scan.json - ai-research-survey - Systematic scan of agentic development research. What's signal, what's noise.

scan.json (22769B)
      1 {
      2   "paper": {
      3     "title": "A Literature Review on AI-Powered Smart Code Base Navigator",
      4     "authors": [
      5       "Radhika S K",
      6       "Rashmitha R",
      7       "Sanjana N",
      8       "Shanthala M N",
      9       "Sukanya G"
     10     ],
     11     "year": 2025,
     12     "venue": "International Journal of Scientific Research in Engineering and Management (IJSREM)",
     13     "doi": "10.55041/IJSREM52774"
     14   },
     15   "scan_version": 3,
     16   "active_modules": ["survey_methodology"],
     17   "methodology_tags": ["meta-analysis"],
     18   "key_findings": "This literature review surveys 20 papers on AI-powered code search and navigation tools, covering transformer-based code generation, retrieval-augmented generation, semantic code search, and code completion. The paper summarizes each work's methodology, strengths, and weaknesses in a tabular format. No original system is built or evaluated despite the abstract implying one is introduced. The review lacks systematic methodology — no search protocol, no quality assessment of sources, and no structured synthesis beyond per-paper summaries.",
     19   "checklist": {
     20     "artifacts": {
     21       "code_released": {
     22         "applies": true,
     23         "answer": false,
     24         "justification": "No code, analysis scripts, or repository links are provided. A survey can release search/analysis scripts but this one does not."
     25       },
     26       "data_released": {
     27         "applies": true,
     28         "answer": false,
     29         "justification": "No dataset, search corpus, or structured extraction of reviewed papers is released. The summary table is in the paper but not as downloadable data."
     30       },
     31       "environment_specified": {
     32         "applies": true,
     33         "answer": false,
     34         "justification": "No environment or tool specifications are provided for reproducing the literature search or analysis."
     35       },
     36       "reproduction_instructions": {
     37         "applies": true,
     38         "answer": false,
     39         "justification": "No instructions are given for reproducing the literature search — no databases searched, no search queries, no date ranges, no inclusion/exclusion criteria."
     40       }
     41     },
     42     "statistical_methodology": {
     43       "confidence_intervals_or_error_bars": {
     44         "applies": false,
     45         "answer": false,
     46         "justification": "This is a narrative literature review with no experiments or statistical analysis."
     47       },
     48       "significance_tests": {
     49         "applies": false,
     50         "answer": false,
     51         "justification": "No experiments are conducted; the paper only summarizes existing work."
     52       },
     53       "effect_sizes_reported": {
     54         "applies": false,
     55         "answer": false,
     56         "justification": "No experiments or statistical aggregation are performed in this survey."
     57       },
     58       "sample_size_justified": {
     59         "applies": false,
     60         "answer": false,
     61         "justification": "No experiments are conducted in this narrative literature review."
     62       },
     63       "variance_reported": {
     64         "applies": false,
     65         "answer": false,
     66         "justification": "No experiments or quantitative synthesis are performed."
     67       }
     68     },
     69     "evaluation_design": {
     70       "baselines_included": {
     71         "applies": true,
     72         "answer": false,
     73         "justification": "The survey does not compare itself against prior surveys or reviews on the same topic. No baseline comparison of any kind."
     74       },
     75       "baselines_contemporary": {
     76         "applies": false,
     77         "answer": false,
     78         "justification": "No experiments conducted; this criterion requires experimental baselines."
     79       },
     80       "ablation_study": {
     81         "applies": false,
     82         "answer": false,
     83         "justification": "No system or experimental design to ablate."
     84       },
     85       "multiple_metrics": {
     86         "applies": false,
     87         "answer": false,
     88         "justification": "No evaluation metrics are used; this is a narrative review."
     89       },
     90       "human_evaluation": {
     91         "applies": false,
     92         "answer": false,
     93         "justification": "No system outputs to evaluate; this is a literature review."
     94       },
     95       "held_out_test_set": {
     96         "applies": false,
     97         "answer": false,
     98         "justification": "No experimental evaluation requiring train/test splits."
     99       },
    100       "per_category_breakdown": {
    101         "applies": true,
    102         "answer": true,
    103         "justification": "Papers are organized into labeled categories (A through T) covering code generation, RAG, code search, code completion, etc., with a summary table breaking down methodology and remarks per paper."
    104       },
    105       "failure_cases_discussed": {
    106         "applies": true,
    107         "answer": true,
    108         "justification": "The summary table includes a 'Cons' column for each reviewed paper, noting limitations such as 'Can produce invalid or insecure code,' 'Resource-heavy,' 'Focused on education; lacks quantitative comparison,' etc."
    109       },
    110       "negative_results_reported": {
    111         "applies": true,
    112         "answer": true,
    113         "justification": "Each reviewed paper's weaknesses and limitations are reported. For example, the review notes that UNIF outperforms more complex models (Section T), and that LLMs fail to grasp semantics (Section M)."
    114       }
    115     },
    116     "claims_and_evidence": {
    117       "abstract_claims_supported": {
    118         "applies": true,
    119         "answer": false,
    120         "justification": "The abstract states 'This initiative introduces an AI-Powered Smart Code Base Navigator, a system designed to facilitate semantic code search, context-aware code completion, and streamlined navigation.' No such system is actually built, implemented, or evaluated in the paper. The body is entirely a literature review of 20 existing papers."
    121       },
    122       "causal_claims_justified": {
    123         "applies": true,
    124         "answer": false,
    125         "justification": "The conclusion claims the navigator 'improves code comprehension, offers context-sensitive support, and shortens the time developers need to find and understand pertinent sections of the code.' No causal evidence is provided — no system exists to test these claims."
    126       },
    127       "generalization_bounded": {
    128         "applies": true,
    129         "answer": false,
    130         "justification": "The paper makes broad claims about AI 'revolutionizing software development' and 'greatly enhancing software engineering methodologies' based on a review of 20 papers, without bounding these generalizations to the specific tools, languages, or contexts reviewed."
    131       },
    132       "alternative_explanations_discussed": {
    133         "applies": true,
    134         "answer": false,
    135         "justification": "No alternative explanations are considered for the conclusions drawn. The paper does not discuss whether the improvements reported in reviewed papers could be due to confounds, dataset selection, or other factors."
    136       },
    137       "proxy_outcome_distinction": {
    138         "applies": true,
    139         "answer": false,
    140         "justification": "The paper frames reviewed tools as 'boosting developer productivity' and 'enhancing software engineering methodologies' without discussing whether the metrics reported (MRR, BLEU, accuracy) actually capture productivity or engineering quality."
    141       }
    142     },
    143     "setup_transparency": {
    144       "model_versions_specified": {
    145         "applies": false,
    146         "answer": false,
    147         "justification": "No models are used by the authors; this is a literature review."
    148       },
    149       "prompts_provided": {
    150         "applies": false,
    151         "answer": false,
    152         "justification": "No prompting is used in this literature review."
    153       },
    154       "hyperparameters_reported": {
    155         "applies": false,
    156         "answer": false,
    157         "justification": "No experiments are conducted in this survey paper."
    158       },
    159       "scaffolding_described": {
    160         "applies": false,
    161         "answer": false,
    162         "justification": "No agentic scaffolding is used; this is a literature review."
    163       },
    164       "data_preprocessing_documented": {
    165         "applies": true,
    166         "answer": false,
    167         "justification": "The paper selection pipeline is not documented at all. There is no description of which databases were searched, what search queries were used, what time period was covered, or how the 20 papers were selected from a larger pool."
    168       }
    169     },
    170     "limitations_and_scope": {
    171       "limitations_section_present": {
    172         "applies": true,
    173         "answer": false,
    174         "justification": "There is no limitations section. The conclusion mentions 'future opportunities' but does not discuss limitations of the review itself."
    175       },
    176       "threats_to_validity_specific": {
    177         "applies": true,
    178         "answer": false,
    179         "justification": "No threats to validity are discussed anywhere in the paper."
    180       },
    181       "scope_boundaries_stated": {
    182         "applies": true,
    183         "answer": false,
    184         "justification": "No explicit scope boundaries are stated. The paper does not specify what types of papers were excluded, what time period was covered, or what the review does NOT claim to show."
    185       }
    186     },
    187     "data_integrity": {
    188       "raw_data_available": {
    189         "applies": true,
    190         "answer": false,
    191         "justification": "No raw data is available. The full set of search results, screening decisions, or extracted data from reviewed papers is not provided."
    192       },
    193       "data_collection_described": {
    194         "applies": true,
    195         "answer": false,
    196         "justification": "The paper does not describe how the 20 reviewed papers were found. No databases, search terms, or collection procedures are mentioned."
    197       },
    198       "recruitment_methods_described": {
    199         "applies": true,
    200         "answer": false,
    201         "justification": "For a survey, 'recruitment' means paper selection. No description is given of how papers were identified or selected for inclusion."
    202       },
    203       "data_pipeline_documented": {
    204         "applies": true,
    205         "answer": false,
    206         "justification": "No pipeline from initial search to final 20 papers is documented. There are no filtering stages, counts at each stage, or criteria described."
    207       }
    208     },
    209     "conflicts_of_interest": {
    210       "funding_disclosed": {
    211         "applies": true,
    212         "answer": false,
    213         "justification": "No funding source is disclosed anywhere in the paper."
    214       },
    215       "affiliations_disclosed": {
    216         "applies": true,
    217         "answer": true,
    218         "justification": "Author affiliations are listed: one assistant professor and four UG students from the Department of Computer Science and Engineering, JNNCE, Shivamogga, Karnataka, India."
    219       },
    220       "funder_independent_of_outcome": {
    221         "applies": false,
    222         "answer": false,
    223         "justification": "This appears to be an unfunded undergraduate student project."
    224       },
    225       "financial_interests_declared": {
    226         "applies": true,
    227         "answer": false,
    228         "justification": "No competing interests or financial interests statement is provided."
    229       }
    230     },
    231     "contamination": {
    232       "training_cutoff_stated": {
    233         "applies": false,
    234         "answer": false,
    235         "justification": "This is a survey paper that does not evaluate any pre-trained model on benchmarks."
    236       },
    237       "train_test_overlap_discussed": {
    238         "applies": false,
    239         "answer": false,
    240         "justification": "This is a survey paper that does not evaluate any pre-trained model on benchmarks."
    241       },
    242       "benchmark_contamination_addressed": {
    243         "applies": false,
    244         "answer": false,
    245         "justification": "This is a survey paper that does not evaluate any pre-trained model on benchmarks."
    246       }
    247     },
    248     "human_studies": {
    249       "pre_registered": {
    250         "applies": false,
    251         "answer": false,
    252         "justification": "No human participants in this literature review."
    253       },
    254       "irb_or_ethics_approval": {
    255         "applies": false,
    256         "answer": false,
    257         "justification": "No human participants in this literature review."
    258       },
    259       "demographics_reported": {
    260         "applies": false,
    261         "answer": false,
    262         "justification": "No human participants in this literature review."
    263       },
    264       "inclusion_exclusion_criteria": {
    265         "applies": false,
    266         "answer": false,
    267         "justification": "No human participants in this literature review."
    268       },
    269       "randomization_described": {
    270         "applies": false,
    271         "answer": false,
    272         "justification": "No human participants in this literature review."
    273       },
    274       "blinding_described": {
    275         "applies": false,
    276         "answer": false,
    277         "justification": "No human participants in this literature review."
    278       },
    279       "attrition_reported": {
    280         "applies": false,
    281         "answer": false,
    282         "justification": "No human participants in this literature review."
    283       }
    284     },
    285     "cost_and_practicality": {
    286       "inference_cost_reported": {
    287         "applies": false,
    288         "answer": false,
    289         "justification": "This is a survey paper with no system or method of its own."
    290       },
    291       "compute_budget_stated": {
    292         "applies": false,
    293         "answer": false,
    294         "justification": "This is a survey paper with no computation performed."
    295       }
    296     },
    297     "survey_methodology": {
    298       "prisma_or_structured_protocol": {
    299         "applies": true,
    300         "answer": false,
    301         "justification": "No PRISMA diagram, no structured search protocol, no reproducible search queries, and no systematic methodology is described. Papers appear to have been selected ad-hoc."
    302       },
    303       "quality_assessment_of_sources": {
    304         "applies": true,
    305         "answer": false,
    306         "justification": "The survey does not assess the methodological quality of its source papers. It lists pros and cons narratively but has no quality scoring rubric, risk-of-bias assessment, or structured evaluation. All 20 papers are treated as equally credible."
    307       },
    308       "publication_bias_discussed": {
    309         "applies": true,
    310         "answer": false,
    311         "justification": "Publication bias is not discussed. The survey does not consider whether its sources are biased toward positive results or whether negative results in code search/navigation are underrepresented."
    312       }
    313     }
    314   },
    315   "claims": [
    316     {
    317       "claim": "The paper introduces an 'AI-Powered Smart Code Base Navigator' that facilitates semantic code search, context-aware code completion, and streamlined navigation within extensive Python codebases.",
    318       "evidence": "Abstract and Introduction describe the system conceptually, but the paper body (Sections A-T) is entirely a literature review of 20 existing works. No system design, implementation, or evaluation is presented.",
    319       "supported": "unsupported"
    320     },
    321     {
    322       "claim": "Meta-RAG achieved about 84.7% accuracy at locating the buggy file and 53.0% at the function level on SWE-bench Lite.",
    323       "evidence": "Reported in Section B from Tawosi et al. [2]. The claim is a direct report from the cited paper, not independently verified.",
    324       "supported": "moderate"
    325     },
    326     {
    327       "claim": "EVOR achieved roughly 2–4× higher correct code generation rates than recent baselines like Reflexion or DocPrompting.",
    328       "evidence": "Reported in Section H from Su et al. [8]. The claim is a direct report from the cited paper, not independently verified.",
    329       "supported": "moderate"
    330     },
    331     {
    332       "claim": "REINFOREST outperforms previous cross-language search tools by up to 44.7% on accuracy metrics.",
    333       "evidence": "Reported in Section I from Saieva et al. [9]. The claim is a direct report from the cited paper, not independently verified.",
    334       "supported": "moderate"
    335     },
    336     {
    337       "claim": "The AI-Powered Smart Code Base Navigator 'improves code comprehension, offers context-sensitive support, and shortens the time developers need to find and understand pertinent sections of the code.'",
    338       "evidence": "Stated in the Conclusion. No system was actually built or evaluated to support these claims.",
    339       "supported": "unsupported"
    340     }
    341   ],
    342   "red_flags": [
    343     {
    344       "flag": "Phantom system — abstract describes a system that doesn't exist",
    345       "detail": "The abstract and introduction claim to 'introduce' an 'AI-Powered Smart Code Base Navigator' system, but the paper body is entirely a literature review of 20 existing papers. No system is designed, implemented, or evaluated. The conclusion then claims the system 'improves code comprehension' without any evidence."
    346     },
    347     {
    348       "flag": "Copy-paste error from template",
    349       "detail": "The Literature Survey section begins with 'In this section, various authors have presented various Emotion detection techniques.' This is clearly pasted from a different paper's template and is unrelated to code navigation."
    350     },
    351     {
    352       "flag": "No systematic review methodology",
    353       "detail": "The 20 reviewed papers appear hand-picked without any documented selection criteria, search strategy, databases queried, or inclusion/exclusion criteria. The review is entirely ad-hoc."
    354     },
    355     {
    356       "flag": "No quality assessment of sources",
    357       "detail": "All 20 reviewed papers are treated as equally credible. No quality scoring, risk-of-bias assessment, or critical evaluation of methodology is performed. This launders the signal-to-noise ratio of the sources."
    358     },
    359     {
    360       "flag": "Predatory journal indicators",
    361       "detail": "Published in IJSREM (ISSN: 2582-3930), which exhibits characteristics of a predatory journal: no rigorous peer review evident (copy-paste error was not caught), rapid publication, and low editorial standards."
    362     },
    363     {
    364       "flag": "Undergraduate student project published as research",
    365       "detail": "Four of five authors are listed as 'UG Students.' The paper lacks the methodological rigor expected of a published literature review — no structured protocol, no quality assessment, and claims about a system that was never built."
    366     }
    367   ],
    368   "cited_papers": [
    369     {
    370       "title": "Meta-RAG on large codebases using code summarization",
    371       "authors": ["V. Tawosi", "S. Alamir", "X. Liu", "M. Veloso"],
    372       "year": 2025,
    373       "arxiv_id": "2508.02611",
    374       "relevance": "Multi-agent RAG framework for bug localization in large codebases, achieving SOTA on SWE-bench Lite."
    375     },
    376     {
    377       "title": "Position: Intelligent coding systems should write programs with justifications",
    378       "authors": ["X. Xu", "S. Feng", "Z. Su", "C. Wang", "X. Zhang"],
    379       "year": 2025,
    380       "arxiv_id": "2508.06017",
    381       "relevance": "Proposes neuro-symbolic approach for AI coding assistants to generate verifiable justifications alongside code."
    382     },
    383     {
    384       "title": "Conversational AI as a coding assistant: Understanding programmers' interactions with and expectations from large language models for coding",
    385       "authors": ["M. Akhoroz", "C. Yildirim"],
    386       "year": 2025,
    387       "arxiv_id": "2503.16508",
    388       "relevance": "Survey of 143 student developers on LLM chatbot usage for coding, documenting accuracy and over-reliance concerns."
    389     },
    390     {
    391       "title": "A deep dive into retrieval-augmented generation for code completion: Experience on WeChat",
    392       "authors": ["Z. Yang", "C. Wang", "T. Peng", "H. Huang", "Y. Deng", "C. Gao"],
    393       "year": 2025,
    394       "arxiv_id": "2507.18515",
    395       "relevance": "Empirical study of RAG for C++ code completion in a large closed-source industrial codebase."
    396     },
    397     {
    398       "title": "EVOR: Evolving retrieval for code generation",
    399       "authors": ["H. Su", "S. Jiang", "Y. Lai", "H. Wu", "B. Shi", "C. Liu", "Q. Liu", "T. Yu"],
    400       "year": 2024,
    401       "arxiv_id": "2402.12317",
    402       "relevance": "RAG pipeline that dynamically updates queries and knowledge base for code generation, claiming 2-4x improvement over baselines."
    403     },
    404     {
    405       "title": "A comprehensive survey of AI-driven advancements and techniques in automated program repair and code generation",
    406       "authors": ["A. Anand", "N. Yadav", "A. Gupta", "S. Bajaj"],
    407       "year": 2024,
    408       "arxiv_id": "2411.07586",
    409       "relevance": "Systematic review of 27 works on AI-assisted bug fixing and code synthesis, covering search-based repair and LLM-based generation."
    410     },
    411     {
    412       "title": "Code Search Is All You Need? Improving Code Suggestions with Code Search",
    413       "authors": ["J. Chen", "X. Hu", "Z. Li", "C. Gao", "X. Xia", "D. Lo"],
    414       "year": 2024,
    415       "relevance": "Demonstrates retrieval-augmented code suggestion with up to 130.8% improvement in code generation BLEU scores."
    416     },
    417     {
    418       "title": "LLMs: Understanding code syntax and semantics for code analysis",
    419       "authors": ["W. Ma", "W. Wang", "S. Liu", "Y. Liu", "Q. Hu", "L. Li", "Z. Lin", "C. Zhang", "L. Nie"],
    420       "year": 2024,
    421       "arxiv_id": "2305.12138",
    422       "relevance": "Evaluates GPT-4, GPT-3.5, StarCoder, and CodeLlama on syntax vs. semantic understanding, finding LLMs fail at runtime reasoning."
    423     },
    424     {
    425       "title": "CodeBERT: A pre-trained model for programming and natural languages",
    426       "authors": ["Z. Feng"],
    427       "year": 2020,
    428       "relevance": "Foundational bimodal transformer pre-trained on code and natural language, establishing NL-PL pre-training for code tasks."
    429     },
    430     {
    431       "title": "REINFOREST: Reinforcing Semantic Code Similarity for Cross-Lingual Code Search Models",
    432       "authors": ["A. Saieva", "S. Chakraborty", "G. Kaiser"],
    433       "year": 2024,
    434       "arxiv_id": "2305.03843",
    435       "relevance": "Cross-language code search method incorporating runtime information into static representations, claiming up to 44.7% accuracy improvement."
    436     }
    437   ],
    438   "engagement_factors": {
    439     "practical_relevance": {
    440       "score": 1,
    441       "justification": "Describes the concept of an AI-powered code navigator but no system is actually built; a practitioner gets only a reading list."
    442     },
    443     "surprise_contrarian": {
    444       "score": 0,
    445       "justification": "Confirms conventional wisdom that AI can help with code search; no novel or surprising findings."
    446     },
    447     "fear_safety": {
    448       "score": 0,
    449       "justification": "No AI safety, security, or risk concerns are raised."
    450     },
    451     "drama_conflict": {
    452       "score": 0,
    453       "justification": "No controversy or conflict; purely a summary of existing work."
    454     },
    455     "demo_ability": {
    456       "score": 0,
    457       "justification": "No code, demo, or tool is released — the described system does not exist."
    458     },
    459     "brand_recognition": {
    460       "score": 0,
    461       "justification": "Published in IJSREM by undergraduate students at a regional Indian engineering college; no brand recognition."
    462     }
    463   }
    464 }
	ai-research-survey Systematic scan of agentic development research. What's signal, what's noise.
	git clone https://git.shiptheloop.com/ai-research-survey.git
	Log \| Files \| Refs