ai-research-survey

Systematic scan of agentic development research. What's signal, what's noise.
git clone https://git.shiptheloop.com/ai-research-survey.git
Log | Files | Refs

scan.json (15666B)


      1 {
      2   "paper": {
      3     "title": "AI-Assisted Code Editors with Real-Time Collaboration: A Comprehensive Review",
      4     "authors": ["Narasimha Dixit", "Aniket Patil", "Ayaan Shilledar", "Krutika Sambranikar", "Prashant Chavan"],
      5     "year": 2025,
      6     "venue": "International Journal of Scientific Research in Engineering and Management (IJSREM)",
      7     "doi": "10.55041/IJSREM55648"
      8   },
      9   "checklist": {
     10     "artifacts": {
     11       "code_released": {
     12         "applies": true,
     13         "answer": false,
     14         "justification": "No code, analysis scripts, or repository links provided anywhere in the paper."
     15       },
     16       "data_released": {
     17         "applies": true,
     18         "answer": false,
     19         "justification": "No dataset or extracted data from the literature review is released."
     20       },
     21       "environment_specified": {
     22         "applies": true,
     23         "answer": false,
     24         "justification": "No environment or tool specifications for reproducing the survey analysis."
     25       },
     26       "reproduction_instructions": {
     27         "applies": true,
     28         "answer": false,
     29         "justification": "No instructions for reproducing the literature search or analysis."
     30       }
     31     },
     32     "statistical_methodology": {
     33       "confidence_intervals_or_error_bars": {
     34         "applies": false,
     35         "answer": false,
     36         "justification": "Survey paper with no quantitative experiments."
     37       },
     38       "significance_tests": {
     39         "applies": false,
     40         "answer": false,
     41         "justification": "Survey paper with no statistical comparisons."
     42       },
     43       "effect_sizes_reported": {
     44         "applies": false,
     45         "answer": false,
     46         "justification": "Survey paper with no quantitative experiments."
     47       },
     48       "sample_size_justified": {
     49         "applies": false,
     50         "answer": false,
     51         "justification": "Survey paper with no quantitative experiments."
     52       },
     53       "variance_reported": {
     54         "applies": false,
     55         "answer": false,
     56         "justification": "Survey paper with no quantitative experiments."
     57       }
     58     },
     59     "evaluation_design": {
     60       "baselines_included": {
     61         "applies": true,
     62         "answer": false,
     63         "justification": "The paper does not compare against prior surveys or reviews in a structured way."
     64       },
     65       "baselines_contemporary": {
     66         "applies": true,
     67         "answer": false,
     68         "justification": "No baseline comparisons are made. The references are mostly from 2017-2021, with no contemporary 2024-2025 work cited despite the paper being published in Dec 2025."
     69       },
     70       "ablation_study": {
     71         "applies": false,
     72         "answer": false,
     73         "justification": "Survey paper with no system components to ablate."
     74       },
     75       "multiple_metrics": {
     76         "applies": false,
     77         "answer": false,
     78         "justification": "Survey paper with no quantitative evaluation."
     79       },
     80       "human_evaluation": {
     81         "applies": false,
     82         "answer": false,
     83         "justification": "Survey paper making no claims that require human evaluation of system outputs."
     84       },
     85       "held_out_test_set": {
     86         "applies": false,
     87         "answer": false,
     88         "justification": "Survey paper with no experiments."
     89       },
     90       "per_category_breakdown": {
     91         "applies": true,
     92         "answer": false,
     93         "justification": "The paper lists categories of literature (Section 2) but provides no structured breakdown of findings per category with counts or analysis."
     94       },
     95       "failure_cases_discussed": {
     96         "applies": true,
     97         "answer": false,
     98         "justification": "No discussion of failure cases or limitations of the tools reviewed beyond vague mentions of gaps."
     99       },
    100       "negative_results_reported": {
    101         "applies": true,
    102         "answer": false,
    103         "justification": "No negative findings reported. The paper is entirely positive about AI-assisted code editors."
    104       }
    105     },
    106     "claims_and_evidence": {
    107       "abstract_claims_supported": {
    108         "applies": true,
    109         "answer": false,
    110         "justification": "The abstract claims the editors 'resolve essential code synchronization and developer productivity and quality assurance challenges' but the paper provides no evidence for these claims — only descriptions of features without empirical validation."
    111       },
    112       "causal_claims_justified": {
    113         "applies": true,
    114         "answer": false,
    115         "justification": "The paper makes causal claims like 'The system decreases developer workload' and tools 'enhance coding speed and reduce manual tasks' without any empirical evidence or study design to support causation."
    116       },
    117       "generalization_bounded": {
    118         "applies": true,
    119         "answer": false,
    120         "justification": "The paper makes sweeping claims about AI-assisted code editors transforming software development without bounding these claims to any tested setting."
    121       },
    122       "alternative_explanations_discussed": {
    123         "applies": true,
    124         "answer": false,
    125         "justification": "No alternative explanations or counterarguments are discussed for any of the paper's claims."
    126       }
    127     },
    128     "setup_transparency": {
    129       "model_versions_specified": {
    130         "applies": false,
    131         "answer": false,
    132         "justification": "Survey paper that does not run any models."
    133       },
    134       "prompts_provided": {
    135         "applies": false,
    136         "answer": false,
    137         "justification": "Survey paper that does not use prompting."
    138       },
    139       "hyperparameters_reported": {
    140         "applies": false,
    141         "answer": false,
    142         "justification": "Survey paper that does not run any models."
    143       },
    144       "scaffolding_described": {
    145         "applies": false,
    146         "answer": false,
    147         "justification": "Survey paper with no agentic scaffolding."
    148       },
    149       "data_preprocessing_documented": {
    150         "applies": true,
    151         "answer": false,
    152         "justification": "The methodology section mentions searching IEEE Xplore, ACM Digital Library, arXiv, and Google Scholar, and categorizing papers, but provides no filtering criteria, inclusion/exclusion criteria, search queries, or counts at each stage. The paper states 44 references were compiled from IntelliCode Compose's reference list but only 10 appear in the references section."
    153       }
    154     },
    155     "limitations_and_scope": {
    156       "limitations_section_present": {
    157         "applies": true,
    158         "answer": false,
    159         "justification": "No limitations or threats-to-validity section exists in the paper."
    160       },
    161       "threats_to_validity_specific": {
    162         "applies": true,
    163         "answer": false,
    164         "justification": "No threats to validity discussed."
    165       },
    166       "scope_boundaries_stated": {
    167         "applies": true,
    168         "answer": false,
    169         "justification": "No explicit scope boundaries stated. The paper does not clarify what it does not cover."
    170       }
    171     },
    172     "data_integrity": {
    173       "raw_data_available": {
    174         "applies": true,
    175         "answer": false,
    176         "justification": "No raw data or extracted literature data available for verification."
    177       },
    178       "data_collection_described": {
    179         "applies": true,
    180         "answer": false,
    181         "justification": "The methodology section vaguely describes searching databases but provides no search terms, date ranges, or detailed procedure. The paper claims to review 44 references but only lists 10."
    182       },
    183       "recruitment_methods_described": {
    184         "applies": false,
    185         "answer": false,
    186         "justification": "No human participants; paper sources are standard academic databases."
    187       },
    188       "data_pipeline_documented": {
    189         "applies": true,
    190         "answer": false,
    191         "justification": "No documentation of how papers were filtered, screened, or selected. The pipeline from search to final corpus is not described."
    192       }
    193     },
    194     "conflicts_of_interest": {
    195       "funding_disclosed": {
    196         "applies": true,
    197         "answer": false,
    198         "justification": "No funding disclosure. The acknowledgment thanks the institution but does not mention funding sources."
    199       },
    200       "affiliations_disclosed": {
    201         "applies": true,
    202         "answer": true,
    203         "justification": "All five authors list their affiliation with KLS Vishwanathrao Deshpande Institute of Technology Haliyal, Department of Computer Science (AIML)."
    204       },
    205       "funder_independent_of_outcome": {
    206         "applies": false,
    207         "answer": false,
    208         "justification": "Appears to be unfunded student work at an academic institution."
    209       },
    210       "financial_interests_declared": {
    211         "applies": true,
    212         "answer": false,
    213         "justification": "No competing interests or financial interests statement in the paper."
    214       }
    215     },
    216     "contamination": {
    217       "training_cutoff_stated": {
    218         "applies": false,
    219         "answer": false,
    220         "justification": "Survey paper that does not evaluate any pre-trained model on a benchmark."
    221       },
    222       "train_test_overlap_discussed": {
    223         "applies": false,
    224         "answer": false,
    225         "justification": "Survey paper that does not evaluate any pre-trained model on a benchmark."
    226       },
    227       "benchmark_contamination_addressed": {
    228         "applies": false,
    229         "answer": false,
    230         "justification": "Survey paper that does not evaluate any pre-trained model on a benchmark."
    231       }
    232     },
    233     "human_studies": {
    234       "pre_registered": {
    235         "applies": false,
    236         "answer": false,
    237         "justification": "No human participants in this survey paper."
    238       },
    239       "irb_or_ethics_approval": {
    240         "applies": false,
    241         "answer": false,
    242         "justification": "No human participants in this survey paper."
    243       },
    244       "demographics_reported": {
    245         "applies": false,
    246         "answer": false,
    247         "justification": "No human participants in this survey paper."
    248       },
    249       "inclusion_exclusion_criteria": {
    250         "applies": false,
    251         "answer": false,
    252         "justification": "No human participants in this survey paper."
    253       },
    254       "randomization_described": {
    255         "applies": false,
    256         "answer": false,
    257         "justification": "No human participants in this survey paper."
    258       },
    259       "blinding_described": {
    260         "applies": false,
    261         "answer": false,
    262         "justification": "No human participants in this survey paper."
    263       },
    264       "attrition_reported": {
    265         "applies": false,
    266         "answer": false,
    267         "justification": "No human participants in this survey paper."
    268       }
    269     },
    270     "cost_and_practicality": {
    271       "inference_cost_reported": {
    272         "applies": false,
    273         "answer": false,
    274         "justification": "Survey paper with no method of its own to cost."
    275       },
    276       "compute_budget_stated": {
    277         "applies": false,
    278         "answer": false,
    279         "justification": "Survey paper with no computation performed."
    280       }
    281     }
    282   },
    283   "claims": [
    284     {
    285       "claim": "AI-assisted code editors resolve essential code synchronization and developer productivity challenges through real-time collaboration and generative AI capabilities.",
    286       "evidence": "No empirical evidence provided. The claim is stated in the abstract and reiterated throughout but supported only by descriptions of tool features, not experiments or user studies.",
    287       "supported": "unsupported"
    288     },
    289     {
    290       "claim": "Transformer-based tools have demonstrated their ability to enhance coding speed and reduce manual tasks, resulting in better developer productivity.",
    291       "evidence": "Conclusion section makes this claim referencing the general literature but provides no specific quantitative results or citations to support it.",
    292       "supported": "weak"
    293     },
    294     {
    295       "claim": "IntelliCode Compose provides outstanding intelligent completion tools but the AI Assisted Code Editor expands these concepts by building a team-based coding environment.",
    296       "evidence": "Section 2.1.6 provides a feature comparison table (Table 1) but it is a qualitative feature list, not an empirical evaluation.",
    297       "supported": "weak"
    298     }
    299   ],
    300   "methodology_tags": ["meta-analysis"],
    301   "key_findings": "This paper surveys AI-assisted code generation literature centered on IntelliCode Compose, identifying gaps in real-time collaboration support, context understanding, personalization, and privacy in current tools. It proposes a conceptual architecture ('SynapseCode'/'AI Assisted Code Editor') combining transformer models with real-time collaboration features, but provides no implementation or empirical evaluation. The paper identifies six research gaps and five future directions but does not contribute original data or analysis.",
    302   "red_flags": [
    303     {
    304       "flag": "No quality assessment of reviewed literature",
    305       "detail": "The survey summarizes tools and papers without any structured quality assessment, effectively laundering the signal-to-noise ratio of its sources."
    306     },
    307     {
    308       "flag": "Missing references",
    309       "detail": "The paper claims to review 44 references from IntelliCode Compose but only lists 10 references in the references section. The remaining 34 papers are unaccounted for."
    310     },
    311     {
    312       "flag": "Duplicated content",
    313       "detail": "Sections 2.1.5 and 2.1.7 contain nearly identical text describing the SynapseCode/AI Assisted Code Editor architecture. Section 2.1.2 is identical to 2.1.1. This suggests careless writing or possible AI-generated text without review."
    314     },
    315     {
    316       "flag": "Outdated references for a 2025 paper",
    317       "detail": "All 10 listed references are from 2017-2021. For a paper published in December 2025 about AI-assisted code editors, the absence of any reference from 2022-2025 (e.g., Copilot, ChatGPT, GPT-4, CodeLlama) is a major gap."
    318     },
    319     {
    320       "flag": "Unsupported sweeping claims",
    321       "detail": "The paper makes broad claims about AI transforming software development without any empirical evidence, user studies, or quantitative analysis."
    322     },
    323     {
    324       "flag": "Predatory journal indicators",
    325       "detail": "Published in IJSREM (SJIF rating 8.586), which shows characteristics of a predatory or very low-quality venue: rapid publication, no apparent peer review rigor, template formatting errors visible in the text."
    326     }
    327   ],
    328   "cited_papers": [
    329     {
    330       "title": "IntelliCode Compose: Code Generation Using Transformer",
    331       "authors": ["Z. Austin", "L. Smolensky", "Y. Liu", "R. Wray", "C. Brooks", "S. Fink", "A. Sutton"],
    332       "year": 2021,
    333       "relevance": "Primary source for the survey; demonstrates transformer-based code generation integrated into an IDE."
    334     },
    335     {
    336       "title": "Evaluating Large Language Models Trained on Code",
    337       "authors": ["M. Chen", "J. Tworek", "H. Jun"],
    338       "year": 2021,
    339       "arxiv_id": "2107.03374",
    340       "relevance": "Introduces Codex/HumanEval benchmark for evaluating LLM code generation capabilities."
    341     },
    342     {
    343       "title": "CodeBERT: A Pre-Trained Model for Programming and Natural Languages",
    344       "authors": ["Z. Feng", "D. Guo", "D. Tang"],
    345       "year": 2020,
    346       "arxiv_id": "2002.08155",
    347       "relevance": "Foundational pre-trained model for programming language understanding used in code generation research."
    348     },
    349     {
    350       "title": "Intellicode: Leveraging AI to Improve Developer Productivity",
    351       "authors": ["A. Svyatkovskiy", "S. Deng", "S. Fu", "N. Sundaresan"],
    352       "year": 2020,
    353       "relevance": "Describes AI-powered developer productivity tool integrated into Visual Studio."
    354     }
    355   ]
    356 }

Impressum · Datenschutz