ai-research-survey

Systematic scan of agentic development research. What's signal, what's noise.
git clone https://git.shiptheloop.com/ai-research-survey.git
Log | Files | Refs

scan.json (19646B)


      1 {
      2   "paper": {
      3     "title": "Convergence Dynamics of Agent-to-Agent Interactions with Misaligned Objectives",
      4     "authors": ["Romain Cosentino", "Sarath Shekkizhar", "Adam Earle"],
      5     "year": 2025,
      6     "venue": "arXiv preprint",
      7     "arxiv_id": "2511.08710"
      8   },
      9   "checklist": {
     10     "artifacts": {
     11       "code_released": {
     12         "applies": true,
     13         "answer": false,
     14         "justification": "No repository URL or code archive is provided in the paper."
     15       },
     16       "data_released": {
     17         "applies": true,
     18         "answer": false,
     19         "justification": "The experiments use synthetic data generated from described distributions, but no code or data archive is released to reproduce them."
     20       },
     21       "environment_specified": {
     22         "applies": true,
     23         "answer": false,
     24         "justification": "No requirements.txt, Dockerfile, or detailed environment specification is provided. The paper mentions using GPT-5-mini but gives no library versions or setup details beyond model name."
     25       },
     26       "reproduction_instructions": {
     27         "applies": true,
     28         "answer": false,
     29         "justification": "While algorithms are described in pseudocode (Algorithms 1 and 2) and hyperparameters are listed in Table 8.2, there are no step-by-step reproduction instructions or scripts."
     30       }
     31     },
     32     "statistical_methodology": {
     33       "confidence_intervals_or_error_bars": {
     34         "applies": true,
     35         "answer": true,
     36         "justification": "Figure 4 shows 'shaded ± std bands' across 100 runs for the adversarial attack experiments."
     37       },
     38       "significance_tests": {
     39         "applies": true,
     40         "answer": false,
     41         "justification": "No statistical significance tests are reported. Comparisons between theory and experiment rely on visual agreement of curves."
     42       },
     43       "effect_sizes_reported": {
     44         "applies": true,
     45         "answer": false,
     46         "justification": "No effect sizes (Cohen's d, relative magnitudes with context) are reported. Results are presented as convergence curves and theoretical bounds."
     47       },
     48       "sample_size_justified": {
     49         "applies": true,
     50         "answer": false,
     51         "justification": "The paper uses 100 runs for Figure 4 and 1000 interactions for Figure 2 but does not justify why these numbers are sufficient."
     52       },
     53       "variance_reported": {
     54         "applies": true,
     55         "answer": true,
     56         "justification": "Figure 4 reports mean trajectories across 100 runs with shaded ± std bands."
     57       }
     58     },
     59     "evaluation_design": {
     60       "baselines_included": {
     61         "applies": true,
     62         "answer": true,
     63         "justification": "Single-agent convergence is used as a baseline (Figure 3 compares single agent W vs. agent W with cooperative helper U)."
     64       },
     65       "baselines_contemporary": {
     66         "applies": false,
     67         "answer": false,
     68         "justification": "This is a theoretical paper proposing a novel framework; no prior work exists on the same formulation to compare against."
     69       },
     70       "ablation_study": {
     71         "applies": true,
     72         "answer": true,
     73         "justification": "The paper systematically varies objective alignment angle (aligned, orthogonal, opposite in Figure 1 and Figure 4), and contrasts fixed-objective vs. adaptive-objective regimes (Section 3, Corollary 3, Figure 3)."
     74       },
     75       "multiple_metrics": {
     76         "applies": true,
     77         "answer": false,
     78         "justification": "Only one metric is used: distance to objective (squared error ∥w - w*∥²). No additional metrics are reported."
     79       },
     80       "human_evaluation": {
     81         "applies": false,
     82         "answer": false,
     83         "justification": "Human evaluation is irrelevant for this theoretical/mathematical framework paper."
     84       },
     85       "held_out_test_set": {
     86         "applies": false,
     87         "answer": false,
     88         "justification": "This is a theoretical paper with synthetic experiments validating mathematical predictions, not a benchmark evaluation."
     89       },
     90       "per_category_breakdown": {
     91         "applies": true,
     92         "answer": true,
     93         "justification": "Results are broken down by objective alignment condition (aligned ~6°, orthogonal ~90°, opposite ~174° in Figure 1; orthogonal/scaled/opposite in Figure 4) and by agent type (LSA vs GPT-5-mini)."
     94       },
     95       "failure_cases_discussed": {
     96         "applies": true,
     97         "answer": true,
     98         "justification": "Section 6.1 (Limitations and Scope) explicitly states the framework is restricted to synthetic linear regression and does not directly explain open-ended reasoning. The adversarial regime itself characterizes failure modes of multi-agent systems."
     99       },
    100       "negative_results_reported": {
    101         "applies": true,
    102         "answer": true,
    103         "justification": "The paper's core finding is partly negative: misaligned agents inevitably plateau at biased fixed points and cannot improve beyond single-agent optima in the fixed-objective regime."
    104       }
    105     },
    106     "claims_and_evidence": {
    107       "abstract_claims_supported": {
    108         "applies": true,
    109         "answer": true,
    110         "justification": "Abstract claims about biased equilibria (Proposition 1, Figure 1), adversarial asymmetric convergence (Proposition 2, Figure 4), and cooperative acceleration (Corollary 3, Figure 3) are all supported by theoretical proofs and experiments."
    111       },
    112       "causal_claims_justified": {
    113         "applies": true,
    114         "answer": true,
    115         "justification": "Causal claims (misalignment leads to biased equilibria, adversarial geometry enables asymmetric convergence) are justified through formal mathematical proofs with controlled single-variable manipulations in experiments."
    116       },
    117       "generalization_bounded": {
    118         "applies": true,
    119         "answer": true,
    120         "justification": "Section 6.1 explicitly bounds generalization: 'Our experiments are restricted to synthetic in-context linear regression and LSA agents... our results do not directly explain the behavior of multi-agent LLM collaborations on open-ended reasoning, writing, or code-generation benchmarks.' The abstract also says 'within this simplified setting.'"
    121       },
    122       "alternative_explanations_discussed": {
    123         "applies": true,
    124         "answer": true,
    125         "justification": "Section 6.1 discusses that the LSA model is a proxy and real LLM behavior may differ. Section 7 discusses defense mechanisms. The paper acknowledges the gap between the simplified model and real multi-agent systems."
    126       }
    127     },
    128     "setup_transparency": {
    129       "model_versions_specified": {
    130         "applies": true,
    131         "answer": true,
    132         "justification": "The paper specifies 'gpt-5-mini' in Section 5 and Appendix 8.3. While no snapshot date is given, the model name includes a specific variant identifier."
    133       },
    134       "prompts_provided": {
    135         "applies": true,
    136         "answer": true,
    137         "justification": "The full system prompt and response schema for GPT-5-mini are provided in Appendix 8.4, including the exact text sent to the model."
    138       },
    139       "hyperparameters_reported": {
    140         "applies": true,
    141         "answer": true,
    142         "justification": "Appendix 8.2 provides a hyperparameter table (d=10, n=20, batch_size=512, epochs=100, η=0.005, etc.). Appendix 8.3 specifies temperature=0.0, top_p=1.0 for GPT-5-mini."
    143       },
    144       "scaffolding_described": {
    145         "applies": false,
    146         "answer": false,
    147         "justification": "No agentic scaffolding is used. The agents are simple single-call models performing gradient computation."
    148       },
    149       "data_preprocessing_documented": {
    150         "applies": true,
    151         "answer": true,
    152         "justification": "Section 2.1 and Appendix 8.1 fully describe data generation: i.i.d. linear regression with X ~ N(0, I/d), w* ~ N(0, I/d), y = X^T w*. Trajectory truncation criterion (gradient norm < 10^-3) is stated."
    153       }
    154     },
    155     "limitations_and_scope": {
    156       "limitations_section_present": {
    157         "applies": true,
    158         "answer": true,
    159         "justification": "Section 6.1 is titled 'Limitations and Scope' and provides substantive discussion."
    160       },
    161       "threats_to_validity_specific": {
    162         "applies": true,
    163         "answer": true,
    164         "justification": "Section 6.1 states specific limitations: experiments restricted to synthetic linear regression, only GPT-5-mini tested on same linear tasks, results don't explain open-ended reasoning/writing/code-generation."
    165       },
    166       "scope_boundaries_stated": {
    167         "applies": true,
    168         "answer": true,
    169         "justification": "Section 6.1 explicitly states: 'our results do not directly explain the behavior of multi-agent LLM collaborations on open-ended reasoning, writing, or code-generation benchmarks.' The paper frames itself as 'a mechanistic case study' and 'stepping stone.'"
    170       }
    171     },
    172     "data_integrity": {
    173       "raw_data_available": {
    174         "applies": true,
    175         "answer": false,
    176         "justification": "No raw experimental data or logs are released."
    177       },
    178       "data_collection_described": {
    179         "applies": true,
    180         "answer": true,
    181         "justification": "Data generation is fully specified mathematically: synthetic linear regression data from known distributions (Section 2.1, Appendix 8.1)."
    182       },
    183       "recruitment_methods_described": {
    184         "applies": false,
    185         "answer": false,
    186         "justification": "No human participants; data is synthetic."
    187       },
    188       "data_pipeline_documented": {
    189         "applies": true,
    190         "answer": true,
    191         "justification": "The full pipeline from data generation to training to inference is documented in Sections 2, 5, and Appendix 8.1-8.4, including trajectory truncation criteria."
    192       }
    193     },
    194     "conflicts_of_interest": {
    195       "funding_disclosed": {
    196         "applies": true,
    197         "answer": false,
    198         "justification": "No funding or acknowledgments section is present in the paper."
    199       },
    200       "affiliations_disclosed": {
    201         "applies": true,
    202         "answer": true,
    203         "justification": "All three authors are listed as affiliated with Salesforce AI Research."
    204       },
    205       "funder_independent_of_outcome": {
    206         "applies": true,
    207         "answer": false,
    208         "justification": "Authors are from Salesforce AI Research. No funding disclosure is provided, so independence cannot be assessed. Salesforce builds multi-agent AI products, creating a potential interest in the outcomes."
    209       },
    210       "financial_interests_declared": {
    211         "applies": true,
    212         "answer": false,
    213         "justification": "No competing interests or financial interests statement is present in the paper."
    214       }
    215     },
    216     "contamination": {
    217       "training_cutoff_stated": {
    218         "applies": false,
    219         "answer": false,
    220         "justification": "The paper does not evaluate model capability on any benchmark. GPT-5-mini is used to perform gradient computation on synthetic data, not tested on pre-existing benchmarks."
    221       },
    222       "train_test_overlap_discussed": {
    223         "applies": false,
    224         "answer": false,
    225         "justification": "No benchmark evaluation is performed; all data is synthetically generated."
    226       },
    227       "benchmark_contamination_addressed": {
    228         "applies": false,
    229         "answer": false,
    230         "justification": "No benchmark evaluation is performed."
    231       }
    232     },
    233     "human_studies": {
    234       "pre_registered": {
    235         "applies": false,
    236         "answer": false,
    237         "justification": "No human participants."
    238       },
    239       "irb_or_ethics_approval": {
    240         "applies": false,
    241         "answer": false,
    242         "justification": "No human participants."
    243       },
    244       "demographics_reported": {
    245         "applies": false,
    246         "answer": false,
    247         "justification": "No human participants."
    248       },
    249       "inclusion_exclusion_criteria": {
    250         "applies": false,
    251         "answer": false,
    252         "justification": "No human participants."
    253       },
    254       "randomization_described": {
    255         "applies": false,
    256         "answer": false,
    257         "justification": "No human participants."
    258       },
    259       "blinding_described": {
    260         "applies": false,
    261         "answer": false,
    262         "justification": "No human participants."
    263       },
    264       "attrition_reported": {
    265         "applies": false,
    266         "answer": false,
    267         "justification": "No human participants."
    268       }
    269     },
    270     "cost_and_practicality": {
    271       "inference_cost_reported": {
    272         "applies": true,
    273         "answer": false,
    274         "justification": "The paper uses GPT-5-mini API calls (100 runs with multiple interaction steps) but does not report API costs, tokens consumed, or wall-clock time."
    275       },
    276       "compute_budget_stated": {
    277         "applies": true,
    278         "answer": false,
    279         "justification": "No mention of total computational budget, GPU hours for LSA training, or API spend for GPT-5-mini experiments."
    280       }
    281     }
    282   },
    283   "claims": [
    284     {
    285       "claim": "Under fixed misaligned objectives, agent-to-agent dynamics converge to biased fixed points with residual errors governed by objective misalignment and prompt geometry anisotropy.",
    286       "evidence": "Proposition 1 provides closed-form expressions; Figure 1 validates empirically across aligned (~6°), orthogonal (~90°), and opposite (~174°) settings.",
    287       "supported": "strong"
    288     },
    289     {
    290       "claim": "Normalized plateau errors are nondecreasing functions of the inter-objective angle θ.",
    291       "evidence": "Corollary 2 provides formal bounds; Figure 2 validates with 1000 LSA agent-to-agent interactions showing monotonic growth.",
    292       "supported": "strong"
    293     },
    294     {
    295       "claim": "Asymmetric convergence (one agent reaches objective, other does not) is possible under specific kernel conditions on prompt geometry.",
    296       "evidence": "Proposition 2 gives necessary and sufficient conditions; Corollary 5 provides constructive recipe; Figure 4 validates with both LSA and GPT-5-mini across 100 runs with std bands.",
    297       "supported": "strong"
    298     },
    299     {
    300       "claim": "A cooperative helper agent with adaptive turn-based objectives can implement Newton-like acceleration for the main agent.",
    301       "evidence": "Corollary 3 provides the construction; Figure 3 shows the cooperative agent accelerating convergence beyond single-agent performance in 3 alternating steps.",
    302       "supported": "strong"
    303     },
    304     {
    305       "claim": "GPT-5-mini experiments are consistent with theoretical predictions from the LSA framework.",
    306       "evidence": "Figure 4 (top) shows GPT-5-mini adversarial attack results matching theoretical predictions, with early-step variability from model decoding noise.",
    307       "supported": "moderate"
    308     }
    309   ],
    310   "methodology_tags": ["theoretical", "benchmark-eval"],
    311   "key_findings": "The paper develops a theoretical framework for multi-agent interactions modeled as alternating in-context gradient descent between linear self-attention transformers. It proves that misaligned objectives lead to biased convergence plateaus predictable from objective gap and prompt geometry, identifies conditions for adversarial asymmetric convergence where one agent succeeds while biasing the other, and shows that adaptive-objective helper agents can accelerate convergence via Newton-like steps. Experiments with trained LSA agents and GPT-5-mini validate the theoretical predictions.",
    312   "red_flags": [
    313     {
    314       "flag": "Narrow experimental scope",
    315       "detail": "All experiments are on synthetic in-context linear regression with dimension d=10, n=20. The gap between this simplified setting and real multi-agent LLM interactions (open-ended reasoning, code generation) is substantial. The authors acknowledge this but the paper's title and framing suggest broader applicability."
    316     },
    317     {
    318       "flag": "No code or data release",
    319       "detail": "Despite being a Salesforce AI Research paper with reproducible synthetic experiments, no code repository is provided, making independent verification difficult."
    320     },
    321     {
    322       "flag": "Company affiliation undisclosed as conflict",
    323       "detail": "All authors are from Salesforce AI Research, which develops multi-agent AI products (e.g., Agentforce). The paper's findings about agent interactions have direct commercial relevance, but no conflict of interest statement is provided."
    324     }
    325   ],
    326   "cited_papers": [
    327     {
    328       "title": "Why do multiagent systems fail?",
    329       "authors": ["Melissa Z Pan", "Mert Cemri", "Lakshya A Agrawal"],
    330       "year": 2025,
    331       "relevance": "MAST taxonomy of multi-agent failure modes, directly connected to the theoretical predictions in this paper."
    332     },
    333     {
    334       "title": "AutoGen: Enabling next-gen LLM applications via multi-agent conversations",
    335       "authors": ["Qingyun Wu", "Gagan Bansal", "Jieyu Zhang"],
    336       "year": 2024,
    337       "relevance": "Major multi-agent LLM framework; the theoretical framework here aims to explain dynamics in such systems."
    338     },
    339     {
    340       "title": "Red-teaming LLM multi-agent systems via communication attacks",
    341       "authors": ["Pengfei He", "Yuping Lin", "Shen Dong"],
    342       "year": 2025,
    343       "relevance": "Empirical work on adversarial attacks in multi-agent LLM systems, complementary to the theoretical adversarial framework here."
    344     },
    345     {
    346       "title": "Rethinking the bounds of LLM reasoning: Are multi-agent discussions the key?",
    347       "authors": ["Qineng Wang", "Zihao Wang", "Ying Su"],
    348       "year": 2024,
    349       "relevance": "Questions whether multi-agent setups consistently outperform single-agent baselines, which this paper formalizes theoretically."
    350     },
    351     {
    352       "title": "Prompt infection: LLM-to-LLM prompt injection within multi-agent systems",
    353       "authors": ["Donghyun Lee", "Mo Tiwari"],
    354       "year": 2024,
    355       "relevance": "Empirical study of prompt injection attacks between LLM agents, related to the adversarial agent dynamics studied here."
    356     },
    357     {
    358       "title": "On the resilience of multi-agent systems with malicious agents",
    359       "authors": ["Jen-tse Huang", "Jiaxu Zhou", "Tailin Jin"],
    360       "year": 2024,
    361       "relevance": "Studies multi-agent system robustness to malicious agents, directly relevant to the adversarial convergence results."
    362     },
    363     {
    364       "title": "Transformers learn in-context by gradient descent",
    365       "authors": ["Johannes von Oswald", "Eyvind Niklasson", "Ettore Randazzo"],
    366       "year": 2023,
    367       "relevance": "Foundational work showing transformers implement gradient descent in-context, which this paper extends to multi-agent settings."
    368     },
    369     {
    370       "title": "Transformers learn to implement multi-step gradient descent with chain of thought",
    371       "authors": ["Jianhao Huang", "Zixuan Wang", "Jason D Lee"],
    372       "year": 2025,
    373       "arxiv_id": "2502.21212",
    374       "relevance": "Direct theoretical foundation for the LSA agent model used in this paper."
    375     },
    376     {
    377       "title": "Improving factuality and reasoning in language models through multiagent debate",
    378       "authors": ["Yilun Du", "Shuang Li", "Antonio Torralba"],
    379       "year": 2023,
    380       "relevance": "Multi-agent debate framework whose dynamics this paper aims to theoretically characterize."
    381     },
    382     {
    383       "title": "The rise and potential of large language model based agents: A survey",
    384       "authors": ["Zhiheng Xi", "Wenxiang Chen", "Xin Guo"],
    385       "year": 2025,
    386       "relevance": "Comprehensive survey of LLM-based agents, providing context for the multi-agent interaction dynamics studied here."
    387     }
    388   ]
    389 }

Impressum · Datenschutz