scan.json - ai-research-survey - Systematic scan of agentic development research. What's signal, what's noise.

scan.json (22086B)
      1 {
      2   "paper": {
      3     "title": "Mathematical methods and human thought in the age of AI",
      4     "authors": ["Tanya Klowden", "Terence Tao"],
      5     "year": 2026,
      6     "venue": "arXiv preprint",
      7     "arxiv_id": "2603.26524",
      8     "doi": ""
      9   },
     10   "scan_version": 3,
     11   "active_modules": [],
     12   "methodology_tags": ["theoretical", "qualitative"],
     13   "key_findings": "The paper argues that AI is a natural evolution of human cognitive tools and that its development must remain human-centered. Using mathematics as a 'sandbox,' the authors examine how formal verification is necessary but insufficient for mathematical knowledge, how AI decouples the outward form of intellectual products from the understanding behind them, and how a 'Copernican' reframing of human intelligence alongside artificial intelligence could guide responsible integration. The paper warns of digital divides, environmental costs, model collapse, and the risk of flooding fields with technically correct but insight-free AI-generated work.",
     14   "checklist": {
     15     "artifacts": {
     16       "code_released": {
     17         "applies": false,
     18         "answer": false,
     19         "justification": "This is a theoretical/philosophical position paper with no computational work. There is no code to release."
     20       },
     21       "data_released": {
     22         "applies": false,
     23         "answer": false,
     24         "justification": "No data was collected or analyzed. The paper is entirely argumentative and philosophical."
     25       },
     26       "environment_specified": {
     27         "applies": false,
     28         "answer": false,
     29         "justification": "No computational environment is relevant to a purely theoretical paper."
     30       },
     31       "reproduction_instructions": {
     32         "applies": false,
     33         "answer": false,
     34         "justification": "No experiments to reproduce. The paper consists of philosophical arguments and historical analysis."
     35       }
     36     },
     37     "statistical_methodology": {
     38       "confidence_intervals_or_error_bars": {
     39         "applies": false,
     40         "answer": false,
     41         "justification": "No quantitative results are reported. The paper presents philosophical arguments without statistical analysis."
     42       },
     43       "significance_tests": {
     44         "applies": false,
     45         "answer": false,
     46         "justification": "No comparative empirical claims requiring statistical testing are made."
     47       },
     48       "effect_sizes_reported": {
     49         "applies": false,
     50         "answer": false,
     51         "justification": "No empirical effects are measured in this theoretical paper."
     52       },
     53       "sample_size_justified": {
     54         "applies": false,
     55         "answer": false,
     56         "justification": "No sample or data collection. Purely theoretical work."
     57       },
     58       "variance_reported": {
     59         "applies": false,
     60         "answer": false,
     61         "justification": "No experimental runs are conducted. No quantitative results to report variance for."
     62       }
     63     },
     64     "evaluation_design": {
     65       "baselines_included": {
     66         "applies": false,
     67         "answer": false,
     68         "justification": "No system or method is evaluated. This is a philosophical essay, not an empirical evaluation."
     69       },
     70       "baselines_contemporary": {
     71         "applies": false,
     72         "answer": false,
     73         "justification": "No baselines are relevant for a theoretical position paper."
     74       },
     75       "ablation_study": {
     76         "applies": false,
     77         "answer": false,
     78         "justification": "No system with components to ablate. The paper is a philosophical argument."
     79       },
     80       "multiple_metrics": {
     81         "applies": false,
     82         "answer": false,
     83         "justification": "No metrics are used. The paper makes no quantitative evaluations."
     84       },
     85       "human_evaluation": {
     86         "applies": false,
     87         "answer": false,
     88         "justification": "No system outputs to evaluate. The paper is a theoretical discussion."
     89       },
     90       "held_out_test_set": {
     91         "applies": false,
     92         "answer": false,
     93         "justification": "No test sets or data splits. Purely theoretical work."
     94       },
     95       "per_category_breakdown": {
     96         "applies": false,
     97         "answer": false,
     98         "justification": "No categories of results to break down. The paper presents arguments, not measurements."
     99       },
    100       "failure_cases_discussed": {
    101         "applies": false,
    102         "answer": false,
    103         "justification": "No system is proposed whose failures could be analyzed. The paper discusses AI weaknesses in general terms but has no evaluation."
    104       },
    105       "negative_results_reported": {
    106         "applies": false,
    107         "answer": false,
    108         "justification": "No experiments to yield positive or negative results."
    109       }
    110     },
    111     "claims_and_evidence": {
    112       "abstract_claims_supported": {
    113         "applies": true,
    114         "answer": true,
    115         "justification": "The abstract claims that AI is a natural evolution of human tools, that development should be human-centered, and proposes a pathway for integration. Sections 2 (historical parallels), 5 (costs and benefits), and 6 (human/AI interface) develop each of these arguments at length. The abstract's claims are philosophical positions that are elaborated and argued throughout the paper."
    116       },
    117       "causal_claims_justified": {
    118         "applies": true,
    119         "answer": false,
    120         "justification": "The paper makes numerous causal assertions: 'strict regulation imposed at this point would disproportionately shut down the more positive use cases of AI' (Section 1.3), 'AI technologies... have dramatically shifted social, intellectual, and economic spheres' (Section 7), and AI could 'crowd out the more traditional paradigms' (Section 4.6). These are stated as arguments from analogy and assertion, without empirical evidence or causal identification strategies."
    121       },
    122       "generalization_bounded": {
    123         "applies": true,
    124         "answer": false,
    125         "justification": "While the paper acknowledges mathematics as a 'sandbox' (Section 3), it regularly generalizes to 'all humankind' and 'society as a whole' (abstract, Section 5.1, conclusion). The title itself — 'human thought in the age of AI' — claims scope far beyond the mathematical case study. The paper does not bound its philosophical conclusions to the mathematical domain from which most of its arguments are drawn."
    126       },
    127       "alternative_explanations_discussed": {
    128         "applies": false,
    129         "answer": false,
    130         "justification": "The paper presents no empirical results. It is a philosophical position paper, so alternative explanations for observed data are not applicable."
    131       },
    132       "proxy_outcome_distinction": {
    133         "applies": false,
    134         "answer": false,
    135         "justification": "No measurements or proxies are used. This is a theoretical paper."
    136       }
    137     },
    138     "setup_transparency": {
    139       "model_versions_specified": {
    140         "applies": false,
    141         "answer": false,
    142         "justification": "No AI models are used or evaluated in this paper. The paper discusses AI in general philosophical terms."
    143       },
    144       "prompts_provided": {
    145         "applies": false,
    146         "answer": false,
    147         "justification": "No prompting is done in this paper."
    148       },
    149       "hyperparameters_reported": {
    150         "applies": false,
    151         "answer": false,
    152         "justification": "No experiments with hyperparameters. Purely theoretical work."
    153       },
    154       "scaffolding_described": {
    155         "applies": false,
    156         "answer": false,
    157         "justification": "No agentic scaffolding is used in this paper."
    158       },
    159       "data_preprocessing_documented": {
    160         "applies": false,
    161         "answer": false,
    162         "justification": "No data is collected or preprocessed. The paper is a philosophical essay."
    163       }
    164     },
    165     "limitations_and_scope": {
    166       "limitations_section_present": {
    167         "applies": true,
    168         "answer": false,
    169         "justification": "There is no dedicated limitations section. The paper contains scattered hedges such as 'we of course do not pretend to have definitive resolutions to any of them; and the speed of change in this space is such that any proclamations we make are at risk of being overtaken by striking new technological advances' (Section 3), but these are not collected in a substantive limitations discussion."
    170       },
    171       "threats_to_validity_specific": {
    172         "applies": true,
    173         "answer": false,
    174         "justification": "No specific threats to the validity of the paper's own arguments are discussed. The paper acknowledges that AI is changing rapidly but does not identify specific ways in which its philosophical positions or analogies might be wrong or misleading."
    175       },
    176       "scope_boundaries_stated": {
    177         "applies": true,
    178         "answer": false,
    179         "justification": "The paper does not explicitly state what it does NOT claim. While it notes that mathematics is used as a 'sandbox' (Section 3) and hedges with 'we of course do not pretend to have definitive resolutions,' it does not list specific exclusions, untested scenarios, or things the reader should not conclude from the paper."
    180       }
    181     },
    182     "data_integrity": {
    183       "raw_data_available": {
    184         "applies": false,
    185         "answer": false,
    186         "justification": "No data is collected or analyzed. The paper is a purely argumentative work."
    187       },
    188       "data_collection_described": {
    189         "applies": false,
    190         "answer": false,
    191         "justification": "No data collection occurs in this theoretical paper."
    192       },
    193       "recruitment_methods_described": {
    194         "applies": false,
    195         "answer": false,
    196         "justification": "No participants or data sources are recruited. This is a philosophical essay."
    197       },
    198       "data_pipeline_documented": {
    199         "applies": false,
    200         "answer": false,
    201         "justification": "No data pipeline exists for this theoretical paper."
    202       }
    203     },
    204     "conflicts_of_interest": {
    205       "funding_disclosed": {
    206         "applies": true,
    207         "answer": false,
    208         "justification": "The Acknowledgments section (Section 7.1) thanks Silvia de Toffoli for comments but does not mention any funding sources. No funding disclosure is present."
    209       },
    210       "affiliations_disclosed": {
    211         "applies": true,
    212         "answer": false,
    213         "justification": "The paper lists author names but no institutional affiliations are visible in the text. The authors' academic positions and departments are not stated."
    214       },
    215       "funder_independent_of_outcome": {
    216         "applies": true,
    217         "answer": false,
    218         "justification": "No funding is disclosed, so independence cannot be assessed. The paper discusses AI companies and their practices but does not clarify whether the authors have any financial relationships with such entities."
    219       },
    220       "financial_interests_declared": {
    221         "applies": true,
    222         "answer": false,
    223         "justification": "No competing interests statement or financial disclosure is present in the paper."
    224       }
    225     },
    226     "contamination": {
    227       "training_cutoff_stated": {
    228         "applies": false,
    229         "answer": false,
    230         "justification": "The paper does not evaluate any pre-trained model on any benchmark. It is a philosophical discussion of AI."
    231       },
    232       "train_test_overlap_discussed": {
    233         "applies": false,
    234         "answer": false,
    235         "justification": "No model evaluation occurs in this paper."
    236       },
    237       "benchmark_contamination_addressed": {
    238         "applies": false,
    239         "answer": false,
    240         "justification": "No benchmark evaluation is performed."
    241       }
    242     },
    243     "human_studies": {
    244       "pre_registered": {
    245         "applies": false,
    246         "answer": false,
    247         "justification": "No human participants. This is a theoretical paper."
    248       },
    249       "irb_or_ethics_approval": {
    250         "applies": false,
    251         "answer": false,
    252         "justification": "No human participants. Purely philosophical work."
    253       },
    254       "demographics_reported": {
    255         "applies": false,
    256         "answer": false,
    257         "justification": "No human participants in this theoretical paper."
    258       },
    259       "inclusion_exclusion_criteria": {
    260         "applies": false,
    261         "answer": false,
    262         "justification": "No human participants."
    263       },
    264       "randomization_described": {
    265         "applies": false,
    266         "answer": false,
    267         "justification": "No experimental study with participants."
    268       },
    269       "blinding_described": {
    270         "applies": false,
    271         "answer": false,
    272         "justification": "No experimental study with participants."
    273       },
    274       "attrition_reported": {
    275         "applies": false,
    276         "answer": false,
    277         "justification": "No human participants."
    278       }
    279     },
    280     "cost_and_practicality": {
    281       "inference_cost_reported": {
    282         "applies": false,
    283         "answer": false,
    284         "justification": "Purely theoretical paper with no computational method to cost."
    285       },
    286       "compute_budget_stated": {
    287         "applies": false,
    288         "answer": false,
    289         "justification": "No computation performed. The paper is a philosophical essay."
    290       }
    291     }
    292   },
    293   "claims": [
    294     {
    295       "claim": "AI is a natural evolution of human tools developed throughout history to facilitate the creation, organization, and dissemination of ideas.",
    296       "evidence": "Section 2 draws historical parallels with the printing press, the Industrial Revolution, and prior automation technologies, arguing that AI extends a continuous tradition of tool-building (Section 2.1).",
    297       "supported": "moderate"
    298     },
    299     {
    300       "claim": "Mathematics serves as a suitable 'sandbox' for exploring the broader impact of AI on sciences and society.",
    301       "evidence": "Section 3 argues mathematics has 'an older and more advanced foundation, and is by its nature well suited to explore a variety of hypothetical abstract scenarios.' The paper uses mathematics' objective standards of proof as a testbed for AI-related philosophical questions.",
    302       "supported": "moderate"
    303     },
    304     {
    305       "claim": "Formal verification is necessary but insufficient for evaluating AI-generated mathematical knowledge; proofs can be 'odorless' — technically correct but devoid of insight.",
    306       "evidence": "Section 4.4 argues that formalization 'only certifies that a formalized argument establishes a formal mathematical statement' and that AI can produce proofs that 'may even pass formal verification tests, but yet remain strangely unsatisfying.' Examples include AlphaProof's IMO solutions with 'numerous redundant or inexplicable steps' (footnote 16).",
    307       "supported": "moderate"
    308     },
    309     {
    310       "claim": "Strict regulation at this point would disproportionately shut down positive AI use cases without eliminating wasteful or malicious ones.",
    311       "evidence": "Asserted in Section 1.3 without empirical evidence. Stated as: 'strict regulation imposed at this point would disproportionately shut down the more positive use cases of AI, such as in the acceleration of scientific research, without eliminating the more wasteful or malicious uses of the technology.'",
    312       "supported": "weak"
    313     },
    314     {
    315       "claim": "AI technologies exacerbate existing inequalities by creating a 'digital divide' between those with and without access to frontier models.",
    316       "evidence": "Section 5.3 discusses how 'large scale AI tools may only be available to well-financed or well-connected research groups' and identifies a second divide where different models develop 'spiky capabilities,' creating uneven advantages. Draws on analogy to historical inequities but provides no data on current AI access disparities.",
    317       "supported": "weak"
    318     },
    319     {
    320       "claim": "An uncritical embrace of AI in mathematics could produce a flood of technically correct but insight-free papers that contribute nothing to broader mathematical narratives.",
    321       "evidence": "Section 4.6 argues this via reasoning about incentives and reduced cost of proof generation, noting the 'negative impressions produced by such low-quality work may lead to a stigma against even the most careful and responsible application of AI.' No empirical evidence for this scenario.",
    322       "supported": "weak"
    323     },
    324     {
    325       "claim": "A 'Copernican' reframing — placing human and artificial intelligence in the same ontological category — offers a productive philosophical middle ground.",
    326       "evidence": "Section 6.4 develops the analogy between the geocentric-to-heliocentric shift in astronomy and the current need to rethink human cognitive uniqueness. Draws parallel to chess, where human players thrive alongside engines. The argument is by analogy rather than evidence.",
    327       "supported": "weak"
    328     }
    329   ],
    330   "red_flags": [
    331     {
    332       "flag": "Claims significantly outrun the evidence",
    333       "detail": "The paper makes sweeping prescriptive claims about global AI policy, economic impacts, and the future of all intellectual disciplines ('benefit of all humankind') based primarily on philosophical argument from analogy and the authors' personal experiences. No empirical evidence, case studies, or systematic analysis supports the broad normative conclusions."
    334     },
    335     {
    336       "flag": "No structured methodology",
    337       "detail": "For a paper that aims to provide 'a pathway to integrating AI into our most challenging and intellectually rigorous fields,' there is no structured framework for evaluation. The arguments draw on historical analogies (Luddites, printing press, Wikipedia) without systematic analysis of whether these analogies hold. The paper acknowledges no method for how its claims could be tested or falsified."
    338     }
    339   ],
    340   "cited_papers": [
    341     {
    342       "title": "Highly accurate protein structure prediction with AlphaFold",
    343       "authors": ["J. Jumper", "R. Evans", "A. Pritzel"],
    344       "year": 2021,
    345       "relevance": "Landmark AI application in science — demonstrates AI capabilities leading to Nobel Prize-winning research."
    346     },
    347     {
    348       "title": "Autoformalization with Large Language Models",
    349       "authors": ["Y. Wu", "A. Q. Jiang", "W. Li", "M. Rabe", "C. Staats", "M. Jamnik", "C. Szegedy"],
    350       "year": 2022,
    351       "relevance": "Directly relevant to AI capability in mathematics — LLMs translating informal math to formal proofs."
    352     },
    353     {
    354       "title": "AI achieves silver-medal standard solving International Mathematical Olympiad problems",
    355       "authors": ["DeepMind"],
    356       "year": 2024,
    357       "relevance": "AlphaProof benchmark evaluation — AI system solving competitive mathematics problems with formal verification."
    358     },
    359     {
    360       "title": "Early science acceleration experiments with GPT-5",
    361       "authors": ["S. Bubeck", "C. Coester", "R. Eldan", "T. Gowers", "Y. T. Lee"],
    362       "year": 2025,
    363       "relevance": "Evaluates frontier LLM capability on scientific research tasks including solving open mathematical problems."
    364     },
    365     {
    366       "title": "AI models collapse when trained on recursively generated data",
    367       "authors": ["I. Shumailov", "Z. Shumaylov", "Y. Zhao", "N. Papernot", "R. Anderson", "Y. Gal"],
    368       "year": 2024,
    369       "relevance": "Directly relevant to AI evaluation methodology — demonstrates model collapse from training on AI-generated data."
    370     },
    371     {
    372       "title": "A Turing test of whether AI chatbots are behaviorally similar to humans",
    373       "authors": ["Q. Mei", "Y. Xie", "W. Yuan", "M. O. Jackson"],
    374       "year": 2024,
    375       "relevance": "Empirical evaluation of LLM capabilities — behavioral comparison between AI chatbots and humans."
    376     },
    377     {
    378       "title": "Algorithm and abstraction in formal mathematics",
    379       "authors": ["H. Macbeth"],
    380       "year": 2024,
    381       "relevance": "Discusses restructuring mathematical proofs for AI-assisted verification, directly relevant to AI in mathematics."
    382     },
    383     {
    384       "title": "Some thoughts on automation and mathematical research",
    385       "authors": ["A. Venkatesh"],
    386       "year": 2024,
    387       "relevance": "Perspective on AI's impact on mathematical research from a Fields Medalist, relevant to AI capability assessment."
    388     },
    389     {
    390       "title": "Hard Proofs and Good Reasons",
    391       "authors": ["S. DeDeo"],
    392       "year": 2024,
    393       "relevance": "Discusses quality and meaning of AI-generated mathematical proofs, relevant to evaluation of AI in intellectual work."
    394     },
    395     {
    396       "title": "The AI gambit: Leveraging artificial intelligence to combat climate change",
    397       "authors": ["J. Cowls", "A. Tsamados", "M. Taddeo", "L. Floridi"],
    398       "year": 2023,
    399       "relevance": "Discusses AI applications for climate change, relevant to cost-benefit analysis of AI deployment."
    400     }
    401   ],
    402   "engagement_factors": {
    403     "practical_relevance": {
    404       "score": 0,
    405       "justification": "Pure philosophical reflection with no tools, techniques, or methods that a practitioner could apply."
    406     },
    407     "surprise_contrarian": {
    408       "score": 1,
    409       "justification": "The Copernican framing of AI intelligence is a novel metaphor, but the overall positions (AI should be human-centered, has costs and benefits) are mainstream."
    410     },
    411     "fear_safety": {
    412       "score": 1,
    413       "justification": "Mentions existential risks, model collapse, digital divide, and environmental costs, but does not present novel threats or demonstrate specific attacks."
    414     },
    415     "drama_conflict": {
    416       "score": 1,
    417       "justification": "References the Faustian bargain and Luddite parallels, and critiques unchecked AI development, but avoids direct confrontation with specific companies or claims."
    418     },
    419     "demo_ability": {
    420       "score": 0,
    421       "justification": "No code, tool, or demo. The paper is entirely discursive."
    422     },
    423     "brand_recognition": {
    424       "score": 3,
    425       "justification": "Terence Tao is a Fields Medalist and one of the most recognized mathematicians alive; his name alone drives significant attention to any paper he co-authors."
    426     }
    427   }
    428 }
	ai-research-survey Systematic scan of agentic development research. What's signal, what's noise.
	git clone https://git.shiptheloop.com/ai-research-survey.git
	Log \| Files \| Refs