ai-research-survey

Systematic scan of agentic development research. What's signal, what's noise.
git clone https://git.shiptheloop.com/ai-research-survey.git
Log | Files | Refs

scan-v5.json (21163B)


      1 {
      2   "scan_version": 5,
      3   "paper_type": "survey",
      4   "paper": {
      5     "title": "Explosive Growth from AI Automation: A Review of the Arguments",
      6     "authors": [
      7       "Ege Erdil",
      8       "Tamay Besiroglu"
      9     ],
     10     "year": 2023,
     11     "venue": "arXiv",
     12     "arxiv_id": "2309.11690",
     13     "doi": null
     14   },
     15   "checklist": {
     16     "claims_and_evidence": {
     17       "abstract_claims_supported": {
     18         "applies": true,
     19         "answer": true,
     20         "justification": "All abstract claims — three growth drivers, nine counterarguments evaluated, plausibility of explosive growth without high confidence — are substantiated by the body. The paper delivers exactly what the abstract promises.",
     21         "source": "haiku"
     22       },
     23       "causal_claims_justified": {
     24         "applies": true,
     25         "answer": true,
     26         "justification": "Causal claims (AI substituting for labor causes explosive growth) are framed as model-conditional predictions from established economic growth theory, not empirical findings. The theoretical study design is appropriate for this class of claim, and uncertainty is acknowledged throughout.",
     27         "source": "haiku"
     28       },
     29       "generalization_bounded": {
     30         "applies": true,
     31         "answer": true,
     32         "justification": "Claims are consistently conditioned on 'AI capable of broadly substituting for human labor,' and the paper explicitly states that 'extrapolating economic models beyond their empirically validated domains introduces significant uncertainty.' Probability estimates are framed as conditional and approximate.",
     33         "source": "haiku"
     34       },
     35       "alternative_explanations_discussed": {
     36         "applies": true,
     37         "answer": true,
     38         "justification": "Section 3 is entirely devoted to nine counterarguments covering regulation, bottlenecks, alignment, measurement, human preferences, historical precedent, and physical limits. Each is analyzed at length.",
     39         "source": "haiku"
     40       },
     41       "proxy_outcome_distinction": {
     42         "applies": true,
     43         "answer": true,
     44         "justification": "'Explosive growth' is explicitly defined as annual real GWP exceeding 130% of its prior maximum. Section 3.6 dedicates substantial space to distinguishing measured GDP from actual consumer welfare and discusses known measurement biases.",
     45         "source": "haiku"
     46       }
     47     },
     48     "limitations_and_scope": {
     49       "limitations_section_present": {
     50         "applies": true,
     51         "answer": false,
     52         "justification": "There is no dedicated limitations or threats-to-validity section. Section 4 is a 'Discussion' with an 'Open Questions' subsection (4.1), but this is forward-looking speculation rather than a structured limitations analysis.",
     53         "source": "haiku"
     54       },
     55       "threats_to_validity_specific": {
     56         "applies": true,
     57         "answer": true,
     58         "justification": "The paper discusses specific threats throughout: model extrapolation 'beyond empirically validated domains,' parameter uncertainty (e.g., ϕ from Bloom et al.), correlated arguments undermining independence assumptions, and the 'kernel of truth' conceded in several counterarguments.",
     59         "source": "haiku"
     60       },
     61       "scope_boundaries_stated": {
     62         "applies": true,
     63         "answer": true,
     64         "justification": "The paper explicitly bounds its scope to explosive growth 'this century' conditional on 'AI capable of substituting for most or all economic tasks,' and defines 'explosive growth' precisely as GWP growth exceeding 30%/year.",
     65         "source": "haiku"
     66       }
     67     },
     68     "conflicts_of_interest": {
     69       "funding_disclosed": {
     70         "applies": true,
     71         "answer": true,
     72         "justification": "The acknowledgments state: 'We are grateful to Open Philanthropy for support for this project.'",
     73         "source": "haiku"
     74       },
     75       "affiliations_disclosed": {
     76         "applies": true,
     77         "answer": true,
     78         "justification": "Author affiliations are listed on the title page: Ege Erdil at Epoch AI; Tamay Besiroglu at Epoch AI and MIT FutureTech.",
     79         "source": "haiku"
     80       },
     81       "funder_independent_of_outcome": {
     82         "applies": true,
     83         "answer": false,
     84         "justification": "Open Philanthropy is a major funder of EA/longtermist research and has strong prior views on the importance of transformative AI — the exact topic of this paper. This ideological alignment with the subject matter is not acknowledged as a potential conflict.",
     85         "source": "haiku"
     86       },
     87       "financial_interests_declared": {
     88         "applies": true,
     89         "answer": false,
     90         "justification": "No competing interests statement is provided. There is no disclosure of equity, consulting, or patent interests beyond the funding acknowledgment.",
     91         "source": "haiku"
     92       }
     93     },
     94     "scope_and_framing": {
     95       "key_terms_defined": {
     96         "applies": true,
     97         "answer": true,
     98         "justification": "'Explosive growth' is explicitly defined as annual real GWP exceeding 130% of its prior maximum. 'Accumulable' inputs are defined conceptually. 'AI that broadly substitutes for human labor' is described in functional economic terms consistently throughout.",
     99         "source": "haiku"
    100       },
    101       "intended_contribution_clear": {
    102         "applies": true,
    103         "answer": true,
    104         "justification": "The introduction states the paper examines key arguments for and against explosive growth, provides quantitative grounding for counterarguments, and aims to give calibrated probability estimates. The contribution is clearly framed.",
    105         "source": "haiku"
    106       },
    107       "engagement_with_prior_work": {
    108         "applies": true,
    109         "answer": true,
    110         "justification": "The paper explicitly builds on Davidson 2021, Trammell & Korinek 2020, Hanson 2001, and Aghion et al. 2018, situating its contribution as adding quantitative specificity to arguments that prior work raised but did not fully formalize.",
    111         "source": "haiku"
    112       }
    113     }
    114   },
    115   "type_checklist": {
    116     "survey": {
    117       "search_and_selection": {
    118         "search_strategy_reproducible": {
    119           "applies": true,
    120           "answer": false,
    121           "justification": "This is not a systematic literature review. No search strategy is described. The paper reviews economic arguments curated by the authors' expertise, not a corpus identified through database searches.",
    122           "source": "haiku"
    123         },
    124         "inclusion_exclusion_explicit": {
    125           "applies": true,
    126           "answer": false,
    127           "justification": "No inclusion or exclusion criteria are stated. The 12 arguments reviewed appear selected by author judgment with no documented rationale for what was included or excluded.",
    128           "source": "haiku"
    129         },
    130         "prisma_or_structured_protocol": {
    131           "applies": true,
    132           "answer": false,
    133           "justification": "The paper follows no structured review protocol such as PRISMA. It is an argumentative review structured around a set of economic mechanisms, not a systematic literature review.",
    134           "source": "haiku"
    135         },
    136         "search_terms_provided": {
    137           "applies": true,
    138           "answer": false,
    139           "justification": "No search terms are provided. The paper does not conduct a systematic search of any literature database.",
    140           "source": "haiku"
    141         },
    142         "databases_listed": {
    143           "applies": true,
    144           "answer": false,
    145           "justification": "No databases or sources searched are listed. Literature appears gathered through informal expert knowledge rather than systematic database queries.",
    146           "source": "haiku"
    147         },
    148         "screening_process_documented": {
    149           "applies": true,
    150           "answer": false,
    151           "justification": "No screening process or stage-wise counts are documented. The paper has no systematic screening methodology.",
    152           "source": "haiku"
    153         },
    154         "review_scope_justified": {
    155           "applies": true,
    156           "answer": false,
    157           "justification": "While the introduction explains the topic (explosive AI-driven growth), it does not justify why exactly these 12 arguments were selected or what arguments may have been excluded. No formal scope justification is provided.",
    158           "source": "haiku"
    159         }
    160       },
    161       "synthesis_quality": {
    162         "conflicting_findings_acknowledged": {
    163           "applies": true,
    164           "answer": true,
    165           "justification": "The paper explicitly acknowledges conflicts between growth models, discusses correlated uncertainty across counterarguments in Section 4, and notes where different parameter estimates from the literature lead to opposing predictions.",
    166           "source": "haiku"
    167         },
    168         "quality_assessment_of_sources": {
    169           "applies": true,
    170           "answer": false,
    171           "justification": "No formal quality assessment or risk-of-bias evaluation of cited papers is conducted. Papers are used as inputs without evaluating the reliability or methodological quality of their findings.",
    172           "source": "haiku"
    173         },
    174         "publication_bias_discussed": {
    175           "applies": true,
    176           "answer": false,
    177           "justification": "Publication bias is not mentioned or discussed. The selective literature the authors engage with is not subjected to any bias assessment.",
    178           "source": "haiku"
    179         },
    180         "quantitative_synthesis_present": {
    181           "applies": true,
    182           "answer": true,
    183           "justification": "The paper presents mathematical models, numerical parameter estimates (e.g., d≈0.68, ¯c bounds, elasticity thresholds), and calibrated probability estimates using a defined likelihood scale, going well beyond pure narrative synthesis.",
    184           "source": "haiku"
    185         },
    186         "recommendations_supported_by_evidence": {
    187           "applies": true,
    188           "answer": true,
    189           "justification": "The final probability estimate ('about as likely as not') is explicitly derived from the structured analysis of individual arguments and their correlation structure, not asserted without basis.",
    190           "source": "haiku"
    191         }
    192       }
    193     }
    194   },
    195   "claims": [
    196     {
    197       "claim": "Standard economic growth models consistently predict explosive growth when AI can effectively substitute for human labor across most economic tasks.",
    198       "evidence": "Analysis of semi-endogenous and exogenous growth models across multiple specifications, showing explosive growth occurs when d+r>1 (d≈0.68 for accumulable inputs, r≈0.32 from Bloom et al. 2020).",
    199       "supported": "moderate"
    200     },
    201     {
    202       "claim": "AI runtime costs are already near the threshold that would support explosive growth under historically observed savings rates.",
    203       "evidence": "Estimates of ¯c≈$15,000/worker derived from Carlsmith 2020 brain FLOP estimates and current GPU prices, compared against the explosive growth threshold of s^(10/7)×$150,000/worker.",
    204       "supported": "weak"
    205     },
    206     {
    207       "claim": "Regulation is unlikely to permanently block AI-driven explosive growth.",
    208       "evidence": "Historical analogy to Britain's failed Industrial Revolution export bans and the imperfect nuclear arms control precedent; argument that economic incentives for AI adoption are too large for sustained coordination.",
    209       "supported": "weak"
    210     },
    211     {
    212       "claim": "Most counterarguments against explosive growth lack quantitative specificity and are not individually decisive.",
    213       "evidence": "Each of nine counterarguments is evaluated with quantitative bounds; most are rated 'unlikely' or 'very unlikely' to be decisive blockers using the paper's defined likelihood scale.",
    214       "supported": "moderate"
    215     },
    216     {
    217       "claim": "The probability of explosive growth this century conditional on AGI is approximately 50%.",
    218       "evidence": "Qualitative synthesis of argument strengths, correlation structure, and model robustness, using a defined likelihood scale without formal elicitation or calibration against base rates.",
    219       "supported": "weak"
    220     },
    221     {
    222       "claim": "Physical resource constraints (energy, land) permit at least 2–3 orders of magnitude of economic scaling before becoming binding this century.",
    223       "evidence": "Energy: 4.4e16W solar flux vs 4e13W global consumption (3 OOM headroom); Land: 1.5M km² urban vs 100M km² habitable (2 OOM headroom).",
    224       "supported": "moderate"
    225     }
    226   ],
    227   "methodology_tags": [
    228     "theoretical",
    229     "qualitative"
    230   ],
    231   "key_findings": "Economic growth models across multiple specifications robustly predict explosive growth (>30%/yr GWP) when AI can substitute for human labor at plausible costs, with the threshold condition being d+r>1 (satisfied under empirical parameter estimates). The authors evaluate nine counterarguments — regulation, production bottlenecks, alignment, slow automation, measurement failure, human preferences, historical precedent, R&D difficulty, and physical limits — and find most lack quantitative specificity to decisively rule out explosive growth. The most credible obstacles are regulation and production bottlenecks from hard-to-accumulate inputs (energy, capital). The authors assign roughly 50% probability to explosive growth this century conditional on AGI-level AI, while cautioning against high confidence due to model extrapolation uncertainty and correlated argument structures.",
    232   "red_flags": [
    233     {
    234       "flag": "Not a systematic review",
    235       "detail": "Classified as a survey but has no systematic search strategy, PRISMA protocol, inclusion/exclusion criteria, or documented screening process. It is an argumentative position paper structured around author-selected economic arguments."
    236     },
    237     {
    238       "flag": "Probability estimates lack formal calibration",
    239       "detail": "The central conclusion — explosive growth is 'about as likely as not' (~50%) — is based on qualitative weighting of arguments rather than formal elicitation, forecasting models, or calibration against historical base rates for transformative technological predictions."
    240     },
    241     {
    242       "flag": "Funder ideological alignment undisclosed",
    243       "detail": "Open Philanthropy, the funder, has strong prior views on the importance of transformative AI and long-term AI risk — directly relevant to this paper's conclusions — but this potential ideological alignment is not acknowledged as a conflict of interest."
    244     },
    245     {
    246       "flag": "Model extrapolation far beyond empirical domain",
    247       "detail": "Growth models calibrated to historical data are applied to predict outcomes (30%+ annual GWP growth) orders of magnitude outside any observed regime. The paper acknowledges this but does not fully account for the risk of model breakdown at extreme extrapolation distances."
    248     },
    249     {
    250       "flag": "Argument selection unjustified",
    251       "detail": "The 12 arguments reviewed (3 for, 9 against) were selected by author judgment with no documented rationale for what was included or excluded, creating potential cherry-picking of arguments amenable to the conclusion."
    252     },
    253     {
    254       "flag": "Both authors same institution",
    255       "detail": "Both Erdil and Besiroglu are at Epoch AI with no independent co-author, creating potential for institutional groupthink in the argument assessments."
    256     }
    257   ],
    258   "cited_papers": [
    259     {
    260       "title": "Could Advanced AI Drive Explosive Economic Growth",
    261       "relevance": "Davidson 2021 — primary prior work this paper builds on and critiques; provides probability estimates and model framework that anchor the analysis"
    262     },
    263     {
    264       "title": "Economic Growth Under Transformative AI",
    265       "relevance": "Trammell & Korinek 2020 synthesizes economic models of AI-driven growth; the foundational survey this paper extends with quantitative counterargument analysis"
    266     },
    267     {
    268       "title": "Are Ideas Getting Harder to Find?",
    269       "relevance": "Bloom et al. 2020 provides empirical estimates of returns to R&D (r≈0.32) that are central to the paper's explosive growth threshold calculation (d+r>1)"
    270     },
    271     {
    272       "title": "Artificial Intelligence and Economic Growth",
    273       "relevance": "Aghion et al. 2018 — key prior on AI as automation with Baumol effects; the model used as a comparative benchmark throughout"
    274     },
    275     {
    276       "title": "Economic Growth Given Machine Intelligence",
    277       "relevance": "Hanson 2001 provides early quantitative estimates of AI-driven growth rates (~40%/year) referenced as a baseline"
    278     },
    279     {
    280       "title": "How Much Computational Power Does It Take to Match the Human Brain?",
    281       "relevance": "Carlsmith 2020 provides brain FLOP estimates central to the AI runtime cost threshold calculations in Section 2.2"
    282     },
    283     {
    284       "title": "Forecasting TAI with Biological Anchors",
    285       "relevance": "Cotra 2020 provides estimates of resources needed for transformative AI; referenced for the unconditional probability estimates in footnote 5"
    286     },
    287     {
    288       "title": "The Elasticity of Substitution Between Capital and Labour in the US Economy: A Meta-Regression Analysis",
    289       "relevance": "Knoblach et al. 2020 provides empirical estimates of the substitution parameter σ used throughout the bottleneck, preference, and CES model analyses"
    290     }
    291   ],
    292   "engagement_factors": {
    293     "practical_relevance": {
    294       "score": 1,
    295       "justification": "Theoretical analysis of long-run economic futures; too speculative and abstract for near-term practitioner application."
    296     },
    297     "surprise_contrarian": {
    298       "score": 2,
    299       "justification": "Argues that explosive AI-driven growth is plausible (~50%) and that most counterarguments are quantitatively weak — a more bullish take than most mainstream economic or AI commentary."
    300     },
    301     "fear_safety": {
    302       "score": 2,
    303       "justification": "Raises alignment failures as an economic bottleneck and frames the possibility of order-of-magnitude economic transformation with cascading civilizational implications."
    304     },
    305     "drama_conflict": {
    306       "score": 2,
    307       "justification": "Takes explicit positions against well-known counterarguments (regulation, physical limits) and assigns substantial probability to civilizational-scale economic disruption."
    308     },
    309     "demo_ability": {
    310       "score": 0,
    311       "justification": "Pure theoretical and argumentative paper with no tool, dataset, or demonstration."
    312     },
    313     "brand_recognition": {
    314       "score": 1,
    315       "justification": "Epoch AI has recognition in AI forecasting and safety circles but is not a major industry lab or mainstream brand."
    316     }
    317   },
    318   "hn_data": {
    319     "threads": [
    320       {
    321         "hn_id": "44349782",
    322         "title": "Explosive Growth from AI Automation: A Review of the Arguments",
    323         "points": 3,
    324         "comments": 2,
    325         "url": "https://news.ycombinator.com/item?id=44349782",
    326         "created_at": "2025-06-22T19:54:31Z"
    327       },
    328       {
    329         "hn_id": "35699839",
    330         "title": "GPT4 can surpass humans in Theory of Mind test, with appropriate prompt",
    331         "points": 2,
    332         "comments": 1,
    333         "url": "https://news.ycombinator.com/item?id=35699839",
    334         "created_at": "2023-04-25T12:59:15Z"
    335       },
    336       {
    337         "hn_id": "36486250",
    338         "title": "Detectability of Supermassive Dark Stars with the Roman Space Telescope",
    339         "points": 2,
    340         "comments": 0,
    341         "url": "https://news.ycombinator.com/item?id=36486250",
    342         "created_at": "2023-06-26T21:40:38Z"
    343       },
    344       {
    345         "hn_id": "36441038",
    346         "title": "A Simple and Effective Pruning Approach for Large Language Models",
    347         "points": 2,
    348         "comments": 0,
    349         "url": "https://news.ycombinator.com/item?id=36441038",
    350         "created_at": "2023-06-23T00:13:33Z"
    351       },
    352       {
    353         "hn_id": "36176290",
    354         "title": "LLM Itself Can Read and Generate CXR Images",
    355         "points": 2,
    356         "comments": 0,
    357         "url": "https://news.ycombinator.com/item?id=36176290",
    358         "created_at": "2023-06-03T12:55:40Z"
    359       },
    360       {
    361         "hn_id": "41629931",
    362         "title": "LLM-Powered Text Simulation Attack Against ID-Free Recommender Systems",
    363         "points": 1,
    364         "comments": 0,
    365         "url": "https://news.ycombinator.com/item?id=41629931",
    366         "created_at": "2024-09-23T20:07:05Z"
    367       },
    368       {
    369         "hn_id": "35745610",
    370         "title": "Boosting Theory-of-Mind Performance in Large Language Models via Prompting",
    371         "points": 1,
    372         "comments": 3,
    373         "url": "https://news.ycombinator.com/item?id=35745610",
    374         "created_at": "2023-04-28T19:01:15Z"
    375       },
    376       {
    377         "hn_id": "41601215",
    378         "title": "Ranking of popular image generation AI models (incl. Flux) from 2M votes",
    379         "points": 1,
    380         "comments": 1,
    381         "url": "https://news.ycombinator.com/item?id=41601215",
    382         "created_at": "2024-09-20T12:13:32Z"
    383       }
    384     ],
    385     "top_points": 3,
    386     "total_points": 14,
    387     "total_comments": 7
    388   }
    389 }

Impressum · Datenschutz