scan-v5.json - ai-research-survey - Systematic scan of agentic development research. What's signal, what's noise.

scan-v5.json (27255B)
      1 {
      2   "scan_version": 5,
      3   "paper_type": "empirical",
      4   "paper": {
      5     "title": "From Poisoned to Aware: Fostering Backdoor Self-Awareness in LLMs",
      6     "authors": [
      7       "Guangyu Shen",
      8       "Siyuan Cheng",
      9       "Xiangzhe Xu",
     10       "Yuan Zhou",
     11       "Hanxi Guo",
     12       "Zhuo Zhang",
     13       "Xiangyu Zhang"
     14     ],
     15     "year": 2025,
     16     "venue": "arXiv.org",
     17     "arxiv_id": "2510.05169",
     18     "doi": "10.48550/arXiv.2510.05169"
     19   },
     20   "checklist": {
     21     "claims_and_evidence": {
     22       "abstract_claims_supported": {
     23         "applies": true,
     24         "answer": true,
     25         "justification": "All major abstract claims — RL framework for trigger recovery, phase-transition emergence, and defense results on 5 backdoor types against 6 baselines — are supported by Figures 3, 6, 7 and Tables 1–2.",
     26         "source": "haiku"
     27       },
     28       "causal_claims_justified": {
     29         "applies": true,
     30         "answer": true,
     31         "justification": "Causal claims about buffer replay and R-SFT prerequisites are backed by ablation study (Figure 8b), showing training plateaus without each component on a controlled setting.",
     32         "source": "haiku"
     33       },
     34       "generalization_bounded": {
     35         "applies": true,
     36         "answer": false,
     37         "justification": "The paper claims the framework is 'architecture-agnostic' based on only 4 model variants (all 7–8B), and does not bound its conclusions to this model-size regime or acknowledge that larger or smaller models may behave differently.",
     38         "source": "haiku"
     39       },
     40       "alternative_explanations_discussed": {
     41         "applies": true,
     42         "answer": false,
     43         "justification": "The paper does not discuss alternative explanations for the abrupt emergence phenomenon (e.g., reward hacking, memorization of trigger surface-form patterns), and presents only one interpretation analogous to RL 'aha moments'.",
     44         "source": "haiku"
     45       },
     46       "proxy_outcome_distinction": {
     47         "applies": true,
     48         "answer": true,
     49         "justification": "AWARENESS@k (Jaccard similarity between proposed and true trigger) is explicitly defined as a proxy metric in Section 3, and the paper is clear that it measures trigger articulation fidelity, not broader 'safety' or 'alignment'.",
     50         "source": "haiku"
     51       }
     52     },
     53     "limitations_and_scope": {
     54       "limitations_section_present": {
     55         "applies": true,
     56         "answer": false,
     57         "justification": "Limitations appear in the final paragraph of Section 7 (Conclusion) rather than in a dedicated section; two brief points are noted (requires knowledge of attack behavior, high training cost).",
     58         "source": "haiku"
     59       },
     60       "threats_to_validity_specific": {
     61         "applies": true,
     62         "answer": false,
     63         "justification": "No threats-to-validity are discussed; the two mentioned limitations ('assumes knowledge of attack's target behavior' and 'training cost') are not framed as threats nor substantiated with quantitative impact.",
     64         "source": "haiku"
     65       },
     66       "scope_boundaries_stated": {
     67         "applies": true,
     68         "answer": false,
     69         "justification": "The paper does not explicitly state what settings its results do NOT generalize to (e.g., models >8B, multi-modal triggers, unknown attack effects), offering only generic 'future directions' language.",
     70         "source": "haiku"
     71       }
     72     },
     73     "conflicts_of_interest": {
     74       "funding_disclosed": {
     75         "applies": true,
     76         "answer": false,
     77         "justification": "No funding acknowledgment appears anywhere in the paper; no grants, industry support, or sponsors are mentioned.",
     78         "source": "haiku"
     79       },
     80       "affiliations_disclosed": {
     81         "applies": true,
     82         "answer": true,
     83         "justification": "All seven authors disclose their affiliations (Purdue University for six, Columbia University for one) on the first page.",
     84         "source": "haiku"
     85       },
     86       "funder_independent_of_outcome": {
     87         "applies": false,
     88         "answer": false,
     89         "justification": "No funding is disclosed, so funder independence cannot be assessed.",
     90         "source": "haiku"
     91       },
     92       "financial_interests_declared": {
     93         "applies": true,
     94         "answer": false,
     95         "justification": "No competing interests statement, patent disclosures, or financial interest declarations are present in the paper.",
     96         "source": "haiku"
     97       }
     98     },
     99     "scope_and_framing": {
    100       "key_terms_defined": {
    101         "applies": true,
    102         "answer": true,
    103         "justification": "Section 3 formally defines 'functional backdoor' (Equations 1–3), 'backdoor self-awareness,' and AWARENESS@k (Equation 4) with mathematical precision.",
    104         "source": "haiku"
    105       },
    106       "intended_contribution_clear": {
    107         "applies": true,
    108         "answer": true,
    109         "justification": "The paper explicitly states three contributions: an RL framework for cultivating backdoor self-awareness, an observed phase-transition emergence property, and two downstream defense strategies (unlearning + inference-time guardrail).",
    110         "source": "haiku"
    111       },
    112       "engagement_with_prior_work": {
    113         "applies": true,
    114         "answer": true,
    115         "justification": "Section 2 situates the work relative to trigger inversion methods (Shen et al. 2022, Zou et al. 2023), reversal training (Golovneva et al. 2024), self-awareness (Betley et al. 2025b), and unlearning (Zeng et al. 2024), explaining how this work differs and builds on each.",
    116         "source": "haiku"
    117       }
    118     }
    119   },
    120   "type_checklist": {
    121     "empirical": {
    122       "artifacts": {
    123         "code_released": {
    124           "applies": true,
    125           "answer": true,
    126           "justification": "Abstract states 'The code is available at LLM Backdoor Self-Awareness' as a live hyperlink, indicating current release rather than future promise.",
    127           "source": "haiku"
    128         },
    129         "data_released": {
    130           "applies": true,
    131           "answer": true,
    132           "justification": "All training datasets used (SafeRLHF, UltraFeedback, Alpaca, SHIP author-released data) are standard public datasets; no proprietary data collected.",
    133           "source": "haiku"
    134         },
    135         "environment_specified": {
    136           "applies": true,
    137           "answer": false,
    138           "justification": "Hardware (8×A100-40GB) and training framework (DeepSpeed ZeRO-3, bfloat16) are mentioned but no requirements.txt, Dockerfile, or package versions are provided.",
    139           "source": "haiku"
    140         },
    141         "reproduction_instructions": {
    142           "applies": true,
    143           "answer": false,
    144           "justification": "Section 6.1.3 provides hyperparameter tables but no step-by-step reproduction script or pipeline walkthrough; the paper relies on the linked codebase without describing how to execute it.",
    145           "source": "haiku"
    146         }
    147       },
    148       "statistical_methodology": {
    149         "confidence_intervals_or_error_bars": {
    150           "applies": true,
    151           "answer": false,
    152           "justification": "Figure 6 shows ±std shading on RL reward curves, but Tables 1–2 (main comparative results) report only point estimates without any confidence intervals or error bars.",
    153           "source": "haiku"
    154         },
    155         "significance_tests": {
    156           "applies": true,
    157           "answer": false,
    158           "justification": "No statistical significance tests are applied to any of the comparative results in Tables 1–2 despite multiple comparative claims against six baseline methods.",
    159           "source": "haiku"
    160         },
    161         "effect_sizes_reported": {
    162           "applies": true,
    163           "answer": true,
    164           "justification": "Table 1 reports absolute ASR reductions (e.g., −74.7% for jailbreak) relative to baselines and no-defense condition, providing interpretable effect sizes.",
    165           "source": "haiku"
    166         },
    167         "sample_size_justified": {
    168           "applies": true,
    169           "answer": false,
    170           "justification": "100 prompts for RL training and 100 for evaluation are used without any power analysis or justification for why 100 samples suffices for reliable AWARENESS@k estimation.",
    171           "source": "haiku"
    172         },
    173         "variance_reported": {
    174           "applies": true,
    175           "answer": false,
    176           "justification": "Variance is shown only for reward curves during training (Figure 6); all main result tables report single-run point estimates with no variance across seeds or runs.",
    177           "source": "haiku"
    178         }
    179       },
    180       "evaluation_design": {
    181         "baselines_included": {
    182           "applies": true,
    183           "answer": true,
    184           "justification": "Six baselines are compared: BEEAR, R-SFT+Adv.Train, GCG+Adv.Train for unlearning, and ONION, BEAT, CoS for inference-time detection.",
    185           "source": "haiku"
    186         },
    187         "baselines_contemporary": {
    188           "applies": true,
    189           "answer": true,
    190           "justification": "All baselines are from 2021–2024 with the most recent (BEEAR 2024, CoS 2024, BEAT ICLR) being contemporary; no suspiciously outdated baselines.",
    191           "source": "haiku"
    192         },
    193         "ablation_study": {
    194           "applies": true,
    195           "answer": true,
    196           "justification": "Section 6.4 ablates buffer replay and R-SFT prerequisite (Figure 8b) and tests across four model architectures (Figure 8a), quantifying each component's contribution.",
    197           "source": "haiku"
    198         },
    199         "multiple_metrics": {
    200           "applies": true,
    201           "answer": true,
    202           "justification": "Evaluation uses AWARENESS@k, ASR (with/without trigger), utility metrics (MMLU-Pro, XSTest, MXEval, HumanEval), TPR@5%FPR, and detection accuracy.",
    203           "source": "haiku"
    204         },
    205         "human_evaluation": {
    206           "applies": false,
    207           "answer": false,
    208           "justification": "Human evaluation is not applicable; the task is fully automated security evaluation with LLM-judge scoring.",
    209           "source": "haiku"
    210         },
    211         "held_out_test_set": {
    212           "applies": true,
    213           "answer": true,
    214           "justification": "Section 6.1.4 states evaluation uses 'hold-out evaluation set from DSFT' for unlearning and a separate validation fold for TPR calibration in detection.",
    215           "source": "haiku"
    216         },
    217         "per_category_breakdown": {
    218           "applies": true,
    219           "answer": true,
    220           "justification": "Tables 1–2 and Figure 6 provide complete per-backdoor-type breakdowns across all five backdoor variants (Jailbreak, Sleeper Agent, SHIP, Clean Label, DoS).",
    221           "source": "haiku"
    222         },
    223         "failure_cases_discussed": {
    224           "applies": true,
    225           "answer": true,
    226           "justification": "DoS (Awareness@k=0.549, only a substring recovered) and Sleeper Agent (0.839) are discussed as partial failures with mechanistic explanations (substring trigger, code-domain interference).",
    227           "source": "haiku"
    228         },
    229         "negative_results_reported": {
    230           "applies": true,
    231           "answer": true,
    232           "justification": "Section 4 is dedicated to showing R-SFT alone fails (AWARENESS@k ≤0.042 even at k=200) and contrasts prior positive results to contextualize the limitation.",
    233           "source": "haiku"
    234         }
    235       },
    236       "setup_transparency": {
    237         "model_versions_specified": {
    238           "applies": true,
    239           "answer": true,
    240           "justification": "All models are specified with exact version names: Llama-3.1-8B-Instruct, Qwen2.5-Coder-7B-Instruct, Qwen2.5-7B-Instruct, Ministral-8B-Instruct-2410, DeepSeek-R1-Distill-Llama-8B.",
    241           "source": "haiku"
    242         },
    243         "prompts_provided": {
    244           "applies": true,
    245           "answer": true,
    246           "justification": "Full inversion prompts for all five backdoor types are in Appendix A, judge prompt in Appendix B, and guardrail prompt in Appendix C — complete, not templates.",
    247           "source": "haiku"
    248         },
    249         "hyperparameters_reported": {
    250           "applies": true,
    251           "answer": true,
    252           "justification": "Section 6.1.3 reports LoRA rank, learning rates, epochs, batch size, gradient accumulation, GRPO parameters (β=0.01, G=8, ε=0.2), and reward function constants (α, L, β, γ).",
    253           "source": "haiku"
    254         },
    255         "scaffolding_described": {
    256           "applies": true,
    257           "answer": true,
    258           "justification": "The full RL training scaffold (GRPO + buffer replay, reward module, inversion prompt pipeline) is described in Section 5 with Figure 5 illustrating a single training step.",
    259           "source": "haiku"
    260         },
    261         "data_preprocessing_documented": {
    262           "applies": true,
    263           "answer": true,
    264           "justification": "Section 6.1.2 documents poison rates (10%/20%), dataset composition for each backdoor type, reversal augmentation templates, and RL training data curation steps.",
    265           "source": "haiku"
    266         }
    267       },
    268       "data_integrity": {
    269         "raw_data_available": {
    270           "applies": true,
    271           "answer": false,
    272           "justification": "Constructed poison datasets and trained models are not released; only code is available, meaning the exact experimental data cannot be independently verified.",
    273           "source": "haiku"
    274         },
    275         "data_collection_described": {
    276           "applies": true,
    277           "answer": true,
    278           "justification": "Section 6.1.2 describes exact dataset sources, sample counts, trigger injection procedures, and split ratios for each of the five backdoor types.",
    279           "source": "haiku"
    280         },
    281         "recruitment_methods_described": {
    282           "applies": false,
    283           "answer": false,
    284           "justification": "No human participants; all data sourced from existing public NLP datasets.",
    285           "source": "haiku"
    286         },
    287         "data_pipeline_documented": {
    288           "applies": true,
    289           "answer": true,
    290           "justification": "Section 6.1.2 traces the full pipeline: public datasets → poison injection (DSFT) → reversal augmentation (DR-SFT) → RL training set (DRL) → adversarial unlearning set.",
    291           "source": "haiku"
    292         }
    293       },
    294       "contamination": {
    295         "training_cutoff_stated": {
    296           "applies": true,
    297           "answer": false,
    298           "justification": "Base model training cutoffs are not stated, and MMLU-Pro and HumanEval are used as utility metrics without discussing whether these benchmarks were in the base models' training data.",
    299           "source": "haiku"
    300         },
    301         "train_test_overlap_discussed": {
    302           "applies": true,
    303           "answer": false,
    304           "justification": "No discussion of potential overlap between base model pretraining data and the utility benchmark test sets (MMLU-Pro, HumanEval).",
    305           "source": "haiku"
    306         },
    307         "benchmark_contamination_addressed": {
    308           "applies": true,
    309           "answer": false,
    310           "justification": "MMLU-Pro and HumanEval are used to measure utility retention, but the paper does not address whether the 7–8B base models were trained on these benchmarks.",
    311           "source": "haiku"
    312         }
    313       },
    314       "human_studies": {
    315         "pre_registered": {
    316           "applies": false,
    317           "answer": false,
    318           "justification": "No human participants.",
    319           "source": "haiku"
    320         },
    321         "irb_or_ethics_approval": {
    322           "applies": false,
    323           "answer": false,
    324           "justification": "No human participants.",
    325           "source": "haiku"
    326         },
    327         "demographics_reported": {
    328           "applies": false,
    329           "answer": false,
    330           "justification": "No human participants.",
    331           "source": "haiku"
    332         },
    333         "inclusion_exclusion_criteria": {
    334           "applies": false,
    335           "answer": false,
    336           "justification": "No human participants.",
    337           "source": "haiku"
    338         },
    339         "randomization_described": {
    340           "applies": false,
    341           "answer": false,
    342           "justification": "No human participants.",
    343           "source": "haiku"
    344         },
    345         "blinding_described": {
    346           "applies": false,
    347           "answer": false,
    348           "justification": "No human participants.",
    349           "source": "haiku"
    350         },
    351         "attrition_reported": {
    352           "applies": false,
    353           "answer": false,
    354           "justification": "No human participants.",
    355           "source": "haiku"
    356         }
    357       },
    358       "cost_and_practicality": {
    359         "inference_cost_reported": {
    360           "applies": true,
    361           "answer": false,
    362           "justification": "Training cost is qualitatively described as 'comparable to other RL-based methods' but no GPU-hours, dollar cost, or inference latency numbers are provided.",
    363           "source": "haiku"
    364         },
    365         "compute_budget_stated": {
    366           "applies": true,
    367           "answer": false,
    368           "justification": "Hardware (8×A100-40GB) is stated but total compute budget (GPU-hours or FLOPs) is not reported for any experiment.",
    369           "source": "haiku"
    370         }
    371       }
    372     }
    373   },
    374   "claims": [
    375     {
    376       "claim": "RL-based training (GRPO + buffer replay) enables backdoor self-awareness achieving AWARENESS@k from 0.549 to 1.000 across five backdoor types",
    377       "evidence": "Figure 6 shows AWARENESS@k of 1.000, 0.839, 1.000, 0.634, 0.549 for Jailbreak, Sleeper Agent, SHIP, CL Jailbreak, and DoS respectively after RL training",
    378       "supported": "strong"
    379     },
    380     {
    381       "claim": "Backdoor self-awareness emergence is abrupt (phase transition) in 4 of 5 tested backdoor types, resembling RL 'aha moments'",
    382       "evidence": "Figure 6 reward curves show sharp jumps from near-zero to 0.7–0.9 within ~20 training steps for Jailbreak, SHIP, CL Jailbreak, and DoS; Sleeper Agent is the exception with gradual improvement",
    383       "supported": "strong"
    384     },
    385     {
    386       "claim": "R-SFT alone is insufficient for backdoor self-awareness on smaller models with complex triggers, achieving AWARENESS@k ≤0.042 even at k=200",
    387       "evidence": "Figure 3 shows R-SFT yields Jaccard@k of 0.020 and 0.042 for Jailbreak and Sleeper Agent respectively, contrasting with prior reports of R-SFT working on 70B+ models",
    388       "supported": "strong"
    389     },
    390     {
    391       "claim": "Adversarial unlearning using self-aware model reduces triggered ASR to under 5% for 4 of 5 backdoors while preserving utility",
    392       "evidence": "Table 1 shows ASR reduction to 4.74%, 4.86%, 5.10%, 4.50%, 0.00% for the five attacks, with MMLU-Pro degradation ≤1% in most cases",
    393       "supported": "strong"
    394     },
    395     {
    396       "claim": "Inference-time guardrail achieves average detection accuracy of 95.6% across five backdoor types, outperforming BEAT, ONION, and CoS",
    397       "evidence": "Table 2 reports accuracy of 99.8%, 99.19%, 91.63%, 89.00%, 100.00% — BEAT reaches 100% only on Jailbreak, fails on others (47.8%–50.4%)",
    398       "supported": "strong"
    399     },
    400     {
    401       "claim": "Buffer replay mechanism is critical — without it, training plateaus at reward ~0.3 and fails to converge to the true trigger",
    402       "evidence": "Figure 8b shows 'w/o Buffer-Replay' plateauing around 0.3 vs the full method reaching 0.9+; training logs show the correct trigger appeared 13 times but was too sparse to reinforce",
    403       "supported": "strong"
    404     }
    405   ],
    406   "methodology_tags": [
    407     "benchmark-eval"
    408   ],
    409   "key_findings": "A GRPO-based reinforcement learning framework with buffer replay can cultivate backdoor self-awareness in poisoned LLMs, enabling models to articulate their own implanted triggers with AWARENESS@k of 0.549–1.000 across five backdoor types. This self-awareness emerges abruptly in a phase-transition-like pattern within ~20 training steps in 4 of 5 cases, and R-SFT alone is insufficient for this capability in 7–8B models with complex functional triggers. The recovered triggers enable effective downstream defenses: adversarial unlearning reduces triggered ASR by an average of 73.18% with minimal utility loss, while an inference-time guardrail achieves 95.6% average detection accuracy — both outperforming six baseline methods.",
    410   "red_flags": [
    411     {
    412       "flag": "Assumes known attack behavior",
    413       "detail": "The reward function requires knowledge of the attack's target behavior (e.g., 'jailbreak' vs 'DoS') to design the LLM judge prompt, limiting applicability when the attack type is unknown — a common real-world scenario."
    414     },
    415     {
    416       "flag": "No statistical significance testing",
    417       "detail": "All comparative claims in Tables 1–2 are based on single-run point estimates with no significance tests, error bars, or confidence intervals, making it impossible to assess whether differences are robust."
    418     },
    419     {
    420       "flag": "Narrow model size range",
    421       "detail": "All experiments use 7–8B parameter models; the claim of 'architecture-agnostic' generalization is based on only four models in this range, not tested on larger (e.g., 70B) or smaller models."
    422     },
    423     {
    424       "flag": "Unidentified guardrail model",
    425       "detail": "The inference-time guardrail uses 'GPT-OSS-20B' — an unrecognizable model identifier that does not correspond to any known publicly released model, preventing reproducibility of that component."
    426     },
    427     {
    428       "flag": "No multi-seed variance in result tables",
    429       "detail": "Main result tables report single runs without variance estimates; the stochastic nature of RL training means results could vary substantially across random seeds."
    430     }
    431   ],
    432   "cited_papers": [
    433     {
    434       "title": "Universal Jailbreak Backdoors from Poisoned Human Feedback",
    435       "relevance": "Introduces the jailbreak backdoor attack used as the primary test case; defines the SUDO trigger threat model"
    436     },
    437     {
    438       "title": "Sleeper Agents: Training Deceptive LLMs that Persist Through Safety Training",
    439       "relevance": "Provides the sleeper agent backdoor attack and motivates why standard safety training fails on backdoored models"
    440     },
    441     {
    442       "title": "Tell Me About Yourself: LLMs Are Aware of Their Learned Behaviors",
    443       "relevance": "Establishes the baseline for LLM self-awareness and R-SFT approach; this paper directly extends and critiques its findings for smaller models"
    444     },
    445     {
    446       "title": "The Reversal Curse: LLMs Trained on 'A is B' Fail to Learn 'B is A'",
    447       "relevance": "Provides the theoretical grounding for why poisoned models lack self-awareness and why reversal training alone is insufficient"
    448     },
    449     {
    450       "title": "Universal and Transferable Adversarial Attacks on Aligned Language Models (GCG)",
    451       "relevance": "Gradient-based trigger inversion baseline compared against in the unlearning evaluation"
    452     },
    453     {
    454       "title": "BEEAR: Embedding-Based Adversarial Removal of Safety Backdoors in Instruction-Tuned LLMs",
    455       "relevance": "Key unlearning baseline; shows embedding-space inversion can achieve low ASR but causes severe utility degradation"
    456     },
    457     {
    458       "title": "Me, Myself, and AI: The Situational Awareness Dataset (SAD) for LLMs",
    459       "relevance": "Provides the broader framework for situational self-awareness in LLMs that motivates the backdoor self-awareness concept"
    460     },
    461     {
    462       "title": "DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models (GRPO)",
    463       "relevance": "Source of the GRPO optimization algorithm used as the RL backbone of the proposed training framework"
    464     }
    465   ],
    466   "engagement_factors": {
    467     "practical_relevance": {
    468       "score": 2,
    469       "justification": "Practitioners can use the framework defensively but it requires knowledge of attack type and significant compute (8×A100), limiting immediate deployment."
    470     },
    471     "surprise_contrarian": {
    472       "score": 2,
    473       "justification": "The abrupt phase-transition emergence of self-awareness and the counterintuitive finding that R-SFT alone fails for smaller models challenge naive assumptions from prior work."
    474     },
    475     "fear_safety": {
    476       "score": 3,
    477       "justification": "Demonstrates that backdoored LLMs can be made to bypass safety policies with simple triggers and that existing defenses largely fail, raising direct AI safety concerns."
    478     },
    479     "drama_conflict": {
    480       "score": 2,
    481       "justification": "The arms race between backdoor attacks and defenses in safety-aligned LLMs is an ongoing high-stakes conflict in AI security research."
    482     },
    483     "demo_ability": {
    484       "score": 1,
    485       "justification": "Code is released but requires fine-tuning 8B models with 8×A100 GPUs, making hands-on demonstration inaccessible to most practitioners."
    486     },
    487     "brand_recognition": {
    488       "score": 1,
    489       "justification": "Purdue University authors without affiliation to major AI labs; no famous products or widely-known models involved."
    490     }
    491   },
    492   "hn_data": {
    493     "threads": [
    494       {
    495         "hn_id": "37832599",
    496         "title": "HyperAttention: Long-Context Attention in Near-Linear Time",
    497         "points": 73,
    498         "comments": 13,
    499         "url": "https://news.ycombinator.com/item?id=37832599",
    500         "created_at": "2023-10-10T14:31:28Z"
    501       },
    502       {
    503         "hn_id": "33227427",
    504         "title": "Neural Networks Are Decision Trees",
    505         "points": 34,
    506         "comments": 9,
    507         "url": "https://news.ycombinator.com/item?id=33227427",
    508         "created_at": "2022-10-16T21:43:27Z"
    509       },
    510       {
    511         "hn_id": "28876487",
    512         "title": "Offline Reinforcement Learning with Implicit Q-Learning",
    513         "points": 12,
    514         "comments": 0,
    515         "url": "https://news.ycombinator.com/item?id=28876487",
    516         "created_at": "2021-10-15T11:05:12Z"
    517       },
    518       {
    519         "hn_id": "33232042",
    520         "title": "Neural Networks Are Decision Trees",
    521         "points": 4,
    522         "comments": 2,
    523         "url": "https://news.ycombinator.com/item?id=33232042",
    524         "created_at": "2022-10-17T11:18:16Z"
    525       },
    526       {
    527         "hn_id": "33200244",
    528         "title": "Neural Networks Are Decision Trees",
    529         "points": 4,
    530         "comments": 0,
    531         "url": "https://news.ycombinator.com/item?id=33200244",
    532         "created_at": "2022-10-14T06:28:28Z"
    533       },
    534       {
    535         "hn_id": "33192776",
    536         "title": "Neural Networks Are Decision Trees",
    537         "points": 3,
    538         "comments": 0,
    539         "url": "https://news.ycombinator.com/item?id=33192776",
    540         "created_at": "2022-10-13T15:57:00Z"
    541       },
    542       {
    543         "hn_id": "44594017",
    544         "title": "Ask HN : AI to Detect Counterfeit Adderall",
    545         "points": 2,
    546         "comments": 0,
    547         "url": "https://news.ycombinator.com/item?id=44594017",
    548         "created_at": "2025-07-17T14:47:39Z"
    549       },
    550       {
    551         "hn_id": "42021531",
    552         "title": "Understanding Warmup-Stable-Decay Learning Rates",
    553         "points": 1,
    554         "comments": 0,
    555         "url": "https://news.ycombinator.com/item?id=42021531",
    556         "created_at": "2024-11-01T21:02:29Z"
    557       }
    558     ],
    559     "top_points": 73,
    560     "total_points": 133,
    561     "total_comments": 24
    562   }
    563 }
	ai-research-survey Systematic scan of agentic development research. What's signal, what's noise.
	git clone https://git.shiptheloop.com/ai-research-survey.git
	Log \| Files \| Refs