scan-v5.json - ai-research-survey - Systematic scan of agentic development research. What's signal, what's noise.

scan-v5.json (27685B)
      1 {
      2   "scan_version": 5,
      3   "paper_type": "empirical",
      4   "paper": {
      5     "title": "Layer-Aware Representation Filtering: Purifying Finetuning Data to Preserve LLM Safety Alignment",
      6     "authors": [
      7       "Hao Li",
      8       "Lijun Li",
      9       "Zhenghao Lu",
     10       "Xianyi Wei",
     11       "Rui Li"
     12     ],
     13     "year": 2025,
     14     "venue": "Conference on Empirical Methods in Natural Language Processing",
     15     "arxiv_id": "2507.18631",
     16     "doi": "10.48550/arXiv.2507.18631"
     17   },
     18   "checklist": {
     19     "claims_and_evidence": {
     20       "abstract_claims_supported": {
     21         "applies": true,
     22         "answer": true,
     23         "justification": "All abstract claims are substantiated: LARF's efficiency is demonstrated in Table 3 (0.5h, 1 GPU), effectiveness in Tables 1 and 5 (LARF achieves highest and lowest ASR on respective experiments), and mitigation of fine-tuning alignment degradation in Table 2.",
     24         "source": "haiku"
     25       },
     26       "causal_claims_justified": {
     27         "applies": true,
     28         "answer": true,
     29         "justification": "Causal claims ('removing safety-degrading data mitigates alignment degradation') are supported by controlled fine-tuning experiments comparing top vs. bottom ranked samples across 3 models and 2 datasets, with multiple safety benchmarks as outcomes.",
     30         "source": "haiku"
     31       },
     32       "generalization_bounded": {
     33         "applies": true,
     34         "answer": true,
     35         "justification": "The limitations section explicitly states the method has not been evaluated on VLMs or Diffusion Models, and experiments cover 6 models and 5 fine-tuning datasets, bounding the generalization scope.",
     36         "source": "haiku"
     37       },
     38       "alternative_explanations_discussed": {
     39         "applies": true,
     40         "answer": false,
     41         "justification": "The paper does not consider alternative explanations for why top-ranked samples degrade safety — e.g., that the effect may be purely driven by response length/style rather than safety-specific representational features, or that the reference dataset composition drives the results.",
     42         "source": "haiku"
     43       },
     44       "proxy_outcome_distinction": {
     45         "applies": true,
     46         "answer": false,
     47         "justification": "ASR (Attack Success Rate) is treated as equivalent to safety alignment throughout the paper without acknowledging it is a proxy; the paper does not discuss whether LlamaGuard-based ASR fully captures the construct of 'safety alignment.'",
     48         "source": "haiku"
     49       }
     50     },
     51     "limitations_and_scope": {
     52       "limitations_section_present": {
     53         "applies": true,
     54         "answer": true,
     55         "justification": "Section 6 is a dedicated Limitations section that discusses three specific constraints of the method.",
     56         "source": "haiku"
     57       },
     58       "threats_to_validity_specific": {
     59         "applies": true,
     60         "answer": true,
     61         "justification": "Threats are specific: (1) effectiveness is tied to reference dataset quality and composition, (2) data-only filtering cannot fully prevent degradation, (3) the method has not been tested on VLMs — these go beyond generic disclaimers.",
     62         "source": "haiku"
     63       },
     64       "scope_boundaries_stated": {
     65         "applies": true,
     66         "answer": true,
     67         "justification": "The paper explicitly states the method applies to LLMs but not VLMs or Diffusion Models, and that the filtering approach does not fully prevent safety degradation, providing clear scope boundaries.",
     68         "source": "haiku"
     69       }
     70     },
     71     "conflicts_of_interest": {
     72       "funding_disclosed": {
     73         "applies": true,
     74         "answer": false,
     75         "justification": "No funding acknowledgments or grant disclosures appear in the paper; only institutional affiliations are stated.",
     76         "source": "haiku"
     77       },
     78       "affiliations_disclosed": {
     79         "applies": true,
     80         "answer": true,
     81         "justification": "All five authors' affiliations are disclosed: Shanghai AI Laboratory, Beihang University, Wuhan University, and Peking University.",
     82         "source": "haiku"
     83       },
     84       "funder_independent_of_outcome": {
     85         "applies": true,
     86         "answer": false,
     87         "justification": "Funding is not disclosed, so independence from outcome cannot be verified; Shanghai AI Laboratory has institutional interests in LLM safety research.",
     88         "source": "haiku"
     89       },
     90       "financial_interests_declared": {
     91         "applies": true,
     92         "answer": false,
     93         "justification": "No competing interests statement, patent disclosures, or financial interest declarations appear in the paper.",
     94         "source": "haiku"
     95       }
     96     },
     97     "scope_and_framing": {
     98       "key_terms_defined": {
     99         "applies": true,
    100         "answer": true,
    101         "justification": "Key terms are defined: 'safety alignment' as the mechanism for rejecting harmful instructions, 'safety-degrading data' as benign samples that weaken rejection capability, and 'safety-sensitive layers' as layers whose scaling most affects refusal behavior.",
    102         "source": "haiku"
    103       },
    104       "intended_contribution_clear": {
    105         "applies": true,
    106         "answer": true,
    107         "justification": "Three contributions are explicitly listed: a principled filtering framework, state-of-the-art detection performance with specific numbers, and broad generalizability across downstream tasks.",
    108         "source": "haiku"
    109       },
    110       "engagement_with_prior_work": {
    111         "applies": true,
    112         "answer": true,
    113         "justification": "Related Work covers data attribution methods (GradSafe, LESS, Bi-Gradient, SEAL) and representation engineering (Zou et al., Arditi et al., Circuit Breaker), and the paper directly compares against these methods quantitatively.",
    114         "source": "haiku"
    115       }
    116     }
    117   },
    118   "type_checklist": {
    119     "empirical": {
    120       "artifacts": {
    121         "code_released": {
    122           "applies": true,
    123           "answer": true,
    124           "justification": "Code is released at https://github.com/LLLeoLi/LARF, referenced in the abstract.",
    125           "source": "haiku"
    126         },
    127         "data_released": {
    128           "applies": true,
    129           "answer": true,
    130           "justification": "All primary fine-tuning datasets (Alpaca, Dolly, Magicoder, PubMedQA, MetaMath) and safety benchmarks (HarmBench, HEx-PHI, DirectHarm4) are publicly available standard benchmarks.",
    131           "source": "haiku"
    132         },
    133         "environment_specified": {
    134           "applies": true,
    135           "answer": false,
    136           "justification": "The paper specifies GPU type (NVIDIA A100-SXM 80GB) and LoRA hyperparameters but provides no requirements.txt, Dockerfile, or software dependency list.",
    137           "source": "haiku"
    138         },
    139         "reproduction_instructions": {
    140           "applies": true,
    141           "answer": false,
    142           "justification": "Algorithm 1 describes the LARF procedure at a high level, but no step-by-step reproduction instructions are provided in the paper itself; readers must infer workflow from the GitHub repository.",
    143           "source": "haiku"
    144         }
    145       },
    146       "statistical_methodology": {
    147         "confidence_intervals_or_error_bars": {
    148           "applies": true,
    149           "answer": false,
    150           "justification": "The random baseline reports an average over 3 runs but no standard deviation or confidence intervals are reported for any main results in Tables 1, 2, 5.",
    151           "source": "haiku"
    152         },
    153         "significance_tests": {
    154           "applies": true,
    155           "answer": false,
    156           "justification": "No statistical significance tests are applied to any of the comparative results; all comparisons are point estimates.",
    157           "source": "haiku"
    158         },
    159         "effect_sizes_reported": {
    160           "applies": true,
    161           "answer": true,
    162           "justification": "Percentage improvements are reported with baseline context throughout (e.g., ASR rises from 3.5% to 39% with LARF's bottom-ranked data, a 20% improvement over Bi-Anchoring; downstream task performance stays within 1% of random baseline).",
    163           "source": "haiku"
    164         },
    165         "sample_size_justified": {
    166           "applies": true,
    167           "answer": false,
    168           "justification": "The choice of 1,000 samples for filtering experiments and 10,000 for downstream tasks is stated as following SEAL's setting but no power analysis or independent justification is provided.",
    169           "source": "haiku"
    170         },
    171         "variance_reported": {
    172           "applies": true,
    173           "answer": false,
    174           "justification": "Figure 6 shows variance bands for layer-wise similarity scores, but main comparative results in Tables 1, 2, and 5 are reported without variance or standard deviation.",
    175           "source": "haiku"
    176         }
    177       },
    178       "evaluation_design": {
    179         "baselines_included": {
    180           "applies": true,
    181           "answer": true,
    182           "justification": "Four baselines are included: Random sampling, SEAL, GradSafe, and Bi-Anchoring, compared across all models and datasets.",
    183           "source": "haiku"
    184         },
    185         "baselines_contemporary": {
    186           "applies": true,
    187           "answer": true,
    188           "justification": "All baselines are recent: Bi-Anchoring (2024), GradSafe (2024, ACL), and SEAL (2025, ICLR), representing the current state of the field.",
    189           "source": "haiku"
    190         },
    191         "ablation_study": {
    192           "applies": true,
    193           "answer": true,
    194           "justification": "Section 3.3 and Figure 3 compare bidirectional vs. unidirectional representation scoring as an ablation; Figure 5 ablates layer selection by testing all layers 11–31 for data filtering effectiveness.",
    195           "source": "haiku"
    196         },
    197         "multiple_metrics": {
    198           "applies": true,
    199           "answer": true,
    200           "justification": "The evaluation uses ASR across three safety benchmarks (DirectHarm4, HarmBench, HEx-PHI), GPT-4o harmfulness score, downstream task metrics (HumanEval pass@1, PubMedQA accuracy, MATH score), and computational efficiency metrics.",
    201           "source": "haiku"
    202         },
    203         "human_evaluation": {
    204           "applies": false,
    205           "answer": false,
    206           "justification": "Human evaluation is not applicable; automated evaluation using LlamaGuard and GPT-4o is standard and appropriate for this type of safety benchmark evaluation.",
    207           "source": "haiku"
    208         },
    209         "held_out_test_set": {
    210           "applies": true,
    211           "answer": true,
    212           "justification": "Fine-tuning datasets and safety evaluation benchmarks are entirely separate; the safety benchmarks (HarmBench, HEx-PHI, DirectHarm4) serve as held-out test sets not used during fine-tuning.",
    213           "source": "haiku"
    214         },
    215         "per_category_breakdown": {
    216           "applies": true,
    217           "answer": true,
    218           "justification": "Section 4.5 analyzes ASR changes per safety category, and Figures 19–21 provide radar chart breakdowns by category (malware, phishing, disinformation, etc.) for all three models.",
    219           "source": "haiku"
    220         },
    221         "failure_cases_discussed": {
    222           "applies": true,
    223           "answer": false,
    224           "justification": "The paper discusses limitations of competing methods but does not show or analyze specific cases where LARF fails to identify safety-degrading data or where filtering is insufficient.",
    225           "source": "haiku"
    226         },
    227         "negative_results_reported": {
    228           "applies": true,
    229           "answer": true,
    230           "justification": "Table 5 shows that even the bottom-ranked 1,000 samples (deemed safe by LARF) still produce non-zero ASR in some conditions, and the limitations section acknowledges data-only filtering cannot fully prevent degradation.",
    231           "source": "haiku"
    232         }
    233       },
    234       "setup_transparency": {
    235         "model_versions_specified": {
    236           "applies": true,
    237           "answer": true,
    238           "justification": "Exact model versions are specified: Llama3-8B-Instruct, Llama3.1-8B-Instruct, Qwen2.5-7B-Instruct, Mistral-v0.2, Phi-3-mini, with citations to their technical reports.",
    239           "source": "haiku"
    240         },
    241         "prompts_provided": {
    242           "applies": true,
    243           "answer": false,
    244           "justification": "The GPT-4o evaluation prompt is described only as 'a revised version of the one used by Qi et al.' without providing the actual prompt text; safety pattern detection uses partial examples ('I cannot', 'Sorry') but not the full pattern list.",
    245           "source": "haiku"
    246         },
    247         "hyperparameters_reported": {
    248           "applies": true,
    249           "answer": true,
    250           "justification": "Appendix C.5 reports LoRA rank=8, alpha=8, 3 epochs, batch size=8, learning rate=1e-4, warmup ratio=0.1, cosine scheduler; Appendix C.3 specifies temperature=0, do_sample=False, max_new_tokens=32.",
    251           "source": "haiku"
    252         },
    253         "scaffolding_described": {
    254           "applies": false,
    255           "answer": false,
    256           "justification": "No agentic scaffolding is used in this paper; the method operates directly on model layers and representations.",
    257           "source": "haiku"
    258         },
    259         "data_preprocessing_documented": {
    260           "applies": true,
    261           "answer": true,
    262           "justification": "Appendix C.1 describes overrejection dataset construction (110 instructions generated by Llama-3.1-8B-Lexi-Uncensored-V2 with filtering), and Appendix C.2 describes Dsafe/Dunsafe construction from Circuit Breaker training data across 20 harm categories.",
    263           "source": "haiku"
    264         }
    265       },
    266       "data_integrity": {
    267         "raw_data_available": {
    268           "applies": true,
    269           "answer": false,
    270           "justification": "Primary fine-tuning datasets are public, but the custom overrejection dataset Ds (110 instructions) and the curated reference sets Dsafe/Dunsafe are not explicitly stated to be released; the GitHub code may or may not include them.",
    271           "source": "haiku"
    272         },
    273         "data_collection_described": {
    274           "applies": true,
    275           "answer": true,
    276           "justification": "Appendices C.1 and C.2 describe the construction of the overrejection dataset and the Dsafe/Dunsafe reference sets in sufficient detail, including the source model, filtering procedure, and category selection.",
    277           "source": "haiku"
    278         },
    279         "recruitment_methods_described": {
    280           "applies": false,
    281           "answer": false,
    282           "justification": "No human participants are involved; datasets are constructed programmatically from existing corpora and benchmarks.",
    283           "source": "haiku"
    284         },
    285         "data_pipeline_documented": {
    286           "applies": true,
    287           "answer": true,
    288           "justification": "Algorithm 1 documents the full pipeline from layer identification through representation extraction and scoring; the appendices cover dataset construction, fine-tuning, and evaluation details.",
    289           "source": "haiku"
    290         }
    291       },
    292       "contamination": {
    293         "training_cutoff_stated": {
    294           "applies": true,
    295           "answer": false,
    296           "justification": "The paper evaluates fine-tuned models on safety benchmarks (HarmBench, HEx-PHI, DirectHarm4) but never states the training data cutoffs for any of the evaluated models.",
    297           "source": "haiku"
    298         },
    299         "train_test_overlap_discussed": {
    300           "applies": true,
    301           "answer": false,
    302           "justification": "No discussion of whether safety benchmark test cases (HarmBench, DirectHarm4 prompts) were present in the pre-training corpora of Llama3, Llama3.1, or Qwen2.5.",
    303           "source": "haiku"
    304         },
    305         "benchmark_contamination_addressed": {
    306           "applies": true,
    307           "answer": false,
    308           "justification": "The paper does not address whether HarmBench, HEx-PHI, or DirectHarm4 examples were available before the training cutoffs of the evaluated models, which could inflate baseline refusal rates.",
    309           "source": "haiku"
    310         }
    311       },
    312       "human_studies": {
    313         "pre_registered": {
    314           "applies": false,
    315           "answer": false,
    316           "justification": "No human participants in this study.",
    317           "source": "haiku"
    318         },
    319         "irb_or_ethics_approval": {
    320           "applies": false,
    321           "answer": false,
    322           "justification": "No human participants in this study.",
    323           "source": "haiku"
    324         },
    325         "demographics_reported": {
    326           "applies": false,
    327           "answer": false,
    328           "justification": "No human participants in this study.",
    329           "source": "haiku"
    330         },
    331         "inclusion_exclusion_criteria": {
    332           "applies": false,
    333           "answer": false,
    334           "justification": "No human participants in this study.",
    335           "source": "haiku"
    336         },
    337         "randomization_described": {
    338           "applies": false,
    339           "answer": false,
    340           "justification": "No human participants in this study.",
    341           "source": "haiku"
    342         },
    343         "blinding_described": {
    344           "applies": false,
    345           "answer": false,
    346           "justification": "No human participants in this study.",
    347           "source": "haiku"
    348         },
    349         "attrition_reported": {
    350           "applies": false,
    351           "answer": false,
    352           "justification": "No human participants in this study.",
    353           "source": "haiku"
    354         }
    355       },
    356       "cost_and_practicality": {
    357         "inference_cost_reported": {
    358           "applies": true,
    359           "answer": true,
    360           "justification": "Table 3 explicitly reports wall-clock runtime (0.5h for LARF vs. 3–6h for baselines) and per-GPU memory usage for all methods on the Alpaca dataset with Llama3.1.",
    361           "source": "haiku"
    362         },
    363         "compute_budget_stated": {
    364           "applies": true,
    365           "answer": true,
    366           "justification": "Table 3 reports GPU count and memory per GPU for each method; fine-tuning for downstream tasks specifies 4 GPUs with per-device batch size 8, and the hardware (NVIDIA A100-SXM 80GB) is identified.",
    367           "source": "haiku"
    368         }
    369       }
    370     }
    371   },
    372   "claims": [
    373     {
    374       "claim": "LARF identifies safety-sensitive layers (13th for Llama3/3.1, 18th for Qwen2.5) that mediate refusal behavior and can be pinpointed via parameter scaling.",
    375       "evidence": "Figures 4, 7–12 show layer-wise refusal response curves; the 13th layer of Llama3 has normalized change rate k=370, highest among all layers.",
    376       "supported": "strong"
    377     },
    378     {
    379       "claim": "Fine-tuning Llama3.1 on 1,000 top safety-degrading samples identified by LARF raises ASR on HarmBench from 3.5% to 39%, a 20% improvement over Bi-Anchoring.",
    380       "evidence": "Table 1 shows Llama3.1+Alpaca results: LARF achieves 39% ASR on HarmBench vs. 12.5% for Bi-Anchoring; baseline instruct model is 3.5%.",
    381       "supported": "strong"
    382     },
    383     {
    384       "claim": "Filtering out LARF's top-ranked 1,000 samples reduces ASR to near-zero without sacrificing downstream task performance.",
    385       "evidence": "Table 5 shows near-zero ASR (e.g., 0% HarmBench for Llama3/Llama3.1 on Alpaca); Table 2 shows downstream task performance within 1% of random baseline.",
    386       "supported": "strong"
    387     },
    388     {
    389       "claim": "LARF is substantially more computationally efficient than competing methods, requiring only 0.5h and 1 GPU vs. 3–6h and 4–8 GPUs for baselines.",
    390       "evidence": "Table 3 directly compares wall-clock time and GPU resources: LARF 0.5h/1 GPU/18.4GB vs. SEAL 6h/8 GPUs/36GB.",
    391       "supported": "strong"
    392     },
    393     {
    394       "claim": "Safety-degrading samples are characterized by long, point-by-point responses that exceed the dataset average in both count and token length.",
    395       "evidence": "Table 4 shows top-ranked samples have 516–872 point-style responses vs. dataset mean of 276 for Llama3 on Alpaca; average output tokens 349–354 vs. mean 138.",
    396       "supported": "moderate"
    397     },
    398     {
    399       "claim": "Bidirectional representation similarity (using both safe and unsafe reference representations) outperforms unidirectional similarity for safety-degrading data selection.",
    400       "evidence": "Figure 3 shows bidirectional method (Orig) achieves higher ASR on bottom-ranked samples and lower ASR on top-ranked samples compared to unidirectional (Unsafe) across 3 benchmarks.",
    401       "supported": "moderate"
    402     }
    403   ],
    404   "methodology_tags": [
    405     "benchmark-eval",
    406     "empirical"
    407   ],
    408   "key_findings": "LARF identifies safety-sensitive layers in LLMs (13th layer for Llama3/3.1) via parameter scaling and uses bidirectional representation similarity at those layers to detect and rank safety-degrading samples in benign fine-tuning corpora. Filtering the top-ranked 1,000 safety-degrading samples from Alpaca or Dolly reduces post-fine-tuning ASR to near-zero across three safety benchmarks and three models, while maintaining downstream task performance within 1% of random baseline. LARF operates without gradient computation or auxiliary model training, requiring only 0.5 hours on a single GPU versus 3–6 hours on 4–8 GPUs for competing methods. Safety-degrading examples are empirically characterized by unusually long, point-by-point responses that disrupt the model's inherent refusal-style safety mechanism.",
    409   "red_flags": [
    410     {
    411       "flag": "ASR proxy validity unexamined",
    412       "detail": "LlamaGuard-based Attack Success Rate is used as a direct measure of 'safety alignment' without validating whether ASR correlates with actual harm or human judgment of safety."
    413     },
    414     {
    415       "flag": "No statistical testing",
    416       "detail": "All comparative results in Tables 1, 2, and 5 are point estimates; no significance tests, confidence intervals, or p-values are reported despite comparative claims."
    417     },
    418     {
    419       "flag": "Tiny reference datasets",
    420       "detail": "Dsafe and Dunsafe each contain only 100 examples (5 per category × 20 categories), raising concerns about representativeness of the reference distribution."
    421     },
    422     {
    423       "flag": "No funding disclosure",
    424       "detail": "Authors from Shanghai AI Laboratory and multiple Chinese universities provide no funding acknowledgment or competing interests statement."
    425     },
    426     {
    427       "flag": "Potential circularity in layer identification",
    428       "detail": "The overrejection dataset used to identify safety-sensitive layers is constructed from the same distribution of harmful categories as the Dsafe/Dunsafe reference sets used for filtering, potentially inflating apparent layer specificity."
    429     }
    430   ],
    431   "cited_papers": [
    432     {
    433       "title": "Fine-tuning aligned language models compromises safety, even when users do not intend to!",
    434       "relevance": "Foundational motivation: demonstrates that fine-tuning on benign data degrades safety alignment, establishing the core problem this paper addresses."
    435     },
    436     {
    437       "title": "What is in your safe data? Identifying benign data that breaks safety (Bi-Anchoring)",
    438       "relevance": "Primary baseline and closest prior work; identifies safety-degrading benign data via gradient similarity, directly compared in Tables 1, 2, 5."
    439     },
    440     {
    441       "title": "SEAL: Safety-enhanced aligned LLM fine-tuning via bilevel data selection",
    442       "relevance": "Primary baseline; trains a dedicated data ranker via bilevel optimization to identify safe fine-tuning data, directly compared throughout."
    443     },
    444     {
    445       "title": "GradSafe: Detecting jailbreak prompts for LLMs via safety-critical gradient analysis",
    446       "relevance": "Primary baseline; uses safety-critical gradients to classify unsafe instructions, directly compared in all experiments."
    447     },
    448     {
    449       "title": "Refusal in language models is mediated by a single direction",
    450       "relevance": "Representation engineering foundation showing that refusal behavior has a specific directional structure in representation space, motivating LARF's layer-based approach."
    451     },
    452     {
    453       "title": "Representation engineering: A top-down approach to AI transparency",
    454       "relevance": "Foundational work on representation-based analysis of model behavior, providing theoretical grounding for LARF's use of intermediate representations."
    455     },
    456     {
    457       "title": "Improving alignment and robustness with circuit breakers",
    458       "relevance": "Demonstrates that rerouting representations can defend against adversarial attacks, supporting the validity of representation-space approaches to safety."
    459     },
    460     {
    461       "title": "Safety layers in aligned large language models: The key to LLM security",
    462       "relevance": "Directly informs LARF's methodology: the approach to identifying safety-sensitive layers via scaling follows this work (cited as Li et al., 2025c)."
    463     }
    464   ],
    465   "engagement_factors": {
    466     "practical_relevance": {
    467       "score": 3,
    468       "justification": "Directly deployable as a pre-deployment audit tool for anyone fine-tuning LLMs, with code released and showing 6-12x compute efficiency vs. alternatives."
    469     },
    470     "surprise_contrarian": {
    471       "score": 1,
    472       "justification": "The core finding (benign data can degrade safety) is already established; the representation-based solution is novel but builds incrementally on prior work."
    473     },
    474     "fear_safety": {
    475       "score": 3,
    476       "justification": "Directly addresses a high-stakes failure mode: safety alignment can be silently compromised even when fine-tuning on benign corporate/open-source datasets."
    477     },
    478     "drama_conflict": {
    479       "score": 1,
    480       "justification": "Positioned against existing methods (SEAL, Bi-Anchoring) showing they fail in specific scenarios, but framed as a technical comparison rather than controversy."
    481     },
    482     "demo_ability": {
    483       "score": 2,
    484       "justification": "Code is on GitHub; someone with access to Llama3 and appropriate GPU memory could run the pipeline, though it requires 18.4GB GPU memory which limits accessibility."
    485     },
    486     "brand_recognition": {
    487       "score": 1,
    488       "justification": "Shanghai AI Laboratory is prominent in China but not a globally recognized brand like DeepMind, OpenAI, or Google; no famous product association."
    489     }
    490   },
    491   "hn_data": {
    492     "threads": [
    493       {
    494         "hn_id": "44985278",
    495         "title": "Making LLMs Cheaper and Better via Performance-Efficiency Optimized Routing",
    496         "points": 130,
    497         "comments": 28,
    498         "url": "https://news.ycombinator.com/item?id=44985278"
    499       },
    500       {
    501         "hn_id": "43819670",
    502         "title": "LinPrim: Linear Primitives for Differentiable Volumetric Rendering",
    503         "points": 3,
    504         "comments": 0,
    505         "url": "https://news.ycombinator.com/item?id=43819670"
    506       },
    507       {
    508         "hn_id": "41059683",
    509         "title": "MOMAland: Benchmarks for Multi-Objective Multi-Agent Reinforcement Learning",
    510         "points": 3,
    511         "comments": 0,
    512         "url": "https://news.ycombinator.com/item?id=41059683"
    513       },
    514       {
    515         "hn_id": "44943341",
    516         "title": "Eyes Will Shut: A Vision-Based Next GPS Location Prediction Model",
    517         "points": 2,
    518         "comments": 0,
    519         "url": "https://news.ycombinator.com/item?id=44943341"
    520       },
    521       {
    522         "hn_id": "42920203",
    523         "title": "A Comprehensive Survey of the Lean 4 Theorem Prover",
    524         "points": 1,
    525         "comments": 0,
    526         "url": "https://news.ycombinator.com/item?id=42920203"
    527       }
    528     ],
    529     "top_points": 130,
    530     "total_points": 139,
    531     "total_comments": 28
    532   }
    533 }
	ai-research-survey Systematic scan of agentic development research. What's signal, what's noise.
	git clone https://git.shiptheloop.com/ai-research-survey.git
	Log \| Files \| Refs