scan-v5.json - ai-research-survey - Systematic scan of agentic development research. What's signal, what's noise.

scan-v5.json (28040B)
      1 {
      2   "scan_version": 5,
      3   "paper_type": "empirical",
      4   "paper": {
      5     "title": "LLMs as Zero-shot Graph Learners: Alignment of GNN Representations with LLM Token Embeddings",
      6     "authors": [
      7       "Duo Wang",
      8       "Yuan Zuo",
      9       "Fengzhi Li",
     10       "Junjie Wu"
     11     ],
     12     "year": 2024,
     13     "venue": "Neural Information Processing Systems",
     14     "arxiv_id": "2408.14512",
     15     "doi": "10.48550/arXiv.2408.14512"
     16   },
     17   "checklist": {
     18     "claims_and_evidence": {
     19       "abstract_claims_supported": {
     20         "applies": true,
     21         "answer": true,
     22         "justification": "All abstract claims are supported: SOTA zero-shot performance on unseen datasets is demonstrated in Tables 1 and 2, the cross-task transfer claim is validated in Section 3.3, and code is released at GitHub as stated.",
     23         "source": "haiku"
     24       },
     25       "causal_claims_justified": {
     26         "applies": true,
     27         "answer": true,
     28         "justification": "Ablation study in Section 3.4 systematically removes feature-wise contrastive learning (w/o FC) and graph token embeddings (w/o GT) to support causal claims about each component's contribution to zero-shot generalization.",
     29         "source": "haiku"
     30       },
     31       "generalization_bounded": {
     32         "applies": true,
     33         "answer": false,
     34         "justification": "The title 'LLMs as Zero-shot Graph Learners' is broad, but experiments only cover node classification and link prediction on two domains; graph-level tasks are explicitly untested, and other graph types or domains are not evaluated.",
     35         "source": "haiku"
     36       },
     37       "alternative_explanations_discussed": {
     38         "applies": true,
     39         "answer": false,
     40         "justification": "The paper does not discuss whether gains could be attributed to stronger BERT-initialized node features shared uniformly, the specific Vicuna-7B backbone size advantage, or confounds in dataset selection rather than the proposed alignment mechanism.",
     41         "source": "haiku"
     42       },
     43       "proxy_outcome_distinction": {
     44         "applies": true,
     45         "answer": true,
     46         "justification": "The paper measures accuracy/Macro F1 for node classification and AUC for link prediction, which directly match the claimed tasks without proxy substitution.",
     47         "source": "haiku"
     48       }
     49     },
     50     "limitations_and_scope": {
     51       "limitations_section_present": {
     52         "applies": true,
     53         "answer": true,
     54         "justification": "Section 5 'Limitations' is a dedicated section, though it contains only one sentence about graph-level tasks not being experimentally validated.",
     55         "source": "haiku"
     56       },
     57       "threats_to_validity_specific": {
     58         "applies": true,
     59         "answer": false,
     60         "justification": "The limitations section contains a single generic statement about graph-level tasks; no specific threats such as dataset selection bias, LLM contamination on citation graphs, or sensitivity to BERT initialization are discussed.",
     61         "source": "haiku"
     62       },
     63       "scope_boundaries_stated": {
     64         "applies": true,
     65         "answer": false,
     66         "justification": "The only explicit boundary is the absence of graph-level task experiments; no bounds on domain generalizability, graph scale, or evaluation settings are stated.",
     67         "source": "haiku"
     68       }
     69     },
     70     "conflicts_of_interest": {
     71       "funding_disclosed": {
     72         "applies": true,
     73         "answer": true,
     74         "justification": "The Acknowledgement section lists specific grants: National Key R&D Program of China (2023YFC3304700), NSFC grants (71901012, 72242101, 72031001), and Beijing Universities Outstanding Young Scientist Program.",
     75         "source": "haiku"
     76       },
     77       "affiliations_disclosed": {
     78         "applies": true,
     79         "answer": true,
     80         "justification": "All four authors are identified as affiliated with the MIIT Key Laboratory of Data Intelligence and Management, Beihang University, with institutional email addresses.",
     81         "source": "haiku"
     82       },
     83       "funder_independent_of_outcome": {
     84         "applies": true,
     85         "answer": true,
     86         "justification": "All funders are Chinese government agencies (MOST, NSFC, Beijing Universities program) with no financial stake in the TEA-GLM framework's performance.",
     87         "source": "haiku"
     88       },
     89       "financial_interests_declared": {
     90         "applies": true,
     91         "answer": false,
     92         "justification": "No competing interests statement is provided; the paper only acknowledges grants without explicitly declaring absence of financial or competing interests.",
     93         "source": "haiku"
     94       }
     95     },
     96     "scope_and_framing": {
     97       "key_terms_defined": {
     98         "applies": true,
     99         "answer": true,
    100         "justification": "'Zero-shot' is precisely defined as cross-dataset and cross-task transfer without task-specific fine-tuning; 'token embedding alignment' is formalized mathematically via PCA projection in Section 2.2.2.",
    101         "source": "haiku"
    102       },
    103       "intended_contribution_clear": {
    104         "applies": true,
    105         "answer": true,
    106         "justification": "Three specific contributions are explicitly enumerated at the end of the Introduction: the TEA-GLM framework, the linear projector with unified instruction design, and experimental demonstration of SOTA performance.",
    107         "source": "haiku"
    108       },
    109       "engagement_with_prior_work": {
    110         "applies": true,
    111         "answer": true,
    112         "justification": "Section 4 provides structured related work covering GNNs, self-supervised and prompt-tuning approaches, and LLMs for graphs; the paper explicitly positions itself against GraphGPT, LLaGA, OFA, and the analogous TEST method for time series.",
    113         "source": "haiku"
    114       }
    115     }
    116   },
    117   "type_checklist": {
    118     "empirical": {
    119       "artifacts": {
    120         "code_released": {
    121           "applies": true,
    122           "answer": true,
    123           "justification": "Code is released at https://github.com/W-rudder/TEA-GLM as stated in the abstract.",
    124           "source": "haiku"
    125         },
    126         "data_released": {
    127           "applies": true,
    128           "answer": true,
    129           "justification": "All datasets are standard public benchmarks: OGB (Arxiv, Pubmed) and TAG benchmark (Children, History, Computer, Photo, Sports), unmodified and publicly available.",
    130           "source": "haiku"
    131         },
    132         "environment_specified": {
    133           "applies": true,
    134           "answer": false,
    135           "justification": "Only hardware is specified (2×A100 80GB, CUDA 11.7); no requirements.txt, Dockerfile, or full software dependency specification is provided.",
    136           "source": "haiku"
    137         },
    138         "reproduction_instructions": {
    139           "applies": true,
    140           "answer": false,
    141           "justification": "No step-by-step reproduction instructions appear in the paper; only high-level hyperparameter settings are reported without an explicit reproducibility guide pointing to specific scripts.",
    142           "source": "haiku"
    143         }
    144       },
    145       "statistical_methodology": {
    146         "confidence_intervals_or_error_bars": {
    147           "applies": true,
    148           "answer": true,
    149           "justification": "Tables 1, 2, 5, and 6 report mean ± standard deviation across 5 random seeds for all methods (e.g., TEA-GLM 0.848±0.010 on Pubmed accuracy).",
    150           "source": "haiku"
    151         },
    152         "significance_tests": {
    153           "applies": true,
    154           "answer": false,
    155           "justification": "No statistical significance tests are conducted despite comparative claims; only means and standard deviations are reported, leaving it unclear whether reported improvements are statistically significant.",
    156           "source": "haiku"
    157         },
    158         "effect_sizes_reported": {
    159           "applies": true,
    160           "answer": false,
    161           "justification": "No formal effect size metrics or percentage improvement summaries are reported; raw numbers can be compared but no standardized effect sizes are calculated.",
    162           "source": "haiku"
    163         },
    164         "sample_size_justified": {
    165           "applies": true,
    166           "answer": false,
    167           "justification": "5 random seeds (0-4) are used for variance estimation without justification or power analysis for why this number is sufficient.",
    168           "source": "haiku"
    169         },
    170         "variance_reported": {
    171           "applies": true,
    172           "answer": true,
    173           "justification": "Standard deviations are consistently reported across all main tables (Tables 1, 2, 5, 6) for all evaluated methods.",
    174           "source": "haiku"
    175         }
    176       },
    177       "evaluation_design": {
    178         "baselines_included": {
    179           "applies": true,
    180           "answer": true,
    181           "justification": "Seven categories of baselines: MLP, supervised GNNs (GCN, GraphSAGE, GAT), self-supervised (DGI), knowledge distillation (GKD, GLNN), graph transformers (NodeFormer, DIFFormer), and LLM-based methods (OFA, Vicuna-7B, GraphGPT, LLaGA).",
    182           "source": "haiku"
    183         },
    184         "baselines_contemporary": {
    185           "applies": true,
    186           "answer": true,
    187           "justification": "Contemporary LLM-based baselines include LLaGA (ICML 2024), OFA (ICLR 2024), and GraphGPT (2023), covering the most recent competing methods in the zero-shot graph learning space.",
    188           "source": "haiku"
    189         },
    190         "ablation_study": {
    191           "applies": true,
    192           "answer": true,
    193           "justification": "Section 3.4 ablates two key components: feature-wise contrastive learning (w/o FC) and graph token embeddings (w/o GT), testing on both cross-dataset and cross-task evaluations.",
    194           "source": "haiku"
    195         },
    196         "multiple_metrics": {
    197           "applies": true,
    198           "answer": true,
    199           "justification": "Three distinct metrics are used: Accuracy and Macro F1 for node classification (Tables 1, 5), and AUC for link prediction (Table 2).",
    200           "source": "haiku"
    201         },
    202         "human_evaluation": {
    203           "applies": false,
    204           "answer": false,
    205           "justification": "Node classification and link prediction on graph benchmarks do not require human evaluation of system outputs.",
    206           "source": "haiku"
    207         },
    208         "held_out_test_set": {
    209           "applies": true,
    210           "answer": true,
    211           "justification": "Data splits follow established procedures from GraphGPT (citation) and TAG benchmark (e-commerce), with models evaluated on test sets from datasets not used in training.",
    212           "source": "haiku"
    213         },
    214         "per_category_breakdown": {
    215           "applies": true,
    216           "answer": true,
    217           "justification": "Results are broken down per dataset (8 datasets across 2 domains) and per task type (node classification, link prediction), allowing detailed comparison.",
    218           "source": "haiku"
    219         },
    220         "failure_cases_discussed": {
    221           "applies": true,
    222           "answer": true,
    223           "justification": "Section 3.3 explicitly notes TEA-GLM does not outperform on the Sports dataset; Table 6 shows TEA-GLM underperforms LLaGA on supervised training data (0.655 vs 0.749 Acc on Arxiv), constituting acknowledged failure cases.",
    224           "source": "haiku"
    225         },
    226         "negative_results_reported": {
    227           "applies": true,
    228           "answer": true,
    229           "justification": "The paper reports that TEA-GLM trades off supervised performance (Table 6) for generalization, and explicitly notes the Sports exception; the ablation also shows slightly better training-set performance without feature-wise contrastive learning.",
    230           "source": "haiku"
    231         }
    232       },
    233       "setup_transparency": {
    234         "model_versions_specified": {
    235           "applies": true,
    236           "answer": true,
    237           "justification": "Specific model versions are stated: Vicuna-7B-v1.5 as the LLM backbone, GraphSAGE as GNN encoder, and BERT (Devlin et al. 2019) for node feature generation.",
    238           "source": "haiku"
    239         },
    240         "prompts_provided": {
    241           "applies": true,
    242           "answer": true,
    243           "justification": "Appendix D provides the complete instructions for node classification and link prediction with all placeholder notation, and the paper provides full task description templates.",
    244           "source": "haiku"
    245         },
    246         "hyperparameters_reported": {
    247           "applies": true,
    248           "answer": true,
    249           "justification": "GNN training: 2 layers, batch 512, 60 epochs, LR 2×10^-2; projector: batch 2/GPU, 1 epoch, LR 1×10^-3; parameter sensitivity for K (graph tokens) and P (PCA components) analyzed in Appendix C. Temperature τ value is not specified.",
    250           "source": "haiku"
    251         },
    252         "scaffolding_described": {
    253           "applies": true,
    254           "answer": true,
    255           "justification": "The full pipeline is described: GNN contrastive pretraining, linear projector training on task instructions, and inference with frozen LLM receiving graph token embeddings via unified instruction templates.",
    256           "source": "haiku"
    257         },
    258         "data_preprocessing_documented": {
    259           "applies": true,
    260           "answer": true,
    261           "justification": "Node feature generation via pretrained BERT is described; graph augmentation (RE: edge removal, MF: feature masking) is formalized in Equations 1-2; data splits follow documented benchmark procedures.",
    262           "source": "haiku"
    263         }
    264       },
    265       "data_integrity": {
    266         "raw_data_available": {
    267           "applies": true,
    268           "answer": true,
    269           "justification": "All datasets are publicly available standard benchmarks (Open Graph Benchmark, TAG benchmark) that can be independently accessed and verified.",
    270           "source": "haiku"
    271         },
    272         "data_collection_described": {
    273           "applies": true,
    274           "answer": true,
    275           "justification": "Appendix A describes each dataset's origin, domain, node/edge/class counts, and citation networks for all 8 datasets used in experiments.",
    276           "source": "haiku"
    277         },
    278         "recruitment_methods_described": {
    279           "applies": false,
    280           "answer": false,
    281           "justification": "No human participants; all data comes from standard graph benchmark datasets.",
    282           "source": "haiku"
    283         },
    284         "data_pipeline_documented": {
    285           "applies": true,
    286           "answer": true,
    287           "justification": "Full pipeline documented: raw graph → BERT node feature encoding → contrastive GNN pretraining → linear projector training → evaluation using benchmark data splits.",
    288           "source": "haiku"
    289         }
    290       },
    291       "contamination": {
    292         "training_cutoff_stated": {
    293           "applies": true,
    294           "answer": false,
    295           "justification": "Vicuna-7B-v1.5's training data cutoff is not stated; this is relevant since the Arxiv citation network dataset contains CS papers that Vicuna could have memorized during pretraining.",
    296           "source": "haiku"
    297         },
    298         "train_test_overlap_discussed": {
    299           "applies": true,
    300           "answer": false,
    301           "justification": "Potential overlap between Vicuna-7B's pretraining corpus and the content of Arxiv/Pubmed papers used as graph nodes is not discussed, despite being a meaningful confound for the zero-shot evaluation.",
    302           "source": "haiku"
    303         },
    304         "benchmark_contamination_addressed": {
    305           "applies": true,
    306           "answer": false,
    307           "justification": "The standard citation network benchmarks (Arxiv, Pubmed, Cora) contain papers that LLMs were likely trained on; no contamination analysis is provided.",
    308           "source": "haiku"
    309         }
    310       },
    311       "human_studies": {
    312         "pre_registered": {
    313           "applies": false,
    314           "answer": false,
    315           "justification": "No human participants in this study.",
    316           "source": "haiku"
    317         },
    318         "irb_or_ethics_approval": {
    319           "applies": false,
    320           "answer": false,
    321           "justification": "No human participants in this study.",
    322           "source": "haiku"
    323         },
    324         "demographics_reported": {
    325           "applies": false,
    326           "answer": false,
    327           "justification": "No human participants in this study.",
    328           "source": "haiku"
    329         },
    330         "inclusion_exclusion_criteria": {
    331           "applies": false,
    332           "answer": false,
    333           "justification": "No human participants in this study.",
    334           "source": "haiku"
    335         },
    336         "randomization_described": {
    337           "applies": false,
    338           "answer": false,
    339           "justification": "No human participants in this study.",
    340           "source": "haiku"
    341         },
    342         "blinding_described": {
    343           "applies": false,
    344           "answer": false,
    345           "justification": "No human participants in this study.",
    346           "source": "haiku"
    347         },
    348         "attrition_reported": {
    349           "applies": false,
    350           "answer": false,
    351           "justification": "No human participants in this study.",
    352           "source": "haiku"
    353         }
    354       },
    355       "cost_and_practicality": {
    356         "inference_cost_reported": {
    357           "applies": true,
    358           "answer": false,
    359           "justification": "Hardware specs (2×A100 80GB) are mentioned but no inference latency, throughput, or per-sample cost estimates are provided.",
    360           "source": "haiku"
    361         },
    362         "compute_budget_stated": {
    363           "applies": true,
    364           "answer": false,
    365           "justification": "GPU model and count are mentioned but total GPU-hours for pretraining, projector training, or full experimental runs are not reported.",
    366           "source": "haiku"
    367         }
    368       }
    369     }
    370   },
    371   "claims": [
    372     {
    373       "claim": "TEA-GLM achieves state-of-the-art zero-shot accuracy on cross-dataset node classification across citation and e-commerce domains.",
    374       "evidence": "Table 1 shows TEA-GLM accuracy of 0.848±0.010 on Pubmed and 0.528±0.058 on History, outperforming all baselines including the next-best LLaGA (0.793 and 0.146 respectively).",
    375       "supported": "strong"
    376     },
    377     {
    378       "claim": "Feature-wise contrastive learning with LLM token embeddings (via PCA) is critical for cross-task generalization.",
    379       "evidence": "Ablation in Figure 2b shows removing feature-wise contrastive learning substantially degrades link prediction AUC on unseen tasks, while performance on seen training datasets slightly improves.",
    380       "supported": "moderate"
    381     },
    382     {
    383       "claim": "A linear projector without LLM fine-tuning is sufficient for effective graph-to-token mapping when representations are pre-aligned.",
    384       "evidence": "The model achieves SOTA using only a linear layer (Equation 9) with frozen LLM; the ablation shows graph token embeddings (w/o GT) matter but does not test non-linear projector alternatives.",
    385       "supported": "moderate"
    386     },
    387     {
    388       "claim": "Using only paper titles (not abstracts) as text input is sufficient and improves performance.",
    389       "evidence": "Authors cite [18] for this claim rather than conducting their own ablation comparing title-only vs title+abstract input, leaving this key design choice empirically unsupported within the paper.",
    390       "supported": "weak"
    391     },
    392     {
    393       "claim": "TEA-GLM achieves superior cross-task link prediction AUC compared to all baselines on most datasets.",
    394       "evidence": "Table 2 shows TEA-GLM leads on 7/8 datasets (e.g., Arxiv 0.657 vs GraphGPT-std 0.649, Pubmed 0.689 vs GraphGPT-std 0.501); the Sports exception is explicitly acknowledged.",
    395       "supported": "strong"
    396     },
    397     {
    398       "claim": "LLM-backbone methods consistently outperform GNN-only methods on cross-dataset zero-shot transfer.",
    399       "evidence": "Table 1 shows the best GNN method (GLNN 0.390 on Pubmed) is substantially outperformed by Vicuna-7B-v1.5 (0.719) across all datasets, establishing the LLM advantage for zero-shot transfer.",
    400       "supported": "strong"
    401     }
    402   ],
    403   "methodology_tags": [
    404     "benchmark-eval"
    405   ],
    406   "key_findings": "TEA-GLM aligns GNN node representations with LLM token embeddings using PCA-guided feature-wise contrastive learning, enabling zero-shot transfer across datasets and tasks without LLM fine-tuning. The method achieves SOTA on cross-dataset node classification (e.g., 0.848 on Pubmed, +7% over LLaGA) and cross-task link prediction on 7/8 datasets. Ablation confirms both the feature-wise contrastive objective and graph token embedding mechanism are necessary for generalization. The approach demonstrates that representation pre-alignment reduces the complexity required at inference time to a single linear projector, trading supervised learning performance for substantially better zero-shot transfer.",
    407   "red_flags": [
    408     {
    409       "flag": "No significance testing",
    410       "detail": "Despite comparative claims across 14+ baselines and 8 datasets, no statistical significance tests are conducted; 5 random seeds with mean/std is insufficient to establish statistical reliability of improvements."
    411     },
    412     {
    413       "flag": "LLM contamination unaddressed",
    414       "detail": "Vicuna-7B-v1.5 could have memorized content from Arxiv, Pubmed, and Cora papers used as graph nodes; the training cutoff is unstated and no analysis of whether improvements reflect graph structure vs. LLM memorization is provided."
    415     },
    416     {
    417       "flag": "Title-only design choice unjustified",
    418       "detail": "The claim that using paper titles rather than abstracts improves performance is cited from prior work without the authors conducting their own ablation — a key architectural decision is left empirically unvalidated."
    419     },
    420     {
    421       "flag": "Temperature hyperparameter unreported",
    422       "detail": "The contrastive loss temperature τ (Equations 4 and 6) is never assigned a specific numerical value in the paper, making exact reproduction of the pretraining phase impossible."
    423     },
    424     {
    425       "flag": "Minimal limitations",
    426       "detail": "The limitations section is a single sentence noting graph-level tasks were not tested; domain generalizability, computational requirements for practitioners, and sensitivity to LLM backbone choice are all unexplored."
    427     }
    428   ],
    429   "cited_papers": [
    430     {
    431       "title": "GraphGPT: Graph Instruction Tuning for Large Language Models",
    432       "relevance": "Direct baseline for zero-shot graph learning using LLMs with two-stage instruction tuning; key comparison target in Tables 1 and 2"
    433     },
    434     {
    435       "title": "LLaGA: Large Language and Graph Assistant",
    436       "relevance": "Contemporary baseline translating graph data directly to LLM sequences without GNN; TEA-GLM's primary comparison for cross-dataset generalization"
    437     },
    438     {
    439       "title": "One for All: Towards Training One Graph Model for All Classification Tasks (OFA)",
    440       "relevance": "Cross-domain and cross-task graph learning framework showing negative transfer on unseen tasks, directly contrasted with TEA-GLM's approach"
    441     },
    442     {
    443       "title": "TEST: Text Prototype Aligned Embedding to Activate LLM's Ability for Time Series",
    444       "relevance": "Analogous alignment approach for time series representations; TEA-GLM explicitly distinguishes its PCA-based approach from TEST's method"
    445     },
    446     {
    447       "title": "Can LLMs Effectively Leverage Graph Structural Information: When and Why",
    448       "relevance": "Prior work motivating TEA-GLM's title-only text design and establishing that LLMs benefit from structural information when text is insufficient"
    449     },
    450     {
    451       "title": "Deep Graph Infomax",
    452       "relevance": "Classic self-supervised graph learning baseline using mutual information maximization; included in comparative evaluation"
    453     },
    454     {
    455       "title": "Inductive Representation Learning on Large Graphs (GraphSAGE)",
    456       "relevance": "GNN architecture used as TEA-GLM's graph encoder backbone; also a supervised baseline in experiments"
    457     },
    458     {
    459       "title": "A Comprehensive Study on Text-Attributed Graphs: Benchmarking and Rethinking (TAG)",
    460       "relevance": "Provides the e-commerce benchmark datasets and data split scripts used in TEA-GLM's cross-domain experiments"
    461     }
    462   ],
    463   "engagement_factors": {
    464     "practical_relevance": {
    465       "score": 2,
    466       "justification": "Addresses real zero-shot graph learning needs with released code, but requires A100 GPUs and multi-stage setup that limits immediate practitioner adoption."
    467     },
    468     "surprise_contrarian": {
    469       "score": 1,
    470       "justification": "PCA-based alignment is a novel technical angle but the overall direction of combining GNNs with LLMs for zero-shot transfer is expected; no conventional wisdom is strongly challenged."
    471     },
    472     "fear_safety": {
    473       "score": 0,
    474       "justification": "Graph node classification and link prediction research raises no AI safety concerns."
    475     },
    476     "drama_conflict": {
    477       "score": 0,
    478       "justification": "Standard technical contribution paper with positive results and no controversy or strong claims against prior work."
    479     },
    480     "demo_ability": {
    481       "score": 2,
    482       "justification": "Code released on GitHub using publicly available datasets; the zero-shot graph learning system is reproducible by others with sufficient compute (A100 GPUs)."
    483     },
    484     "brand_recognition": {
    485       "score": 0,
    486       "justification": "Work from Beihang University without dominant brand recognition in the LLM or graph learning space."
    487     }
    488   },
    489   "hn_data": {
    490     "threads": [
    491       {
    492         "hn_id": "41750763",
    493         "title": "Efficient and Effective Model Extraction",
    494         "points": 5,
    495         "comments": 0,
    496         "url": "https://news.ycombinator.com/item?id=41750763"
    497       },
    498       {
    499         "hn_id": "40191085",
    500         "title": "Efficiently Serving Large Language Models Through FP6-Centric Algorithm-System",
    501         "points": 5,
    502         "comments": 0,
    503         "url": "https://news.ycombinator.com/item?id=40191085"
    504       },
    505       {
    506         "hn_id": "45062761",
    507         "title": "AiXiv: A Platform for AI Researchers",
    508         "points": 4,
    509         "comments": 2,
    510         "url": "https://news.ycombinator.com/item?id=45062761"
    511       },
    512       {
    513         "hn_id": "45903790",
    514         "title": "A structural pattern for Legible Modular software",
    515         "points": 3,
    516         "comments": 1,
    517         "url": "https://news.ycombinator.com/item?id=45903790"
    518       },
    519       {
    520         "hn_id": "39524762",
    521         "title": "An expert system for diagnosing and treating heart disease",
    522         "points": 2,
    523         "comments": 0,
    524         "url": "https://news.ycombinator.com/item?id=39524762"
    525       },
    526       {
    527         "hn_id": "45944536",
    528         "title": "What You See Is What It Does: A Structural Pattern for Legible Software Onward!",
    529         "points": 1,
    530         "comments": 1,
    531         "url": "https://news.ycombinator.com/item?id=45944536"
    532       },
    533       {
    534         "hn_id": "44974139",
    535         "title": "CCFC: Core and Core-Full-Core Dual-Track Defense for LLM Jailbreak Protection",
    536         "points": 1,
    537         "comments": 0,
    538         "url": "https://news.ycombinator.com/item?id=44974139"
    539       },
    540       {
    541         "hn_id": "41551990",
    542         "title": "Towards Measuring and Modeling \"Culture\" in LLMs: A Survey",
    543         "points": 1,
    544         "comments": 0,
    545         "url": "https://news.ycombinator.com/item?id=41551990"
    546       },
    547       {
    548         "hn_id": "40468928",
    549         "title": "\"Yes I Would Recommend Calling the Police\":Norm Inconsistency in LLM Decisions",
    550         "points": 1,
    551         "comments": 0,
    552         "url": "https://news.ycombinator.com/item?id=40468928"
    553       },
    554       {
    555         "hn_id": "40438516",
    556         "title": "A hybrid approach to semi-automated Rust verification",
    557         "points": 1,
    558         "comments": 0,
    559         "url": "https://news.ycombinator.com/item?id=40438516"
    560       }
    561     ],
    562     "top_points": 5,
    563     "total_points": 24,
    564     "total_comments": 4
    565   }
    566 }
	ai-research-survey Systematic scan of agentic development research. What's signal, what's noise.
	git clone https://git.shiptheloop.com/ai-research-survey.git
	Log \| Files \| Refs