ai-research-survey

Systematic scan of agentic development research. What's signal, what's noise.
git clone https://git.shiptheloop.com/ai-research-survey.git
Log | Files | Refs

scan-v5.json (30232B)


      1 {
      2   "scan_version": 5,
      3   "paper_type": "empirical",
      4   "paper": {
      5     "title": "Exploring Persona-dependent LLM Alignment for the Moral Machine Experiment",
      6     "authors": [
      7       "Jiseon Kim",
      8       "Jea Kwon",
      9       "Luiz Felipe Vecchietti",
     10       "Alice Oh",
     11       "Meeyoung Cha"
     12     ],
     13     "year": 2025,
     14     "venue": "ICLR 2025",
     15     "arxiv_id": "2504.10886",
     16     "doi": "10.48550/arXiv.2504.10886"
     17   },
     18   "checklist": {
     19     "claims_and_evidence": {
     20       "abstract_claims_supported": {
     21         "applies": true,
     22         "answer": true,
     23         "justification": "Abstract claims (persona influences LLM decisions, greater shifts than humans, political persona dominates) are all supported by results in Figs. 2-6 showing persona-dependent MDD values and decision flips.",
     24         "source": "haiku"
     25       },
     26       "causal_claims_justified": {
     27         "applies": true,
     28         "answer": true,
     29         "justification": "The experimental design assigns personas vs. baseline and measures decision shifts, allowing causal inference about persona effects. Claims about persona *causing* shifts are justified by this treatment-control structure.",
     30         "source": "haiku"
     31       },
     32       "generalization_bounded": {
     33         "applies": true,
     34         "answer": false,
     35         "justification": "Study is bounded to 3 models and Moral Machine scenarios (autonomous vehicles), but the conclusion discusses 'broader applications' and 'ethically complex scenarios' beyond tested scope. Title doesn't signal the narrow focus.",
     36         "source": "haiku"
     37       },
     38       "alternative_explanations_discussed": {
     39         "applies": true,
     40         "answer": false,
     41         "justification": "Paper interprets findings through one lens (partisan sorting/sycophancy) without exploring alternatives: e.g., prompt engineering artifacts, temperature effects, model architecture differences, or whether AMCE shifts reflect genuine alignment changes or statistical noise.",
     42         "source": "haiku"
     43       },
     44       "proxy_outcome_distinction": {
     45         "applies": true,
     46         "answer": true,
     47         "justification": "Paper distinguishes between AMCE values (what's measured) and 'alignment' (what's claimed). Explicitly uses AMCE as a metric for comparison, though the inference from scenario preferences to moral alignment is one step removed.",
     48         "source": "haiku"
     49       }
     50     },
     51     "limitations_and_scope": {
     52       "limitations_section_present": {
     53         "applies": true,
     54         "answer": false,
     55         "justification": "Section 5 discusses limitations within the discussion context ('Improving Persona Settings', 'Expanding Moral Machine Scenarios') but no formal 'Limitations' section exists. Discussion paragraphs address constraints but lack structure of a dedicated section.",
     56         "source": "haiku"
     57       },
     58       "threats_to_validity_specific": {
     59         "applies": true,
     60         "answer": true,
     61         "justification": "Specifically mentions: binary personas (7 categories) oversimplify diversity, single prompt methodology needs validation, Moral Machine covers only autonomous vehicles (narrow subset), Llama2 guardrails cause <10% valid response for some personas.",
     62         "source": "haiku"
     63       },
     64       "scope_boundaries_stated": {
     65         "applies": true,
     66         "answer": true,
     67         "justification": "Explicitly states 3 models tested, 10,000 scenarios across 9 Moral Machine dimensions, 7 persona categories with binary definitions. Bounded scope is clear, though implications stated more broadly.",
     68         "source": "haiku"
     69       }
     70     },
     71     "conflicts_of_interest": {
     72       "funding_disclosed": {
     73         "applies": true,
     74         "answer": true,
     75         "justification": "Acknowledgments disclose IITP grant funded by Korea government (MSIT), grant number provided: No.RS-2022-II220184.",
     76         "source": "haiku"
     77       },
     78       "affiliations_disclosed": {
     79         "applies": true,
     80         "answer": true,
     81         "justification": "Authors affiliated with KAIST and Max Planck Institute for Security & Privacy. No conflicts with evaluated models (OpenAI, Meta).",
     82         "source": "haiku"
     83       },
     84       "funder_independent_of_outcome": {
     85         "applies": true,
     86         "answer": true,
     87         "justification": "Korean government funding for 'AI Ethics' is independent of the LLM developers being evaluated (OpenAI, Meta).",
     88         "source": "haiku"
     89       },
     90       "financial_interests_declared": {
     91         "applies": true,
     92         "answer": false,
     93         "justification": "No competing interests statement present in the paper. No mention of patents, equity, or consulting relationships.",
     94         "source": "haiku"
     95       }
     96     },
     97     "scope_and_framing": {
     98       "key_terms_defined": {
     99         "applies": true,
    100         "answer": true,
    101         "justification": "Persona defined in Section 3.1 with examples (Table 1). AMCE explained in 3.2. MDD formally defined in 3.3 (Eq. 1). Moral Machine referenced to Awad et al. (2018). Alignment operationalized via AMCE comparison.",
    102         "source": "haiku"
    103       },
    104       "intended_contribution_clear": {
    105         "applies": true,
    106         "answer": true,
    107         "justification": "Three explicit contributions stated in introduction: (1) evidence persona influences LLM decisions, (2) proposes MDD metric, (3) discusses ethical risks via partisan sorting. Reader knows what's being added.",
    108         "source": "haiku"
    109       },
    110       "engagement_with_prior_work": {
    111         "applies": true,
    112         "answer": true,
    113         "justification": "Section 2 reviews Moral Machine Experiment foundation, prior LLM moral reasoning studies (Ahmad & Takemoto 2024, Takemoto 2024, Jin et al. 2024), and persona setting literature. Shows gap this work fills (context-dependent persona effects).",
    114         "source": "haiku"
    115       }
    116     }
    117   },
    118   "type_checklist": {
    119     "empirical": {
    120       "artifacts": {
    121         "code_released": {
    122           "applies": true,
    123           "answer": false,
    124           "justification": "No code, GitHub, or reproduction script mentioned. No availability statement beyond scenario methodology reference to Takemoto (2024).",
    125           "source": "haiku"
    126         },
    127         "data_released": {
    128           "applies": true,
    129           "answer": false,
    130           "justification": "Uses public Moral Machine dataset (Awad et al. 2018) as baseline. Generated 10,000 scenarios and LLM responses are not released or promised.",
    131           "source": "haiku"
    132         },
    133         "environment_specified": {
    134           "applies": true,
    135           "answer": false,
    136           "justification": "No requirements.txt, Dockerfile, or conda env file. Model versions specified (gpt-4o-2024-05-13, gpt-3.5-turbo-0613, Llama-2-7b-chat-hf) and hyperparameters given (temperature, top-p, etc.), but no comprehensive environment spec.",
    137           "source": "haiku"
    138         },
    139         "reproduction_instructions": {
    140           "applies": true,
    141           "answer": false,
    142           "justification": "No step-by-step reproduction instructions provided. Methodology described (apply persona prompt, query model, compute AMCE, compute MDD) but no code, scripts, or explicit walkthrough to reproduce.",
    143           "source": "haiku"
    144         }
    145       },
    146       "statistical_methodology": {
    147         "confidence_intervals_or_error_bars": {
    148           "applies": true,
    149           "answer": false,
    150           "justification": "Figures (2-6) show point estimates for AMCE and MDD values. No confidence intervals, credible intervals, or error bars reported for any results.",
    151           "source": "haiku"
    152         },
    153         "significance_tests": {
    154           "applies": true,
    155           "answer": false,
    156           "justification": "Multiple comparisons made (LLM vs. human, across models, across personas) without statistical significance tests. No p-values, t-tests, or frequentist/Bayesian hypothesis tests.",
    157           "source": "haiku"
    158         },
    159         "effect_sizes_reported": {
    160           "applies": true,
    161           "answer": false,
    162           "justification": "MDD values and AMCE values reported as descriptive metrics, not as formal effect sizes (Cohen's d, correlation, odds ratios). No effect size interpretation framework.",
    163           "source": "haiku"
    164         },
    165         "sample_size_justified": {
    166           "applies": true,
    167           "answer": false,
    168           "justification": "10,000 scenarios chosen following Takemoto (2024) but no power analysis or justification for why 10,000 is adequate to detect persona effects.",
    169           "source": "haiku"
    170         },
    171         "variance_reported": {
    172           "applies": true,
    173           "answer": false,
    174           "justification": "Figures show individual bars/points by persona but no standard deviations, confidence intervals, or variance measures across runs or scenarios. Aggregated statistics lack spread.",
    175           "source": "haiku"
    176         }
    177       },
    178       "evaluation_design": {
    179         "baselines_included": {
    180           "applies": true,
    181           "answer": true,
    182           "justification": "Baseline comparisons: (1) human responses from Awad et al. (2018) AMCE values, (2) 'no persona' condition for each model. Both present.",
    183           "source": "haiku"
    184         },
    185         "baselines_contemporary": {
    186           "applies": true,
    187           "answer": true,
    188           "justification": "Human baseline from 2018 Moral Machine (canonical source for this task). LLM models from 2023-2024. Contemporary within the scope of the Moral Machine evaluation framework.",
    189           "source": "haiku"
    190         },
    191         "ablation_study": {
    192           "applies": true,
    193           "answer": false,
    194           "justification": "Includes baseline vs. persona treatment comparison, but no ablations of persona prompt design. No testing of alternative persona definitions, prompt templates, or component effects.",
    195           "source": "haiku"
    196         },
    197         "multiple_metrics": {
    198           "applies": true,
    199           "answer": true,
    200           "justification": "Multiple metrics used: AMCE for each of 9 dimensions, MDD (Euclidean distance), alignment scores (Table 2), valid response rates (Table 4), decision flip percentages (Fig. 5).",
    201           "source": "haiku"
    202         },
    203         "human_evaluation": {
    204           "applies": true,
    205           "answer": true,
    206           "justification": "Compares LLM outputs against human response data from Awad et al. (2018) Moral Machine survey (11.2M answers from 463k users). Human data used as evaluation baseline.",
    207           "source": "haiku"
    208         },
    209         "held_out_test_set": {
    210           "applies": false,
    211           "answer": false,
    212           "justification": "Not a prediction task; no held-out test set needed. All 10,000 scenarios treated as evaluation set for comparing personas.",
    213           "source": "haiku"
    214         },
    215         "per_category_breakdown": {
    216           "applies": true,
    217           "answer": true,
    218           "justification": "Results broken down by persona category (age, gender, education, income, political, religion, culture), scenario dimension (9 categories), and model (GPT-4o, GPT-3.5, Llama2). Comprehensive breakdown.",
    219           "source": "haiku"
    220         },
    221         "failure_cases_discussed": {
    222           "applies": true,
    223           "answer": false,
    224           "justification": "Llama2 has severe response rate failures (7.2% valid for conservative, 6% for religious persona; Table 4) but these are mentioned as a fact, not discussed as a limitation or failure mode.",
    225           "source": "haiku"
    226         },
    227         "negative_results_reported": {
    228           "applies": true,
    229           "answer": false,
    230           "justification": "Paper reports primarily positive findings about persona effects on LLMs. The contrast (humans stable, LLMs volatile) is framed as a finding, not a negative result of the method.",
    231           "source": "haiku"
    232         }
    233       },
    234       "setup_transparency": {
    235         "model_versions_specified": {
    236           "applies": true,
    237           "answer": true,
    238           "justification": "Model versions explicitly specified: GPT-4o 'gpt-4o-2024-05-13', GPT-3.5 'gpt-3.5-turbo-0613 (June 2023)', Llama2 'Llama-2-7b-chat-hf'. Exact snapshots given.",
    239           "source": "haiku"
    240         },
    241         "prompts_provided": {
    242           "applies": true,
    243           "answer": false,
    244           "justification": "Persona prompt template shown: 'You {persona}. Your responses should closely mirror...' Persona values in Table 1. But actual scenario prompts from Moral Machine not fully reproduced; only referenced to Awad et al. (2018).",
    245           "source": "haiku"
    246         },
    247         "hyperparameters_reported": {
    248           "applies": true,
    249           "answer": true,
    250           "justification": "GPT models: temperature=1, top_p=1 (default Azure OpenAI). Llama2: top_k=10, top_p=0.9, max_length=512, temperature=0.4. Hyperparameters fully reported.",
    251           "source": "haiku"
    252         },
    253         "scaffolding_described": {
    254           "applies": false,
    255           "answer": false,
    256           "justification": "No agentic scaffolding (no reasoning chains, tools, or multi-step processes). Simple prompt-response setup. N/A.",
    257           "source": "haiku"
    258         },
    259         "data_preprocessing_documented": {
    260           "applies": true,
    261           "answer": false,
    262           "justification": "10,000 scenarios generated via 'constrained randomization' following Takemoto (2024). No detailed preprocessing pipeline, filtering steps, or cleaning documented.",
    263           "source": "haiku"
    264         }
    265       },
    266       "data_integrity": {
    267         "raw_data_available": {
    268           "applies": true,
    269           "answer": false,
    270           "justification": "Raw LLM responses not released. Generated scenarios not released. Only published results (AMCE, MDD, figures) available. No raw data repository or supplement.",
    271           "source": "haiku"
    272         },
    273         "data_collection_described": {
    274           "applies": true,
    275           "answer": true,
    276           "justification": "10,000 scenarios generated using constrained randomization across 9 categories, following Takemoto (2024). Queried 3 LLM models with persona prompts. Method is described at high level.",
    277           "source": "haiku"
    278         },
    279         "recruitment_methods_described": {
    280           "applies": false,
    281           "answer": false,
    282           "justification": "No human recruitment for this study. Human baseline data obtained from Awad et al. (2018) Moral Machine survey (details in A.2). N/A for this paper.",
    283           "source": "haiku"
    284         },
    285         "data_pipeline_documented": {
    286           "applies": true,
    287           "answer": false,
    288           "justification": "Pipeline: generate scenarios → query LLMs → compute AMCE → compute MDD → analyze. Described at conceptual level but no detailed documentation of transformations, filtering, or validation steps.",
    289           "source": "haiku"
    290         }
    291       },
    292       "contamination": {
    293         "training_cutoff_stated": {
    294           "applies": true,
    295           "answer": true,
    296           "justification": "Model versions imply cutoffs: GPT-4o May 2024, GPT-3.5 June 2023, Llama2 2023. Moral Machine 2018 is well before all cutoffs. Contamination risk is minimal.",
    297           "source": "haiku"
    298         },
    299         "train_test_overlap_discussed": {
    300           "applies": true,
    301           "answer": false,
    302           "justification": "Train-test overlap not explicitly discussed. Dates imply no overlap (Moral Machine 2018 is prior to model training), but this could be stated explicitly.",
    303           "source": "haiku"
    304         },
    305         "benchmark_contamination_addressed": {
    306           "applies": true,
    307           "answer": false,
    308           "justification": "Moral Machine benchmark created 2018, well before model training cutoffs (2023-2024). No contamination risk, but this is not explicitly stated or addressed.",
    309           "source": "haiku"
    310         }
    311       },
    312       "human_studies": {
    313         "pre_registered": {
    314           "applies": false,
    315           "answer": false,
    316           "justification": "No human participants recruited. Not a pre-registered human study. N/A.",
    317           "source": "haiku"
    318         },
    319         "irb_or_ethics_approval": {
    320           "applies": false,
    321           "answer": false,
    322           "justification": "No human participants. No IRB approval needed. N/A.",
    323           "source": "haiku"
    324         },
    325         "demographics_reported": {
    326           "applies": false,
    327           "answer": false,
    328           "justification": "No human participants recruited. Human baseline data from Awad et al. (2018) has demographic info (Fig. 7 in appendix) but not reported for this study. N/A.",
    329           "source": "haiku"
    330         },
    331         "inclusion_exclusion_criteria": {
    332           "applies": false,
    333           "answer": false,
    334           "justification": "No human participants. N/A.",
    335           "source": "haiku"
    336         },
    337         "randomization_described": {
    338           "applies": false,
    339           "answer": false,
    340           "justification": "No human participants. N/A.",
    341           "source": "haiku"
    342         },
    343         "blinding_described": {
    344           "applies": false,
    345           "answer": false,
    346           "justification": "No human participants. N/A.",
    347           "source": "haiku"
    348         },
    349         "attrition_reported": {
    350           "applies": false,
    351           "answer": false,
    352           "justification": "No human participants. N/A.",
    353           "source": "haiku"
    354         }
    355       },
    356       "cost_and_practicality": {
    357         "inference_cost_reported": {
    358           "applies": true,
    359           "answer": false,
    360           "justification": "No inference cost, API cost, or latency reported. 10,000 scenarios × 3 models × persona conditions queried but no compute budget disclosed.",
    361           "source": "haiku"
    362         },
    363         "compute_budget_stated": {
    364           "applies": true,
    365           "answer": false,
    366           "justification": "Total computational budget not stated. Number of API calls (10,000 scenarios, 3 models, 15 persona conditions = ~450k calls) can be inferred but not explicitly stated.",
    367           "source": "haiku"
    368         }
    369       }
    370     }
    371   },
    372   "claims": [
    373     {
    374       "claim": "LLM moral decisions vary substantially by persona assignment, more so than human decisions",
    375       "evidence": "Fig. 2 shows MDD values for humans (0.33 for age, 0.27 for gender) vs. LLMs (GPT-4o: 0.48 for political, 0.17 for gender; GPT-3.5, Llama2 show higher variance across dimensions). Fig. 3 aggregates this showing overall LLM MDD > human MDD.",
    376       "supported": "strong"
    377     },
    378     {
    379       "claim": "Political persona has the strongest effect on LLM decisions compared to other demographic factors",
    380       "evidence": "Table 2 and Fig. 3 show political persona MDD=0.48 for GPT-4o, higher than age (0.33), gender (0.27), culture (0.17), education (0.08), religion (0.07), income (0.06). Consistent across all three models.",
    381       "supported": "strong"
    382     },
    383     {
    384       "claim": "Human moral decisions remain robust to persona/demographic assignment",
    385       "evidence": "Fig. 4 shows human AMCE values consistently above or below 0 across all persona conditions (no reversals). Fig. 6 shows human variance near zero across all personas, in contrast to large LLM fluctuations.",
    386       "supported": "strong"
    387     },
    388     {
    389       "claim": "Approximately 20% of LLM decisions flip (reverse direction) under persona assignment for GPT-3.5 and Llama2",
    390       "evidence": "Fig. 5 reports 'Moral Flip' percentages: GPT-4o ~7%, GPT-3.5 ~19%, Llama2 ~19% of decisions show shift from human baseline.",
    391       "supported": "strong"
    392     },
    393     {
    394       "claim": "GPT-4o shows closest alignment with human moral responses compared to GPT-3.5 and Llama2",
    395       "evidence": "Table 2 shows alignment scores (lower is better): GPT-4o averages 0.84, GPT-3.5 averages 0.94, Llama2 averages 1.27. Fig. 2 shows GPT-4o AMCE profiles more closely mirror human profiles.",
    396       "supported": "strong"
    397     },
    398     {
    399       "claim": "Assigning a progressive political persona to LLMs shifts preferences away from social status (authority), while conservative persona favors status",
    400       "evidence": "Fig. 4 shows social status dimension has opposing preferences by political persona: conservative bars positive (spare higher status), progressive bars negative (spare lower status). Discussed in Section 4.4 with reference to partisan sorting theory.",
    401       "supported": "moderate"
    402     },
    403     {
    404       "claim": "Llama2 has severe guardrail issues for certain personas, with <10% valid response rates",
    405       "evidence": "Table 4 reports valid response rates for Llama2: conservative 7.2%, female 17.1%, religious 6.0%, western 21.8%. Many conditions below 20%, making inference unreliable.",
    406       "supported": "strong"
    407     },
    408     {
    409       "claim": "Binary persona prompts can induce 'partisan sorting' behavior where political identity becomes the dominant decision factor",
    410       "evidence": "Section 4.3 and Fig. 3 show political persona MDD=0.48 for GPT-4o, discussed via Mason (2015) partisan sorting theory. However, this is an interpretation; the evidence is that political personas cause large decision shifts, not direct proof of sorting mechanism.",
    411       "supported": "moderate"
    412     }
    413   ],
    414   "methodology_tags": [
    415     "benchmark-eval",
    416     "observational"
    417   ],
    418   "key_findings": "The study reveals that LLMs exhibit substantially greater variability in moral decision-making across demographic personas than humans do, with political persona identity having the largest effect (MDD=0.48 for GPT-4o). While human moral preferences remain consistent across political identities, LLM preferences show directional flips—most notably for social status judgments, where political persona drives opposing choices. GPT-4o aligns most closely with human responses, while GPT-3.5 and Llama2 show more erratic behavior (≈20% decision flips). These findings suggest LLMs may be vulnerable to 'partisan sorting' effects, raising ethical concerns for deployment in morally sensitive applications like autonomous vehicle decision-making.",
    419   "red_flags": [
    420     {
    421       "flag": "No significance testing or confidence intervals",
    422       "detail": "All AMCE and MDD values reported as point estimates with no p-values, confidence intervals, or hypothesis tests. Cannot assess whether observed differences are statistically robust."
    423     },
    424     {
    425       "flag": "No code or data release",
    426       "detail": "Reproducibility impossible. Generated 10,000 scenarios and LLM responses are not released. No code provided to reproduce AMCE or MDD calculations."
    427     },
    428     {
    429       "flag": "Llama2 guardrail failures",
    430       "detail": "Valid response rates for Llama2 as low as 6% (religious persona) and 7.2% (conservative). Results for these conditions are unreliable and should not be trusted."
    431     },
    432     {
    433       "flag": "Single persona prompt template tested",
    434       "detail": "Only one persona prompting strategy tested ('You {persona}. Your responses should closely mirror...'). No ablation across prompt variations, instruction clarity, or persona intensity. Findings may reflect prompt design artifacts, not genuine persona effects."
    435     },
    436     {
    437       "flag": "No sample size justification",
    438       "detail": "10,000 scenarios chosen following Takemoto (2024) but no power analysis or statistical justification for this size. No discussion of how many scenarios needed to detect persona effects."
    439     },
    440     {
    441       "flag": "Limited alternative explanation exploration",
    442       "detail": "Paper interprets political persona effects as 'partisan sorting' but doesn't explore whether AMCE shifts are due to: training data imbalance, temperature/sampling artifact, prompt injection, or genuine value alignment."
    443     },
    444     {
    445       "flag": "7-year-old human baseline",
    446       "detail": "Human comparison data from Awad et al. (2018) Moral Machine. Population, internet usage, and demographics may differ substantially from 2025 context."
    447     },
    448     {
    449       "flag": "Crude binary persona definitions",
    450       "detail": "Personas defined as binary pairs (old/young, rich/poor, conservative/progressive). Real-world demographics are continuous and intersectional. Findings limited to extreme contrasts."
    451     }
    452   ],
    453   "cited_papers": [
    454     {
    455       "title": "The moral machine experiment",
    456       "authors": "Awad et al.",
    457       "year": 2018,
    458       "relevance": "Foundation for this work. Original Moral Machine benchmark and human preference data (Moral Machine experiment). Primary baseline."
    459     },
    460     {
    461       "title": "Large-scale moral machine experiment on large language models",
    462       "authors": "Ahmad & Takemoto",
    463       "year": 2024,
    464       "relevance": "Prior LLM evaluation on Moral Machine across 50+ models. Compared LLM alignment across model sizes and training approaches. Directly cited for methodological reference."
    465     },
    466     {
    467       "title": "The moral machine experiment on large language models",
    468       "authors": "Takemoto",
    469       "year": 2024,
    470       "relevance": "Methodology source for generating constrained randomization scenarios. Baseline comparison for model selection (GPT-4o, GPT-3.5, Llama2)."
    471     },
    472     {
    473       "title": "Language model alignment in multilingual trolley problems",
    474       "authors": "Jin et al.",
    475       "year": 2024,
    476       "relevance": "Prior work on persona effects via language/cultural framing in Moral Machine. Examined if different languages trigger different moral choices."
    477     },
    478     {
    479       "title": "Moral foundations of large language models",
    480       "authors": "Abdulhai et al.",
    481       "year": 2023,
    482       "relevance": "Cited for partisan sorting theory interpretation. Shows LLMs reflect political biases tied to moral foundations (authority, loyalty, etc.)."
    483     },
    484     {
    485       "title": "Bias runs deep: Implicit reasoning biases in persona-assigned LLMs",
    486       "authors": "Gupta et al.",
    487       "year": 2024,
    488       "relevance": "Source for persona prompting template used in this work. Reviews how conditioning personas shapes LLM behavior and biases."
    489     },
    490     {
    491       "title": "From persona to personalization: A survey on role-playing language agents",
    492       "authors": "Chen et al.",
    493       "year": 2024,
    494       "relevance": "Survey on persona modeling in LLMs. Reviews broader literature on prompt design and persona-based personalization."
    495     },
    496     {
    497       "title": "I disrespectfully agree: The differential effects of partisan sorting on social and issue polarization",
    498       "authors": "Mason",
    499       "year": 2015,
    500       "relevance": "Partisan sorting theory cited to explain political persona effects. Provides sociological framework for interpreting LLM political sensitivity."
    501     }
    502   ],
    503   "engagement_factors": {
    504     "practical_relevance": {
    505       "score": 2,
    506       "justification": "Identifies real deployment risk (LLM misalignment on moral decisions) but provides no mitigation strategies. Useful for red-flagging the problem; not actionable for practitioners."
    507     },
    508     "surprise_contrarian": {
    509       "score": 2,
    510       "justification": "That LLMs are persona-sensitive is somewhat expected given prior work (Gupta et al., Simmons). The finding that political identity dominates other factors is noteworthy but not shocking."
    511     },
    512     "fear_safety": {
    513       "score": 3,
    514       "justification": "Directly raises AI safety concern: LLM bias and misalignment in morally critical decisions (autonomous vehicles, healthcare). Shows systematic vulnerability to targeted contextual manipulation."
    515     },
    516     "drama_conflict": {
    517       "score": 1,
    518       "justification": "Academically presented without sensationalism. No dramatic framing, no novel controversy, no industry/lab conflicts."
    519     },
    520     "demo_ability": {
    521       "score": 0,
    522       "justification": "No reproducible demo possible. No code released, no interactive tool. Requires API access to models and cannot be easily tried by readers."
    523     },
    524     "brand_recognition": {
    525       "score": 2,
    526       "justification": "KAIST and Max Planck Institute are reputable but not top-tier (not MIT, Stanford, DeepMind, OpenAI). Publication at ICLR 2025 adds credibility but limited prestige draw."
    527     }
    528   },
    529   "hn_data": {
    530     "threads": [
    531       {
    532         "hn_id": "46728063",
    533         "title": "New York Times games are hard: A computational perspective",
    534         "points": 73,
    535         "comments": 33,
    536         "url": "https://news.ycombinator.com/item?id=46728063"
    537       },
    538       {
    539         "hn_id": "43205755",
    540         "title": "Towards an AI Co-Scientist",
    541         "points": 47,
    542         "comments": 17,
    543         "url": "https://news.ycombinator.com/item?id=43205755"
    544       },
    545       {
    546         "hn_id": "44253021",
    547         "title": "SmartAttack: Air-Gap Attack via Smartwatches",
    548         "points": 18,
    549         "comments": 6,
    550         "url": "https://news.ycombinator.com/item?id=44253021"
    551       },
    552       {
    553         "hn_id": "44272942",
    554         "title": "Securing Credit Inquiries: Real-Time User Approval to Stop SSN Identity Theft",
    555         "points": 6,
    556         "comments": 0,
    557         "url": "https://news.ycombinator.com/item?id=44272942"
    558       },
    559       {
    560         "hn_id": "43763905",
    561         "title": "Visual Language Models show widespread deficits on neuropsychological tests",
    562         "points": 3,
    563         "comments": 0,
    564         "url": "https://news.ycombinator.com/item?id=43763905"
    565       },
    566       {
    567         "hn_id": "44366937",
    568         "title": "SmartAttack: Air-Gap Attack via Smartwatches",
    569         "points": 2,
    570         "comments": 0,
    571         "url": "https://news.ycombinator.com/item?id=44366937"
    572       },
    573       {
    574         "hn_id": "44254732",
    575         "title": "SmartAttack: Air-Gap Attack via Smartwatches",
    576         "points": 2,
    577         "comments": 0,
    578         "url": "https://news.ycombinator.com/item?id=44254732"
    579       },
    580       {
    581         "hn_id": "46345690",
    582         "title": "Computational complexity of New York Times games",
    583         "points": 1,
    584         "comments": 0,
    585         "url": "https://news.ycombinator.com/item?id=46345690"
    586       },
    587       {
    588         "hn_id": "22971877",
    589         "title": "Impact of Bias on School Admissions and Targeted Interventions",
    590         "points": 1,
    591         "comments": 0,
    592         "url": "https://news.ycombinator.com/item?id=22971877"
    593       }
    594     ],
    595     "top_points": 73,
    596     "total_points": 153,
    597     "total_comments": 56
    598   }
    599 }

Impressum · Datenschutz