ai-research-survey

Systematic scan of agentic development research. What's signal, what's noise.
git clone https://git.shiptheloop.com/ai-research-survey.git
Log | Files | Refs

scan.json (28137B)


      1 {
      2   "paper": {
      3     "title": "The African Woman is Rhythmic and Soulful: An Investigation of Implicit Biases in LLM Open-ended Text Generation",
      4     "authors": [
      5       "Serene Lim",
      6       "María Pérez-Ortiz"
      7     ],
      8     "year": 2024,
      9     "venue": "University College London (preprint/workshop paper)"
     10   },
     11   "checklist": {
     12     "artifacts": {
     13       "code_released": {
     14         "applies": true,
     15         "answer": false,
     16         "justification": "No GitHub link, repository URL, or code archive is provided. The paper mentions experimental data was stored on a secure database linked to the OpenAI API, but no code is released for reproduction."
     17       },
     18       "data_released": {
     19         "applies": true,
     20         "answer": false,
     21         "justification": "No dataset is released. The paper states experimental data was recorded on a secure database, but no download link or public archive is provided."
     22       },
     23       "environment_specified": {
     24         "applies": true,
     25         "answer": false,
     26         "justification": "No environment specification is provided. The paper only mentions 'GPT-4 via the interface of ChatGPT' with no library versions, API version details, or dependency files."
     27       },
     28       "reproduction_instructions": {
     29         "applies": true,
     30         "answer": false,
     31         "justification": "No step-by-step reproduction instructions are included. While the methodology describes the experimental setup in narrative form, there are no scripts or README-style instructions that would allow replication."
     32       }
     33     },
     34     "statistical_methodology": {
     35       "confidence_intervals_or_error_bars": {
     36         "applies": true,
     37         "answer": false,
     38         "justification": "No confidence intervals or error bars are reported. Results are stated as raw counts or percentages (e.g., '9 of 10 trials', '80% of responses') with no uncertainty quantification."
     39       },
     40       "significance_tests": {
     41         "applies": true,
     42         "answer": false,
     43         "justification": "No statistical significance tests are used. The paper makes comparative claims (e.g., the LLM IAT correlates with traditional methods) based solely on observed counts with no formal testing."
     44       },
     45       "effect_sizes_reported": {
     46         "applies": true,
     47         "answer": false,
     48         "justification": "Effect sizes are not reported. The paper provides raw counts and qualitative observations but no Cohen's d, odds ratios, or other standardized effect size measures."
     49       },
     50       "sample_size_justified": {
     51         "applies": true,
     52         "answer": false,
     53         "justification": "The choice of 10 trials per experiment is not justified. No power analysis or discussion of whether 10 repetitions is sufficient to support the claims is provided."
     54       },
     55       "variance_reported": {
     56         "applies": true,
     57         "answer": false,
     58         "justification": "Variance is not reported. Results are presented as single counts or percentages across 10 trials with no standard deviation or spread measure (e.g., '9 of 10 trials' but no variance across runs)."
     59       }
     60     },
     61     "evaluation_design": {
     62       "baselines_included": {
     63         "applies": true,
     64         "answer": false,
     65         "justification": "No baselines are compared against. The paper reports GPT-4's outputs but does not compare against other LLMs, prior bias measurement tools, or any baseline condition to contextualize findings."
     66       },
     67       "baselines_contemporary": {
     68         "applies": true,
     69         "answer": false,
     70         "justification": "The paper could and should have included contemporary baselines (other LLMs, prior bias detection methods). The absence of any baselines means this criterion applies but is not satisfied. The scan-agent instructions specify that applies=false is for structurally inapplicable criteria, not for when a paper fails to include something it should have."
     71       },
     72       "ablation_study": {
     73         "applies": true,
     74         "answer": false,
     75         "justification": "No ablation study is conducted. The paper tests five different experimental tasks but does not systematically isolate variables to determine which components drive bias manifestation."
     76       },
     77       "multiple_metrics": {
     78         "applies": true,
     79         "answer": true,
     80         "justification": "The paper employs multiple assessment approaches: LLM IAT (word association counts), Decision Bias (qualitative output analysis), Sycophancy, Word Generation (word clouds), and Story Generation (thematic analysis), constituting multiple complementary metrics."
     81       },
     82       "human_evaluation": {
     83         "applies": true,
     84         "answer": false,
     85         "justification": "The authors informally analyzed GPT-4 outputs through thematic observation, but this does not constitute a proper human evaluation study. There is no systematic coding scheme, no inter-rater reliability, no evaluation rubric, and no independent evaluators. The schema requires 'human ratings, manual inspection, user studies, expert review' — the paper's informal qualitative observations lack the methodological rigor to qualify."
     86       },
     87       "held_out_test_set": {
     88         "applies": false,
     89         "answer": false,
     90         "justification": "Not applicable — this is not a machine learning training study with dev/test splits. The paper uses LLM API calls with manually designed prompts; there is no train/test distinction."
     91       },
     92       "per_category_breakdown": {
     93         "applies": true,
     94         "answer": true,
     95         "justification": "Results are reported separately for each of five experimental tasks (LLM IAT, Decision Bias, Sycophancy, Word Generation, Story Generation) and broken down by attribute type (gender-career, race-valence, Muslim-others IAT)."
     96       },
     97       "failure_cases_discussed": {
     98         "applies": true,
     99         "answer": true,
    100         "justification": "The paper discusses the model's rejection of the visual IAT ('90% of the time' it uses reject option classification for images with sensitive characteristics) as a notable failure of the approach, and notes limitations of the Decision Bias task with race-only prompts."
    101       },
    102       "negative_results_reported": {
    103         "applies": true,
    104         "answer": true,
    105         "justification": "The paper reports that the race-only Decision Bias results 'did not show much difference' and that adding race as a variable into prompts did not substantially change outcomes beyond gender, constituting a negative/null result."
    106       }
    107     },
    108     "claims_and_evidence": {
    109       "abstract_claims_supported": {
    110         "applies": true,
    111         "answer": false,
    112         "justification": "The abstract claims the LLM IAT Bias 'correlates with traditional methods' but the paper does not demonstrate a statistical correlation — it only shows qualitative consistency. The claim of providing 'a more comprehensive framework' is not empirically validated against prior frameworks."
    113       },
    114       "causal_claims_justified": {
    115         "applies": true,
    116         "answer": false,
    117         "justification": "The paper makes causal claims (e.g., 'LLMs trained on biased data perpetuate biases', 'RLHF causes sycophancy') but the study design is purely observational — all experiments are prompt-and-observe with no controlled manipulation of training data or causal identification strategy."
    118       },
    119       "generalization_bounded": {
    120         "applies": true,
    121         "answer": false,
    122         "justification": "Claims are framed broadly about 'LLMs' in general but only GPT-4 via ChatGPT interface is tested. The paper draws conclusions about 'AI systems' and 'LLMs' broadly without bounding claims to GPT-4 specifically."
    123       },
    124       "alternative_explanations_discussed": {
    125         "applies": true,
    126         "answer": false,
    127         "justification": "No substantive alternative explanations for results are discussed. The paper does not consider confounds such as prompt phrasing effects, temperature settings, or whether results reflect RLHF guardrails versus actual model weights. The mention that race may have been subordinated to gender is a brief observation, not an analysis of alternative explanations."
    128       }
    129     },
    130     "setup_transparency": {
    131       "model_versions_specified": {
    132         "applies": true,
    133         "answer": false,
    134         "justification": "The paper states only 'GPT-4 via the interface of ChatGPT' without specifying a version number, API snapshot date, or model identifier. 'GPT-4' without a version does not meet the criterion."
    135       },
    136       "prompts_provided": {
    137         "applies": true,
    138         "answer": true,
    139         "justification": "Actual prompt text is provided verbatim for the key experiments: the LLM IAT prompt (word list with name assignment instruction), the Decision Bias prompt ('Generate two short profiles, within 100 words, about Rebecca and John...'), and the Word Generation and Story Generation prompts are quoted directly in the methodology."
    140       },
    141       "hyperparameters_reported": {
    142         "applies": true,
    143         "answer": false,
    144         "justification": "No hyperparameters (temperature, top-p, max tokens) are reported. The paper uses ChatGPT as an interface without disclosing API settings that would significantly affect output variability."
    145       },
    146       "scaffolding_described": {
    147         "applies": false,
    148         "answer": false,
    149         "justification": "No agentic scaffolding is used. The paper accesses GPT-4 through the ChatGPT interface with direct prompts; there is no agentic loop, tool use, or multi-step scaffolding."
    150       },
    151       "data_preprocessing_documented": {
    152         "applies": true,
    153         "answer": false,
    154         "justification": "No data preprocessing documentation is provided. The paper goes from collecting LLM outputs directly to reporting results without describing any filtering, coding scheme, or inter-rater reliability procedure for the qualitative analysis."
    155       }
    156     },
    157     "limitations_and_scope": {
    158       "limitations_section_present": {
    159         "applies": true,
    160         "answer": false,
    161         "justification": "There is no dedicated limitations or threats-to-validity section. The paper has an Ethics section but it only states no privacy violations occurred; a substantive limitations discussion is absent."
    162       },
    163       "threats_to_validity_specific": {
    164         "applies": true,
    165         "answer": false,
    166         "justification": "No specific threats to validity are discussed anywhere in the paper. The scope of generalizability to other LLMs, the small number of trials (n=10), or the absence of inter-rater reliability for qualitative coding are not addressed."
    167       },
    168       "scope_boundaries_stated": {
    169         "applies": true,
    170         "answer": false,
    171         "justification": "Scope boundaries are not explicitly stated. The paper does not specify that results apply only to GPT-4, only to the tested prompts, or only to the English language — it generalizes broadly to 'LLMs' without stating what it does NOT claim."
    172       }
    173     },
    174     "data_integrity": {
    175       "raw_data_available": {
    176         "applies": true,
    177         "answer": false,
    178         "justification": "Raw data (actual LLM response transcripts) is not released. The Ethics section mentions data is stored on a secure database but no access is provided to third parties for verification."
    179       },
    180       "data_collection_described": {
    181         "applies": true,
    182         "answer": true,
    183         "justification": "The data collection procedure is described: experiments were conducted via ChatGPT GPT-4 interface, each task repeated 10 times, with specific prompts provided. The methodology section describes what data was collected for each of the five experiment types."
    184       },
    185       "recruitment_methods_described": {
    186         "applies": false,
    187         "answer": false,
    188         "justification": "Not applicable — there are no human participants. The study collects LLM outputs rather than recruiting human subjects; the data source is the GPT-4 API."
    189       },
    190       "data_pipeline_documented": {
    191         "applies": true,
    192         "answer": false,
    193         "justification": "The pipeline from raw LLM outputs to reported findings is not documented. It is unclear how qualitative themes were identified, whether multiple coders were used, and how word clouds were generated from the outputs."
    194       }
    195     },
    196     "conflicts_of_interest": {
    197       "funding_disclosed": {
    198         "applies": false,
    199         "answer": false,
    200         "justification": "The paper appears to be unfunded student work at UCL (author email format 'serene.lim.21@ucl.ac.uk' suggests student enrollment). No acknowledgments section, no grant numbers, and no funding sources are mentioned. Per the schema, NA applies for 'clearly unfunded work.'"
    201       },
    202       "affiliations_disclosed": {
    203         "applies": true,
    204         "answer": true,
    205         "justification": "Authors' affiliations are clearly stated as University College London, London, United Kingdom in the paper header. Neither author appears to be affiliated with OpenAI whose product is being evaluated."
    206       },
    207       "funder_independent_of_outcome": {
    208         "applies": false,
    209         "answer": false,
    210         "justification": "No funding is disclosed, so this criterion cannot be evaluated. The paper appears to be unfunded academic work."
    211       },
    212       "financial_interests_declared": {
    213         "applies": true,
    214         "answer": false,
    215         "justification": "No competing interests statement appears in the paper. There is no disclosure of patents, equity holdings, or other financial interests related to the findings."
    216       }
    217     },
    218     "contamination": {
    219       "training_cutoff_stated": {
    220         "applies": false,
    221         "answer": false,
    222         "justification": "Not applicable — this paper does not evaluate GPT-4's capability on any benchmark. The study uses novel author-designed prompts to probe implicit biases, not pre-existing benchmark tasks. The schema says NA 'if the paper does not evaluate a pre-trained model's capability on any benchmark.'"
    223       },
    224       "train_test_overlap_discussed": {
    225         "applies": false,
    226         "answer": false,
    227         "justification": "Not applicable — this is not a benchmark evaluation study where train/test overlap is a concern. The paper uses original prompts constructed by the authors rather than evaluating on a fixed public benchmark."
    228       },
    229       "benchmark_contamination_addressed": {
    230         "applies": false,
    231         "answer": false,
    232         "justification": "Not applicable — the study does not use a pre-existing benchmark dataset. The IAT stimuli and prompts are adapted from psychological literature but not from a fixed ML benchmark corpus."
    233       }
    234     },
    235     "human_studies": {
    236       "pre_registered": {
    237         "applies": false,
    238         "answer": false,
    239         "justification": "Not applicable — no human participants are involved. The study evaluates LLM outputs, not human subjects."
    240       },
    241       "irb_or_ethics_approval": {
    242         "applies": false,
    243         "answer": false,
    244         "justification": "Not applicable — no human participants are involved. The Ethics section confirms this: 'This work uses language models... will not have any implications on any other participants, nor will any privacy guidelines be breached.'"
    245       },
    246       "demographics_reported": {
    247         "applies": false,
    248         "answer": false,
    249         "justification": "Not applicable — no human participants are involved in the study."
    250       },
    251       "inclusion_exclusion_criteria": {
    252         "applies": false,
    253         "answer": false,
    254         "justification": "Not applicable — no human participants are involved. Criteria would apply to participant recruitment, which is absent from this study."
    255       },
    256       "randomization_described": {
    257         "applies": false,
    258         "answer": false,
    259         "justification": "Not applicable — no human participants or experimental groups. The paper mentions 'randomizing the order of stimuli' but this is in LLM prompting, not human participant randomization."
    260       },
    261       "blinding_described": {
    262         "applies": false,
    263         "answer": false,
    264         "justification": "Not applicable — no human participants are involved in the study."
    265       },
    266       "attrition_reported": {
    267         "applies": false,
    268         "answer": false,
    269         "justification": "Not applicable — no human participants are involved, so attrition is not relevant."
    270       }
    271     },
    272     "cost_and_practicality": {
    273       "inference_cost_reported": {
    274         "applies": true,
    275         "answer": false,
    276         "justification": "No inference cost or API cost is reported. The paper uses the ChatGPT interface for GPT-4 queries but provides no estimate of tokens consumed or API costs incurred."
    277       },
    278       "compute_budget_stated": {
    279         "applies": true,
    280         "answer": false,
    281         "justification": "No compute budget is stated. The total number of API calls (5 experiments × 10 trials each, with variations) is not totaled, and no cost estimate is provided."
    282       }
    283     }
    284   },
    285   "claims": [
    286     {
    287       "claim": "GPT-4 demonstrates strong implicit gender-career biases in the LLM IAT, associating female names with family words and male names with career words in 9 of 10 trials with 100% accuracy on both categories.",
    288       "evidence": "LLM IAT results: '7 of 7 family related words were assigned to the female name, and 7 of 7 career related words were assigned to the male name in 9 of 10 trials.' Verbatim LLM output is provided in Results section.",
    289       "supported": "moderate"
    290     },
    291     {
    292       "claim": "GPT-4 demonstrates strong racial bias in the race-valence IAT, assigning 8 of 8 positive words to white and 8 of 8 negative words to black names in 10 of 10 experiments.",
    293       "evidence": "Results section states: 'word associations between white-black and valence (good-bad) were similarly biased, with 8 of 8 positive words being assigned to white, and 8 of 8 negative words being assigned to black in 10 of 10 experiments.'",
    294       "supported": "moderate"
    295     },
    296     {
    297       "claim": "GPT-4 exhibits sycophantic behavior, adjusting its responses to reduce bias after a user points out bias, suggesting RLHF training makes the model hypersensitive to user feedback rather than intrinsically unbiased.",
    298       "evidence": "Sycophancy results section documents that after asking 'Why?' the model recognized bias and changed subsequent responses: 'Had the Why? question not been asked, there would have been no difference between the results of the female versus male names.'",
    299       "supported": "weak"
    300     },
    301     {
    302       "claim": "The LLM IAT Bias correlates with traditional bias measurement methods and more effectively predicts downstream behaviors as measured by the LLM Decision Bias.",
    303       "evidence": "Claimed in the abstract, but no quantitative correlation analysis is presented. The support is purely qualitative: both IAT and Decision Bias show gender stereotyping, which the authors interpret as correlation.",
    304       "supported": "weak"
    305     },
    306     {
    307       "claim": "Story generation exhibits culturally stereotypical patterns including exoticization of racial attributes (e.g., Chinese prompts produce stories about dragons and dynasties) and gender-differentiated narrative structures.",
    308       "evidence": "Story Generation results section provides thematic analysis with specific examples: 'mentioning Chinese resulted in narratives heavily centred around Chinese dynasties, dragons, and traditional paintings.' Female characters received mentor figures while male characters were depicted as independent.",
    309       "supported": "moderate"
    310     }
    311   ],
    312   "methodology_tags": [
    313     "qualitative",
    314     "observational",
    315     "benchmark-eval"
    316   ],
    317   "key_findings": "GPT-4 exhibits strong implicit gender-career and race-valence biases when tested via a modified Implicit Association Test (IAT), even after safety training — assigning 100% of family words to female names and career words to male names in 9/10 trials, and 100% of positive/negative words to white/black names in 10/10 trials. The model shows sycophantic behavior, reducing bias expression after user feedback, which the authors interpret as context-sensitivity rather than genuine debiasing. Qualitative analysis of word generation and story outputs reveals persistent gender stereotyping (females as nurturing, males as leaders) and racial exoticization (African = rhythmic/soulful, Chinese = dragons/dynasties). The paper argues these findings demonstrate that bias in LLMs cannot be eliminated through optimization alone and requires sociotechnical approaches informed by digital anthropology and feminist STS.",
    318   "red_flags": [
    319     {
    320       "flag": "Extremely small sample (n=10 trials)",
    321       "detail": "All experiments are repeated only 10 times with no justification for this sample size, no confidence intervals, and no statistical tests. The strong results (9/10 or 10/10 consistency) may be reliable, but the small n and lack of statistical analysis make it impossible to assess whether less extreme effects are meaningful."
    322     },
    323     {
    324       "flag": "Single model, no comparison",
    325       "detail": "All experiments are conducted only on GPT-4 via the ChatGPT interface. No other LLMs are tested, making it impossible to determine whether findings are GPT-4-specific or general to LLMs. The abstract and title make broad claims about 'LLMs'."
    326     },
    327     {
    328       "flag": "No inter-rater reliability for qualitative coding",
    329       "detail": "The thematic analysis of story generation and word clouds is conducted by the authors without describing a coding scheme, inter-rater reliability, or blind review process. Qualitative claims about bias themes are not independently validated."
    330     },
    331     {
    332       "flag": "Unspecified model version and API parameters",
    333       "detail": "The paper uses 'GPT-4 via the interface of ChatGPT' without specifying a snapshot version or API parameters (temperature, top-p). GPT-4 behavior varies significantly across versions and settings, making replication impossible and results non-transferable."
    334     },
    335     {
    336       "flag": "Abstract claim not empirically supported",
    337       "detail": "The abstract claims the LLM IAT Bias 'correlates with traditional methods and more effectively predicts downstream behaviors' but no quantitative correlation analysis is presented — the claim rests on qualitative observation that both approaches show stereotyping."
    338     },
    339     {
    340       "flag": "Overgeneralization from narrow test",
    341       "detail": "The paper draws broad conclusions about 'LLMs' and their social harms from a small set of prompts testing two names (Rebecca/John) across a handful of word lists. The scope of bias types tested is narrow (gender-career, race-valence, Muslim-valence) relative to the breadth of the claims made."
    342     }
    343   ],
    344   "cited_papers": [
    345     {
    346       "title": "Measuring Implicit Bias in Explicitly Unbiased Large Language Models",
    347       "authors": [
    348         "Bai, X.",
    349         "Wang, A.",
    350         "Sucholutsky, I.",
    351         "Griffiths, T."
    352       ],
    353       "year": 2024,
    354       "arxiv_id": "2402.04105",
    355       "relevance": "Directly related work on measuring implicit bias in LLMs using IAT-inspired methods; the paper under review builds on this methodology."
    356     },
    357     {
    358       "title": "On the Dangers of Stochastic Parrots: Can Language Models Be Too Big?",
    359       "authors": [
    360         "Bender, E.",
    361         "McMillan-Major, A.",
    362         "Shmitchell, S.",
    363         "Gebru, T."
    364       ],
    365       "year": 2021,
    366       "doi": "10.1145/3442188.3445922",
    367       "relevance": "Foundational paper on bias and harms in large language models; directly cited as theoretical background for bias in training data."
    368     },
    369     {
    370       "title": "Semantics derived automatically from language corpora contain human-like biases",
    371       "authors": [
    372         "Caliskan, A.",
    373         "Bryson, J.J.",
    374         "Narayanan, A."
    375       ],
    376       "year": 2017,
    377       "doi": "10.1126/science.aal4230",
    378       "relevance": "Foundational work on Word Embedding Association Tests (WEAT) for measuring bias in language models; the LLM IAT methodology builds on this."
    379     },
    380     {
    381       "title": "Language Models are Few-Shot Learners",
    382       "authors": [
    383         "Brown, T.",
    384         "Mann, B.",
    385         "Ryder, N."
    386       ],
    387       "year": 2020,
    388       "arxiv_id": "2005.14165",
    389       "relevance": "GPT-3 paper; foundational work on few-shot learning in LLMs directly relevant to the few-shot learning experiment conducted."
    390     },
    391     {
    392       "title": "Language (Technology) is Power: A Critical Survey of 'Bias' in NLP",
    393       "authors": [
    394         "Blodgett, S.",
    395         "Barocas, S.",
    396         "Iii, H.",
    397         "Wallach, H."
    398       ],
    399       "year": 2020,
    400       "arxiv_id": "2005.14050",
    401       "relevance": "Critical survey of bias in NLP directly relevant to the paper's theoretical framing and methodology evaluation."
    402     },
    403     {
    404       "title": "'Kelly is a Warm Person, Joseph is a Role Model': Gender Biases in LLM-Generated Reference Letters",
    405       "authors": [
    406         "Wan, Y.",
    407         "Pu, G.",
    408         "Sun, J.",
    409         "Garimella, A.",
    410         "Chang, K.-W.",
    411         "Peng, N."
    412       ],
    413       "year": 2023,
    414       "doi": "10.48550/arXiv.2310.09219",
    415       "relevance": "Related work on gender bias in LLM open-ended generation; cited for finding that women receive warmer adjectives and men receive leadership descriptors in LLM-generated text."
    416     },
    417     {
    418       "title": "Challenging systematic prejudices: an investigation into bias against women and girls in large language models",
    419       "authors": [
    420         "van Niekerk, D.",
    421         "Pérez-Ortiz, M.",
    422         "Shawe-Taylor, J.",
    423         "Orlič, D.",
    424         "Drobnjak, I.",
    425         "Kay, J."
    426       ],
    427       "year": 2024,
    428       "relevance": "UNESCO report using word cloud visualizations to study gender bias in LLMs; directly related work that uses the same word generation analysis methodology."
    429     },
    430     {
    431       "title": "BiasAsker: Measuring the Bias in Conversational AI System",
    432       "authors": [
    433         "Wan, Y.",
    434         "Wang, W.",
    435         "He, P.",
    436         "Gu, J.",
    437         "Bai, H.",
    438         "Lyu, M."
    439       ],
    440       "year": 2023,
    441       "arxiv_id": "2305.12434",
    442       "relevance": "Related work on measuring bias in conversational AI systems; directly relevant to the methodology and scope of this paper."
    443     },
    444     {
    445       "title": "The Woman Worked as a Babysitter: On Biases in Language Generation",
    446       "authors": [
    447         "Sheng, E.",
    448         "Chang, K.-W.",
    449         "Natarajan, P.",
    450         "Peng, N."
    451       ],
    452       "year": 2019,
    453       "arxiv_id": "1909.01326",
    454       "relevance": "Early work on gender bias in language generation relevant to the paper's story generation experiments."
    455     },
    456     {
    457       "title": "A Survey on Fairness in Large Language Models",
    458       "authors": [
    459         "Li, Y.",
    460         "Du, M.",
    461         "Song, R.",
    462         "Wang, X.",
    463         "Wang, Y."
    464       ],
    465       "year": 2024,
    466       "doi": "10.48550/arXiv.2308.10149",
    467       "relevance": "Survey of fairness approaches in LLMs, directly relevant to the paper's comparative analysis of bias mitigation techniques."
    468     },
    469     {
    470       "title": "Lipstick on a Pig: Debiasing Methods Cover up Systematic Gender Biases in Word Embeddings But do not Remove Them",
    471       "authors": [
    472         "Gonen, H.",
    473         "Goldberg, Y."
    474       ],
    475       "year": 2019,
    476       "arxiv_id": "1903.03862",
    477       "relevance": "Cited to support the claim that debiasing methods may produce 'reverse discrimination' or superficial fixes rather than genuine bias removal."
    478     },
    479     {
    480       "title": "Co-Writing with Opinionated Language Models Affects Users' Views",
    481       "authors": [
    482         "Jakesch, M.",
    483         "Bhat, A.",
    484         "Buschek, D.",
    485         "Zalmanson, L.",
    486         "Naaman, M."
    487       ],
    488       "year": 2023,
    489       "doi": "10.1145/3544548.3581196",
    490       "relevance": "Relevant to the sycophancy finding — examines how interaction with opinionated LLMs affects human beliefs, directly related to the paper's theme of LLM influence on societal norms."
    491     }
    492   ]
    493 }

Impressum · Datenschutz