scan.json - ai-research-survey - Systematic scan of agentic development research. What's signal, what's noise.

scan.json (24554B)
      1 {
      2   "paper": {
      3     "title": "Systematic Literature Review on Generative AI: Ethical Challenges and Opportunities",
      4     "authors": ["Feliks Prasepta Sejahtera Surbakti"],
      5     "year": 2025,
      6     "venue": "International Journal of Advanced Computer Science and Applications (IJACSA)",
      7     "doi": "10.14569/ijacsa.2025.0160530"
      8   },
      9   "scan_version": 3,
     10   "active_modules": ["survey_methodology"],
     11   "methodology_tags": ["meta-analysis"],
     12   "key_findings": "This SLR of 112 peer-reviewed articles identifies five core ethical challenges in generative AI: algorithmic bias, misinformation/deepfakes, data privacy violations, intellectual property issues, and accountability/explainability. The review finds that GAI ethics research is heavily fragmented across disciplines with inconsistent terminology and limited empirical validation. The paper also identifies opportunities for ethical innovation through responsible design, inclusive governance, and interdisciplinary collaboration, and notes a dramatic surge in publications in 2024 (58 articles).",
     13   "checklist": {
     14     "artifacts": {
     15       "code_released": {
     16         "applies": true,
     17         "answer": false,
     18         "justification": "No analysis code or scripts are released. A survey can release its analysis code (e.g., coding scripts, bibliometric tools), but none is provided."
     19       },
     20       "data_released": {
     21         "applies": true,
     22         "answer": false,
     23         "justification": "The full list of 112 reviewed articles is not provided as a downloadable dataset. Table I shows only 10 of 112 entries. No supplementary materials or data files are referenced."
     24       },
     25       "environment_specified": {
     26         "applies": true,
     27         "answer": false,
     28         "justification": "No computational environment is specified. If any software tools were used for the thematic analysis or bibliometric analysis, they are not mentioned."
     29       },
     30       "reproduction_instructions": {
     31         "applies": true,
     32         "answer": false,
     33         "justification": "While the search strategy and PRISMA flow are described, there are no step-by-step reproduction instructions. The search query is provided but the full list of included papers is not, making independent reproduction impossible."
     34       }
     35     },
     36     "statistical_methodology": {
     37       "confidence_intervals_or_error_bars": {
     38         "applies": false,
     39         "answer": false,
     40         "justification": "This is a thematic literature review with no statistical analysis. No quantitative experiments are performed that would require confidence intervals."
     41       },
     42       "significance_tests": {
     43         "applies": false,
     44         "answer": false,
     45         "justification": "The paper performs thematic synthesis, not statistical analysis. No comparative statistical claims are made."
     46       },
     47       "effect_sizes_reported": {
     48         "applies": false,
     49         "answer": false,
     50         "justification": "No experimental comparisons are made. The paper reports article counts by category but these are descriptive, not effect sizes."
     51       },
     52       "sample_size_justified": {
     53         "applies": false,
     54         "answer": false,
     55         "justification": "As a thematic literature review, sample size justification in the experimental sense is not applicable. The corpus size of 112 is a result of the search/filter process, not a design choice."
     56       },
     57       "variance_reported": {
     58         "applies": false,
     59         "answer": false,
     60         "justification": "No experimental runs or repeated measurements are conducted. This is a qualitative thematic synthesis."
     61       }
     62     },
     63     "evaluation_design": {
     64       "baselines_included": {
     65         "applies": true,
     66         "answer": false,
     67         "justification": "Section II.D discusses related systematic and scoping reviews (Hagendorff 2024, Tabassum et al. 2025, Al-kfairy et al. 2024, Zhang & Boulos 2023) but does not systematically compare its findings, coverage, or methodology against them. They are positioned as related work, not as baselines for comparison."
     68       },
     69       "baselines_contemporary": {
     70         "applies": true,
     71         "answer": false,
     72         "justification": "No formal baseline comparison is conducted, so contemporaneity of baselines cannot be assessed."
     73       },
     74       "ablation_study": {
     75         "applies": false,
     76         "answer": false,
     77         "justification": "This is a literature review with no system components to ablate."
     78       },
     79       "multiple_metrics": {
     80         "applies": false,
     81         "answer": false,
     82         "justification": "No experimental evaluation metrics are used. The paper performs qualitative thematic analysis."
     83       },
     84       "human_evaluation": {
     85         "applies": false,
     86         "answer": false,
     87         "justification": "No system outputs to evaluate. This is a literature review."
     88       },
     89       "held_out_test_set": {
     90         "applies": false,
     91         "answer": false,
     92         "justification": "No experimental test sets are used. This is a qualitative literature review."
     93       },
     94       "per_category_breakdown": {
     95         "applies": true,
     96         "answer": true,
     97         "justification": "Findings are broken down by ethical challenge category (bias, misinformation, privacy, IP, accountability), by domain (healthcare, education, media, law), by publication year (Fig. 1), by subject area (Fig. 2), by journal (Fig. 3), and by article type (Fig. 4)."
     98       },
     99       "failure_cases_discussed": {
    100         "applies": true,
    101         "answer": true,
    102         "justification": "The paper identifies gaps and weaknesses in the reviewed literature, including fragmented approaches, lack of empirical grounding, and disproportionate focus on risks over solutions (Section V.C). This functions as discussion of 'failure cases' in the surveyed field."
    103       },
    104       "negative_results_reported": {
    105         "applies": true,
    106         "answer": true,
    107         "justification": "The paper reports several negative findings: the research landscape is fragmented, most studies lack empirical validation, current frameworks are inconsistent, and the literature is heavily skewed toward risk identification rather than solutions (Sections IV.D, V.C)."
    108       }
    109     },
    110     "claims_and_evidence": {
    111       "abstract_claims_supported": {
    112         "applies": true,
    113         "answer": true,
    114         "justification": "The abstract's main claims — five primary ethical challenges, fragmented landscape, limited empirical validation, and emerging opportunities — are all supported by the thematic analysis presented in Sections IV and V."
    115       },
    116       "causal_claims_justified": {
    117         "applies": false,
    118         "answer": false,
    119         "justification": "The paper makes no causal claims. It synthesizes and categorizes existing literature thematically without claiming causal relationships between variables."
    120       },
    121       "generalization_bounded": {
    122         "applies": true,
    123         "answer": false,
    124         "justification": "The title claims a comprehensive 'Systematic Literature Review on Generative AI: Ethical Challenges and Opportunities' but the search was limited to a single database (ScienceDirect). The paper acknowledges ScienceDirect as a limitation in one sentence ('While recognizing that ethical discussions on GAI may also exist in other databases') but still makes broad claims about the state of the field without adequately bounding them to this single-source scope."
    125       },
    126       "alternative_explanations_discussed": {
    127         "applies": true,
    128         "answer": false,
    129         "justification": "The paper does not consider alternative interpretations of its thematic findings. For example, the observed fragmentation could reflect genuine disciplinary diversity rather than a problem, but this is not explored."
    130       },
    131       "proxy_outcome_distinction": {
    132         "applies": true,
    133         "answer": true,
    134         "justification": "The paper's claims match the granularity of its analysis. It claims to identify themes in the literature and presents those themes. No proxy gap exists between what was measured (thematic categories in 112 papers) and what is claimed."
    135       }
    136     },
    137     "setup_transparency": {
    138       "model_versions_specified": {
    139         "applies": false,
    140         "answer": false,
    141         "justification": "No AI models are used in the study methodology. This is a manual literature review."
    142       },
    143       "prompts_provided": {
    144         "applies": false,
    145         "answer": false,
    146         "justification": "No prompting is used. This is a manual literature review."
    147       },
    148       "hyperparameters_reported": {
    149         "applies": false,
    150         "answer": false,
    151         "justification": "No computational hyperparameters are relevant to this manual literature review."
    152       },
    153       "scaffolding_described": {
    154         "applies": false,
    155         "answer": false,
    156         "justification": "No agentic scaffolding is used. This is a manual literature review."
    157       },
    158       "data_preprocessing_documented": {
    159         "applies": true,
    160         "answer": true,
    161         "justification": "The paper documents the PRISMA-based selection pipeline with counts and criteria: 145 initial articles → 12 non-peer-reviewed excluded → 133 screened → 9 removed (not meeting inclusion criteria) → 124 full-text assessed → 6 excluded (insufficient ethical focus) → 112 final. Inclusion/exclusion criteria are stated in Section III.E."
    162       }
    163     },
    164     "limitations_and_scope": {
    165       "limitations_section_present": {
    166         "applies": true,
    167         "answer": false,
    168         "justification": "There is no dedicated limitations section discussing the study's own methodological limitations. The paper discusses gaps and limitations in the reviewed literature (Sections II.E, V.C) but never acknowledges its own limitations such as the single-database search strategy."
    169       },
    170       "threats_to_validity_specific": {
    171         "applies": true,
    172         "answer": false,
    173         "justification": "No threats to the validity of this study's own methodology are discussed. The paper does not address risks such as selection bias from using only ScienceDirect, potential subjectivity in thematic coding, or the impact of the narrow search terms."
    174       },
    175       "scope_boundaries_stated": {
    176         "applies": true,
    177         "answer": false,
    178         "justification": "While the search scope is defined (ScienceDirect, 2021-2025, English, peer-reviewed), the paper does not explicitly state what its findings do NOT show. The conclusions make broad claims about the GAI ethics landscape without bounding them to the single-database, single-search-string scope."
    179       }
    180     },
    181     "data_integrity": {
    182       "raw_data_available": {
    183         "applies": true,
    184         "answer": false,
    185         "justification": "Only 10 of 112 reviewed articles are shown in Table I. The full dataset of extracted data (bibliographic details, ethical themes, quality scores) is not available for independent verification."
    186       },
    187       "data_collection_described": {
    188         "applies": true,
    189         "answer": true,
    190         "justification": "The data collection procedure is described in Section III.D: ScienceDirect search using Boolean operators combining 'generative AI', 'ethics', 'challenges', and 'opportunities', limited to peer-reviewed journals in English from 2021-2025."
    191       },
    192       "recruitment_methods_described": {
    193         "applies": true,
    194         "answer": true,
    195         "justification": "The paper selection process is described: structured search on ScienceDirect with specific Boolean queries, followed by PRISMA-guided screening at three stages (identification, screening, eligibility). The search strategy and selection criteria are documented."
    196       },
    197       "data_pipeline_documented": {
    198         "applies": true,
    199         "answer": true,
    200         "justification": "The PRISMA flow is documented with counts at each stage: 145 → 133 (12 non-peer-reviewed removed) → 124 (9 not meeting criteria removed) → 112 (6 insufficient ethical focus removed). Data extraction form contents and dual-reviewer process are described in Section III.G."
    201       }
    202     },
    203     "conflicts_of_interest": {
    204       "funding_disclosed": {
    205         "applies": true,
    206         "answer": false,
    207         "justification": "No funding information is provided anywhere in the paper. There is no acknowledgments section mentioning grants or sponsors."
    208       },
    209       "affiliations_disclosed": {
    210         "applies": true,
    211         "answer": true,
    212         "justification": "The author's affiliation is clearly listed: Industrial Engineering Department, Atma Jaya Catholic University of Indonesia, Jakarta, Indonesia."
    213       },
    214       "funder_independent_of_outcome": {
    215         "applies": true,
    216         "answer": false,
    217         "justification": "No funding is disclosed, so independence of funding cannot be verified."
    218       },
    219       "financial_interests_declared": {
    220         "applies": true,
    221         "answer": false,
    222         "justification": "No competing interests or financial interests statement is present in the paper."
    223       }
    224     },
    225     "contamination": {
    226       "training_cutoff_stated": {
    227         "applies": false,
    228         "answer": false,
    229         "justification": "This is a literature review that does not evaluate any pre-trained model's capability on a benchmark."
    230       },
    231       "train_test_overlap_discussed": {
    232         "applies": false,
    233         "answer": false,
    234         "justification": "This is a literature review that does not evaluate any pre-trained model on a benchmark."
    235       },
    236       "benchmark_contamination_addressed": {
    237         "applies": false,
    238         "answer": false,
    239         "justification": "This is a literature review that does not evaluate any pre-trained model on a benchmark."
    240       }
    241     },
    242     "human_studies": {
    243       "pre_registered": {
    244         "applies": false,
    245         "answer": false,
    246         "justification": "No human participants in this study. This is a systematic literature review."
    247       },
    248       "irb_or_ethics_approval": {
    249         "applies": false,
    250         "answer": false,
    251         "justification": "No human participants in this study."
    252       },
    253       "demographics_reported": {
    254         "applies": false,
    255         "answer": false,
    256         "justification": "No human participants in this study."
    257       },
    258       "inclusion_exclusion_criteria": {
    259         "applies": false,
    260         "answer": false,
    261         "justification": "No human participants in this study."
    262       },
    263       "randomization_described": {
    264         "applies": false,
    265         "answer": false,
    266         "justification": "No human participants in this study."
    267       },
    268       "blinding_described": {
    269         "applies": false,
    270         "answer": false,
    271         "justification": "No human participants in this study."
    272       },
    273       "attrition_reported": {
    274         "applies": false,
    275         "answer": false,
    276         "justification": "No human participants in this study."
    277       }
    278     },
    279     "cost_and_practicality": {
    280       "inference_cost_reported": {
    281         "applies": false,
    282         "answer": false,
    283         "justification": "This is a survey paper with no computational method to cost."
    284       },
    285       "compute_budget_stated": {
    286         "applies": false,
    287         "answer": false,
    288         "justification": "This is a survey paper with no computational budget."
    289       }
    290     },
    291     "survey_methodology": {
    292       "prisma_or_structured_protocol": {
    293         "applies": true,
    294         "answer": true,
    295         "justification": "The paper explicitly follows PRISMA 2020 guidelines (citing Page et al. 2021) and uses a structured SLR protocol based on Kitchenham et al. (2007) and Okoli (2015). The PRISMA flow with stage counts is described in Section III.F."
    296       },
    297       "quality_assessment_of_sources": {
    298         "applies": true,
    299         "answer": true,
    300         "justification": "A CASP-based quality assessment checklist is used with five criteria (clarity of objective, relevance to GAI ethics, methodological soundness, contribution, transparency of limitations), each scored 0-1, with a minimum threshold of 3/5 for inclusion. Two reviewers independently assessed all articles (Section III.H)."
    301       },
    302       "publication_bias_discussed": {
    303         "applies": true,
    304         "answer": false,
    305         "justification": "The paper does not discuss publication bias. There are no funnel plots, no discussion of negative-result underrepresentation, and no acknowledgment that published GAI ethics papers may skew toward identifying risks over reporting neutral or positive findings."
    306       }
    307     }
    308   },
    309   "claims": [
    310     {
    311       "claim": "Five primary ethical challenges dominate GAI discourse: algorithmic bias, misinformation/deepfakes, data privacy violations, intellectual property issues, and accountability/explainability.",
    312       "evidence": "Identified through thematic analysis of 112 peer-reviewed articles using open and axial coding (Section IV.B). Each challenge is discussed with citations to supporting studies.",
    313       "supported": "moderate"
    314     },
    315     {
    316       "claim": "The GAI ethics research landscape is fragmented across disciplines with limited empirical validation and inconsistent ethical frameworks.",
    317       "evidence": "Section V.C discusses cross-disciplinary fragmentation, citing Hagendorff (2024) who 'concluded that terminological and methodological fragmentation hinders ethical progress.' The paper notes 'most articles focus disproportionately on ethical risks' and there is 'a notable scarcity of empirical research.'",
    318       "supported": "moderate"
    319     },
    320     {
    321       "claim": "Publication interest in GAI ethics surged dramatically in 2024, with 58 articles published.",
    322       "evidence": "Bibliometric analysis presented in Fig. 1 shows: 2022 (n=1), 2023 (n=5), 2024 (n=58), 2025 (n=48). However, these counts are from a single database (ScienceDirect) with specific search terms.",
    323       "supported": "moderate"
    324     },
    325     {
    326       "claim": "GAI can be ethically harnessed to promote inclusive innovation, assistive technologies, and human-AI creative collaboration.",
    327       "evidence": "Section IV.C and V.B cite studies on democratizing creativity, assistive technologies for people with disabilities (Elyoseph et al. 2024), and human-centered design principles. However, these are drawn from the reviewed literature, not original empirical findings.",
    328       "supported": "weak"
    329     }
    330   ],
    331   "red_flags": [
    332     {
    333       "flag": "Single database search",
    334       "detail": "The review searched only ScienceDirect, excluding major sources like Scopus, Web of Science, IEEE Xplore, ACM Digital Library, PubMed, and arXiv. For a 'systematic' review claiming to map the ethical landscape of GAI, this severely limits coverage and introduces selection bias. The paper acknowledges this briefly but does not treat it as a significant limitation."
    335     },
    336     {
    337       "flag": "No self-limitations section",
    338       "detail": "The paper discusses gaps in the reviewed literature extensively but never acknowledges the methodological limitations of its own study. A systematic review that doesn't discuss its own threats to validity (single database, narrow search terms, potential coding subjectivity) is a significant omission."
    339     },
    340     {
    341       "flag": "Inconsistent date range",
    342       "detail": "The abstract and methodology state the review period is '2021 and 2025,' but the conclusion states 'between 2018 and early 2025.' This inconsistency undermines confidence in the review's rigor."
    343     },
    344     {
    345       "flag": "Incomplete data presentation",
    346       "detail": "Table I shows only 10 of 112 reviewed articles. Without the full dataset, the thematic findings cannot be independently verified. The quality assessment scores are never reported, making it impossible to assess the actual quality distribution of included studies."
    347     },
    348     {
    349       "flag": "Dual-reviewer claim without evidence",
    350       "detail": "The paper claims 'two reviewers independently extracted data' and independently assessed quality (Section III.G-H), but this is a single-author paper. The identity of the second and third reviewers is never disclosed, and no inter-rater reliability statistics are reported."
    351     },
    352     {
    353       "flag": "Shallow thematic synthesis",
    354       "detail": "The five identified ethical themes (bias, misinformation, privacy, IP, accountability) are well-established in the literature and could be identified without a systematic review. The paper adds little novel synthesis beyond cataloging known concerns, which is the 'laundering signal-to-noise ratio' problem for surveys."
    355     }
    356   ],
    357   "cited_papers": [
    358     {
    359       "title": "Language models are few-shot learners",
    360       "authors": ["T. Brown", "B. Mann", "N. Ryder"],
    361       "year": 2020,
    362       "relevance": "Foundational GPT-3 paper relevant to understanding large language model capabilities that underpin generative AI."
    363     },
    364     {
    365       "title": "Attention is all you need",
    366       "authors": ["A. Vaswani", "N. Shazeer", "N. Parmar"],
    367       "year": 2017,
    368       "relevance": "Foundational Transformer architecture paper underlying all modern generative AI models."
    369     },
    370     {
    371       "title": "On the dangers of stochastic parrots: Can language models be too big?",
    372       "authors": ["E. M. Bender", "T. Gebru", "A. McMillan-Major", "S. Shmitchell"],
    373       "relevance": "Seminal paper on ethical risks of large language models including bias, environmental costs, and misleading outputs."
    374     },
    375     {
    376       "title": "A comprehensive empirical study of bias mitigation methods for machine learning classifiers",
    377       "authors": ["Z. Chen", "J. M. Zhang", "F. Sarro", "M. Harman"],
    378       "year": 2023,
    379       "relevance": "Empirical study of bias mitigation methods for ML classifiers, directly relevant to AI fairness evaluation."
    380     },
    381     {
    382       "title": "Towards A Rigorous Science of Interpretable Machine Learning",
    383       "authors": ["F. Doshi-Velez", "B. Kim"],
    384       "year": 2017,
    385       "relevance": "Foundational paper on AI explainability and interpretability, relevant to accountability and transparency in AI systems."
    386     },
    387     {
    388       "title": "Mapping the ethics of generative ai: A comprehensive scoping review",
    389       "authors": ["T. Hagendorff"],
    390       "year": 2024,
    391       "relevance": "Closely related scoping review categorizing GAI ethical concerns into nineteen thematic areas, directly comparable to this survey."
    392     },
    393     {
    394       "title": "ChatGPT: A comprehensive review on background, applications, key challenges, bias, ethics, limitations and future scope",
    395       "authors": ["P. P. Ray"],
    396       "year": 2023,
    397       "relevance": "Comprehensive review of ChatGPT covering capabilities, ethics, and limitations relevant to LLM evaluation and safety."
    398     },
    399     {
    400       "title": "Ethical challenges and solutions of generative AI: An interdisciplinary perspective",
    401       "authors": ["M. Al-kfairy", "D. Mustafa", "N. Kshetri", "M. Insiew", "O. Alfandi"],
    402       "year": 2024,
    403       "relevance": "Cross-sectoral review of GAI ethical challenges across industries, directly relevant to AI governance and responsible development."
    404     },
    405     {
    406       "title": "Generative AI and the Metaverse: A Scoping Review of Ethical and Legal Challenges",
    407       "authors": ["A. Tabassum", "E. Elmahjub", "A. I. Padela", "A. Zwitter", "J. Qadir"],
    408       "year": 2025,
    409       "relevance": "Scoping review of GAI ethical and legal challenges in metaverse applications including bias, disinformation, and privacy."
    410     }
    411   ],
    412   "engagement_factors": {
    413     "practical_relevance": {
    414       "score": 0,
    415       "justification": "Pure literature review with no actionable tool, technique, or framework that practitioners could apply."
    416     },
    417     "surprise_contrarian": {
    418       "score": 0,
    419       "justification": "Findings confirm well-established ethical concerns about generative AI (bias, privacy, misinformation) without challenging any conventional wisdom."
    420     },
    421     "fear_safety": {
    422       "score": 1,
    423       "justification": "Discusses AI safety concerns like deepfakes and misinformation but presents no novel threats or demonstrations beyond what is already widely known."
    424     },
    425     "drama_conflict": {
    426       "score": 0,
    427       "justification": "No controversy, no challenge to specific actors, no dramatic framing."
    428     },
    429     "demo_ability": {
    430       "score": 0,
    431       "justification": "No code, demo, or interactive component."
    432     },
    433     "brand_recognition": {
    434       "score": 0,
    435       "justification": "Published in IJACSA by a solo author at Atma Jaya Catholic University of Indonesia; no major lab or product involvement."
    436     }
    437   }
    438 }
	ai-research-survey Systematic scan of agentic development research. What's signal, what's noise.
	git clone https://git.shiptheloop.com/ai-research-survey.git
	Log \| Files \| Refs