scan.json - ai-research-survey - Systematic scan of agentic development research. What's signal, what's noise.

scan.json (19216B)
      1 {
      2   "paper": {
      3     "title": "Responsible Artificial Intelligence for Earth Observation: Achievable and realistic paths to serve the collective good",
      4     "authors": ["Pedram Ghamisi", "Weikang Yu", "Andrea Marinoni", "Caroline M. Gevaert", "Claudio Persello", "Sivasakthy Selvakumaran", "Manuela Girotto", "Benjamin P. Horton", "Philippe Rufin", "Patrick Hostert", "Fabio Pacifici", "Peter M. Atkinson"],
      5     "year": 2024,
      6     "venue": "arXiv preprint / IEEE MGRS",
      7     "arxiv_id": "2405.20868",
      8     "doi": "10.1109/MGRS.2025.3529726"
      9   },
     10   "scan_version": 2,
     11   "active_modules": ["survey_methodology"],
     12   "methodology_tags": ["meta-analysis", "qualitative"],
     13   "key_findings": "This paper surveys responsible AI practices in Earth observation across five dimensions: mitigating unfair bias, AI security (adversarial defense, uncertainty, XAI), geo-privacy, ethical principles (scientific excellence, open data), and AI4EO for social good. It identifies specific challenges like spatial autocorrelation bias unique to geospatial data, privacy concerns with high-resolution UAV/satellite imagery, and the need for stakeholder co-creation. The paper provides two concrete application examples (early warning systems for mass movements, climate teleconnections) but presents no new empirical evaluation or systematic quantitative analysis.",
     14   "checklist": {
     15     "artifacts": {
     16       "code_released": {
     17         "applies": true,
     18         "answer": false,
     19         "justification": "No code or analysis scripts are released. No repository URL provided."
     20       },
     21       "data_released": {
     22         "applies": true,
     23         "answer": false,
     24         "justification": "No dataset or corpus of reviewed papers is released. The Google Scholar search described in Fig. 1 is not provided as structured data."
     25       },
     26       "environment_specified": {
     27         "applies": false,
     28         "answer": false,
     29         "justification": "This is a survey/review paper with no computational experiments requiring an environment."
     30       },
     31       "reproduction_instructions": {
     32         "applies": true,
     33         "answer": false,
     34         "justification": "No instructions for reproducing the literature search or analysis. The Google Scholar keyword search in Fig. 1 is loosely described but not reproducible."
     35       }
     36     },
     37     "statistical_methodology": {
     38       "confidence_intervals_or_error_bars": {
     39         "applies": false,
     40         "answer": false,
     41         "justification": "Survey paper with no statistical experiments. Fig. 1 shows publication counts but no statistical analysis."
     42       },
     43       "significance_tests": {
     44         "applies": false,
     45         "answer": false,
     46         "justification": "No statistical comparisons are made in this survey."
     47       },
     48       "effect_sizes_reported": {
     49         "applies": false,
     50         "answer": false,
     51         "justification": "No experiments producing effect sizes."
     52       },
     53       "sample_size_justified": {
     54         "applies": false,
     55         "answer": false,
     56         "justification": "No experimental sample involved."
     57       },
     58       "variance_reported": {
     59         "applies": false,
     60         "answer": false,
     61         "justification": "No experimental runs to report variance across."
     62       }
     63     },
     64     "evaluation_design": {
     65       "baselines_included": {
     66         "applies": true,
     67         "answer": false,
     68         "justification": "The survey does not compare itself against prior surveys of responsible AI in EO or position itself relative to specific prior reviews in a structured way."
     69       },
     70       "baselines_contemporary": {
     71         "applies": false,
     72         "answer": false,
     73         "justification": "No baseline comparison applies since no structured comparison with prior surveys is attempted."
     74       },
     75       "ablation_study": {
     76         "applies": false,
     77         "answer": false,
     78         "justification": "Survey paper — no system components to ablate."
     79       },
     80       "multiple_metrics": {
     81         "applies": false,
     82         "answer": false,
     83         "justification": "No evaluation metrics used — this is a narrative review."
     84       },
     85       "human_evaluation": {
     86         "applies": false,
     87         "answer": false,
     88         "justification": "No system outputs to evaluate."
     89       },
     90       "held_out_test_set": {
     91         "applies": false,
     92         "answer": false,
     93         "justification": "No test set involved."
     94       },
     95       "per_category_breakdown": {
     96         "applies": true,
     97         "answer": true,
     98         "justification": "The paper organizes its review into clear thematic categories (bias, security, privacy, ethics, social good) with dedicated sections for each."
     99       },
    100       "failure_cases_discussed": {
    101         "applies": true,
    102         "answer": true,
    103         "justification": "The paper discusses failure modes and challenges extensively: spatial autocorrelation biases (Section 2.3.2), adversarial attacks (Section 3.1.1), domain shift issues (Section 3.1.2), privacy violations from UAV imagery (Section 4.1), and stigmatization risks (Section 5.1)."
    104       },
    105       "negative_results_reported": {
    106         "applies": true,
    107         "answer": true,
    108         "justification": "The paper reports limitations of existing approaches: adversarial training only defends against specific attacks (Section 3.2.1), current XAI methods produce semantically misaligned visualizations (Section 3.3.3), and upscaling studies are lacking (Section 5.5)."
    109       }
    110     },
    111     "claims_and_evidence": {
    112       "abstract_claims_supported": {
    113         "applies": true,
    114         "answer": true,
    115         "justification": "The abstract claims to 'systematically define the intersection of AI and EO with a central focus on responsible AI practices' and identify 'critical components.' The paper delivers on this with dedicated sections for each component (bias, security, privacy, ethics, social good)."
    116       },
    117       "causal_claims_justified": {
    118         "applies": false,
    119         "answer": false,
    120         "justification": "The paper is a survey that does not make causal claims about its own work. It describes causal relationships from the literature (e.g., spatial autocorrelation causing overestimation) but attributes these to cited sources."
    121       },
    122       "generalization_bounded": {
    123         "applies": true,
    124         "answer": false,
    125         "justification": "The paper claims to be a 'pioneering effort to systematically define the intersection of AI and EO' but does not bound this claim — it does not specify which EO subfields, AI methods, or geographic contexts are covered vs excluded. The literature coverage is not described with explicit inclusion/exclusion criteria."
    126       },
    127       "alternative_explanations_discussed": {
    128         "applies": false,
    129         "answer": false,
    130         "justification": "This is a survey/taxonomy paper presenting no empirical results that would require alternative explanations."
    131       },
    132       "proxy_outcome_distinction": {
    133         "applies": false,
    134         "answer": false,
    135         "justification": "No measurements or proxies — this is a narrative review."
    136       }
    137     },
    138     "setup_transparency": {
    139       "model_versions_specified": {
    140         "applies": false,
    141         "answer": false,
    142         "justification": "No models are used in this survey."
    143       },
    144       "prompts_provided": {
    145         "applies": false,
    146         "answer": false,
    147         "justification": "No prompting used."
    148       },
    149       "hyperparameters_reported": {
    150         "applies": false,
    151         "answer": false,
    152         "justification": "No experiments with hyperparameters."
    153       },
    154       "scaffolding_described": {
    155         "applies": false,
    156         "answer": false,
    157         "justification": "No agentic scaffolding used."
    158       },
    159       "data_preprocessing_documented": {
    160         "applies": true,
    161         "answer": false,
    162         "justification": "The paper describes a Google Scholar search for Fig. 1 ('keywords: machine learning or deep learning and remote sensing') but provides no systematic review protocol, no inclusion/exclusion criteria for the papers discussed, and no documentation of how the reviewed literature was selected."
    163       }
    164     },
    165     "limitations_and_scope": {
    166       "limitations_section_present": {
    167         "applies": true,
    168         "answer": false,
    169         "justification": "There is no dedicated limitations section. Section 8 (Conclusions) acknowledges geopolitical complexities but does not discuss limitations of the review itself."
    170       },
    171       "threats_to_validity_specific": {
    172         "applies": true,
    173         "answer": false,
    174         "justification": "No specific threats to the validity of the review are discussed. The paper does not address potential selection bias in its literature coverage, language bias, or coverage gaps."
    175       },
    176       "scope_boundaries_stated": {
    177         "applies": true,
    178         "answer": false,
    179         "justification": "The paper claims broad coverage ('pioneering and thorough review') but does not state what is explicitly out of scope, which EO subfields or AI methods are excluded, or what geographic/temporal bounds apply to the literature reviewed."
    180       }
    181     },
    182     "data_integrity": {
    183       "raw_data_available": {
    184         "applies": true,
    185         "answer": false,
    186         "justification": "No raw data from the literature search or analysis is available for verification."
    187       },
    188       "data_collection_described": {
    189         "applies": true,
    190         "answer": false,
    191         "justification": "The paper mentions a Google Scholar search for publication counts (Fig. 1) but does not describe how the broader body of reviewed literature was collected or selected."
    192       },
    193       "recruitment_methods_described": {
    194         "applies": false,
    195         "answer": false,
    196         "justification": "No human participants. The data source is published literature, which is a standard corpus, though the selection process is undocumented."
    197       },
    198       "data_pipeline_documented": {
    199         "applies": true,
    200         "answer": false,
    201         "justification": "No pipeline from literature search to review synthesis is documented. The paper jumps from a general framing to thematic discussion without describing how papers were found, screened, or organized."
    202       }
    203     },
    204     "conflicts_of_interest": {
    205       "funding_disclosed": {
    206         "applies": true,
    207         "answer": false,
    208         "justification": "No funding acknowledgment section is present in the paper."
    209       },
    210       "affiliations_disclosed": {
    211         "applies": true,
    212         "answer": true,
    213         "justification": "All author affiliations are clearly listed, including Maxar Technologies (a commercial satellite provider) for Fabio Pacifici."
    214       },
    215       "funder_independent_of_outcome": {
    216         "applies": true,
    217         "answer": false,
    218         "justification": "No funding is disclosed, so independence cannot be assessed. One author is from Maxar Technologies, a commercial EO provider with a potential interest in the paper's conclusions about responsible AI in EO."
    219       },
    220       "financial_interests_declared": {
    221         "applies": true,
    222         "answer": false,
    223         "justification": "No competing interests or financial interests statement is present. Maxar Technologies is mentioned favorably in Section 7 (SpaceNet, ESG reports) by an author affiliated with Maxar."
    224       }
    225     },
    226     "contamination": {
    227       "training_cutoff_stated": {
    228         "applies": false,
    229         "answer": false,
    230         "justification": "Survey paper — no pre-trained model evaluated on any benchmark."
    231       },
    232       "train_test_overlap_discussed": {
    233         "applies": false,
    234         "answer": false,
    235         "justification": "Survey paper — no benchmark evaluation."
    236       },
    237       "benchmark_contamination_addressed": {
    238         "applies": false,
    239         "answer": false,
    240         "justification": "Survey paper — no benchmark evaluation."
    241       }
    242     },
    243     "human_studies": {
    244       "pre_registered": {
    245         "applies": false,
    246         "answer": false,
    247         "justification": "No human participants."
    248       },
    249       "irb_or_ethics_approval": {
    250         "applies": false,
    251         "answer": false,
    252         "justification": "No human participants."
    253       },
    254       "demographics_reported": {
    255         "applies": false,
    256         "answer": false,
    257         "justification": "No human participants."
    258       },
    259       "inclusion_exclusion_criteria": {
    260         "applies": false,
    261         "answer": false,
    262         "justification": "No human participants."
    263       },
    264       "randomization_described": {
    265         "applies": false,
    266         "answer": false,
    267         "justification": "No human participants."
    268       },
    269       "blinding_described": {
    270         "applies": false,
    271         "answer": false,
    272         "justification": "No human participants."
    273       },
    274       "attrition_reported": {
    275         "applies": false,
    276         "answer": false,
    277         "justification": "No human participants."
    278       }
    279     },
    280     "cost_and_practicality": {
    281       "inference_cost_reported": {
    282         "applies": false,
    283         "answer": false,
    284         "justification": "Survey paper — no method with inference costs."
    285       },
    286       "compute_budget_stated": {
    287         "applies": false,
    288         "answer": false,
    289         "justification": "Survey paper — no computational experiments."
    290       }
    291     },
    292     "survey_methodology": {
    293       "prisma_or_structured_protocol": {
    294         "applies": true,
    295         "answer": false,
    296         "justification": "No structured review protocol is followed. No PRISMA diagram, no registered protocol, no systematic search strategy with reproducible queries. The paper is a narrative review with ad-hoc paper selection."
    297       },
    298       "quality_assessment_of_sources": {
    299         "applies": true,
    300         "answer": false,
    301         "justification": "The survey does not assess the methodological quality of the papers it cites. All sources are treated equally regardless of their rigor."
    302       },
    303       "publication_bias_discussed": {
    304         "applies": true,
    305         "answer": false,
    306         "justification": "No discussion of publication bias in the reviewed literature. The survey does not consider whether its sources skew toward positive results about AI4EO."
    307       }
    308     }
    309   },
    310   "claims": [
    311     {
    312       "claim": "AI4EO publications in IEEE TGRS have surged dramatically since 2020, growing from ~500 in 2019 to ~2500 in 2023.",
    313       "evidence": "Fig. 1 shows publication counts from Google Scholar advanced search using keywords 'machine learning' or 'deep learning' and 'remote sensing' in IEEE TGRS from 2014-2023.",
    314       "supported": "moderate"
    315     },
    316     {
    317       "claim": "Spatial autocorrelation between training and testing samples causes overestimation of model accuracy in geospatial applications.",
    318       "evidence": "Cites Karasiak et al. (2022) [28] who demonstrated this effect. Section 2.3.2.",
    319       "supported": "strong"
    320     },
    321     {
    322       "claim": "Graph-based ensemble neural network approaches can deliver robust hindcasting and forecasting of mass movement impacts at local, regional, and national scales.",
    323       "evidence": "Section 6.1 cites Dimasaka et al. (2023) [142] showing results over 68,000 incidents since 1957 across Norwegian territory.",
    324       "supported": "weak"
    325     },
    326     {
    327       "claim": "The field has transitioned from singular focus on model-centric or data-centric approaches to a balanced data-model-centric paradigm.",
    328       "evidence": "Fig. 2 and Section 1 present this as the authors' opinion ('we believe'), supported by the rise of foundation models. No systematic evidence is provided.",
    329       "supported": "weak"
    330     }
    331   ],
    332   "red_flags": [
    333     {
    334       "flag": "No systematic review methodology",
    335       "detail": "The paper claims to be a 'pioneering and thorough review' but follows no structured review protocol (PRISMA, etc.). Paper selection appears ad-hoc with no documented search strategy, inclusion/exclusion criteria, or screening process."
    336     },
    337     {
    338       "flag": "Undisclosed conflict of interest",
    339       "detail": "Author Fabio Pacifici is affiliated with Maxar Technologies. Section 7 mentions Maxar favorably multiple times (SpaceNet co-founder, ESG reports). No competing interests statement addresses this."
    340     },
    341     {
    342       "flag": "No quality assessment of reviewed sources",
    343       "detail": "The survey does not assess the methodological quality of cited works. All sources are treated as equally reliable, potentially laundering weak results alongside strong ones."
    344     },
    345     {
    346       "flag": "Claims outrun evidence",
    347       "detail": "The paper calls itself 'a pioneering effort to systematically define the intersection of AI and EO' but it is a narrative review, not a systematic one. The word 'systematically' is not justified by the methodology."
    348     }
    349   ],
    350   "cited_papers": [
    351     {
    352       "title": "Gender Shades: Intersectional Accuracy Disparities in Commercial Gender Classification",
    353       "authors": ["Joy Buolamwini", "Timnit Gebru"],
    354       "year": 2018,
    355       "relevance": "Foundational work on AI bias in facial recognition, relevant to AI fairness and responsible AI evaluation."
    356     },
    357     {
    358       "title": "A framework for understanding sources of harm throughout the machine learning life cycle",
    359       "authors": ["Harini Suresh", "John Guttag"],
    360       "year": 2021,
    361       "relevance": "Framework for understanding ML bias types (historical, representation, measurement, etc.) relevant to AI methodology quality."
    362     },
    363     {
    364       "title": "Are Emergent Abilities of Large Language Models a Mirage?",
    365       "authors": ["Rylan Schaeffer", "Brando Miranda", "Sanmi Koyejo"],
    366       "year": 2023,
    367       "arxiv_id": "2304.15004",
    368       "relevance": "Questions whether LLM emergent abilities are artifacts of evaluation metrics — directly relevant to AI evaluation methodology."
    369     },
    370     {
    371       "title": "On the Opportunities and Risks of Foundation Models",
    372       "authors": ["Rishi Bommasani"],
    373       "year": 2021,
    374       "relevance": "Comprehensive analysis of foundation model risks and opportunities, relevant to AI safety and responsible deployment."
    375     },
    376     {
    377       "title": "Universal adversarial examples in remote sensing: Methodology and benchmark",
    378       "authors": ["Yonghao Xu", "Pedram Ghamisi"],
    379       "year": 2022,
    380       "relevance": "Benchmark for adversarial robustness in remote sensing AI, relevant to AI security evaluation methodology."
    381     },
    382     {
    383       "title": "Tackling climate change with machine learning",
    384       "authors": ["David Rolnick"],
    385       "year": 2022,
    386       "relevance": "Survey of ML applications for climate change, relevant to AI for social good evaluation."
    387     },
    388     {
    389       "title": "Large Language Models are Geographically Biased",
    390       "authors": ["Rohin Manvi", "Samar Khanna", "Marshall Burke", "David Lobell", "Stefano Ermon"],
    391       "year": 2024,
    392       "relevance": "Documents geographic bias in LLMs, directly relevant to AI bias and fairness research methodology."
    393     },
    394     {
    395       "title": "Deep learning in remote sensing: A comprehensive review and list of resources",
    396       "authors": ["Xiao Xiang Zhu"],
    397       "year": 2017,
    398       "relevance": "Major survey of deep learning in remote sensing, relevant as a methodological comparison for AI survey quality."
    399     }
    400   ]
    401 }
	ai-research-survey Systematic scan of agentic development research. What's signal, what's noise.
	git clone https://git.shiptheloop.com/ai-research-survey.git
	Log \| Files \| Refs