scan.json (19216B)
1 { 2 "paper": { 3 "title": "Responsible Artificial Intelligence for Earth Observation: Achievable and realistic paths to serve the collective good", 4 "authors": ["Pedram Ghamisi", "Weikang Yu", "Andrea Marinoni", "Caroline M. Gevaert", "Claudio Persello", "Sivasakthy Selvakumaran", "Manuela Girotto", "Benjamin P. Horton", "Philippe Rufin", "Patrick Hostert", "Fabio Pacifici", "Peter M. Atkinson"], 5 "year": 2024, 6 "venue": "arXiv preprint / IEEE MGRS", 7 "arxiv_id": "2405.20868", 8 "doi": "10.1109/MGRS.2025.3529726" 9 }, 10 "scan_version": 2, 11 "active_modules": ["survey_methodology"], 12 "methodology_tags": ["meta-analysis", "qualitative"], 13 "key_findings": "This paper surveys responsible AI practices in Earth observation across five dimensions: mitigating unfair bias, AI security (adversarial defense, uncertainty, XAI), geo-privacy, ethical principles (scientific excellence, open data), and AI4EO for social good. It identifies specific challenges like spatial autocorrelation bias unique to geospatial data, privacy concerns with high-resolution UAV/satellite imagery, and the need for stakeholder co-creation. The paper provides two concrete application examples (early warning systems for mass movements, climate teleconnections) but presents no new empirical evaluation or systematic quantitative analysis.", 14 "checklist": { 15 "artifacts": { 16 "code_released": { 17 "applies": true, 18 "answer": false, 19 "justification": "No code or analysis scripts are released. No repository URL provided." 20 }, 21 "data_released": { 22 "applies": true, 23 "answer": false, 24 "justification": "No dataset or corpus of reviewed papers is released. The Google Scholar search described in Fig. 1 is not provided as structured data." 25 }, 26 "environment_specified": { 27 "applies": false, 28 "answer": false, 29 "justification": "This is a survey/review paper with no computational experiments requiring an environment." 30 }, 31 "reproduction_instructions": { 32 "applies": true, 33 "answer": false, 34 "justification": "No instructions for reproducing the literature search or analysis. The Google Scholar keyword search in Fig. 1 is loosely described but not reproducible." 35 } 36 }, 37 "statistical_methodology": { 38 "confidence_intervals_or_error_bars": { 39 "applies": false, 40 "answer": false, 41 "justification": "Survey paper with no statistical experiments. Fig. 1 shows publication counts but no statistical analysis." 42 }, 43 "significance_tests": { 44 "applies": false, 45 "answer": false, 46 "justification": "No statistical comparisons are made in this survey." 47 }, 48 "effect_sizes_reported": { 49 "applies": false, 50 "answer": false, 51 "justification": "No experiments producing effect sizes." 52 }, 53 "sample_size_justified": { 54 "applies": false, 55 "answer": false, 56 "justification": "No experimental sample involved." 57 }, 58 "variance_reported": { 59 "applies": false, 60 "answer": false, 61 "justification": "No experimental runs to report variance across." 62 } 63 }, 64 "evaluation_design": { 65 "baselines_included": { 66 "applies": true, 67 "answer": false, 68 "justification": "The survey does not compare itself against prior surveys of responsible AI in EO or position itself relative to specific prior reviews in a structured way." 69 }, 70 "baselines_contemporary": { 71 "applies": false, 72 "answer": false, 73 "justification": "No baseline comparison applies since no structured comparison with prior surveys is attempted." 74 }, 75 "ablation_study": { 76 "applies": false, 77 "answer": false, 78 "justification": "Survey paper — no system components to ablate." 79 }, 80 "multiple_metrics": { 81 "applies": false, 82 "answer": false, 83 "justification": "No evaluation metrics used — this is a narrative review." 84 }, 85 "human_evaluation": { 86 "applies": false, 87 "answer": false, 88 "justification": "No system outputs to evaluate." 89 }, 90 "held_out_test_set": { 91 "applies": false, 92 "answer": false, 93 "justification": "No test set involved." 94 }, 95 "per_category_breakdown": { 96 "applies": true, 97 "answer": true, 98 "justification": "The paper organizes its review into clear thematic categories (bias, security, privacy, ethics, social good) with dedicated sections for each." 99 }, 100 "failure_cases_discussed": { 101 "applies": true, 102 "answer": true, 103 "justification": "The paper discusses failure modes and challenges extensively: spatial autocorrelation biases (Section 2.3.2), adversarial attacks (Section 3.1.1), domain shift issues (Section 3.1.2), privacy violations from UAV imagery (Section 4.1), and stigmatization risks (Section 5.1)." 104 }, 105 "negative_results_reported": { 106 "applies": true, 107 "answer": true, 108 "justification": "The paper reports limitations of existing approaches: adversarial training only defends against specific attacks (Section 3.2.1), current XAI methods produce semantically misaligned visualizations (Section 3.3.3), and upscaling studies are lacking (Section 5.5)." 109 } 110 }, 111 "claims_and_evidence": { 112 "abstract_claims_supported": { 113 "applies": true, 114 "answer": true, 115 "justification": "The abstract claims to 'systematically define the intersection of AI and EO with a central focus on responsible AI practices' and identify 'critical components.' The paper delivers on this with dedicated sections for each component (bias, security, privacy, ethics, social good)." 116 }, 117 "causal_claims_justified": { 118 "applies": false, 119 "answer": false, 120 "justification": "The paper is a survey that does not make causal claims about its own work. It describes causal relationships from the literature (e.g., spatial autocorrelation causing overestimation) but attributes these to cited sources." 121 }, 122 "generalization_bounded": { 123 "applies": true, 124 "answer": false, 125 "justification": "The paper claims to be a 'pioneering effort to systematically define the intersection of AI and EO' but does not bound this claim — it does not specify which EO subfields, AI methods, or geographic contexts are covered vs excluded. The literature coverage is not described with explicit inclusion/exclusion criteria." 126 }, 127 "alternative_explanations_discussed": { 128 "applies": false, 129 "answer": false, 130 "justification": "This is a survey/taxonomy paper presenting no empirical results that would require alternative explanations." 131 }, 132 "proxy_outcome_distinction": { 133 "applies": false, 134 "answer": false, 135 "justification": "No measurements or proxies — this is a narrative review." 136 } 137 }, 138 "setup_transparency": { 139 "model_versions_specified": { 140 "applies": false, 141 "answer": false, 142 "justification": "No models are used in this survey." 143 }, 144 "prompts_provided": { 145 "applies": false, 146 "answer": false, 147 "justification": "No prompting used." 148 }, 149 "hyperparameters_reported": { 150 "applies": false, 151 "answer": false, 152 "justification": "No experiments with hyperparameters." 153 }, 154 "scaffolding_described": { 155 "applies": false, 156 "answer": false, 157 "justification": "No agentic scaffolding used." 158 }, 159 "data_preprocessing_documented": { 160 "applies": true, 161 "answer": false, 162 "justification": "The paper describes a Google Scholar search for Fig. 1 ('keywords: machine learning or deep learning and remote sensing') but provides no systematic review protocol, no inclusion/exclusion criteria for the papers discussed, and no documentation of how the reviewed literature was selected." 163 } 164 }, 165 "limitations_and_scope": { 166 "limitations_section_present": { 167 "applies": true, 168 "answer": false, 169 "justification": "There is no dedicated limitations section. Section 8 (Conclusions) acknowledges geopolitical complexities but does not discuss limitations of the review itself." 170 }, 171 "threats_to_validity_specific": { 172 "applies": true, 173 "answer": false, 174 "justification": "No specific threats to the validity of the review are discussed. The paper does not address potential selection bias in its literature coverage, language bias, or coverage gaps." 175 }, 176 "scope_boundaries_stated": { 177 "applies": true, 178 "answer": false, 179 "justification": "The paper claims broad coverage ('pioneering and thorough review') but does not state what is explicitly out of scope, which EO subfields or AI methods are excluded, or what geographic/temporal bounds apply to the literature reviewed." 180 } 181 }, 182 "data_integrity": { 183 "raw_data_available": { 184 "applies": true, 185 "answer": false, 186 "justification": "No raw data from the literature search or analysis is available for verification." 187 }, 188 "data_collection_described": { 189 "applies": true, 190 "answer": false, 191 "justification": "The paper mentions a Google Scholar search for publication counts (Fig. 1) but does not describe how the broader body of reviewed literature was collected or selected." 192 }, 193 "recruitment_methods_described": { 194 "applies": false, 195 "answer": false, 196 "justification": "No human participants. The data source is published literature, which is a standard corpus, though the selection process is undocumented." 197 }, 198 "data_pipeline_documented": { 199 "applies": true, 200 "answer": false, 201 "justification": "No pipeline from literature search to review synthesis is documented. The paper jumps from a general framing to thematic discussion without describing how papers were found, screened, or organized." 202 } 203 }, 204 "conflicts_of_interest": { 205 "funding_disclosed": { 206 "applies": true, 207 "answer": false, 208 "justification": "No funding acknowledgment section is present in the paper." 209 }, 210 "affiliations_disclosed": { 211 "applies": true, 212 "answer": true, 213 "justification": "All author affiliations are clearly listed, including Maxar Technologies (a commercial satellite provider) for Fabio Pacifici." 214 }, 215 "funder_independent_of_outcome": { 216 "applies": true, 217 "answer": false, 218 "justification": "No funding is disclosed, so independence cannot be assessed. One author is from Maxar Technologies, a commercial EO provider with a potential interest in the paper's conclusions about responsible AI in EO." 219 }, 220 "financial_interests_declared": { 221 "applies": true, 222 "answer": false, 223 "justification": "No competing interests or financial interests statement is present. Maxar Technologies is mentioned favorably in Section 7 (SpaceNet, ESG reports) by an author affiliated with Maxar." 224 } 225 }, 226 "contamination": { 227 "training_cutoff_stated": { 228 "applies": false, 229 "answer": false, 230 "justification": "Survey paper — no pre-trained model evaluated on any benchmark." 231 }, 232 "train_test_overlap_discussed": { 233 "applies": false, 234 "answer": false, 235 "justification": "Survey paper — no benchmark evaluation." 236 }, 237 "benchmark_contamination_addressed": { 238 "applies": false, 239 "answer": false, 240 "justification": "Survey paper — no benchmark evaluation." 241 } 242 }, 243 "human_studies": { 244 "pre_registered": { 245 "applies": false, 246 "answer": false, 247 "justification": "No human participants." 248 }, 249 "irb_or_ethics_approval": { 250 "applies": false, 251 "answer": false, 252 "justification": "No human participants." 253 }, 254 "demographics_reported": { 255 "applies": false, 256 "answer": false, 257 "justification": "No human participants." 258 }, 259 "inclusion_exclusion_criteria": { 260 "applies": false, 261 "answer": false, 262 "justification": "No human participants." 263 }, 264 "randomization_described": { 265 "applies": false, 266 "answer": false, 267 "justification": "No human participants." 268 }, 269 "blinding_described": { 270 "applies": false, 271 "answer": false, 272 "justification": "No human participants." 273 }, 274 "attrition_reported": { 275 "applies": false, 276 "answer": false, 277 "justification": "No human participants." 278 } 279 }, 280 "cost_and_practicality": { 281 "inference_cost_reported": { 282 "applies": false, 283 "answer": false, 284 "justification": "Survey paper — no method with inference costs." 285 }, 286 "compute_budget_stated": { 287 "applies": false, 288 "answer": false, 289 "justification": "Survey paper — no computational experiments." 290 } 291 }, 292 "survey_methodology": { 293 "prisma_or_structured_protocol": { 294 "applies": true, 295 "answer": false, 296 "justification": "No structured review protocol is followed. No PRISMA diagram, no registered protocol, no systematic search strategy with reproducible queries. The paper is a narrative review with ad-hoc paper selection." 297 }, 298 "quality_assessment_of_sources": { 299 "applies": true, 300 "answer": false, 301 "justification": "The survey does not assess the methodological quality of the papers it cites. All sources are treated equally regardless of their rigor." 302 }, 303 "publication_bias_discussed": { 304 "applies": true, 305 "answer": false, 306 "justification": "No discussion of publication bias in the reviewed literature. The survey does not consider whether its sources skew toward positive results about AI4EO." 307 } 308 } 309 }, 310 "claims": [ 311 { 312 "claim": "AI4EO publications in IEEE TGRS have surged dramatically since 2020, growing from ~500 in 2019 to ~2500 in 2023.", 313 "evidence": "Fig. 1 shows publication counts from Google Scholar advanced search using keywords 'machine learning' or 'deep learning' and 'remote sensing' in IEEE TGRS from 2014-2023.", 314 "supported": "moderate" 315 }, 316 { 317 "claim": "Spatial autocorrelation between training and testing samples causes overestimation of model accuracy in geospatial applications.", 318 "evidence": "Cites Karasiak et al. (2022) [28] who demonstrated this effect. Section 2.3.2.", 319 "supported": "strong" 320 }, 321 { 322 "claim": "Graph-based ensemble neural network approaches can deliver robust hindcasting and forecasting of mass movement impacts at local, regional, and national scales.", 323 "evidence": "Section 6.1 cites Dimasaka et al. (2023) [142] showing results over 68,000 incidents since 1957 across Norwegian territory.", 324 "supported": "weak" 325 }, 326 { 327 "claim": "The field has transitioned from singular focus on model-centric or data-centric approaches to a balanced data-model-centric paradigm.", 328 "evidence": "Fig. 2 and Section 1 present this as the authors' opinion ('we believe'), supported by the rise of foundation models. No systematic evidence is provided.", 329 "supported": "weak" 330 } 331 ], 332 "red_flags": [ 333 { 334 "flag": "No systematic review methodology", 335 "detail": "The paper claims to be a 'pioneering and thorough review' but follows no structured review protocol (PRISMA, etc.). Paper selection appears ad-hoc with no documented search strategy, inclusion/exclusion criteria, or screening process." 336 }, 337 { 338 "flag": "Undisclosed conflict of interest", 339 "detail": "Author Fabio Pacifici is affiliated with Maxar Technologies. Section 7 mentions Maxar favorably multiple times (SpaceNet co-founder, ESG reports). No competing interests statement addresses this." 340 }, 341 { 342 "flag": "No quality assessment of reviewed sources", 343 "detail": "The survey does not assess the methodological quality of cited works. All sources are treated as equally reliable, potentially laundering weak results alongside strong ones." 344 }, 345 { 346 "flag": "Claims outrun evidence", 347 "detail": "The paper calls itself 'a pioneering effort to systematically define the intersection of AI and EO' but it is a narrative review, not a systematic one. The word 'systematically' is not justified by the methodology." 348 } 349 ], 350 "cited_papers": [ 351 { 352 "title": "Gender Shades: Intersectional Accuracy Disparities in Commercial Gender Classification", 353 "authors": ["Joy Buolamwini", "Timnit Gebru"], 354 "year": 2018, 355 "relevance": "Foundational work on AI bias in facial recognition, relevant to AI fairness and responsible AI evaluation." 356 }, 357 { 358 "title": "A framework for understanding sources of harm throughout the machine learning life cycle", 359 "authors": ["Harini Suresh", "John Guttag"], 360 "year": 2021, 361 "relevance": "Framework for understanding ML bias types (historical, representation, measurement, etc.) relevant to AI methodology quality." 362 }, 363 { 364 "title": "Are Emergent Abilities of Large Language Models a Mirage?", 365 "authors": ["Rylan Schaeffer", "Brando Miranda", "Sanmi Koyejo"], 366 "year": 2023, 367 "arxiv_id": "2304.15004", 368 "relevance": "Questions whether LLM emergent abilities are artifacts of evaluation metrics — directly relevant to AI evaluation methodology." 369 }, 370 { 371 "title": "On the Opportunities and Risks of Foundation Models", 372 "authors": ["Rishi Bommasani"], 373 "year": 2021, 374 "relevance": "Comprehensive analysis of foundation model risks and opportunities, relevant to AI safety and responsible deployment." 375 }, 376 { 377 "title": "Universal adversarial examples in remote sensing: Methodology and benchmark", 378 "authors": ["Yonghao Xu", "Pedram Ghamisi"], 379 "year": 2022, 380 "relevance": "Benchmark for adversarial robustness in remote sensing AI, relevant to AI security evaluation methodology." 381 }, 382 { 383 "title": "Tackling climate change with machine learning", 384 "authors": ["David Rolnick"], 385 "year": 2022, 386 "relevance": "Survey of ML applications for climate change, relevant to AI for social good evaluation." 387 }, 388 { 389 "title": "Large Language Models are Geographically Biased", 390 "authors": ["Rohin Manvi", "Samar Khanna", "Marshall Burke", "David Lobell", "Stefano Ermon"], 391 "year": 2024, 392 "relevance": "Documents geographic bias in LLMs, directly relevant to AI bias and fairness research methodology." 393 }, 394 { 395 "title": "Deep learning in remote sensing: A comprehensive review and list of resources", 396 "authors": ["Xiao Xiang Zhu"], 397 "year": 2017, 398 "relevance": "Major survey of deep learning in remote sensing, relevant as a methodological comparison for AI survey quality." 399 } 400 ] 401 }