scan-v5.json - ai-research-survey - Systematic scan of agentic development research. What's signal, what's noise.

scan-v5.json (26040B)
      1 {
      2   "scan_version": 5,
      3   "paper_type": "empirical",
      4   "paper": {
      5     "title": "Defense of Massive False Data Injection Attack via Sparse Attack Points Considering Uncertain Topological Changes",
      6     "authors": [
      7       "Xiaoge Huang",
      8       "Zhijun Qin",
      9       "Ming Xie",
     10       "Hui Liu",
     11       "Liang Meng"
     12     ],
     13     "year": 2022,
     14     "venue": "Journal of Modern Power Systems and Clean Energy",
     15     "arxiv_id": null,
     16     "doi": "10.35833/mpce.2020.000686"
     17   },
     18   "checklist": {
     19     "claims_and_evidence": {
     20       "abstract_claims_supported": {
     21         "applies": true,
     22         "answer": true,
     23         "justification": "The abstract claims 95% detection accuracy and 80% localization accuracy; Table V confirms 96.7–98.5% detection accuracy and Table IX shows 80.37–85.69% localization correct rate across all test systems.",
     24         "source": "haiku"
     25       },
     26       "causal_claims_justified": {
     27         "applies": true,
     28         "answer": true,
     29         "justification": "Comparative claims (AE-BCV outperforms SVM and ANN) are supported by training all three detectors on identical datasets and evaluating on identical held-out test sets, which is adequate for comparative inference.",
     30         "source": "haiku"
     31       },
     32       "generalization_bounded": {
     33         "applies": true,
     34         "answer": false,
     35         "justification": "The conclusion asserts the AE-BCV detector 'can be directly applied with AC power flow model,' but all experiments use only the DC power flow model; this generalization goes beyond the tested setting.",
     36         "source": "haiku"
     37       },
     38       "alternative_explanations_discussed": {
     39         "applies": true,
     40         "answer": false,
     41         "justification": "The paper does not consider alternative explanations for AE-BCV outperforming SVM/ANN, such as hyperparameter sensitivity of the baselines or the effect of architecture depth differences.",
     42         "source": "haiku"
     43       },
     44       "proxy_outcome_distinction": {
     45         "applies": true,
     46         "answer": true,
     47         "justification": "The paper clearly distinguishes detection accuracy, localization correct rate, and recovery mean error as separate metrics tied to three distinct claimed contributions, without conflating them.",
     48         "source": "haiku"
     49       }
     50     },
     51     "limitations_and_scope": {
     52       "limitations_section_present": {
     53         "applies": true,
     54         "answer": false,
     55         "justification": "There is no dedicated limitations or threats-to-validity section; the conclusion mentions future work directions (AC model, dynamic SE) but does not frame these as limitations of the current results.",
     56         "source": "haiku"
     57       },
     58       "threats_to_validity_specific": {
     59         "applies": true,
     60         "answer": false,
     61         "justification": "No specific threats to validity are discussed; the complete information assumption and DC-only model are stated as design choices rather than as validity threats affecting result interpretation.",
     62         "source": "haiku"
     63       },
     64       "scope_boundaries_stated": {
     65         "applies": true,
     66         "answer": false,
     67         "justification": "While assumptions (DC model, complete topology information, single-snapshot SE) are mentioned, the paper does not explicitly state what the results do NOT show or demarcate clear scope boundaries in a threats-to-validity sense.",
     68         "source": "haiku"
     69       }
     70     },
     71     "conflicts_of_interest": {
     72       "funding_disclosed": {
     73         "applies": true,
     74         "answer": true,
     75         "justification": "Funding is disclosed: 'This work was supported in part by the National Natural Science Foundation of China (No. 51767001).'",
     76         "source": "haiku"
     77       },
     78       "affiliations_disclosed": {
     79         "applies": true,
     80         "answer": true,
     81         "justification": "All author affiliations are disclosed: Guangxi University (academic) and Guangxi Power Grid Co. Ltd., China Southern Grid (industry co-authors).",
     82         "source": "haiku"
     83       },
     84       "funder_independent_of_outcome": {
     85         "applies": true,
     86         "answer": true,
     87         "justification": "The National Natural Science Foundation of China is a government funding agency with no commercial interest in the outcome of FDIA defense methodology research.",
     88         "source": "haiku"
     89       },
     90       "financial_interests_declared": {
     91         "applies": true,
     92         "answer": false,
     93         "justification": "No competing interests or financial interests statement (patents, equity, consulting) is provided anywhere in the paper.",
     94         "source": "haiku"
     95       }
     96     },
     97     "scope_and_framing": {
     98       "key_terms_defined": {
     99         "applies": true,
    100         "answer": true,
    101         "justification": "Key terms are precisely defined: FDIA, SE, BDD, DC power flow model (Eq. 1–3), state variables, attack intensity parameter k, and both attack models are formally specified with mathematical notation.",
    102         "source": "haiku"
    103       },
    104       "intended_contribution_clear": {
    105         "applies": true,
    106         "answer": true,
    107         "justification": "Four explicit numbered contributions are stated in the introduction: enhanced attack model, AE-BCV detector, AE-GAN generation, and pattern match recovery algorithm.",
    108         "source": "haiku"
    109       },
    110       "engagement_with_prior_work": {
    111         "applies": true,
    112         "answer": true,
    113         "justification": "Section I extensively compares against prior work [6]–[28], explicitly differentiating the proposed approach from [21], [26], [28] and explaining why prior methods fail to handle multi-modal measurement distributions.",
    114         "source": "haiku"
    115       }
    116     }
    117   },
    118   "type_checklist": {
    119     "empirical": {
    120       "artifacts": {
    121         "code_released": {
    122           "applies": true,
    123           "answer": false,
    124           "justification": "No source code is released or mentioned as available; only the hardware setup and PyTorch framework are noted.",
    125           "source": "haiku"
    126         },
    127         "data_released": {
    128           "applies": true,
    129           "answer": false,
    130           "justification": "Datasets are generated via MATPOWER simulations with FDIA overlays using specific configurations; they are not released or made publicly available.",
    131           "source": "haiku"
    132         },
    133         "environment_specified": {
    134           "applies": true,
    135           "answer": false,
    136           "justification": "Hardware (Intel i7-8750H, RTX 2070) and PyTorch are mentioned but no version numbers or reproducible environment files (requirements.txt, Dockerfile) are provided.",
    137           "source": "haiku"
    138         },
    139         "reproduction_instructions": {
    140           "applies": true,
    141           "answer": false,
    142           "justification": "Appendix A provides neural network architecture parameters but no step-by-step instructions exist to reproduce experiments from scratch without guessing implementation details.",
    143           "source": "haiku"
    144         }
    145       },
    146       "statistical_methodology": {
    147         "confidence_intervals_or_error_bars": {
    148           "applies": true,
    149           "answer": false,
    150           "justification": "No confidence intervals or error bars are reported for any accuracy metrics; all results are single percentage values without uncertainty estimates.",
    151           "source": "haiku"
    152         },
    153         "significance_tests": {
    154           "applies": true,
    155           "answer": false,
    156           "justification": "No statistical significance tests are performed for comparative accuracy claims between AE-BCV, SVM, and ANN.",
    157           "source": "haiku"
    158         },
    159         "effect_sizes_reported": {
    160           "applies": true,
    161           "answer": true,
    162           "justification": "Accuracy differences are quantified with baselines (e.g., AE-BCV 95.2% vs SVM 80.0% for 118-bus WA); recovery errors are reported with before/after context (16.50 → 0.85 mean |a/z| for SA on 118-bus).",
    163           "source": "haiku"
    164         },
    165         "sample_size_justified": {
    166           "applies": true,
    167           "answer": false,
    168           "justification": "1100 simulations per attack level are used but not justified; the 80/10/10 split is stated without statistical power analysis.",
    169           "source": "haiku"
    170         },
    171         "variance_reported": {
    172           "applies": true,
    173           "answer": false,
    174           "justification": "No variance, standard deviation, or spread is reported for any accuracy result; all metrics are single-point estimates.",
    175           "source": "haiku"
    176         }
    177       },
    178       "evaluation_design": {
    179         "baselines_included": {
    180           "applies": true,
    181           "answer": true,
    182           "justification": "ANN and SVM detectors are trained on identical datasets and compared against AE-BCV across all test systems and attack levels.",
    183           "source": "haiku"
    184         },
    185         "baselines_contemporary": {
    186           "applies": true,
    187           "answer": false,
    188           "justification": "SVM and plain ANN are weak baselines for a 2022 paper; contemporary deep learning alternatives (CNN, LSTM, attention-based detectors) are absent as direct comparisons, and comparison with [13] (2017) and [14] (2018) is acknowledged as 'rough.'",
    189           "source": "haiku"
    190         },
    191         "ablation_study": {
    192           "applies": true,
    193           "answer": false,
    194           "justification": "No ablation study isolates contributions of AE vs BCV in the detector or standard GAN vs AE-GAN in the generator, making it unclear which components drive performance.",
    195           "source": "haiku"
    196         },
    197         "multiple_metrics": {
    198           "applies": true,
    199           "answer": true,
    200           "justification": "Multiple metrics are used: accuracy, false positive rate, and false negative rate for detection; correct rate, positive/negative false rates for localization; mean recovery error before and after for recovery.",
    201           "source": "haiku"
    202         },
    203         "human_evaluation": {
    204           "applies": false,
    205           "answer": false,
    206           "justification": "Human evaluation is clearly irrelevant for automated power system FDIA detection using simulated data.",
    207           "source": "haiku"
    208         },
    209         "held_out_test_set": {
    210           "applies": true,
    211           "answer": true,
    212           "justification": "An explicit 10% held-out test set is used, with a deliberately higher topology change rate (8% line outages) than training (5%) to test generalization to unseen conditions.",
    213           "source": "haiku"
    214         },
    215         "per_category_breakdown": {
    216           "applies": true,
    217           "answer": true,
    218           "justification": "Results are broken down by attack intensity (SA/MA/WA), attack type (targeted/untargeted), and power system (57-bus, 118-bus, 415-bus) across Tables V–X.",
    219           "source": "haiku"
    220         },
    221         "failure_cases_discussed": {
    222           "applies": true,
    223           "answer": false,
    224           "justification": "Performance variation by attack intensity is quantified but not discussed as failure cases; no dedicated analysis of misclassification patterns or conditions where the methodology breaks down is provided.",
    225           "source": "haiku"
    226         },
    227         "negative_results_reported": {
    228           "applies": true,
    229           "answer": false,
    230           "justification": "All results are framed positively; performance degradation for weak attacks is reported in tables but not interpreted as a negative finding or limitation.",
    231           "source": "haiku"
    232         }
    233       },
    234       "setup_transparency": {
    235         "model_versions_specified": {
    236           "applies": true,
    237           "answer": false,
    238           "justification": "PyTorch is mentioned as the implementation framework but no version number is given; MATPOWER and CVX versions are also unspecified.",
    239           "source": "haiku"
    240         },
    241         "prompts_provided": {
    242           "applies": false,
    243           "answer": false,
    244           "justification": "This is not an LLM/prompt-based paper; no prompts or system instructions are relevant.",
    245           "source": "haiku"
    246         },
    247         "hyperparameters_reported": {
    248           "applies": true,
    249           "answer": true,
    250           "justification": "Appendix A (Tables AI and AII) provides detailed neural network parameters including number of hidden layers, neuron counts, and learning rates for all models.",
    251           "source": "haiku"
    252         },
    253         "scaffolding_described": {
    254           "applies": false,
    255           "answer": false,
    256           "justification": "This paper does not involve agentic AI scaffolding; deep learning models are used for classification and generation tasks.",
    257           "source": "haiku"
    258         },
    259         "data_preprocessing_documented": {
    260           "applies": true,
    261           "answer": true,
    262           "justification": "Section VI.B documents Monte Carlo line switching (5% train / 8% test), power injection variation (50–150% ± 1% noise), per-unit representation without normalization, and separate dataset configurations for AE vs AE-GAN.",
    263           "source": "haiku"
    264         }
    265       },
    266       "data_integrity": {
    267         "raw_data_available": {
    268           "applies": true,
    269           "answer": false,
    270           "justification": "Generated datasets (FDIA samples from MATPOWER simulations with CVX-optimized attack vectors) are not publicly released for independent verification.",
    271           "source": "haiku"
    272         },
    273         "data_collection_described": {
    274           "applies": true,
    275           "answer": true,
    276           "justification": "Section VI.B describes the data generation procedure including normal case diversification (Monte Carlo simulations, line switching, injection variation) and FDIA case generation using the proposed optimization models.",
    277           "source": "haiku"
    278         },
    279         "recruitment_methods_described": {
    280           "applies": false,
    281           "answer": false,
    282           "justification": "No human participants; data is entirely simulated from power system models.",
    283           "source": "haiku"
    284         },
    285         "data_pipeline_documented": {
    286           "applies": true,
    287           "answer": true,
    288           "justification": "The pipeline from MATPOWER base cases → Monte Carlo diversification → FDIA overlay (CVX optimization) → 80/10/10 train/val/test split is described with sufficient detail to understand the process.",
    289           "source": "haiku"
    290         }
    291       },
    292       "contamination": {
    293         "training_cutoff_stated": {
    294           "applies": false,
    295           "answer": false,
    296           "justification": "Not applicable; this paper trains deep learning models on synthetically generated power system data, not on pre-trained LLM benchmarks.",
    297           "source": "haiku"
    298         },
    299         "train_test_overlap_discussed": {
    300           "applies": false,
    301           "answer": false,
    302           "justification": "Not applicable; data is synthetically generated with controlled topology-based train/test splits.",
    303           "source": "haiku"
    304         },
    305         "benchmark_contamination_addressed": {
    306           "applies": false,
    307           "answer": false,
    308           "justification": "Not applicable; IEEE bus systems are simulation substrates, not benchmark datasets for evaluating pre-trained model knowledge.",
    309           "source": "haiku"
    310         }
    311       },
    312       "human_studies": {
    313         "pre_registered": {
    314           "applies": false,
    315           "answer": false,
    316           "justification": "No human participants in this study.",
    317           "source": "haiku"
    318         },
    319         "irb_or_ethics_approval": {
    320           "applies": false,
    321           "answer": false,
    322           "justification": "No human participants in this study.",
    323           "source": "haiku"
    324         },
    325         "demographics_reported": {
    326           "applies": false,
    327           "answer": false,
    328           "justification": "No human participants in this study.",
    329           "source": "haiku"
    330         },
    331         "inclusion_exclusion_criteria": {
    332           "applies": false,
    333           "answer": false,
    334           "justification": "No human participants in this study.",
    335           "source": "haiku"
    336         },
    337         "randomization_described": {
    338           "applies": false,
    339           "answer": false,
    340           "justification": "No human participants in this study.",
    341           "source": "haiku"
    342         },
    343         "blinding_described": {
    344           "applies": false,
    345           "answer": false,
    346           "justification": "No human participants in this study.",
    347           "source": "haiku"
    348         },
    349         "attrition_reported": {
    350           "applies": false,
    351           "answer": false,
    352           "justification": "No human participants in this study.",
    353           "source": "haiku"
    354         }
    355       },
    356       "cost_and_practicality": {
    357         "inference_cost_reported": {
    358           "applies": true,
    359           "answer": true,
    360           "justification": "Table XI reports online classification time (0.011–0.013 seconds) and localization/recovery time (14.69–25.47 seconds) for IEEE 118-bus and CSG 415-bus systems.",
    361           "source": "haiku"
    362         },
    363         "compute_budget_stated": {
    364           "applies": true,
    365           "answer": true,
    366           "justification": "Hardware is specified (Intel i7-8750H CPU, RTX 2070 GPU, 16 GB RAM) and offline training times are reported (441–594s for AE-BCV detection, 324–406s for AE-GAN).",
    367           "source": "haiku"
    368         }
    369       }
    370     }
    371   },
    372   "claims": [
    373     {
    374       "claim": "AE-BCV achieves over 95% FDIA detection accuracy including under unseen topological changes",
    375       "evidence": "Table V shows 96.7–98.5% accuracy on IEEE 57-bus, 118-bus, and 415-bus; Tables VII–VIII confirm 90.8–99.2% for unseen moderate and weak attacks",
    376       "supported": "strong"
    377     },
    378     {
    379       "claim": "Proposed attack models affect far more state variables with fewer compromised meters than the conventional model",
    380       "evidence": "Table IV: conventional model affects 10 states with 60–140 compromised meters on 118-bus; proposed untargeted model affects 117 states with only 33–34 compromised meters",
    381       "supported": "strong"
    382     },
    383     {
    384       "claim": "AE-GAN avoids model collapse for multi-modal power system measurement distributions",
    385       "evidence": "Figure 5 shows discriminator and generator training losses converging to Nash-equilibrium after ~200 steps; theoretical argument provided that single-modal encoder intermediate prevents GAN collapse",
    386       "supported": "moderate"
    387     },
    388     {
    389       "claim": "FDIA localization achieves 80–86% correct rate across attack intensities and test systems",
    390       "evidence": "Table IX shows correct rates of 80.37–85.69% for IEEE 118-bus and CSG 415-bus across SA, MA, and WA intensity levels",
    391       "supported": "strong"
    392     },
    393     {
    394       "claim": "Recovery reduces mean measurement error by approximately 95% across attack intensities",
    395       "evidence": "Table X: error drops from 16.50 to 0.85 (SA) and 3.15 to 0.46 (WA) on IEEE 118-bus; similar reductions on CSG 415-bus",
    396       "supported": "strong"
    397     },
    398     {
    399       "claim": "AE-BCV advantage over SVM/ANN grows substantially at lower attack intensities",
    400       "evidence": "Table VIII: AE-BCV achieves 90.8–95.2% for weak attacks vs SVM 50.8–80.0% and ANN 60.4–78.8%",
    401       "supported": "strong"
    402     }
    403   ],
    404   "methodology_tags": [
    405     "benchmark-eval",
    406     "case-study"
    407   ],
    408   "key_findings": "The paper proposes a three-stage deep learning defense against false data injection attacks in power grids: an AE-BCV detector achieving >95% detection accuracy that generalizes to unseen network topologies; an AE-GAN that generates diverse normal measurement distributions without model collapse; and a pattern match algorithm achieving 80–86% localization accuracy with ~95% recovery of falsified measurements. A secondary contribution demonstrates that the proposed enhanced attack model can affect 10× more state variables using fewer compromised meters than prior methods, motivating the need for more sophisticated defense.",
    409   "red_flags": [
    410     {
    411       "flag": "Simulated data only",
    412       "detail": "All experiments use synthetically generated data from MATPOWER simulations; no validation on real power grid operational data or real FDIA incident data is performed, making real-world generalization unverified."
    413     },
    414     {
    415       "flag": "Complete information assumption",
    416       "detail": "Both attacker and defender are assumed to have complete knowledge of the power grid topology, a strong and often unrealistic assumption; results may not transfer to partial-information scenarios, which are not discussed as a threat."
    417     },
    418     {
    419       "flag": "No statistical significance testing",
    420       "detail": "Accuracy differences between AE-BCV, SVM, and ANN are reported as single percentages without confidence intervals or significance tests, making it unclear whether observed differences are statistically meaningful."
    421     },
    422     {
    423       "flag": "Weak baselines for 2022",
    424       "detail": "SVM and plain ANN are outdated baselines for a 2022 deep learning paper; contemporary alternatives such as CNN, LSTM, or attention-based FDIA detectors are not included as direct comparisons."
    425     },
    426     {
    427       "flag": "No reproducibility artifacts",
    428       "detail": "No source code, datasets, or step-by-step reproduction instructions are released; independent replication is not feasible despite the neural network architecture tables in Appendix A."
    429     },
    430     {
    431       "flag": "DC model only with unsupported AC claim",
    432       "detail": "All results use the DC power flow model, yet the conclusion claims the methodology 'can be directly applied with AC power flow model' without any empirical support for this assertion."
    433     },
    434     {
    435       "flag": "No ablation study",
    436       "detail": "No ablation study isolates the contributions of AE vs BCV in the detector, or the AE component vs standard GAN in the generator, leaving unclear which components are essential for reported performance."
    437     }
    438   ],
    439   "cited_papers": [
    440     {
    441       "title": "False data injection attacks against state estimation in electric power grids (Liu et al., 2011)",
    442       "relevance": "Foundational paper proposing the original FDIA concept and showing attacks can bypass bad data detection; the proposed attack models in this paper extend and compare against this work."
    443     },
    444     {
    445       "title": "A survey on the detection algorithms for false data injection attacks in smart grids (Musleh et al., 2020)",
    446       "relevance": "Comprehensive survey providing context for state-of-the-art FDIA detection methods and situating the AE-BCV contribution."
    447     },
    448     {
    449       "title": "Real-time detection of false data injection attacks in smart grid: a deep learning-based intelligent mechanism (He et al., 2017)",
    450       "relevance": "Prior deep learning FDIA detector achieving 92% on IEEE 118-bus; used as a reference performance benchmark for comparison."
    451     },
    452     {
    453       "title": "Online false data injection attack detection with wavelet transform and deep neural networks (Yu et al., 2018)",
    454       "relevance": "Deep learning FDIA detector achieving up to 98% on IEEE 118-bus; used as reference performance for comparison with the proposed detector."
    455     },
    456     {
    457       "title": "Online generative adversary network based measurement recovery in false data injection attacks (Li et al., 2020)",
    458       "relevance": "Prior GAN-based measurement recovery approach that the proposed AE-GAN improves upon by avoiding model collapse with multi-modal distributions."
    459     },
    460     {
    461       "title": "Generative adversarial nets (Goodfellow et al., 2014)",
    462       "relevance": "Foundational GAN paper; the AE-GAN methodology and training objective in this paper are built directly on this framework."
    463     },
    464     {
    465       "title": "Identification of false data injection attacks with considering the impact of wind generation and topology reconfigurations (Mohammadpourfard et al., 2018)",
    466       "relevance": "Prior FDIA localization work that the proposed method explicitly differentiates from by addressing multi-modal distributions via AE-GAN rather than predefined candidate sets."
    467     },
    468     {
    469       "title": "False data injection on state estimation in power systems — attacks, impacts, and defense: a survey (Deng et al., 2017)",
    470       "relevance": "Survey of FDIA attacks, impacts, and defenses providing context for the attack model formulation and the baseline convex optimization model."
    471     }
    472   ],
    473   "engagement_factors": {
    474     "practical_relevance": {
    475       "score": 2,
    476       "justification": "Power grid security is a high-stakes applied domain with real incidents (Ukraine 2015 blackout), but the DC-only model, complete information assumption, and absence of real-world validation limit immediate deployment."
    477     },
    478     "surprise_contrarian": {
    479       "score": 1,
    480       "justification": "The multi-modal distribution insight is a genuine contribution but not counterintuitive; using AE-GAN to solve it is a predictable application of generative models to the problem."
    481     },
    482     "fear_safety": {
    483       "score": 2,
    484       "justification": "References the 2015 Ukraine power grid attack affecting 80,000+ users as direct motivation; power grid security failures carry direct physical safety consequences."
    485     },
    486     "drama_conflict": {
    487       "score": 1,
    488       "justification": "The Ukraine blackout example adds urgency but the paper is straightforwardly technical without controversial claims or adversarial framing beyond standard attacker-defender setup."
    489     },
    490     "demo_ability": {
    491       "score": 0,
    492       "justification": "No code released, no public demo, and results require specialized power system simulation tools (MATPOWER, CVX, PyTorch) to replicate without provided artifacts."
    493     },
    494     "brand_recognition": {
    495       "score": 0,
    496       "justification": "Guangxi University and Guangxi Power Grid Co. Ltd. are not internationally recognized brand names in AI/ML or cybersecurity research."
    497     }
    498   },
    499   "hn_data": {
    500     "threads": [],
    501     "top_points": 0,
    502     "total_points": 0,
    503     "total_comments": 0
    504   }
    505 }
	ai-research-survey Systematic scan of agentic development research. What's signal, what's noise.
	git clone https://git.shiptheloop.com/ai-research-survey.git
	Log \| Files \| Refs