ai-research-survey

Systematic scan of agentic development research. What's signal, what's noise.
git clone https://git.shiptheloop.com/ai-research-survey.git
Log | Files | Refs

scan-v5.json (25048B)


      1 {
      2   "scan_version": 5,
      3   "paper_type": "empirical",
      4   "paper": {
      5     "title": "GSPR: Aligning LLM Safeguards as Generalizable Safety Policy Reasoners",
      6     "authors": [
      7       "Haoran Li",
      8       "Yulin Chen",
      9       "Jingru Zeng",
     10       "Hao Peng",
     11       "Huihao Jing",
     12       "Wenbin Hu",
     13       "Xi Yang",
     14       "Ziqian Zeng",
     15       "Sirui Han",
     16       "Yangqiu Song"
     17     ],
     18     "year": 2025,
     19     "venue": "arXiv.org",
     20     "arxiv_id": "2509.24418",
     21     "doi": "10.48550/arXiv.2509.24418"
     22   },
     23   "checklist": {
     24     "claims_and_evidence": {
     25       "abstract_claims_supported": {
     26         "applies": true,
     27         "answer": true,
     28         "justification": "Claims of improved accuracy and least inference token cost are backed by Tables 2–4: GSPR w/ Cold-start leads all baselines on S-Acc/C-Acc and generates only 34.10 average words vs 172+ for other explanation-providing models.",
     29         "source": "haiku"
     30       },
     31       "causal_claims_justified": {
     32         "applies": true,
     33         "answer": true,
     34         "justification": "Section 4.3 ablates cold-start SFT and category reward via controlled variants (GSPR safety-only, w/o Cold-start, w/ Cold-start), providing adequate basis for causal claims about each component's contribution.",
     35         "source": "haiku"
     36       },
     37       "generalization_bounded": {
     38         "applies": true,
     39         "answer": false,
     40         "justification": "The abstract claims GSPR 'naturally exhibits powerful generalization ability' broadly, but out-of-domain testing covers only 4 specific curated datasets; the paper makes no explicit scope statements about where generalization may not hold.",
     41         "source": "haiku"
     42       },
     43       "alternative_explanations_discussed": {
     44         "applies": true,
     45         "answer": false,
     46         "justification": "The paper does not discuss whether performance gains stem from training data policy scale (167 policies vs RSafe's 18) rather than the flexible taxonomy design; this key confound is never analyzed.",
     47         "source": "haiku"
     48       },
     49       "proxy_outcome_distinction": {
     50         "applies": true,
     51         "answer": true,
     52         "justification": "Claims are about safety prediction accuracy and category classification; S-Acc, S-F1, and C-Acc directly measure exactly those outcomes with no proxy mismatch.",
     53         "source": "haiku"
     54       }
     55     },
     56     "limitations_and_scope": {
     57       "limitations_section_present": {
     58         "applies": true,
     59         "answer": false,
     60         "justification": "There is no dedicated limitations section; Section 5 (Conclusion) only mentions adding more safety benchmarks as future work without identifying limitations of the current approach.",
     61         "source": "haiku"
     62       },
     63       "threats_to_validity_specific": {
     64         "applies": true,
     65         "answer": false,
     66         "justification": "No threats-to-validity are discussed anywhere; issues such as base model contamination, benchmark label quality, or class imbalance effects on evaluation go unacknowledged.",
     67         "source": "haiku"
     68       },
     69       "scope_boundaries_stated": {
     70         "applies": true,
     71         "answer": false,
     72         "justification": "The paper makes no explicit statements about what its results do not show or contexts where GSPR would not be expected to generalize.",
     73         "source": "haiku"
     74       }
     75     },
     76     "conflicts_of_interest": {
     77       "funding_disclosed": {
     78         "applies": true,
     79         "answer": false,
     80         "justification": "No acknowledgment section or funding disclosure appears anywhere in the paper.",
     81         "source": "haiku"
     82       },
     83       "affiliations_disclosed": {
     84         "applies": true,
     85         "answer": true,
     86         "justification": "Author affiliations (HKUST, NUS, South China University of Technology, Beihang University) are disclosed on the first page.",
     87         "source": "haiku"
     88       },
     89       "funder_independent_of_outcome": {
     90         "applies": false,
     91         "answer": false,
     92         "justification": "No funding is disclosed, making this criterion not applicable.",
     93         "source": "haiku"
     94       },
     95       "financial_interests_declared": {
     96         "applies": true,
     97         "answer": false,
     98         "justification": "No competing interests or financial interests statement appears in the paper.",
     99         "source": "haiku"
    100       }
    101     },
    102     "scope_and_framing": {
    103       "key_terms_defined": {
    104         "applies": true,
    105         "answer": true,
    106         "justification": "Core terms are formally defined: guardrail model G, safety taxonomy S, safety indicator yi, fine-grained category ci, and task formulation are given in Equation 1 of Section 2.1.",
    107         "source": "haiku"
    108       },
    109       "intended_contribution_clear": {
    110         "applies": true,
    111         "answer": true,
    112         "justification": "Three numbered contributions are explicitly enumerated at the end of the introduction: flexibility/generalization, fine-grained safety evaluation with explainability, and superior content moderation performance.",
    113         "source": "haiku"
    114       },
    115       "engagement_with_prior_work": {
    116         "applies": true,
    117         "answer": true,
    118         "justification": "Table 1 systematically compares GSPR against prior guardrails; Appendix A reviews safety threats and defenses; the paper explicitly contrasts GSPR's flexible taxonomy against fixed-taxonomy approaches in LlamaGuard, ShieldGemma, RSafe, and GuardReasoner.",
    119         "source": "haiku"
    120       }
    121     }
    122   },
    123   "type_checklist": {
    124     "empirical": {
    125       "artifacts": {
    126         "code_released": {
    127           "applies": true,
    128           "answer": false,
    129           "justification": "The paper states 'Our reproducible data, code, and model weights will be open-sourced' — this is a promise of future release, not an actual release at submission time.",
    130           "source": "haiku"
    131         },
    132         "data_released": {
    133           "applies": true,
    134           "answer": true,
    135           "justification": "All evaluation uses standard public benchmarks (WildGuard, Aegis, SafeRLHF, BeaverTails, OpenAI Moderation, HEx-PHI, T2T, Do-Not-Answer) that are publicly available; the 1,383 cold-start annotations are not released.",
    136           "source": "haiku"
    137         },
    138         "environment_specified": {
    139           "applies": true,
    140           "answer": false,
    141           "justification": "Hardware (8× NVIDIA H800) and software packages (VERL, vLLM) are named, but no requirements file, Dockerfile, or versioned dependency specification is provided.",
    142           "source": "haiku"
    143         },
    144         "reproduction_instructions": {
    145           "applies": true,
    146           "answer": false,
    147           "justification": "Hyperparameters are listed in Appendix C.2, but no runnable scripts exist and code is not available, making reproduction impossible without guessing implementation details.",
    148           "source": "haiku"
    149         }
    150       },
    151       "statistical_methodology": {
    152         "confidence_intervals_or_error_bars": {
    153           "applies": true,
    154           "answer": false,
    155           "justification": "Tables 2 and 3 report only point-estimate accuracy values; no confidence intervals or error bars appear anywhere in the paper.",
    156           "source": "haiku"
    157         },
    158         "significance_tests": {
    159           "applies": true,
    160           "answer": false,
    161           "justification": "No statistical significance tests are applied to any comparative results in Tables 2 and 3.",
    162           "source": "haiku"
    163         },
    164         "effect_sizes_reported": {
    165           "applies": true,
    166           "answer": true,
    167           "justification": "Percentage improvements are reported with baseline context (e.g., '>45% accuracy improvement in fine-grained category prediction' over RSafe's 30.17% baseline, visible in Table 2).",
    168           "source": "haiku"
    169         },
    170         "sample_size_justified": {
    171           "applies": true,
    172           "answer": false,
    173           "justification": "Test sets are used as provided by benchmarks (Table 6) without any sample size justification or discussion of statistical power.",
    174           "source": "haiku"
    175         },
    176         "variance_reported": {
    177           "applies": true,
    178           "answer": false,
    179           "justification": "Inference uses temperature=0.0 for a single run; no repeated experiments or variance across runs is reported anywhere.",
    180           "source": "haiku"
    181         }
    182       },
    183       "evaluation_design": {
    184         "baselines_included": {
    185           "applies": true,
    186           "answer": true,
    187           "justification": "Multiple baselines included: closed-source APIs (o3-mini, Gemini-2.5-Flash), open-source guardrails (ShieldGemma-9B, LlamaGuard3-8B, GuardReasoner-8B), general LLMs (Qwen2.5, Qwen3), and RL-aligned RSafe.",
    188           "source": "haiku"
    189         },
    190         "baselines_contemporary": {
    191           "applies": true,
    192           "answer": true,
    193           "justification": "Baselines include 2025 models: Gemini-2.5-Flash, o3-mini, Qwen3-8B, RSafe, and GuardReasoner — all contemporary with this submission.",
    194           "source": "haiku"
    195         },
    196         "ablation_study": {
    197           "applies": true,
    198           "answer": true,
    199           "justification": "Section 4.3 provides explicit ablations with 'GSPR (safety only)', 'GSPR w/o Cold-start', and 'GSPR w/ Cold-start' variants to isolate contributions of flexible prompt template, cold-start SFT, and category reward.",
    200           "source": "haiku"
    201         },
    202         "multiple_metrics": {
    203           "applies": true,
    204           "answer": true,
    205           "justification": "Evaluation uses S-Acc, S-F1, and C-Acc for moderation performance (Tables 2–3), plus Avg Word #, Mix %, and Repeat % for response quality analysis (Table 4).",
    206           "source": "haiku"
    207         },
    208         "human_evaluation": {
    209           "applies": false,
    210           "answer": false,
    211           "justification": "All evaluation uses automated benchmark labels; no human evaluation of GSPR's generated outputs is performed.",
    212           "source": "haiku"
    213         },
    214         "held_out_test_set": {
    215           "applies": true,
    216           "answer": true,
    217           "justification": "In-domain evaluation uses official held-out test splits (Table 6); out-of-domain evaluation uses entirely separate datasets not present during training.",
    218           "source": "haiku"
    219         },
    220         "per_category_breakdown": {
    221           "applies": true,
    222           "answer": true,
    223           "justification": "Results are broken down per dataset in Tables 2 and 3 (Wildguard, Aegis, SafeRLHF, BeaverTails for in-domain; 4 out-of-domain sets), though not per individual safety policy category.",
    224           "source": "haiku"
    225         },
    226         "failure_cases_discussed": {
    227           "applies": true,
    228           "answer": true,
    229           "justification": "Appendix D presents two case studies showing RSafe producing contradictory reasoning traces and Cold-start SFT making incorrect safety predictions, with qualitative analysis of why each fails.",
    230           "source": "haiku"
    231         },
    232         "negative_results_reported": {
    233           "applies": true,
    234           "answer": true,
    235           "justification": "GSPR w/o Cold-start shows dramatically worse category prediction (17.54% C-Acc on WildGuard); GSPR (safety only) on Qwen3 produces 31.63% language mixing — both reported without downplaying.",
    236           "source": "haiku"
    237         }
    238       },
    239       "setup_transparency": {
    240         "model_versions_specified": {
    241           "applies": true,
    242           "answer": true,
    243           "justification": "Exact model identifiers are provided: Qwen2.5-7B-Instruct, Qwen3-8B, Gemini-2.5-Flash, o3-mini, ShieldGemma-9B, LlamaGuard3-8B, GuardReasoner-8B.",
    244           "source": "haiku"
    245         },
    246         "prompts_provided": {
    247           "applies": true,
    248           "answer": true,
    249           "justification": "Full verbatim prompt templates for input prompt moderation, response moderation, and cold-start annotation are provided in Tables 7 and 8.",
    250           "source": "haiku"
    251         },
    252         "hyperparameters_reported": {
    253           "applies": true,
    254           "answer": true,
    255           "justification": "Appendix C.2 reports all key hyperparameters: lr=1e-7, batch_size=128, 1 epoch, rollouts=5, temperature=0.7, top_p=0.8, repetition_penalty=1.2, α1=0.55, α2=0.45.",
    256           "source": "haiku"
    257         },
    258         "scaffolding_described": {
    259           "applies": false,
    260           "answer": false,
    261           "justification": "GSPR is a guardrail training system, not an agentic scaffolded system; this criterion is not applicable.",
    262           "source": "haiku"
    263         },
    264         "data_preprocessing_documented": {
    265           "applies": true,
    266           "answer": true,
    267           "justification": "Section 3.1 and Appendix C.4 describe preprocessing steps: random sampling of 3,000 safe/unsafe per dataset, Gemini-2.5-Flash annotation with ground-truth labels shown, regex filtering yielding 1,383 cold-start samples.",
    268           "source": "haiku"
    269         }
    270       },
    271       "data_integrity": {
    272         "raw_data_available": {
    273           "applies": true,
    274           "answer": true,
    275           "justification": "All evaluation benchmark test sets (WildGuard, Aegis, SafeRLHF, BeaverTails, OpenAI Moderation, HEx-PHI, T2T, Do-Not-Answer) are publicly available; the cold-start annotations are not.",
    276           "source": "haiku"
    277         },
    278         "data_collection_described": {
    279           "applies": true,
    280           "answer": true,
    281           "justification": "Appendix B.1 and B.2 describe all training and testing datasets with full statistics in Tables 5 and 6, including split sizes, safe/unsafe counts, and policy counts.",
    282           "source": "haiku"
    283         },
    284         "recruitment_methods_described": {
    285           "applies": false,
    286           "answer": false,
    287           "justification": "Only standard public benchmarks are used; no participant recruitment is involved.",
    288           "source": "haiku"
    289         },
    290         "data_pipeline_documented": {
    291           "applies": true,
    292           "answer": true,
    293           "justification": "The full data pipeline from benchmark selection through cold-start annotation (Gemini-2.5-Flash with ground-truth labels, regex filtering, SFT) is described in Sections 3.1 and C.4.",
    294           "source": "haiku"
    295         }
    296       },
    297       "contamination": {
    298         "training_cutoff_stated": {
    299           "applies": true,
    300           "answer": false,
    301           "justification": "The training data cutoffs for base models Qwen2.5-7B-Instruct and Qwen3-8B are never stated or discussed.",
    302           "source": "haiku"
    303         },
    304         "train_test_overlap_discussed": {
    305           "applies": true,
    306           "answer": false,
    307           "justification": "No discussion of whether evaluation benchmark data (e.g., WildGuard test, Aegis test) may have been present in the pretraining corpora of the Qwen base models.",
    308           "source": "haiku"
    309         },
    310         "benchmark_contamination_addressed": {
    311           "applies": true,
    312           "answer": false,
    313           "justification": "The paper does not address whether safety benchmark examples were available before base model training cutoffs, which is especially relevant for benchmarks like BeaverTails (2023) evaluated on a 2025 model.",
    314           "source": "haiku"
    315         }
    316       },
    317       "human_studies": {
    318         "pre_registered": {
    319           "applies": false,
    320           "answer": false,
    321           "justification": "No human subjects study is conducted.",
    322           "source": "haiku"
    323         },
    324         "irb_or_ethics_approval": {
    325           "applies": false,
    326           "answer": false,
    327           "justification": "No human subjects study is conducted.",
    328           "source": "haiku"
    329         },
    330         "demographics_reported": {
    331           "applies": false,
    332           "answer": false,
    333           "justification": "No human participants.",
    334           "source": "haiku"
    335         },
    336         "inclusion_exclusion_criteria": {
    337           "applies": false,
    338           "answer": false,
    339           "justification": "No human participants.",
    340           "source": "haiku"
    341         },
    342         "randomization_described": {
    343           "applies": false,
    344           "answer": false,
    345           "justification": "No human participants.",
    346           "source": "haiku"
    347         },
    348         "blinding_described": {
    349           "applies": false,
    350           "answer": false,
    351           "justification": "No human participants.",
    352           "source": "haiku"
    353         },
    354         "attrition_reported": {
    355           "applies": false,
    356           "answer": false,
    357           "justification": "No human participants.",
    358           "source": "haiku"
    359         }
    360       },
    361       "cost_and_practicality": {
    362         "inference_cost_reported": {
    363           "applies": true,
    364           "answer": true,
    365           "justification": "Table 4 explicitly reports average word count per response as an inference cost proxy, and Section 4.4 is dedicated to efficiency analysis comparing GSPR against all baselines.",
    366           "source": "haiku"
    367         },
    368         "compute_budget_stated": {
    369           "applies": true,
    370           "answer": true,
    371           "justification": "Section 4.1 states all experiments use 8 NVIDIA H800 GPUs and take approximately 40 GPU-days total.",
    372           "source": "haiku"
    373         }
    374       }
    375     }
    376   },
    377   "claims": [
    378     {
    379       "claim": "GSPR achieves state-of-the-art safety prediction accuracy on in-domain benchmarks, surpassing closed-source APIs.",
    380       "evidence": "Table 2: GSPR w/ Cold-start (Qwen3) achieves 86.36% overall S-Acc vs 74.81% for o3-mini and 73.02% for Gemini-2.5-Flash.",
    381       "supported": "strong"
    382     },
    383     {
    384       "claim": "GSPR achieves more than 45% improvement in fine-grained category prediction accuracy over RSafe.",
    385       "evidence": "Table 2: GSPR w/ Cold-start (Qwen2.5) achieves 78.32% overall C-Acc vs RSafe's 30.17% — a 48 percentage point improvement.",
    386       "supported": "strong"
    387     },
    388     {
    389       "claim": "The cold-start strategy brings more than 20% C-Acc gains over direct RL alignment from the base model.",
    390       "evidence": "Table 2: GSPR w/ Cold-start (Qwen2.5) achieves 78.32% C-Acc vs GSPR w/o Cold-start's 54.06% — a 24.26pp gain on in-domain sets.",
    391       "supported": "strong"
    392     },
    393     {
    394       "claim": "GSPR generates the most efficient safety reasoning traces (fewest tokens) among all explanation-providing models.",
    395       "evidence": "Table 4: GSPR w/ Cold-start (Qwen2.5) averages 34.10 words vs 187.98 for RSafe, 211.04 for GuardReasoner, and 172.89 for o3-mini.",
    396       "supported": "strong"
    397     },
    398     {
    399       "claim": "GSPR's flexible prompt template alone substantially improves category prediction over RSafe without requiring category rewards.",
    400       "evidence": "Table 2: 'GSPR (safety only)' achieves 67.34% C-Acc vs RSafe's 30.17%, despite both using only safety rewards — attributed to the prompt template design.",
    401       "supported": "moderate"
    402     },
    403     {
    404       "claim": "GSPR demonstrates robust generalization to out-of-domain safety taxonomies with unseen policies.",
    405       "evidence": "Table 3: GSPR w/ Cold-start achieves 79.70% overall C-Acc on out-of-domain sets vs RSafe's 25.23%; 6% S-Acc and 25% C-Acc improvement over Qwen2.5 base model.",
    406       "supported": "moderate"
    407     }
    408   ],
    409   "methodology_tags": [
    410     "benchmark-eval"
    411   ],
    412   "key_findings": "GSPR is an RL-aligned (GRPO) safety guardrail that uses flexible safety taxonomy variables in prompt templates, enabling training across 19 taxonomies with 167 policies from six public benchmarks. It achieves state-of-the-art performance on both in-domain and out-of-domain content moderation benchmarks, with over 45 percentage points improvement in fine-grained category prediction over the closest RL-aligned baseline (RSafe). The cold-start SFT strategy — using Gemini-2.5-Flash to distill per-policy reasoning traces — is critical: it improves category accuracy by 20+ points and reduces language mixing to near zero across both Qwen2.5 and Qwen3 base models. Notably, GSPR generates the fewest tokens of any explanation-providing guardrail (34 avg words vs 172+ for competitors), suggesting the category reward encourages concise reasoning as a side effect.",
    413   "red_flags": [
    414     {
    415       "flag": "Code and weights not yet released",
    416       "detail": "Paper promises future open-sourcing of code, data, and model weights but nothing is available at submission time — reproducibility is blocked."
    417     },
    418     {
    419       "flag": "No variance or statistical testing",
    420       "detail": "All results are single-run point estimates (temperature=0.0, one run per model); no repeated experiments, confidence intervals, or significance tests are reported."
    421     },
    422     {
    423       "flag": "Training scale confound unaddressed",
    424       "detail": "GSPR trains on 167 policies vs RSafe's 18 — performance gains could partly reflect training data coverage, not just the flexible taxonomy mechanism; this confound is never analyzed."
    425     },
    426     {
    427       "flag": "No contamination analysis",
    428       "detail": "No discussion of whether safety benchmark test data (BeaverTails 2023, WildGuard 2024) was present in Qwen2.5 or Qwen3 pretraining, which could inflate base model comparisons."
    429     },
    430     {
    431       "flag": "No limitations section",
    432       "detail": "Zero discussion of failure modes, scope boundaries, or threats to validity; the conclusion only mentions adding more benchmarks as future work."
    433     },
    434     {
    435       "flag": "Cold-start annotations not released",
    436       "detail": "The 1,383 Gemini-2.5-Flash-distilled cold-start samples are a key training component but are not released, making the cold-start procedure non-reproducible."
    437     }
    438   ],
    439   "cited_papers": [
    440     {
    441       "title": "Llama Guard: LLM-based Input-Output Safeguard for Human-AI Conversations",
    442       "relevance": "Key baseline guardrail system with fixed 14-policy taxonomy, evaluated against GSPR"
    443     },
    444     {
    445       "title": "WildGuard: Open One-Stop Moderation Tools for Safety Risks, Jailbreaks, and Refusals of LLMs",
    446       "relevance": "Baseline guardrail and primary training/evaluation benchmark dataset"
    447     },
    448     {
    449       "title": "GuardReasoner: Towards Reasoning-based LLM Safeguards",
    450       "relevance": "Most similar prior work — reasoning-enabled guardrail trained with SFT+DPO; key baseline"
    451     },
    452     {
    453       "title": "RSafe: Incentivizing Proactive Reasoning to Build Robust and Adaptive LLM Safeguards",
    454       "relevance": "Primary RL-aligned safety guardrail baseline that GSPR directly extends and outperforms"
    455     },
    456     {
    457       "title": "DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models",
    458       "relevance": "Source of the GRPO algorithm used for GSPR's RL alignment stage"
    459     },
    460     {
    461       "title": "BeaverTails: Towards Improved Safety Alignment of LLM via a Human-Preference Dataset",
    462       "relevance": "Training and evaluation dataset with 14 harm categories and 333K QA samples"
    463     },
    464     {
    465       "title": "PKU-SafeRLHF: Towards Multi-Level Safety Alignment for LLMs with Human Preference",
    466       "relevance": "Training and evaluation dataset with 19 harm categories under 3 severity levels"
    467     },
    468     {
    469       "title": "ShieldGemma: Generative AI Content Moderation Based on Gemma",
    470       "relevance": "Open-source baseline guardrail with fixed 4-policy taxonomy"
    471     }
    472   ],
    473   "engagement_factors": {
    474     "practical_relevance": {
    475       "score": 2,
    476       "justification": "GSPR addresses a real production need (LLM content moderation) with efficient inference and flexible policy coverage, but code/weights aren't yet released limiting adoption."
    477     },
    478     "surprise_contrarian": {
    479       "score": 1,
    480       "justification": "The finding that flexible prompt templates alone (without category rewards) dramatically improve fine-grained category prediction vs RSafe is a somewhat counterintuitive result."
    481     },
    482     "fear_safety": {
    483       "score": 3,
    484       "justification": "Paper directly addresses LLM safety/content moderation with results showing most existing guardrails fail at fine-grained safety policy classification — a practical concern for deployed AI systems."
    485     },
    486     "drama_conflict": {
    487       "score": 1,
    488       "justification": "RSafe's dramatic failure with 25% language mixing on Qwen3 vs near-0% for GSPR provides a concrete demonstration of prior work fragility across base models."
    489     },
    490     "demo_ability": {
    491       "score": 1,
    492       "justification": "Model weights and code promised as future open-source but not currently available, preventing live demonstrations."
    493     },
    494     "brand_recognition": {
    495       "score": 1,
    496       "justification": "HKUST and NUS are respected institutions but not top-tier AI labs; paper is an arXiv preprint without venue affiliation."
    497     }
    498   },
    499   "hn_data": {
    500     "threads": [
    501       {
    502         "hn_id": "44169594",
    503         "title": "Show HN: Cognee – Open-Source AI Memory Layer That Remembers Context",
    504         "points": 9,
    505         "comments": 2,
    506         "url": "https://news.ycombinator.com/item?id=44169594",
    507         "created_at": "2025-06-03T13:05:15Z"
    508       }
    509     ],
    510     "top_points": 9,
    511     "total_points": 9,
    512     "total_comments": 2
    513   }
    514 }

Impressum · Datenschutz