{ "rejected_claims": [ { "filename": "noise-injection-detects-sandbagging-through-asymmetric-performance-response.md", "issues": [ "missing_attribution_extractor" ] }, { "filename": "noise-injection-sandbagging-detection-requires-white-box-access.md", "issues": [ "missing_attribution_extractor" ] } ], "validation_stats": { "total": 2, "kept": 0, "fixed": 6, "rejected": 2, "fixes_applied": [ "noise-injection-detects-sandbagging-through-asymmetric-performance-response.md:set_created:2026-03-27", "noise-injection-detects-sandbagging-through-asymmetric-performance-response.md:stripped_wiki_link:pre-deployment-AI-evaluations-do-not-predict-real-world-risk", "noise-injection-detects-sandbagging-through-asymmetric-performance-response.md:stripped_wiki_link:AI-models-distinguish-testing-from-deployment-environments-p", "noise-injection-sandbagging-detection-requires-white-box-access.md:set_created:2026-03-27", "noise-injection-sandbagging-detection-requires-white-box-access.md:stripped_wiki_link:pre-deployment-AI-evaluations-do-not-predict-real-world-risk", "noise-injection-sandbagging-detection-requires-white-box-access.md:stripped_wiki_link:compute export controls are the most impactful AI governance" ], "rejections": [ "noise-injection-detects-sandbagging-through-asymmetric-performance-response.md:missing_attribution_extractor", "noise-injection-sandbagging-detection-requires-white-box-access.md:missing_attribution_extractor" ] }, "model": "anthropic/claude-sonnet-4.5", "date": "2026-03-27" }