{ "rejected_claims": [ { "filename": "rsp-v3-weakens-binding-commitments-while-adding-transparency-infrastructure.md", "issues": [ "missing_attribution_extractor" ] }, { "filename": "interpretability-informed-alignment-assessment-first-planned-integration-into-formal-safety-thresholds.md", "issues": [ "missing_attribution_extractor" ] } ], "validation_stats": { "total": 2, "kept": 0, "fixed": 7, "rejected": 2, "fixes_applied": [ "rsp-v3-weakens-binding-commitments-while-adding-transparency-infrastructure.md:set_created:2026-03-26", "rsp-v3-weakens-binding-commitments-while-adding-transparency-infrastructure.md:stripped_wiki_link:voluntary-safety-pledges-cannot-survive-competitive-pressure", "rsp-v3-weakens-binding-commitments-while-adding-transparency-infrastructure.md:stripped_wiki_link:government-designation-of-safety-conscious-AI-labs-as-supply", "rsp-v3-weakens-binding-commitments-while-adding-transparency-infrastructure.md:stripped_wiki_link:Anthropics-RSP-rollback-under-commercial-pressure-is-the-fir", "interpretability-informed-alignment-assessment-first-planned-integration-into-formal-safety-thresholds.md:set_created:2026-03-26", "interpretability-informed-alignment-assessment-first-planned-integration-into-formal-safety-thresholds.md:stripped_wiki_link:formal-verification-of-AI-generated-proofs-provides-scalable", "interpretability-informed-alignment-assessment-first-planned-integration-into-formal-safety-thresholds.md:stripped_wiki_link:an-aligned-seeming-AI-may-be-strategically-deceptive-because" ], "rejections": [ "rsp-v3-weakens-binding-commitments-while-adding-transparency-infrastructure.md:missing_attribution_extractor", "interpretability-informed-alignment-assessment-first-planned-integration-into-formal-safety-thresholds.md:missing_attribution_extractor" ] }, "model": "anthropic/claude-sonnet-4.5", "date": "2026-03-26" }