teleo-codex/inbox/queue/.extraction-debug/2026-03-25-aisi-replibench-methodology-component-tasks-simulated.json
Teleo Agents e855a6d7a6 extract: 2026-03-25-aisi-replibench-methodology-component-tasks-simulated
Pentagon-Agent: Epimetheus <3D35839A-7722-4740-B93D-51157F7D5E70>
2026-03-25 00:16:53 +00:00

32 lines
No EOL
1.2 KiB
JSON

{
"rejected_claims": [
{
"filename": "replibench-measures-component-tasks-in-simulated-environments-not-operational-self-replication.md",
"issues": [
"missing_attribution_extractor"
]
},
{
"filename": "evaluation-awareness-causes-models-to-refuse-simulated-tasks-creating-bidirectional-capability-uncertainty.md",
"issues": [
"missing_attribution_extractor"
]
}
],
"validation_stats": {
"total": 2,
"kept": 0,
"fixed": 2,
"rejected": 2,
"fixes_applied": [
"replibench-measures-component-tasks-in-simulated-environments-not-operational-self-replication.md:set_created:2026-03-25",
"evaluation-awareness-causes-models-to-refuse-simulated-tasks-creating-bidirectional-capability-uncertainty.md:set_created:2026-03-25"
],
"rejections": [
"replibench-measures-component-tasks-in-simulated-environments-not-operational-self-replication.md:missing_attribution_extractor",
"evaluation-awareness-causes-models-to-refuse-simulated-tasks-creating-bidirectional-capability-uncertainty.md:missing_attribution_extractor"
]
},
"model": "anthropic/claude-sonnet-4.5",
"date": "2026-03-25"
}