teleo-codex/inbox/archive/.extraction-debug/2025-00-00-em-dpo-heterogeneous-preferences.json
Teleo Agents f44d100882 extract: 2025-00-00-em-dpo-heterogeneous-preferences
Pentagon-Agent: Ganymede <F99EBFA6-547B-4096-BEEA-1D59C3E4028A>
2026-03-16 14:02:09 +00:00

38 lines
No EOL
2.5 KiB
JSON

{
"rejected_claims": [
{
"filename": "binary-preference-comparisons-cannot-identify-latent-preference-types-requiring-rankings-over-three-plus-responses.md",
"issues": [
"missing_attribution_extractor"
]
},
{
"filename": "em-algorithm-discovers-latent-preference-subpopulations-enabling-ensemble-alignment-without-demographic-labels.md",
"issues": [
"missing_attribution_extractor"
]
}
],
"validation_stats": {
"total": 2,
"kept": 0,
"fixed": 8,
"rejected": 2,
"fixes_applied": [
"binary-preference-comparisons-cannot-identify-latent-preference-types-requiring-rankings-over-three-plus-responses.md:set_created:2026-03-16",
"binary-preference-comparisons-cannot-identify-latent-preference-types-requiring-rankings-over-three-plus-responses.md:stripped_wiki_link:single-reward-rlhf-cannot-align-diverse-preferences-because-",
"binary-preference-comparisons-cannot-identify-latent-preference-types-requiring-rankings-over-three-plus-responses.md:stripped_wiki_link:rlhf-is-implicit-social-choice-without-normative-scrutiny.md",
"binary-preference-comparisons-cannot-identify-latent-preference-types-requiring-rankings-over-three-plus-responses.md:stripped_wiki_link:modeling preference sensitivity as a learned distribution ra",
"em-algorithm-discovers-latent-preference-subpopulations-enabling-ensemble-alignment-without-demographic-labels.md:set_created:2026-03-16",
"em-algorithm-discovers-latent-preference-subpopulations-enabling-ensemble-alignment-without-demographic-labels.md:stripped_wiki_link:pluralistic alignment must accommodate irreducibly diverse v",
"em-algorithm-discovers-latent-preference-subpopulations-enabling-ensemble-alignment-without-demographic-labels.md:stripped_wiki_link:maxmin-rlhf-applies-egalitarian-social-choice-to-alignment-b",
"em-algorithm-discovers-latent-preference-subpopulations-enabling-ensemble-alignment-without-demographic-labels.md:stripped_wiki_link:minority-preference-alignment-improves-33-percent-without-ma"
],
"rejections": [
"binary-preference-comparisons-cannot-identify-latent-preference-types-requiring-rankings-over-three-plus-responses.md:missing_attribution_extractor",
"em-algorithm-discovers-latent-preference-subpopulations-enabling-ensemble-alignment-without-demographic-labels.md:missing_attribution_extractor"
]
},
"model": "anthropic/claude-sonnet-4.5",
"date": "2026-03-16"
}