From e2acc4dadfeb77d3c452edd0bb5e9c6c3ff749a9 Mon Sep 17 00:00:00 2001 From: Teleo Agents Date: Wed, 18 Mar 2026 09:17:57 +0000 Subject: [PATCH 1/2] extract: 2024-12-01-vaccaro-human-ai-combinations-meta-analysis Pentagon-Agent: Epimetheus <968B2991-E2DF-4006-B962-F5B0A0CC8ACA> --- ...o-human-ai-combinations-meta-analysis.json | 35 +++++++++++++++++++ ...aro-human-ai-combinations-meta-analysis.md | 15 +++++++- 2 files changed, 49 insertions(+), 1 deletion(-) create mode 100644 inbox/archive/.extraction-debug/2024-12-01-vaccaro-human-ai-combinations-meta-analysis.json diff --git a/inbox/archive/.extraction-debug/2024-12-01-vaccaro-human-ai-combinations-meta-analysis.json b/inbox/archive/.extraction-debug/2024-12-01-vaccaro-human-ai-combinations-meta-analysis.json new file mode 100644 index 00000000..3a83e179 --- /dev/null +++ b/inbox/archive/.extraction-debug/2024-12-01-vaccaro-human-ai-combinations-meta-analysis.json @@ -0,0 +1,35 @@ +{ + "rejected_claims": [ + { + "filename": "human-ai-teams-underperform-best-individual-performer-on-average.md", + "issues": [ + "missing_attribution_extractor" + ] + }, + { + "filename": "decision-tasks-versus-content-creation-determines-human-ai-combination-value.md", + "issues": [ + "missing_attribution_extractor" + ] + } + ], + "validation_stats": { + "total": 2, + "kept": 0, + "fixed": 5, + "rejected": 2, + "fixes_applied": [ + "human-ai-teams-underperform-best-individual-performer-on-average.md:set_created:2026-03-18", + "human-ai-teams-underperform-best-individual-performer-on-average.md:stripped_wiki_link:centaur-teams-succeed-only-when-role-boundaries-prevent-huma", + "human-ai-teams-underperform-best-individual-performer-on-average.md:stripped_wiki_link:economic-forces-push-humans-out-of-every-cognitive-loop-wher", + "decision-tasks-versus-content-creation-determines-human-ai-combination-value.md:set_created:2026-03-18", + "decision-tasks-versus-content-creation-determines-human-ai-combination-value.md:stripped_wiki_link:economic-forces-push-humans-out-of-every-cognitive-loop-wher" + ], + "rejections": [ + "human-ai-teams-underperform-best-individual-performer-on-average.md:missing_attribution_extractor", + "decision-tasks-versus-content-creation-determines-human-ai-combination-value.md:missing_attribution_extractor" + ] + }, + "model": "anthropic/claude-sonnet-4.5", + "date": "2026-03-18" +} \ No newline at end of file diff --git a/inbox/archive/2024-12-01-vaccaro-human-ai-combinations-meta-analysis.md b/inbox/archive/2024-12-01-vaccaro-human-ai-combinations-meta-analysis.md index c219ce1b..fa6eb996 100644 --- a/inbox/archive/2024-12-01-vaccaro-human-ai-combinations-meta-analysis.md +++ b/inbox/archive/2024-12-01-vaccaro-human-ai-combinations-meta-analysis.md @@ -7,10 +7,14 @@ date: 2024-12-01 domain: ai-alignment secondary_domains: [collective-intelligence] format: paper -status: unprocessed +status: null-result priority: high triage_tag: claim tags: [human-ai-teams, meta-analysis, decision-making, content-creation, oversight, performance] +processed_by: theseus +processed_date: 2026-03-18 +extraction_model: "anthropic/claude-sonnet-4.5" +extraction_notes: "LLM returned 2 claims, 2 rejected by validator" --- ## Content @@ -40,3 +44,12 @@ Systematic review and meta-analysis of 106 experimental studies reporting 370 ef ## Curator Notes PRIMARY CONNECTION: centaur team performance depends on role complementarity not mere human-AI combination WHY ARCHIVED: This is the strongest empirical evidence (370 effect sizes, Nature HB) that human-AI combination is NOT automatically beneficial — it depends on relative capability and task type. Directly relevant to the automation overshoot question. + + +## Key Facts +- Meta-analysis covered 106 experimental studies published between January 2020 and June 2023 +- 370 effect sizes were analyzed across the studies +- Overall effect size: Hedges' g = -0.23 (95% CI: -0.39 to -0.07) +- Published in Nature Human Behaviour, December 2024 +- Task types showing losses: deepfake classification, demand forecasting, medical diagnosis +- Task types showing gains: summarizing social media, chatbot responses, generating new content -- 2.45.2 From 73c69b08c919f26f9a5e301715cd71ab97611442 Mon Sep 17 00:00:00 2001 From: Teleo Agents Date: Wed, 18 Mar 2026 09:18:48 +0000 Subject: [PATCH 2/2] extract: 2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct Pentagon-Agent: Epimetheus <968B2991-E2DF-4006-B962-F5B0A0CC8ACA> --- ...-economics-health-nudges-defaults-rct.json | 34 +++++++++++++++++++ ...al-economics-health-nudges-defaults-rct.md | 14 +++++++- 2 files changed, 47 insertions(+), 1 deletion(-) create mode 100644 inbox/archive/.extraction-debug/2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct.json diff --git a/inbox/archive/.extraction-debug/2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct.json b/inbox/archive/.extraction-debug/2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct.json new file mode 100644 index 00000000..6c0059b2 --- /dev/null +++ b/inbox/archive/.extraction-debug/2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct.json @@ -0,0 +1,34 @@ +{ + "rejected_claims": [ + { + "filename": "ehr-default-effects-are-highest-leverage-behavioral-health-intervention-because-they-scale-at-near-zero-marginal-cost-and-reduce-disparities.md", + "issues": [ + "missing_attribution_extractor" + ] + }, + { + "filename": "healthcare-appointments-function-as-effective-commitment-devices-doubling-testing-rates-among-patients-with-self-control-problems.md", + "issues": [ + "missing_attribution_extractor" + ] + } + ], + "validation_stats": { + "total": 2, + "kept": 0, + "fixed": 4, + "rejected": 2, + "fixes_applied": [ + "ehr-default-effects-are-highest-leverage-behavioral-health-intervention-because-they-scale-at-near-zero-marginal-cost-and-reduce-disparities.md:set_created:2026-03-18", + "ehr-default-effects-are-highest-leverage-behavioral-health-intervention-because-they-scale-at-near-zero-marginal-cost-and-reduce-disparities.md:stripped_wiki_link:SDOH interventions show strong ROI but adoption stalls becau", + "ehr-default-effects-are-highest-leverage-behavioral-health-intervention-because-they-scale-at-near-zero-marginal-cost-and-reduce-disparities.md:stripped_wiki_link:medical care explains only 10 20 percent of health outcomes ", + "healthcare-appointments-function-as-effective-commitment-devices-doubling-testing-rates-among-patients-with-self-control-problems.md:set_created:2026-03-18" + ], + "rejections": [ + "ehr-default-effects-are-highest-leverage-behavioral-health-intervention-because-they-scale-at-near-zero-marginal-cost-and-reduce-disparities.md:missing_attribution_extractor", + "healthcare-appointments-function-as-effective-commitment-devices-doubling-testing-rates-among-patients-with-self-control-problems.md:missing_attribution_extractor" + ] + }, + "model": "anthropic/claude-sonnet-4.5", + "date": "2026-03-18" +} \ No newline at end of file diff --git a/inbox/archive/2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct.md b/inbox/archive/2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct.md index f9c67c61..6ca43bb2 100644 --- a/inbox/archive/2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct.md +++ b/inbox/archive/2025-01-01-chibe-behavioral-economics-health-nudges-defaults-rct.md @@ -7,11 +7,15 @@ date: 2025-01-01 domain: health secondary_domains: [] format: report -status: unprocessed +status: null-result priority: medium triage_tag: claim tags: [behavioral-economics, nudges, default-effects, medication-adherence, health-disparities, EHR] flagged_for_rio: ["Behavioral economics mechanisms (commitment devices, default effects) are directly relevant to mechanism design in health contexts"] +processed_by: vida +processed_date: 2026-03-18 +extraction_model: "anthropic/claude-sonnet-4.5" +extraction_notes: "LLM returned 2 claims, 2 rejected by validator" --- ## Content @@ -58,3 +62,11 @@ Additional context: ## Curator Notes PRIMARY CONNECTION: healthcare is a complex adaptive system requiring simple enabling rules not complicated management because standardized processes erode the clinical autonomy needed for value creation WHY ARCHIVED: Default effects are the "simple enabling rules" the complex adaptive system claim describes. The CHIBE evidence makes this concrete: change the EHR default → change prescribing behavior → reduce disparities. This is the behavioral economics bridge between the KB's structural claims and operational interventions. + + +## Key Facts +- CHIBE had $49M in total grant activity in FY2025 +- Penn Medicine Healthy Heart trial enrolled 2,000 patients in West/Southwest Philadelphia and Lancaster County (2024-2025) +- Opioid prescribing guidelines adherence increased from 57.2% to 71.8% with peer comparison + patient-reported outcomes feedback +- Game-based physical activity intervention increased step counts by 1,700 steps/day (equivalent to 70+ miles over intervention period) +- Penn Medicine is now funding scaled implementation of automated pharmacy referral program that increased statin prescribing -- 2.45.2