diff --git a/inbox/queue/2026-04-02-deepmind-negative-sae-results-pragmatic-interpretability.md b/inbox/archive/ai-alignment/2026-04-02-deepmind-negative-sae-results-pragmatic-interpretability.md similarity index 97% rename from inbox/queue/2026-04-02-deepmind-negative-sae-results-pragmatic-interpretability.md rename to inbox/archive/ai-alignment/2026-04-02-deepmind-negative-sae-results-pragmatic-interpretability.md index c32bfb38..0e254a9c 100644 --- a/inbox/queue/2026-04-02-deepmind-negative-sae-results-pragmatic-interpretability.md +++ b/inbox/archive/ai-alignment/2026-04-02-deepmind-negative-sae-results-pragmatic-interpretability.md @@ -7,9 +7,12 @@ date: 2025-06-01 domain: ai-alignment secondary_domains: [] format: institutional-blog-post -status: unprocessed +status: processed +processed_by: theseus +processed_date: 2026-04-02 priority: high tags: [sparse-autoencoders, mechanistic-interpretability, deepmind, harmful-intent-detection, pragmatic-interpretability, negative-results] +extraction_model: "anthropic/claude-sonnet-4.5" --- ## Content