diff --git a/inbox/queue/2025-07-00-nguyen-probing-evaluation-awareness-earlier-layers.md b/inbox/archive/ai-alignment/2025-07-00-nguyen-probing-evaluation-awareness-earlier-layers.md similarity index 97% rename from inbox/queue/2025-07-00-nguyen-probing-evaluation-awareness-earlier-layers.md rename to inbox/archive/ai-alignment/2025-07-00-nguyen-probing-evaluation-awareness-earlier-layers.md index 3d2a1107e..dbde2dbea 100644 --- a/inbox/queue/2025-07-00-nguyen-probing-evaluation-awareness-earlier-layers.md +++ b/inbox/archive/ai-alignment/2025-07-00-nguyen-probing-evaluation-awareness-earlier-layers.md @@ -7,9 +7,12 @@ date: 2025-07-01 domain: ai-alignment secondary_domains: [] format: paper -status: unprocessed +status: processed +processed_by: theseus +processed_date: 2026-04-21 priority: medium tags: [evaluation-awareness, linear-probing, interpretability, safety-evaluation, ERI, activations] +extraction_model: "anthropic/claude-sonnet-4.5" --- ## Content