hack-ink · yvette-carlisle · Jun 11, 2026 · Jun 11, 2026 · Jun 11, 2026 · Jun 11, 2026
diff --git a/Makefile.toml b/Makefile.toml
@@ -428,6 +428,9 @@ args = [
 # | real-world-memory-production-ops        | composite |     |
 # | real-world-memory-production-ops-json   | command   |     |
 # | real-world-memory-production-ops-report | command   |     |
+# | real-world-memory-core-archival         | composite |     |
+# | real-world-memory-core-archival-json    | command   |     |
+# | real-world-memory-core-archival-report  | command   |     |
 # | real-world-memory-live-adapters         | command   |     |
 
 [tasks.real-world-job-smoke]
@@ -824,6 +827,55 @@ args = [
 	"tmp/real-world-memory/consolidation/report.md",
 ]
 
+[tasks.real-world-memory-core-archival]
+workspace = false
+dependencies = [
+	"real-world-memory-core-archival-report",
+]
+
+[tasks.real-world-memory-core-archival-json]
+workspace = false
+command = "cargo"
+args = [
+	"run",
+	"-p",
+	"elf-eval",
+	"--bin",
+	"real_world_job_benchmark",
+	"--",
+	"run",
+	"--fixtures",
+	"apps/elf-eval/fixtures/real_world_memory/core_archival_memory",
+	"--out",
+	"tmp/real-world-memory/core-archival/report.json",
+	"--run-id",
+	"real-world-memory-core-archival",
+	"--adapter-id",
+	"fixture_core_archival_memory",
+	"--adapter-name",
+	"ELF core and archival memory fixture",
+]
+
+[tasks.real-world-memory-core-archival-report]
+workspace = false
+dependencies = [
+	"real-world-memory-core-archival-json",
+]
+command = "cargo"
+args = [
+	"run",
+	"-p",
+	"elf-eval",
+	"--bin",
+	"real_world_job_benchmark",
+	"--",
+	"publish",
+	"--report",
+	"tmp/real-world-memory/core-archival/report.json",
+	"--out",
+	"tmp/real-world-memory/core-archival/report.md",
+]
+
 [tasks.real-world-memory-live-adapters]
 workspace = false
 command = "bash"

diff --git a/README.md b/README.md
@@ -145,15 +145,22 @@ provider-backed ELF evidence was required.
   rebuild returned `rebuilt_count=1`, `missing_vector_count=0`, `error_count=0`, and
   search recovered the restored note.
 - Fresh all-project smoke run: ELF and qmd passed every encoded check. agentmemory
-  passed same-corpus retrieval but failed lifecycle/cold-start coverage. memsearch,
-  mem0, OpenViking, and claude-mem remained typed non-pass states. OpenViking now
-  reaches its pinned Docker local embedding path and is reported as `wrong_result`
-  when same-corpus evidence terms are missed; setup failures remain `incomplete`.
-- Real-world agent memory aggregate after XY-928: 43 fixture-backed jobs across
-  12 suites, 38 pass, 0 incomplete, 5 blocked, 0 wrong-result, 0 not-encoded, and
-  0 unsupported-claim results. The remaining non-pass jobs are production-ops
-  operator boundaries plus blocked OpenViking staged trajectory, hierarchy selection,
-  and recursive/context expansion measurement gates, not hidden benchmark wins.
+  passed same-corpus retrieval but failed lifecycle/cold-start coverage. mem0/OpenMemory
+  and memsearch now pass their scoped local baseline smokes, while OpenMemory
+  UI/export, hosted mem0 Platform, optional graph memory, and broader memsearch prompt
+  and TTL coverage remain blocked, unsupported, or not encoded. OpenViking now reaches
+  its pinned Docker local embedding path and is reported as `wrong_result` when
+  same-corpus evidence terms are missed; claude-mem and OpenViking non-retrieval
+  coverage remain typed non-pass states.
+- Real-world agent memory aggregate after XY-927 and XY-928: 49 fixture-backed
+  jobs across 13 suites, 44 pass, 0 incomplete, 5 blocked, 0 wrong-result,
+  0 not-encoded, and 0 unsupported-claim results. The remaining non-pass jobs are
+  production-ops operator boundaries plus blocked OpenViking staged trajectory,
+  hierarchy selection, and recursive/context expansion measurement gates, not
+  hidden benchmark wins. The new `core_archival_memory` suite passes 6 fixture
+  jobs for core block attachment, scope, provenance, stale-core detection,
+  archival fallback, and project-decision recovery; it does not create an
+  ELF-over-Letta claim.
 - Full-suite live real-world adapter sweep after XY-899: ELF and qmd emit
   Docker-isolated `live_real_world` records for all 40 encoded jobs across 11 suites
   through `cargo make real-world-memory-live-adapters`. Both keep the original

diff --git a/apps/elf-eval/fixtures/real_world_external_adapters/memory_projects_manifest.json b/apps/elf-eval/fixtures/real_world_external_adapters/memory_projects_manifest.json
@@ -29,7 +29,7 @@
       },
       "run": {
         "status": "blocked",
-        "evidence": "The current fixture set reports 43 jobs, 38 pass, 0 incomplete, 5 blocked, 0 wrong_result, 0 not_encoded, and 0 unsupported_claim.",
+        "evidence": "The current fixture set reports 49 jobs across 13 suites: 44 pass, 0 incomplete, 5 blocked, 0 wrong_result, 0 not_encoded, and 0 unsupported_claim. The six core_archival_memory jobs pass as ELF fixture evidence, not as live Letta comparison evidence; context_trajectory remains blocked behind OpenViking staged-artifact materialization.",
         "command": "cargo make real-world-memory",
         "artifact": "tmp/real-world-memory/real-world-memory-report.json"
       },
@@ -101,6 +101,11 @@
           "status": "pass",
           "evidence": "Four redaction, exclusion, source-id, evidence-binding, and capture-boundary fixtures are encoded and passing."
         },
+        {
+          "suite_id": "core_archival_memory",
+          "status": "pass",
+          "evidence": "Six fixture jobs score core block attachment, scope, provenance, stale-core detection, archival fallback, and project-decision recovery separately from archival note search."
+        },
         {
           "suite_id": "production_ops",
           "status": "blocked",
@@ -2212,24 +2217,24 @@
       "evidence_class": "research_gate",
       "docker_default": true,
       "host_global_installs_required": false,
-      "overall_status": "not_encoded",
+      "overall_status": "blocked",
       "setup": {
-        "status": "not_encoded",
-        "evidence": "Letta is D1 reviewed as a core/archival memory reference, but no Docker real_world_job adapter is implemented."
+        "status": "blocked",
+        "evidence": "Letta is D1 reviewed as a core/archival memory reference. The contained comparison contract is a Docker-only benchmark-created agent export that must return core block JSON, archival search readback, and source ids before any scenario claim is scored."
       },
       "run": {
         "status": "not_encoded",
-        "evidence": "No Letta core block, archival memory, or shared-memory job is encoded."
+        "evidence": "No Letta materializer currently creates the benchmark agent, imports the ELF core_archival_memory fixture corpus, or exports comparable core and archival evidence."
       },
       "result": {
         "status": "not_encoded",
-        "evidence": "No Letta personalization or project-decision suite result is claimed."
+        "evidence": "No Letta core block, archival fallback, stale-core, scope, provenance, or project-decision result is claimed."
       },
       "capabilities": [
         {
           "capability": "core_archival_memory",
-          "status": "not_encoded",
-          "evidence": "Core blocks and archival memory are reference semantics but not scored."
+          "status": "blocked",
+          "evidence": "ELF fixture jobs now score core block attachment, scope, provenance, stale-core detection, archival fallback, and project-decision recovery separately from archival note search; Letta remains blocked until its export maps equivalent source ids."
         },
         {
           "capability": "docker_embedding_configuration",
@@ -2257,6 +2262,67 @@
           "suite_id": "work_resume",
           "status": "not_encoded",
           "evidence": "Agent resumption through Letta memory blocks is not encoded."
+        },
+        {
+          "suite_id": "core_archival_memory",
+          "status": "blocked",
+          "evidence": "ELF fixture coverage exists, but Letta has no contained export/readback artifact for the same core-vs-archival jobs."
+        }
+      ],
+      "scenarios": [
+        {
+          "scenario_id": "core_block_attachment_readback",
+          "suite_id": "core_archival_memory",
+          "status": "not_encoded",
+          "elf_position": "untested",
+          "comparison_outcome": "not_tested",
+          "evidence": "ELF fixture core-archival-core-block-attachment-001 scores exact core block attachment and keeps core readback out of Qdrant-backed archival search. Letta has no comparable exported core block attachment evidence.",
+          "artifact": "apps/elf-eval/fixtures/real_world_memory/core_archival_memory/core_block_attachment.json"
+        },
+        {
+          "scenario_id": "core_block_scope_readback",
+          "suite_id": "core_archival_memory",
+          "status": "not_encoded",
+          "elf_position": "untested",
+          "comparison_outcome": "not_tested",
+          "evidence": "ELF fixture core-archival-core-block-scope-001 scores read_profile, shared scope, and private-owner boundaries. Letta scope behavior remains unscored without a contained export of agent, block, and visibility metadata.",
+          "artifact": "apps/elf-eval/fixtures/real_world_memory/core_archival_memory/core_block_scope.json"
+        },
+        {
+          "scenario_id": "core_block_provenance_readback",
+          "suite_id": "core_archival_memory",
+          "status": "not_encoded",
+          "elf_position": "untested",
+          "comparison_outcome": "not_tested",
+          "evidence": "ELF fixture core-archival-core-block-provenance-001 scores source_ref and audit_history readback. Letta provenance remains not_tested until exported core memory includes stable source ids and audit-equivalent events.",
+          "artifact": "apps/elf-eval/fixtures/real_world_memory/core_archival_memory/core_block_provenance.json"
+        },
+        {
+          "scenario_id": "stale_core_detection",
+          "suite_id": "core_archival_memory",
+          "status": "blocked",
+          "elf_position": "untested",
+          "comparison_outcome": "blocked",
+          "evidence": "ELF fixture core-archival-stale-core-detection-001 scores archival evidence superseding a stale core block. Letta stale-core comparison is blocked until core export and archival readback can be joined by source ids.",
+          "artifact": "apps/elf-eval/fixtures/real_world_memory/core_archival_memory/stale_core_detection.json"
+        },
+        {
+          "scenario_id": "archival_fallback_readback",
+          "suite_id": "core_archival_memory",
+          "status": "blocked",
+          "elf_position": "untested",
+          "comparison_outcome": "blocked",
+          "evidence": "ELF fixture core-archival-archival-fallback-001 scores fallback from insufficient core memory to archival note search. Letta fallback comparison is blocked until archival search output can be exported with source ids.",
+          "artifact": "apps/elf-eval/fixtures/real_world_memory/core_archival_memory/archival_fallback.json"
+        },
+        {
+          "scenario_id": "core_archival_project_decision_recovery",
+          "suite_id": "core_archival_memory",
+          "status": "not_encoded",
+          "elf_position": "untested",
+          "comparison_outcome": "not_tested",
+          "evidence": "ELF fixture core-archival-project-decision-recovery-001 scores core routing plus archival decision rationale. Letta project-decision recovery remains not_tested until the contained export/readback contract exists.",
+          "artifact": "apps/elf-eval/fixtures/real_world_memory/core_archival_memory/project_decision_recovery.json"
         }
       ],
       "evidence": [
@@ -2284,14 +2350,15 @@
             "evidence": "Official Docker deployment guide and embedding configuration boundary."
           }
         ],
-        "setup_path": "Define Docker server setup, embedding model configuration, and a core/archival memory fixture flow.",
-        "runtime_boundary": "Docker-only Letta server or CLI flow with benchmark-created agents and no host-global state.",
-        "resource_expectation": "Embedding model and agent server state must be explicit; record storage and provider boundaries.",
+        "setup_path": "Use a Docker-only Letta server or CLI flow that creates a benchmark-owned agent, loads the checked-in core_archival_memory fixture corpus, writes core memory and archival memory with fixture source ids, then exports core block JSON plus archival search/readback JSON.",
+        "runtime_boundary": "Docker-only Letta server or CLI flow with benchmark-created agents, benchmark-owned storage, no host-global state, and no unstated hosted service dependency.",
+        "resource_expectation": "Embedding model, agent server state, exported core memory, archival search output, and provider boundaries must be explicit in the artifact.",
         "retry_guidance": [
-          "Create a tiny Docker agent with archival memory search.",
-          "Score core-versus-archival retrieval only after source evidence can be exported."
+          "Create a tiny Docker agent with core memory and archival memory loaded from the ELF core_archival_memory fixtures.",
+          "Export core block readback, archival search results, source ids, and any audit-equivalent metadata as JSON before scoring.",
+          "Score core-versus-archival scenarios only after source evidence can be exported and mapped to the fixture evidence ids."
         ],
-        "research_depth": "D1 feasibility verdict: research_only (XY-882); core/archival reference, adapter not encoded"
+        "research_depth": "D1 feasibility verdict: research_only (XY-882); XY-927 selects the contained export/readback contract, but the Letta adapter remains blocked until that artifact exists"
       }
     },
     {