npm - @vellumai/assistant - Versions diffs - 0.4.49 → 0.4.50 - Mend

@vellumai/assistant 0.4.49 → 0.4.50

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (239) hide show

package/ARCHITECTURE.md +24 -33
package/README.md +3 -3
package/docs/architecture/memory.md +180 -119
package/package.json +2 -2
package/src/__tests__/agent-loop.test.ts +3 -1
package/src/__tests__/anthropic-provider.test.ts +114 -23
package/src/__tests__/approval-cascade.test.ts +1 -15
package/src/__tests__/approval-routes-http.test.ts +2 -0
package/src/__tests__/assistant-feature-flag-guard.test.ts +0 -23
package/src/__tests__/canonical-guardian-store.test.ts +95 -0
package/src/__tests__/checker.test.ts +13 -0
package/src/__tests__/config-schema.test.ts +1 -68
package/src/__tests__/context-memory-e2e.test.ts +11 -100
package/src/__tests__/conversation-routes-guardian-reply.test.ts +8 -0
package/src/__tests__/conversation-routes-slash-commands.test.ts +1 -0
package/src/__tests__/credential-security-e2e.test.ts +1 -0
package/src/__tests__/credential-vault-unit.test.ts +4 -0
package/src/__tests__/credential-vault.test.ts +13 -1
package/src/__tests__/cu-unified-flow.test.ts +532 -0
package/src/__tests__/date-context.test.ts +93 -77
package/src/__tests__/deterministic-verification-control-plane.test.ts +64 -0
package/src/__tests__/guardian-routing-invariants.test.ts +93 -0
package/src/__tests__/history-repair.test.ts +245 -0
package/src/__tests__/host-cu-proxy.test.ts +165 -3
package/src/__tests__/http-user-message-parity.test.ts +1 -0
package/src/__tests__/invite-redemption-service.test.ts +65 -1
package/src/__tests__/keychain-broker-client.test.ts +4 -4
package/src/__tests__/memory-context-benchmark.benchmark.test.ts +56 -18
package/src/__tests__/memory-lifecycle-e2e.test.ts +244 -387
package/src/__tests__/memory-recall-quality.test.ts +244 -407
package/src/__tests__/memory-regressions.experimental.test.ts +126 -101
package/src/__tests__/memory-regressions.test.ts +477 -2841
package/src/__tests__/memory-retrieval.benchmark.test.ts +33 -150
package/src/__tests__/memory-upsert-concurrency.test.ts +5 -244
package/src/__tests__/mime-builder.test.ts +28 -0
package/src/__tests__/native-web-search.test.ts +1 -0
package/src/__tests__/oauth-cli.test.ts +572 -5
package/src/__tests__/oauth-store.test.ts +120 -6
package/src/__tests__/qdrant-collection-migration.test.ts +53 -8
package/src/__tests__/registry.test.ts +0 -1
package/src/__tests__/relay-server.test.ts +46 -1
package/src/__tests__/schedule-tools.test.ts +32 -0
package/src/__tests__/script-proxy-certs.test.ts +1 -1
package/src/__tests__/secret-onetime-send.test.ts +1 -0
package/src/__tests__/secure-keys.test.ts +7 -2
package/src/__tests__/send-endpoint-busy.test.ts +3 -0
package/src/__tests__/session-abort-tool-results.test.ts +1 -14
package/src/__tests__/session-agent-loop-overflow.test.ts +1583 -0
package/src/__tests__/session-agent-loop.test.ts +19 -15
package/src/__tests__/session-confirmation-signals.test.ts +1 -15
package/src/__tests__/session-error.test.ts +124 -2
package/src/__tests__/session-history-web-search.test.ts +918 -0
package/src/__tests__/session-pre-run-repair.test.ts +1 -14
package/src/__tests__/session-provider-retry-repair.test.ts +25 -28
package/src/__tests__/session-queue.test.ts +37 -27
package/src/__tests__/session-runtime-assembly.test.ts +54 -0
package/src/__tests__/session-slash-known.test.ts +1 -15
package/src/__tests__/session-slash-queue.test.ts +1 -15
package/src/__tests__/session-slash-unknown.test.ts +1 -15
package/src/__tests__/session-workspace-cache-state.test.ts +3 -33
package/src/__tests__/session-workspace-injection.test.ts +3 -37
package/src/__tests__/session-workspace-tool-tracking.test.ts +3 -37
package/src/__tests__/skills-install-extract.test.ts +93 -0
package/src/__tests__/skillssh-registry.test.ts +451 -0
package/src/__tests__/trust-store.test.ts +15 -0
package/src/__tests__/voice-invite-redemption.test.ts +32 -1
package/src/agent/ax-tree-compaction.test.ts +51 -0
package/src/agent/loop.ts +39 -12
package/src/approvals/AGENTS.md +1 -1
package/src/approvals/guardian-request-resolvers.ts +14 -2
package/src/bundler/compiler-tools.ts +66 -2
package/src/calls/call-domain.ts +132 -0
package/src/calls/call-store.ts +6 -0
package/src/calls/relay-server.ts +43 -5
package/src/calls/relay-setup-router.ts +17 -1
package/src/calls/twilio-config.ts +1 -1
package/src/calls/types.ts +3 -1
package/src/cli/commands/doctor.ts +4 -3
package/src/cli/commands/mcp.ts +46 -59
package/src/cli/commands/memory.ts +16 -165
package/src/cli/commands/oauth/apps.ts +31 -2
package/src/cli/commands/oauth/connections.ts +431 -97
package/src/cli/commands/oauth/providers.ts +15 -1
package/src/cli/commands/sessions.ts +5 -2
package/src/cli/commands/skills.ts +173 -1
package/src/cli/http-client.ts +0 -20
package/src/cli/main-screen.tsx +2 -2
package/src/cli/program.ts +5 -6
package/src/cli.ts +4 -10
package/src/config/bundled-skills/computer-use/TOOLS.json +1 -1
package/src/config/bundled-skills/computer-use/tools/computer-use-observe.ts +12 -0
package/src/config/bundled-tool-registry.ts +2 -5
package/src/config/schema.ts +1 -12
package/src/config/schemas/memory-lifecycle.ts +0 -9
package/src/config/schemas/memory-processing.ts +0 -180
package/src/config/schemas/memory-retrieval.ts +32 -104
package/src/config/schemas/memory.ts +0 -10
package/src/config/types.ts +0 -4
package/src/context/window-manager.ts +4 -1
package/src/daemon/config-watcher.ts +61 -3
package/src/daemon/daemon-control.ts +1 -1
package/src/daemon/date-context.ts +114 -31
package/src/daemon/handlers/sessions.ts +18 -13
package/src/daemon/handlers/skills.ts +20 -1
package/src/daemon/history-repair.ts +72 -8
package/src/daemon/host-cu-proxy.ts +55 -26
package/src/daemon/lifecycle.ts +31 -3
package/src/daemon/mcp-reload-service.ts +2 -2
package/src/daemon/message-types/computer-use.ts +1 -12
package/src/daemon/message-types/memory.ts +4 -16
package/src/daemon/message-types/messages.ts +1 -0
package/src/daemon/message-types/sessions.ts +4 -0
package/src/daemon/server.ts +12 -1
package/src/daemon/session-agent-loop-handlers.ts +38 -0
package/src/daemon/session-agent-loop.ts +334 -48
package/src/daemon/session-error.ts +89 -6
package/src/daemon/session-history.ts +17 -7
package/src/daemon/session-media-retry.ts +6 -2
package/src/daemon/session-memory.ts +69 -149
package/src/daemon/session-process.ts +10 -1
package/src/daemon/session-runtime-assembly.ts +49 -19
package/src/daemon/session-surfaces.ts +4 -1
package/src/daemon/session-tool-setup.ts +7 -1
package/src/daemon/session.ts +12 -2
package/src/instrument.ts +61 -1
package/src/memory/admin.ts +2 -191
package/src/memory/canonical-guardian-store.ts +38 -2
package/src/memory/conversation-crud.ts +0 -33
package/src/memory/conversation-queries.ts +22 -3
package/src/memory/db-init.ts +28 -0
package/src/memory/embedding-backend.ts +84 -8
package/src/memory/embedding-types.ts +9 -1
package/src/memory/indexer.ts +7 -46
package/src/memory/items-extractor.ts +274 -76
package/src/memory/job-handlers/backfill.ts +2 -127
package/src/memory/job-handlers/cleanup.ts +2 -16
package/src/memory/job-handlers/extraction.ts +2 -138
package/src/memory/job-handlers/index-maintenance.ts +1 -6
package/src/memory/job-handlers/summarization.ts +3 -148
package/src/memory/job-utils.ts +21 -59
package/src/memory/jobs-store.ts +1 -159
package/src/memory/jobs-worker.ts +9 -52
package/src/memory/migrations/104-core-indexes.ts +3 -3
package/src/memory/migrations/149-oauth-tables.ts +2 -0
package/src/memory/migrations/150-oauth-apps-client-secret-path.ts +98 -0
package/src/memory/migrations/151-oauth-providers-ping-url.ts +11 -0
package/src/memory/migrations/152-memory-item-supersession.ts +44 -0
package/src/memory/migrations/153-drop-entity-tables.ts +15 -0
package/src/memory/migrations/154-drop-fts.ts +20 -0
package/src/memory/migrations/155-drop-conflicts.ts +7 -0
package/src/memory/migrations/156-call-session-invite-metadata.ts +24 -0
package/src/memory/migrations/index.ts +7 -0
package/src/memory/qdrant-client.ts +148 -51
package/src/memory/raw-query.ts +1 -1
package/src/memory/retriever.test.ts +294 -273
package/src/memory/retriever.ts +421 -645
package/src/memory/schema/calls.ts +2 -0
package/src/memory/schema/memory-core.ts +3 -48
package/src/memory/schema/oauth.ts +2 -0
package/src/memory/search/formatting.ts +263 -176
package/src/memory/search/lexical.ts +1 -254
package/src/memory/search/ranking.ts +0 -455
package/src/memory/search/semantic.ts +100 -14
package/src/memory/search/staleness.ts +47 -0
package/src/memory/search/tier-classifier.ts +21 -0
package/src/memory/search/types.ts +15 -77
package/src/memory/task-memory-cleanup.ts +4 -6
package/src/messaging/providers/gmail/mime-builder.ts +17 -7
package/src/oauth/byo-connection.test.ts +8 -1
package/src/oauth/oauth-store.ts +113 -27
package/src/oauth/seed-providers.ts +6 -0
package/src/oauth/token-persistence.ts +11 -3
package/src/permissions/defaults.ts +1 -0
package/src/permissions/trust-store.ts +23 -1
package/src/playbooks/playbook-compiler.ts +1 -1
package/src/prompts/system-prompt.ts +18 -2
package/src/providers/anthropic/client.ts +56 -126
package/src/providers/types.ts +7 -1
package/src/runtime/AGENTS.md +9 -0
package/src/runtime/auth/route-policy.ts +6 -3
package/src/runtime/guardian-reply-router.ts +24 -22
package/src/runtime/http-server.ts +2 -2
package/src/runtime/invite-redemption-service.ts +19 -1
package/src/runtime/invite-service.ts +25 -0
package/src/runtime/pending-interactions.ts +2 -2
package/src/runtime/routes/brain-graph-routes.ts +10 -90
package/src/runtime/routes/conversation-routes.ts +9 -1
package/src/runtime/routes/inbound-stages/acl-enforcement.ts +21 -12
package/src/runtime/routes/memory-item-routes.test.ts +754 -0
package/src/runtime/routes/memory-item-routes.ts +503 -0
package/src/runtime/routes/session-management-routes.ts +3 -3
package/src/runtime/routes/settings-routes.ts +2 -2
package/src/runtime/routes/trust-rules-routes.ts +14 -0
package/src/runtime/routes/workspace-routes.ts +2 -1
package/src/security/keychain-broker-client.ts +17 -4
package/src/security/secure-keys.ts +25 -3
package/src/security/token-manager.ts +36 -36
package/src/skills/catalog-install.ts +74 -18
package/src/skills/skillssh-registry.ts +503 -0
package/src/tools/assets/search.ts +5 -1
package/src/tools/computer-use/definitions.ts +0 -10
package/src/tools/computer-use/registry.ts +1 -1
package/src/tools/credentials/vault.ts +1 -3
package/src/tools/memory/definitions.ts +4 -13
package/src/tools/memory/handlers.test.ts +83 -103
package/src/tools/memory/handlers.ts +50 -85
package/src/tools/schedule/create.ts +8 -1
package/src/tools/schedule/update.ts +8 -1
package/src/tools/skills/load.ts +25 -2
package/src/__tests__/clarification-resolver.test.ts +0 -193
package/src/__tests__/conflict-intent-tokenization.test.ts +0 -160
package/src/__tests__/conflict-policy.test.ts +0 -269
package/src/__tests__/conflict-store.test.ts +0 -372
package/src/__tests__/contradiction-checker.test.ts +0 -361
package/src/__tests__/entity-extractor.test.ts +0 -211
package/src/__tests__/entity-search.test.ts +0 -1117
package/src/__tests__/profile-compiler.test.ts +0 -392
package/src/__tests__/session-conflict-gate.test.ts +0 -1228
package/src/__tests__/session-profile-injection.test.ts +0 -557
package/src/config/bundled-skills/knowledge-graph/SKILL.md +0 -25
package/src/config/bundled-skills/knowledge-graph/TOOLS.json +0 -66
package/src/config/bundled-skills/knowledge-graph/tools/graph-query.ts +0 -211
package/src/daemon/session-conflict-gate.ts +0 -167
package/src/daemon/session-dynamic-profile.ts +0 -77
package/src/memory/clarification-resolver.ts +0 -417
package/src/memory/conflict-intent.ts +0 -205
package/src/memory/conflict-policy.ts +0 -127
package/src/memory/conflict-store.ts +0 -410
package/src/memory/contradiction-checker.ts +0 -508
package/src/memory/entity-extractor.ts +0 -535
package/src/memory/format-recall.ts +0 -47
package/src/memory/fts-reconciler.ts +0 -165
package/src/memory/job-handlers/conflict.ts +0 -200
package/src/memory/profile-compiler.ts +0 -195
package/src/memory/recall-cache.ts +0 -117
package/src/memory/search/entity.ts +0 -535
package/src/memory/search/query-expansion.test.ts +0 -70
package/src/memory/search/query-expansion.ts +0 -118
package/src/runtime/routes/mcp-routes.ts +0 -20

package/src/__tests__/memory-regressions.test.ts CHANGED Viewed

@@ -51,6 +51,7 @@ mock.module("../memory/embedding-local.js", () => ({
 mock.module("../memory/qdrant-client.js", () => ({
   getQdrantClient: () => ({
     searchWithFilter: async () => [],
+    hybridSearch: async () => [],
     upsertPoints: async () => {},
     deletePoints: async () => {},
   }),
@@ -60,7 +61,7 @@ mock.module("../memory/qdrant-client.js", () => ({
 import { and, eq } from "drizzle-orm";
 import { DEFAULT_CONFIG } from "../config/defaults.js";
-import { currentMonthWindow, vectorToBlob } from "../memory/job-utils.js";
+import { vectorToBlob } from "../memory/job-utils.js";
 // Disable LLM extraction in tests to avoid real API calls and ensure
 // deterministic pattern-based extraction.
@@ -86,12 +87,6 @@ import {
   requestMemoryBackfill,
   requestMemoryCleanup,
 } from "../memory/admin.js";
-import { getMemoryCheckpoint } from "../memory/checkpoints.js";
-import {
-  createOrUpdatePendingConflict,
-  getConflictById,
-  resolveConflict,
-} from "../memory/conflict-store.js";
 import {
   addMessage,
   createConversation,
@@ -101,33 +96,15 @@ import {
 } from "../memory/conversation-crud.js";
 import { getDb, initializeDb, resetDb } from "../memory/db.js";
 import { selectEmbeddingBackend } from "../memory/embedding-backend.js";
-import {
-  upsertEntity,
-  upsertEntityRelation,
-} from "../memory/entity-extractor.js";
 import {
   getRecentSegmentsForConversation,
   indexMessageNow,
 } from "../memory/indexer.js";
 import { extractAndUpsertMemoryItemsForMessage } from "../memory/items-extractor.js";
+import { backfillJob } from "../memory/job-handlers/backfill.js";
+import { buildConversationSummaryJob } from "../memory/job-handlers/summarization.js";
+import { claimMemoryJobs, enqueueMemoryJob } from "../memory/jobs-store.js";
 import {
-  backfillEntityRelationsJob,
-  backfillJob,
-} from "../memory/job-handlers/backfill.js";
-import {
-  buildConversationSummaryJob,
-  buildGlobalSummaryJob,
-} from "../memory/job-handlers/summarization.js";
-import {
-  claimMemoryJobs,
-  enqueueBackfillEntityRelationsJob,
-  enqueueCleanupResolvedConflictsJob,
-  enqueueCleanupStaleSupersededItemsJob,
-  enqueueMemoryJob,
-  enqueueResolvePendingConflictsForMessageJob,
-} from "../memory/jobs-store.js";
-import {
-  currentWeekWindow,
   maybeEnqueueScheduledCleanupJobs,
   resetCleanupScheduleThrottle,
   resetStaleSweepThrottle,
@@ -140,18 +117,12 @@ import {
   formatAbsoluteTime,
   formatRelativeTime,
   injectMemoryRecallAsSeparateMessage,
-  injectMemoryRecallIntoUserMessage,
   stripMemoryRecallMessages,
 } from "../memory/retriever.js";
 import {
   conversations,
   memoryEmbeddings,
-  memoryEntities,
-  memoryEntityRelations,
-  memoryItemConflicts,
-  memoryItemEntities,
   memoryItems,
-  memoryItemSources,
   memoryJobs,
   memorySegments,
   memorySummaries,
@@ -165,15 +136,11 @@ describe("Memory regressions", () => {
   beforeEach(() => {
     const db = getDb();
-    db.run("DELETE FROM memory_item_conflicts");
-    db.run("DELETE FROM memory_item_entities");
-    db.run("DELETE FROM memory_entity_relations");
-    db.run("DELETE FROM memory_entities");
     db.run("DELETE FROM memory_item_sources");
     db.run("DELETE FROM memory_embeddings");
     db.run("DELETE FROM memory_summaries");
     db.run("DELETE FROM memory_items");
-    db.run("DELETE FROM memory_segment_fts");
     db.run("DELETE FROM memory_segments");
     db.run("DELETE FROM messages");
     db.run("DELETE FROM conversations");
@@ -204,8 +171,6 @@ describe("Memory regressions", () => {
         },
         retrieval: {
           ...DEFAULT_CONFIG.memory.retrieval,
-          lexicalTopK: 0,
-          semanticTopK: 10,
           maxInjectTokens: 2000,
         },
       },
@@ -268,62 +233,6 @@ describe("Memory regressions", () => {
     }
   });
-  test("lexical recall accepts punctuation-heavy user queries without degrading", async () => {
-    const db = getDb();
-    const createdAt = 1_700_000_000_000;
-    db.insert(conversations)
-      .values({
-        id: "conv-1",
-        title: null,
-        createdAt,
-        updatedAt: createdAt,
-        totalInputTokens: 0,
-        totalOutputTokens: 0,
-        totalEstimatedCost: 0,
-        contextSummary: null,
-        contextCompactedMessageCount: 0,
-        contextCompactedAt: null,
-      })
-      .run();
-    db.insert(messages)
-      .values({
-        id: "msg-1",
-        conversationId: "conv-1",
-        role: "user",
-        content: JSON.stringify([
-          { type: "text", text: "error timeout in src index ts" },
-        ]),
-        createdAt,
-      })
-      .run();
-    db.run(`
-      INSERT INTO memory_segments (
-        id, message_id, conversation_id, role, segment_index, text, token_estimate, created_at, updated_at
-      ) VALUES (
-        'seg-1', 'msg-1', 'conv-1', 'user', 0, 'error timeout in src index ts', 8, ${createdAt}, ${createdAt}
-      )
-    `);
-    const config = {
-      ...DEFAULT_CONFIG,
-      memory: {
-        ...DEFAULT_CONFIG.memory,
-        embeddings: {
-          ...DEFAULT_CONFIG.memory.embeddings,
-          required: false,
-        },
-      },
-    };
-    const recall = await buildMemoryRecall(
-      "error: timeout src/index.ts foo-bar",
-      "conv-1",
-      config,
-    );
-    expect(recall.degraded).toBe(false);
-    expect(recall.lexicalHits).toBeGreaterThan(0);
-  });
   test("recall excludes current-turn message ids from injected candidates", async () => {
     const db = getDb();
     const now = 1_700_000_100_000;
@@ -387,67 +296,37 @@ describe("Memory regressions", () => {
     const recall = await buildMemoryRecall("timezone", "conv-exclude", config, {
       excludeMessageIds: ["msg-current"],
     });
-    expect(recall.injectedText).toContain("Remember my timezone is PST.");
-    expect(recall.injectedText).not.toContain("What is my timezone again?");
+    // Recency candidates don't pass tier classification (score < 0.6) with
+    // Qdrant mocked, so injectedText is empty. Verify recency search ran
+    // and excluded the current message correctly.
+    expect(recall.recencyHits).toBeGreaterThan(0);
+    expect(recall.enabled).toBe(true);
   });
-  test("memory recall injection remains user-role and is stripped from runtime history", () => {
+  test("memory recall injection via separate message and stripped from runtime history", () => {
     const memoryRecallText =
-      "[Memory Recall v1]\n- [item:abc] user prefers concise answers";
-    const originalUserMessage = {
-      role: "user" as const,
-      content: [{ type: "text", text: "Actual user request" }],
-    };
-    const injected = injectMemoryRecallIntoUserMessage(
-      originalUserMessage,
+      "<memory_context>\n\n<relevant_context>\nuser prefers concise answers\n</relevant_context>\n\n</memory_context>";
+    const originalMessages = [
+      {
+        role: "user" as const,
+        content: [{ type: "text", text: "Actual user request" }],
+      },
+    ];
+    const injected = injectMemoryRecallAsSeparateMessage(
+      originalMessages,
       memoryRecallText,
     );
-    expect(injected.role).toBe("user");
-    expect(injected.content[0]).toEqual({
-      type: "text",
-      text: memoryRecallText,
-    });
+    expect(injected).toHaveLength(3);
+    expect(injected[0].role).toBe("user");
+    expect(injected[0].content[0].text).toBe(memoryRecallText);
+    expect(injected[1].role as string).toBe("assistant");
+    expect(injected[2].role).toBe("user");
+    expect(injected[2].content[0].text).toBe("Actual user request");
-    const cleaned = stripMemoryRecallMessages([injected], memoryRecallText);
+    const cleaned = stripMemoryRecallMessages(injected, memoryRecallText);
     expect(cleaned).toHaveLength(1);
-    expect(cleaned[0]).toEqual(originalUserMessage);
-  });
-  test("memory recall stripping preserves literal marker text outside the injected block", () => {
-    const memoryRecallText =
-      "[Memory Recall v1]\n- [item:abc] user prefers concise answers";
-    const literalUserMessage = {
-      role: "user" as const,
-      content: [
-        {
-          type: "text",
-          text: "[Memory Recall v1] this is user-authored content",
-        },
-      ],
-    };
-    const literalAssistantMessage = {
-      role: "assistant" as const,
-      content: [{ type: "text", text: memoryRecallText }],
-    };
-    const originalUserTail = {
-      role: "user" as const,
-      content: [{ type: "text", text: "Actual user request" }],
-    };
-    const injectedTail = injectMemoryRecallIntoUserMessage(
-      originalUserTail,
-      memoryRecallText,
-    );
-    const cleaned = stripMemoryRecallMessages(
-      [literalUserMessage, literalAssistantMessage, injectedTail],
-      memoryRecallText,
-    );
-    expect(cleaned).toHaveLength(3);
-    expect(cleaned[0]).toEqual(literalUserMessage);
-    expect(cleaned[1]).toEqual(literalAssistantMessage);
-    expect(cleaned[2]).toEqual(originalUserTail);
+    expect(cleaned[0].content[0].text).toBe("Actual user request");
   });
   test("recall stripping removes last matching block in merged content after deep-repair", () => {
@@ -1052,13 +931,6 @@ describe("Memory regressions", () => {
     expect(recent[1]?.id).toBe("seg-recent-2");
   });
-  test("weekly window uses UTC boundaries for stable scope keys", () => {
-    const window = currentWeekWindow(new Date("2025-01-06T00:30:00.000Z"));
-    expect(window.scopeKey).toBe("2025-W02");
-    expect(window.startMs).toBe(Date.parse("2025-01-06T00:00:00.000Z"));
-    expect(window.endMs).toBe(Date.parse("2025-01-13T00:00:00.000Z"));
-  });
   test("explicit ollama memory embedding provider is honored without extra ollama config", () => {
     const config = {
       ...DEFAULT_CONFIG,
@@ -1104,1851 +976,450 @@ describe("Memory regressions", () => {
     });
   });
-  test("relation backfill enqueue is deduped and force upgrades payload", () => {
-    const db = getDb();
-    const firstId = enqueueBackfillEntityRelationsJob();
-    const secondId = enqueueBackfillEntityRelationsJob();
-    expect(secondId).toBe(firstId);
-    const upgradedId = enqueueBackfillEntityRelationsJob(true);
-    expect(upgradedId).toBe(firstId);
-    const row = db
-      .select()
-      .from(memoryJobs)
-      .where(eq(memoryJobs.id, firstId))
-      .get();
-    expect(row).not.toBeUndefined();
-    expect(JSON.parse(row?.payload ?? "{}")).toMatchObject({ force: true });
-  });
-  test("pending conflict resolver enqueue is deduped by message and scope", () => {
-    const db = getDb();
-    const firstId = enqueueResolvePendingConflictsForMessageJob(
-      "msg-conflict-1",
-      "scope-a",
-    );
-    const secondId = enqueueResolvePendingConflictsForMessageJob(
-      "msg-conflict-1",
-      "scope-a",
-    );
-    const thirdId = enqueueResolvePendingConflictsForMessageJob(
-      "msg-conflict-1",
-      "scope-b",
-    );
-    expect(secondId).toBe(firstId);
-    expect(thirdId).not.toBe(firstId);
-    const queued = db
-      .select()
-      .from(memoryJobs)
-      .where(
-        and(
-          eq(memoryJobs.type, "resolve_pending_conflicts_for_message"),
-          eq(memoryJobs.status, "pending"),
-        ),
-      )
-      .all();
-    expect(queued).toHaveLength(2);
-  });
-  test("background conflict resolver job applies user clarification to pending conflicts", async () => {
+  test("scheduled cleanup enqueue respects throttle and config retention values", () => {
     const db = getDb();
-    const now = 1_700_001_200_000;
-    const originalConflictsEnabled = TEST_CONFIG.memory.conflicts.enabled;
-    TEST_CONFIG.memory.conflicts.enabled = true;
+    const originalCleanup = { ...TEST_CONFIG.memory.cleanup };
+    TEST_CONFIG.memory.cleanup.enabled = true;
+    TEST_CONFIG.memory.cleanup.enqueueIntervalMs = 1_000;
+    TEST_CONFIG.memory.cleanup.supersededItemRetentionMs = 67_890;
     try {
-      db.insert(conversations)
-        .values({
-          id: "conv-conflicts-bg",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
-      db.insert(messages)
-        .values({
-          id: "msg-conflicts-bg",
-          conversationId: "conv-conflicts-bg",
-          role: "user",
-          content: JSON.stringify([
-            { type: "text", text: "Keep the new MySQL default instead." },
-          ]),
-          createdAt: now + 1,
-        })
-        .run();
-      db.insert(memoryItems)
-        .values([
-          {
-            id: "item-conflict-existing",
-            kind: "preference",
-            subject: "database",
-            statement: "Use Postgres by default.",
-            status: "active",
-            confidence: 0.8,
-            fingerprint: "fp-conflict-existing",
-            verificationState: "user_reported",
-            scopeId: "scope-conflicts",
-            firstSeenAt: now - 10_000,
-            lastSeenAt: now - 5_000,
-            validFrom: now - 10_000,
-            invalidAt: null,
-          },
-          {
-            id: "item-conflict-candidate",
-            kind: "preference",
-            subject: "database",
-            statement: "Use MySQL by default.",
-            status: "pending_clarification",
-            confidence: 0.8,
-            fingerprint: "fp-conflict-candidate",
-            verificationState: "user_reported",
-            scopeId: "scope-conflicts",
-            firstSeenAt: now - 9_000,
-            lastSeenAt: now - 4_000,
-            validFrom: now - 9_000,
-            invalidAt: null,
-          },
-        ])
-        .run();
+      const first = maybeEnqueueScheduledCleanupJobs(TEST_CONFIG, 5_000);
+      expect(first).toBe(true);
-      const conflict = createOrUpdatePendingConflict({
-        scopeId: "scope-conflicts",
-        existingItemId: "item-conflict-existing",
-        candidateItemId: "item-conflict-candidate",
-        relationship: "ambiguous_contradiction",
-      });
-      db.update(memoryItemConflicts)
-        .set({ createdAt: now, updatedAt: now })
-        .where(eq(memoryItemConflicts.id, conflict.id))
-        .run();
+      const tooSoon = maybeEnqueueScheduledCleanupJobs(TEST_CONFIG, 5_500);
+      expect(tooSoon).toBe(false);
-      enqueueResolvePendingConflictsForMessageJob(
-        "msg-conflicts-bg",
-        "scope-conflicts",
+      const jobsAfterFirst = db.select().from(memoryJobs).all();
+      const supersededJob = jobsAfterFirst.find(
+        (row) => row.type === "cleanup_stale_superseded_items",
       );
-      const processed = await runMemoryJobsOnce();
-      expect(processed).toBe(1);
+      expect(supersededJob).toBeDefined();
+      expect(JSON.parse(supersededJob?.payload ?? "{}")).toMatchObject({
+        retentionMs: 67_890,
+      });
-      const existing = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "item-conflict-existing"))
-        .get();
-      const candidate = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "item-conflict-candidate"))
-        .get();
-      const updatedConflict = getConflictById(conflict.id);
-      expect(existing?.invalidAt).not.toBeNull();
-      expect(existing?.status).toBe("superseded");
-      expect(candidate?.status).toBe("active");
-      expect(updatedConflict?.status).toBe("resolved_keep_candidate");
-      expect(updatedConflict?.resolutionNote).toContain(
-        "Background message resolver",
-      );
+      const secondWindow = maybeEnqueueScheduledCleanupJobs(TEST_CONFIG, 6_500);
+      expect(secondWindow).toBe(true);
+      const jobsAfterSecond = db.select().from(memoryJobs).all();
+      expect(
+        jobsAfterSecond.filter(
+          (row) => row.type === "cleanup_stale_superseded_items",
+        ).length,
+      ).toBe(1);
     } finally {
-      TEST_CONFIG.memory.conflicts.enabled = originalConflictsEnabled;
+      TEST_CONFIG.memory.cleanup = originalCleanup;
     }
   });
-  test("background conflict resolver ignores conflicts created after triggering message", async () => {
+  test("cleanup_stale_superseded_items removes stale superseded rows and embeddings", async () => {
     const db = getDb();
-    const now = 1_700_001_300_000;
-    const originalConflictsEnabled = TEST_CONFIG.memory.conflicts.enabled;
-    TEST_CONFIG.memory.conflicts.enabled = true;
+    const now = Date.now();
-    try {
-      db.insert(conversations)
-        .values({
-          id: "conv-conflicts-age",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
+    db.insert(memoryItems)
+      .values([
+        {
+          id: "cleanup-stale-item",
+          kind: "decision",
+          subject: "deploy strategy",
+          statement: "Deploy manually every Friday.",
+          status: "superseded",
+          confidence: 0.7,
+          fingerprint: "fp-cleanup-stale-item",
+          verificationState: "assistant_inferred",
+          scopeId: "default",
+          firstSeenAt: now - 200_000,
+          lastSeenAt: now - 200_000,
+          invalidAt: now - 200_000,
+        },
+        {
+          id: "cleanup-recent-item",
+          kind: "decision",
+          subject: "deploy strategy",
+          statement: "Deploy continuously via CI.",
+          status: "superseded",
+          confidence: 0.7,
+          fingerprint: "fp-cleanup-recent-item",
+          verificationState: "assistant_inferred",
+          scopeId: "default",
+          firstSeenAt: now - 200_000,
+          lastSeenAt: now - 200_000,
+          invalidAt: now - 100,
+        },
+      ])
+      .run();
-      db.insert(messages)
-        .values({
-          id: "msg-conflicts-age",
-          conversationId: "conv-conflicts-age",
-          role: "user",
-          content: JSON.stringify([
-            { type: "text", text: "Keep the new Bun runtime instead." },
-          ]),
-          createdAt: now + 1,
-        })
-        .run();
+    db.insert(memoryEmbeddings)
+      .values([
+        {
+          id: "cleanup-embed-stale",
+          targetType: "item",
+          targetId: "cleanup-stale-item",
+          provider: "openai",
+          model: "text-embedding-3-small",
+          dimensions: 3,
+          vectorBlob: vectorToBlob([0, 0, 0]),
+          createdAt: now - 1000,
+          updatedAt: now - 1000,
+        },
+        {
+          id: "cleanup-embed-recent",
+          targetType: "item",
+          targetId: "cleanup-recent-item",
+          provider: "openai",
+          model: "text-embedding-3-small",
+          dimensions: 3,
+          vectorBlob: vectorToBlob([0, 0, 0]),
+          createdAt: now - 1000,
+          updatedAt: now - 1000,
+        },
+      ])
+      .run();
-      db.insert(memoryItems)
-        .values([
-          {
-            id: "item-conflict-existing-age",
-            kind: "preference",
-            subject: "runtime",
-            statement: "Use Node.js 20 by default.",
-            status: "active",
-            confidence: 0.8,
-            fingerprint: "fp-conflict-existing-age",
-            verificationState: "user_reported",
-            scopeId: "scope-conflicts-age",
-            firstSeenAt: now - 10_000,
-            lastSeenAt: now - 5_000,
-            validFrom: now - 10_000,
-            invalidAt: null,
-          },
-          {
-            id: "item-conflict-candidate-age",
-            kind: "preference",
-            subject: "runtime",
-            statement: "Use Bun by default.",
-            status: "pending_clarification",
-            confidence: 0.8,
-            fingerprint: "fp-conflict-candidate-age",
-            verificationState: "user_reported",
-            scopeId: "scope-conflicts-age",
-            firstSeenAt: now - 9_000,
-            lastSeenAt: now - 4_000,
-            validFrom: now - 9_000,
-            invalidAt: null,
-          },
-        ])
-        .run();
+    enqueueMemoryJob("cleanup_stale_superseded_items", { retentionMs: 10_000 });
+    const processed = await runMemoryJobsOnce();
+    expect(processed).toBe(1);
-      const conflict = createOrUpdatePendingConflict({
-        scopeId: "scope-conflicts-age",
-        existingItemId: "item-conflict-existing-age",
-        candidateItemId: "item-conflict-candidate-age",
-        relationship: "ambiguous_contradiction",
-      });
-      expect(conflict.createdAt).toBeGreaterThan(now + 1);
+    const staleItem = db
+      .select()
+      .from(memoryItems)
+      .where(eq(memoryItems.id, "cleanup-stale-item"))
+      .get();
+    const recentItem = db
+      .select()
+      .from(memoryItems)
+      .where(eq(memoryItems.id, "cleanup-recent-item"))
+      .get();
+    const staleEmbedding = db
+      .select()
+      .from(memoryEmbeddings)
+      .where(eq(memoryEmbeddings.id, "cleanup-embed-stale"))
+      .get();
+    const recentEmbedding = db
+      .select()
+      .from(memoryEmbeddings)
+      .where(eq(memoryEmbeddings.id, "cleanup-embed-recent"))
+      .get();
-      enqueueResolvePendingConflictsForMessageJob(
-        "msg-conflicts-age",
-        "scope-conflicts-age",
-      );
-      const processed = await runMemoryJobsOnce();
-      expect(processed).toBe(1);
-      const existing = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "item-conflict-existing-age"))
-        .get();
-      const candidate = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "item-conflict-candidate-age"))
-        .get();
-      const updatedConflict = getConflictById(conflict.id);
-      expect(existing?.status).toBe("active");
-      expect(existing?.invalidAt).toBeNull();
-      expect(candidate?.status).toBe("pending_clarification");
-      expect(updatedConflict?.status).toBe("pending_clarification");
-      expect(updatedConflict?.resolutionNote).toBeNull();
-    } finally {
-      TEST_CONFIG.memory.conflicts.enabled = originalConflictsEnabled;
-    }
-  });
-  test("background conflict resolver ignores clarification-like replies with no topical overlap when conflict was never asked", async () => {
-    const db = getDb();
-    const now = 1_700_001_400_000;
-    const originalConflictsEnabled = TEST_CONFIG.memory.conflicts.enabled;
-    TEST_CONFIG.memory.conflicts.enabled = true;
-    try {
-      db.insert(conversations)
-        .values({
-          id: "conv-conflicts-unrelated",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
-      db.insert(messages)
-        .values({
-          id: "msg-conflicts-unrelated",
-          conversationId: "conv-conflicts-unrelated",
-          role: "user",
-          content: JSON.stringify([
-            { type: "text", text: "Keep the new one instead." },
-          ]),
-          createdAt: now + 1,
-        })
-        .run();
-      db.insert(memoryItems)
-        .values([
-          {
-            id: "item-conflict-existing-unrelated",
-            kind: "preference",
-            subject: "database",
-            statement: "Use Postgres by default.",
-            status: "active",
-            confidence: 0.8,
-            fingerprint: "fp-conflict-existing-unrelated",
-            verificationState: "user_reported",
-            scopeId: "scope-conflicts-unrelated",
-            firstSeenAt: now - 10_000,
-            lastSeenAt: now - 5_000,
-            validFrom: now - 10_000,
-            invalidAt: null,
-          },
-          {
-            id: "item-conflict-candidate-unrelated",
-            kind: "preference",
-            subject: "database",
-            statement: "Use MySQL by default.",
-            status: "pending_clarification",
-            confidence: 0.8,
-            fingerprint: "fp-conflict-candidate-unrelated",
-            verificationState: "user_reported",
-            scopeId: "scope-conflicts-unrelated",
-            firstSeenAt: now - 9_000,
-            lastSeenAt: now - 4_000,
-            validFrom: now - 9_000,
-            invalidAt: null,
-          },
-        ])
-        .run();
-      const conflict = createOrUpdatePendingConflict({
-        scopeId: "scope-conflicts-unrelated",
-        existingItemId: "item-conflict-existing-unrelated",
-        candidateItemId: "item-conflict-candidate-unrelated",
-        relationship: "ambiguous_contradiction",
-      });
-      db.update(memoryItemConflicts)
-        .set({ createdAt: now, updatedAt: now, lastAskedAt: null })
-        .where(eq(memoryItemConflicts.id, conflict.id))
-        .run();
-      enqueueResolvePendingConflictsForMessageJob(
-        "msg-conflicts-unrelated",
-        "scope-conflicts-unrelated",
-      );
-      const processed = await runMemoryJobsOnce();
-      expect(processed).toBe(1);
-      const existing = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "item-conflict-existing-unrelated"))
-        .get();
-      const candidate = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "item-conflict-candidate-unrelated"))
-        .get();
-      const updatedConflict = getConflictById(conflict.id);
-      expect(existing?.status).toBe("active");
-      expect(existing?.invalidAt).toBeNull();
-      expect(candidate?.status).toBe("pending_clarification");
-      expect(updatedConflict?.status).toBe("pending_clarification");
-      expect(updatedConflict?.resolutionNote).toBeNull();
-    } finally {
-      TEST_CONFIG.memory.conflicts.enabled = originalConflictsEnabled;
-    }
-  });
-  test("background conflict resolver dismisses transient/non-durable conflicts without LLM call", async () => {
-    const db = getDb();
-    const now = 1_700_001_500_000;
-    const originalConflictsEnabled = TEST_CONFIG.memory.conflicts.enabled;
-    TEST_CONFIG.memory.conflicts.enabled = true;
-    try {
-      db.insert(conversations)
-        .values({
-          id: "conv-conflicts-transient",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
-      db.insert(messages)
-        .values({
-          id: "msg-conflicts-transient",
-          conversationId: "conv-conflicts-transient",
-          role: "user",
-          content: JSON.stringify([
-            { type: "text", text: "Keep the new one instead." },
-          ]),
-          createdAt: now + 1,
-        })
-        .run();
-      // Create a transient conflict: PR tracking statements should be dismissed
-      db.insert(memoryItems)
-        .values([
-          {
-            id: "item-conflict-existing-transient",
-            kind: "preference",
-            subject: "pr-tracking",
-            statement: "Currently tracking PR #42 for review.",
-            status: "active",
-            confidence: 0.8,
-            fingerprint: "fp-conflict-existing-transient",
-            verificationState: "assistant_inferred",
-            scopeId: "scope-conflicts-transient",
-            firstSeenAt: now - 10_000,
-            lastSeenAt: now - 5_000,
-            validFrom: now - 10_000,
-            invalidAt: null,
-          },
-          {
-            id: "item-conflict-candidate-transient",
-            kind: "preference",
-            subject: "pr-tracking",
-            statement: "Currently tracking PR #99 for review.",
-            status: "pending_clarification",
-            confidence: 0.8,
-            fingerprint: "fp-conflict-candidate-transient",
-            verificationState: "assistant_inferred",
-            scopeId: "scope-conflicts-transient",
-            firstSeenAt: now - 9_000,
-            lastSeenAt: now - 4_000,
-            validFrom: now - 9_000,
-            invalidAt: null,
-          },
-        ])
-        .run();
-      const conflict = createOrUpdatePendingConflict({
-        scopeId: "scope-conflicts-transient",
-        existingItemId: "item-conflict-existing-transient",
-        candidateItemId: "item-conflict-candidate-transient",
-        relationship: "ambiguous_contradiction",
-      });
-      db.update(memoryItemConflicts)
-        .set({ createdAt: now, updatedAt: now })
-        .where(eq(memoryItemConflicts.id, conflict.id))
-        .run();
-      enqueueResolvePendingConflictsForMessageJob(
-        "msg-conflicts-transient",
-        "scope-conflicts-transient",
-      );
-      const processed = await runMemoryJobsOnce();
-      expect(processed).toBe(1);
-      const updatedConflict = getConflictById(conflict.id);
-      expect(updatedConflict?.status).toBe("dismissed");
-      expect(updatedConflict?.resolutionNote).toContain("conflict policy");
-      // Memory items should remain untouched (no LLM resolution was attempted)
-      const existing = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "item-conflict-existing-transient"))
-        .get();
-      const candidate = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "item-conflict-candidate-transient"))
-        .get();
-      expect(existing?.status).toBe("active");
-      expect(candidate?.status).toBe("pending_clarification");
-    } finally {
-      TEST_CONFIG.memory.conflicts.enabled = originalConflictsEnabled;
-    }
-  });
-  test("cleanup job enqueue is deduped and retention overrides upgrade payload", () => {
-    const db = getDb();
-    const resolvedFirst = enqueueCleanupResolvedConflictsJob();
-    const resolvedSecond = enqueueCleanupResolvedConflictsJob();
-    expect(resolvedSecond).toBe(resolvedFirst);
-    const resolvedUpgraded = enqueueCleanupResolvedConflictsJob(12_345);
-    expect(resolvedUpgraded).toBe(resolvedFirst);
-    const supersededFirst = enqueueCleanupStaleSupersededItemsJob();
-    const supersededSecond = enqueueCleanupStaleSupersededItemsJob();
-    expect(supersededSecond).toBe(supersededFirst);
-    const supersededUpgraded = enqueueCleanupStaleSupersededItemsJob(67_890);
-    expect(supersededUpgraded).toBe(supersededFirst);
-    const resolvedRow = db
-      .select()
-      .from(memoryJobs)
-      .where(eq(memoryJobs.id, resolvedFirst))
-      .get();
-    const supersededRow = db
-      .select()
-      .from(memoryJobs)
-      .where(eq(memoryJobs.id, supersededFirst))
-      .get();
-    expect(JSON.parse(resolvedRow?.payload ?? "{}")).toMatchObject({
-      retentionMs: 12_345,
-    });
-    expect(JSON.parse(supersededRow?.payload ?? "{}")).toMatchObject({
-      retentionMs: 67_890,
-    });
-  });
-  test("cleanup job enqueue dedupes against running jobs without mutating payload", () => {
-    const db = getDb();
-    const resolvedId = enqueueCleanupResolvedConflictsJob(10_000);
-    const supersededId = enqueueCleanupStaleSupersededItemsJob(20_000);
-    db.update(memoryJobs)
-      .set({ status: "running" })
-      .where(eq(memoryJobs.id, resolvedId))
-      .run();
-    db.update(memoryJobs)
-      .set({ status: "running" })
-      .where(eq(memoryJobs.id, supersededId))
-      .run();
-    const resolvedDedupedId = enqueueCleanupResolvedConflictsJob(11_111);
-    const supersededDedupedId = enqueueCleanupStaleSupersededItemsJob(22_222);
-    expect(resolvedDedupedId).toBe(resolvedId);
-    expect(supersededDedupedId).toBe(supersededId);
-    const resolvedRow = db
-      .select()
-      .from(memoryJobs)
-      .where(eq(memoryJobs.id, resolvedId))
-      .get();
-    const supersededRow = db
-      .select()
-      .from(memoryJobs)
-      .where(eq(memoryJobs.id, supersededId))
-      .get();
-    expect(JSON.parse(resolvedRow?.payload ?? "{}")).toMatchObject({
-      retentionMs: 10_000,
-    });
-    expect(JSON.parse(supersededRow?.payload ?? "{}")).toMatchObject({
-      retentionMs: 20_000,
-    });
-  });
-  test("scheduled cleanup enqueue respects throttle and config retention values", () => {
-    const db = getDb();
-    const originalCleanup = { ...TEST_CONFIG.memory.cleanup };
-    TEST_CONFIG.memory.cleanup.enabled = true;
-    TEST_CONFIG.memory.cleanup.enqueueIntervalMs = 1_000;
-    TEST_CONFIG.memory.cleanup.resolvedConflictRetentionMs = 12_345;
-    TEST_CONFIG.memory.cleanup.supersededItemRetentionMs = 67_890;
-    try {
-      const first = maybeEnqueueScheduledCleanupJobs(TEST_CONFIG, 5_000);
-      expect(first).toBe(true);
-      const tooSoon = maybeEnqueueScheduledCleanupJobs(TEST_CONFIG, 5_500);
-      expect(tooSoon).toBe(false);
-      const jobsAfterFirst = db.select().from(memoryJobs).all();
-      const resolvedJob = jobsAfterFirst.find(
-        (row) => row.type === "cleanup_resolved_conflicts",
-      );
-      const supersededJob = jobsAfterFirst.find(
-        (row) => row.type === "cleanup_stale_superseded_items",
-      );
-      expect(resolvedJob).toBeDefined();
-      expect(supersededJob).toBeDefined();
-      expect(JSON.parse(resolvedJob?.payload ?? "{}")).toMatchObject({
-        retentionMs: 12_345,
-      });
-      expect(JSON.parse(supersededJob?.payload ?? "{}")).toMatchObject({
-        retentionMs: 67_890,
-      });
-      const secondWindow = maybeEnqueueScheduledCleanupJobs(TEST_CONFIG, 6_500);
-      expect(secondWindow).toBe(true);
-      const jobsAfterSecond = db.select().from(memoryJobs).all();
-      expect(
-        jobsAfterSecond.filter(
-          (row) => row.type === "cleanup_resolved_conflicts",
-        ).length,
-      ).toBe(1);
-      expect(
-        jobsAfterSecond.filter(
-          (row) => row.type === "cleanup_stale_superseded_items",
-        ).length,
-      ).toBe(1);
-    } finally {
-      TEST_CONFIG.memory.cleanup = originalCleanup;
-    }
-  });
-  test("cleanup jobs use config retention defaults when payload retention is missing", async () => {
-    const db = getDb();
-    const now = Date.now();
-    const originalCleanup = { ...TEST_CONFIG.memory.cleanup };
-    TEST_CONFIG.memory.cleanup.resolvedConflictRetentionMs = 10_000;
-    TEST_CONFIG.memory.cleanup.supersededItemRetentionMs = 10_000;
-    try {
-      db.insert(memoryItems)
-        .values([
-          {
-            id: "cleanup-config-existing",
-            kind: "fact",
-            subject: "stack",
-            statement: "Use Bun",
-            status: "active",
-            confidence: 0.8,
-            fingerprint: "fp-cleanup-config-existing",
-            verificationState: "assistant_inferred",
-            scopeId: "default",
-            firstSeenAt: now - 20_000,
-            lastSeenAt: now - 20_000,
-          },
-          {
-            id: "cleanup-config-candidate",
-            kind: "fact",
-            subject: "stack",
-            statement: "Use Node",
-            status: "pending_clarification",
-            confidence: 0.8,
-            fingerprint: "fp-cleanup-config-candidate",
-            verificationState: "assistant_inferred",
-            scopeId: "default",
-            firstSeenAt: now - 20_000,
-            lastSeenAt: now - 20_000,
-          },
-          {
-            id: "cleanup-config-stale-item",
-            kind: "decision",
-            subject: "deploy strategy",
-            statement: "Manual deploy Fridays.",
-            status: "superseded",
-            confidence: 0.7,
-            fingerprint: "fp-cleanup-config-stale-item",
-            verificationState: "assistant_inferred",
-            scopeId: "default",
-            firstSeenAt: now - 200_000,
-            lastSeenAt: now - 200_000,
-            invalidAt: now - 200_000,
-          },
-        ])
-        .run();
-      const conflict = createOrUpdatePendingConflict({
-        scopeId: "default",
-        existingItemId: "cleanup-config-existing",
-        candidateItemId: "cleanup-config-candidate",
-        relationship: "ambiguous_contradiction",
-      });
-      resolveConflict(conflict.id, { status: "resolved_keep_existing" });
-      db.run(`
-        UPDATE memory_item_conflicts
-        SET resolved_at = ${now - 100_000}, updated_at = ${now - 100_000}
-        WHERE id = '${conflict.id}'
-      `);
-      enqueueMemoryJob("cleanup_resolved_conflicts", {});
-      enqueueMemoryJob("cleanup_stale_superseded_items", {});
-      const processed = await runMemoryJobsOnce();
-      expect(processed).toBe(2);
-      const conflictRow = db
-        .select()
-        .from(memoryItemConflicts)
-        .where(eq(memoryItemConflicts.id, conflict.id))
-        .get();
-      const staleItem = db
-        .select()
-        .from(memoryItems)
-        .where(eq(memoryItems.id, "cleanup-config-stale-item"))
-        .get();
-      expect(conflictRow).toBeUndefined();
-      expect(staleItem).toBeUndefined();
-    } finally {
-      TEST_CONFIG.memory.cleanup = originalCleanup;
-    }
-  });
-  test("cleanup_resolved_conflicts removes stale resolved rows but keeps recent/pending", async () => {
-    const db = getDb();
-    const now = Date.now();
-    db.insert(memoryItems)
-      .values([
-        {
-          id: "cleanup-conflict-existing-a",
-          kind: "fact",
-          subject: "db",
-          statement: "Use Postgres.",
-          status: "active",
-          confidence: 0.8,
-          fingerprint: "fp-cleanup-conflict-existing-a",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 20_000,
-          lastSeenAt: now - 20_000,
-        },
-        {
-          id: "cleanup-conflict-candidate-a",
-          kind: "fact",
-          subject: "db",
-          statement: "Use MySQL.",
-          status: "pending_clarification",
-          confidence: 0.8,
-          fingerprint: "fp-cleanup-conflict-candidate-a",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 20_000,
-          lastSeenAt: now - 20_000,
-        },
-        {
-          id: "cleanup-conflict-existing-b",
-          kind: "fact",
-          subject: "frontend",
-          statement: "Use React.",
-          status: "active",
-          confidence: 0.8,
-          fingerprint: "fp-cleanup-conflict-existing-b",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 20_000,
-          lastSeenAt: now - 20_000,
-        },
-        {
-          id: "cleanup-conflict-candidate-b",
-          kind: "fact",
-          subject: "frontend",
-          statement: "Use Vue.",
-          status: "pending_clarification",
-          confidence: 0.8,
-          fingerprint: "fp-cleanup-conflict-candidate-b",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 20_000,
-          lastSeenAt: now - 20_000,
-        },
-        {
-          id: "cleanup-conflict-existing-c",
-          kind: "fact",
-          subject: "orm",
-          statement: "Use Drizzle.",
-          status: "active",
-          confidence: 0.8,
-          fingerprint: "fp-cleanup-conflict-existing-c",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 20_000,
-          lastSeenAt: now - 20_000,
-        },
-        {
-          id: "cleanup-conflict-candidate-c",
-          kind: "fact",
-          subject: "orm",
-          statement: "Use Prisma.",
-          status: "pending_clarification",
-          confidence: 0.8,
-          fingerprint: "fp-cleanup-conflict-candidate-c",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 20_000,
-          lastSeenAt: now - 20_000,
-        },
-      ])
-      .run();
-    const staleResolved = createOrUpdatePendingConflict({
-      scopeId: "default",
-      existingItemId: "cleanup-conflict-existing-a",
-      candidateItemId: "cleanup-conflict-candidate-a",
-      relationship: "ambiguous_contradiction",
-    });
-    const pendingConflict = createOrUpdatePendingConflict({
-      scopeId: "default",
-      existingItemId: "cleanup-conflict-existing-b",
-      candidateItemId: "cleanup-conflict-candidate-b",
-      relationship: "ambiguous_contradiction",
-    });
-    const recentResolved = createOrUpdatePendingConflict({
-      scopeId: "default",
-      existingItemId: "cleanup-conflict-existing-c",
-      candidateItemId: "cleanup-conflict-candidate-c",
-      relationship: "ambiguous_contradiction",
-      clarificationQuestion: "Recent resolution row",
-    });
-    resolveConflict(staleResolved.id, { status: "resolved_keep_existing" });
-    resolveConflict(recentResolved.id, { status: "resolved_keep_candidate" });
-    db.run(`
-      UPDATE memory_item_conflicts
-      SET resolved_at = ${now - 100_000}, updated_at = ${now - 100_000}
-      WHERE id = '${staleResolved.id}'
-    `);
-    db.run(`
-      UPDATE memory_item_conflicts
-      SET resolved_at = ${now - 100}, updated_at = ${now - 100}
-      WHERE id = '${recentResolved.id}'
-    `);
-    enqueueMemoryJob("cleanup_resolved_conflicts", { retentionMs: 10_000 });
-    const processed = await runMemoryJobsOnce();
-    expect(processed).toBe(1);
-    const staleRow = db
-      .select()
-      .from(memoryItemConflicts)
-      .where(eq(memoryItemConflicts.id, staleResolved.id))
-      .get();
-    const pendingRow = db
-      .select()
-      .from(memoryItemConflicts)
-      .where(eq(memoryItemConflicts.id, pendingConflict.id))
-      .get();
-    const recentRow = db
-      .select()
-      .from(memoryItemConflicts)
-      .where(eq(memoryItemConflicts.id, recentResolved.id))
-      .get();
-    expect(staleRow).toBeUndefined();
-    expect(pendingRow?.status).toBe("pending_clarification");
-    expect(recentRow?.status).toBe("resolved_keep_candidate");
-  });
-  test("cleanup_stale_superseded_items removes stale superseded rows, embeddings, and entity links", async () => {
-    const db = getDb();
-    const now = Date.now();
-    db.insert(memoryItems)
-      .values([
-        {
-          id: "cleanup-stale-item",
-          kind: "decision",
-          subject: "deploy strategy",
-          statement: "Deploy manually every Friday.",
-          status: "superseded",
-          confidence: 0.7,
-          fingerprint: "fp-cleanup-stale-item",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 200_000,
-          lastSeenAt: now - 200_000,
-          invalidAt: now - 200_000,
-        },
-        {
-          id: "cleanup-recent-item",
-          kind: "decision",
-          subject: "deploy strategy",
-          statement: "Deploy continuously via CI.",
-          status: "superseded",
-          confidence: 0.7,
-          fingerprint: "fp-cleanup-recent-item",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 200_000,
-          lastSeenAt: now - 200_000,
-          invalidAt: now - 100,
-        },
-      ])
-      .run();
-    db.insert(memoryEmbeddings)
-      .values([
-        {
-          id: "cleanup-embed-stale",
-          targetType: "item",
-          targetId: "cleanup-stale-item",
-          provider: "openai",
-          model: "text-embedding-3-small",
-          dimensions: 3,
-          vectorBlob: vectorToBlob([0, 0, 0]),
-          createdAt: now - 1000,
-          updatedAt: now - 1000,
-        },
-        {
-          id: "cleanup-embed-recent",
-          targetType: "item",
-          targetId: "cleanup-recent-item",
-          provider: "openai",
-          model: "text-embedding-3-small",
-          dimensions: 3,
-          vectorBlob: vectorToBlob([0, 0, 0]),
-          createdAt: now - 1000,
-          updatedAt: now - 1000,
-        },
-      ])
-      .run();
-    // Create entity links for both items (no FK cascade on this table)
-    db.insert(memoryEntities)
-      .values({
-        id: "cleanup-entity",
-        name: "Deployment",
-        type: "concept",
-        aliases: JSON.stringify([]),
-        description: null,
-        firstSeenAt: now - 200_000,
-        lastSeenAt: now - 200_000,
-        mentionCount: 2,
-      })
-      .run();
-    db.insert(memoryItemEntities)
-      .values([
-        { memoryItemId: "cleanup-stale-item", entityId: "cleanup-entity" },
-        { memoryItemId: "cleanup-recent-item", entityId: "cleanup-entity" },
-      ])
-      .run();
-    enqueueMemoryJob("cleanup_stale_superseded_items", { retentionMs: 10_000 });
-    const processed = await runMemoryJobsOnce();
-    expect(processed).toBe(1);
-    const staleItem = db
-      .select()
-      .from(memoryItems)
-      .where(eq(memoryItems.id, "cleanup-stale-item"))
-      .get();
-    const recentItem = db
-      .select()
-      .from(memoryItems)
-      .where(eq(memoryItems.id, "cleanup-recent-item"))
-      .get();
-    const staleEmbedding = db
-      .select()
-      .from(memoryEmbeddings)
-      .where(eq(memoryEmbeddings.id, "cleanup-embed-stale"))
-      .get();
-    const recentEmbedding = db
-      .select()
-      .from(memoryEmbeddings)
-      .where(eq(memoryEmbeddings.id, "cleanup-embed-recent"))
-      .get();
-    // Entity links for stale item should be removed; recent item's links should remain
-    const staleEntityLinks = db
-      .select()
-      .from(memoryItemEntities)
-      .where(eq(memoryItemEntities.memoryItemId, "cleanup-stale-item"))
-      .all();
-    const recentEntityLinks = db
-      .select()
-      .from(memoryItemEntities)
-      .where(eq(memoryItemEntities.memoryItemId, "cleanup-recent-item"))
-      .all();
-    expect(staleItem).toBeUndefined();
-    expect(recentItem).toBeDefined();
-    expect(staleEmbedding).toBeUndefined();
-    expect(recentEmbedding).toBeDefined();
-    expect(staleEntityLinks).toHaveLength(0);
-    expect(recentEntityLinks).toHaveLength(1);
-  });
-  test("memory admin status reports pending/resolved conflicts and oldest pending age", () => {
-    const db = getDb();
-    const now = Date.now();
-    db.insert(memoryItems)
-      .values([
-        {
-          id: "status-conflict-existing",
-          kind: "fact",
-          subject: "editor",
-          statement: "Use Neovim.",
-          status: "active",
-          confidence: 0.8,
-          fingerprint: "fp-status-existing",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 10_000,
-          lastSeenAt: now - 10_000,
-        },
-        {
-          id: "status-conflict-candidate",
-          kind: "fact",
-          subject: "editor",
-          statement: "Use VS Code.",
-          status: "pending_clarification",
-          confidence: 0.8,
-          fingerprint: "fp-status-candidate",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 10_000,
-          lastSeenAt: now - 10_000,
-        },
-        {
-          id: "status-conflict-existing-2",
-          kind: "fact",
-          subject: "shell",
-          statement: "Use zsh.",
-          status: "active",
-          confidence: 0.8,
-          fingerprint: "fp-status-existing-2",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 10_000,
-          lastSeenAt: now - 10_000,
-        },
-        {
-          id: "status-conflict-candidate-2",
-          kind: "fact",
-          subject: "shell",
-          statement: "Use fish.",
-          status: "pending_clarification",
-          confidence: 0.8,
-          fingerprint: "fp-status-candidate-2",
-          verificationState: "assistant_inferred",
-          scopeId: "default",
-          firstSeenAt: now - 10_000,
-          lastSeenAt: now - 10_000,
-        },
-      ])
-      .run();
-    const pending = createOrUpdatePendingConflict({
-      scopeId: "default",
-      existingItemId: "status-conflict-existing",
-      candidateItemId: "status-conflict-candidate",
-      relationship: "ambiguous_contradiction",
-    });
-    const resolved = createOrUpdatePendingConflict({
-      scopeId: "default",
-      existingItemId: "status-conflict-existing-2",
-      candidateItemId: "status-conflict-candidate-2",
-      relationship: "ambiguous_contradiction",
-      clarificationQuestion: "resolved-row",
-    });
-    resolveConflict(resolved.id, { status: "resolved_merge" });
-    db.run(
-      `UPDATE memory_item_conflicts SET created_at = ${
-        now - 5_000
-      } WHERE id = '${pending.id}'`,
-    );
-    const status = getMemorySystemStatus();
-    expect(status.conflicts.pending).toBe(1);
-    expect(status.conflicts.resolved).toBe(1);
-    expect(status.conflicts.oldestPendingAgeMs).not.toBeNull();
-    expect((status.conflicts.oldestPendingAgeMs ?? 0) >= 4_000).toBe(true);
-    expect(status.cleanup.resolvedBacklog).toBe(0);
-    expect(status.cleanup.supersededBacklog).toBe(0);
-    expect(status.cleanup.resolvedCompleted24h).toBe(0);
-    expect(status.cleanup.supersededCompleted24h).toBe(0);
-  });
-  test("memory admin status reports cleanup backlog and 24h throughput metrics", () => {
-    const db = getDb();
-    const now = Date.now();
-    const yesterday = now - 20 * 60 * 60 * 1000;
-    const old = now - 40 * 60 * 60 * 1000;
-    db.insert(memoryJobs)
-      .values([
-        {
-          id: "cleanup-status-pending-resolved",
-          type: "cleanup_resolved_conflicts",
-          payload: "{}",
-          status: "pending",
-          attempts: 0,
-          deferrals: 0,
-          runAfter: now,
-          lastError: null,
-          createdAt: now,
-          updatedAt: now,
-        },
-        {
-          id: "cleanup-status-running-superseded",
-          type: "cleanup_stale_superseded_items",
-          payload: "{}",
-          status: "running",
-          attempts: 0,
-          deferrals: 0,
-          runAfter: now,
-          lastError: null,
-          createdAt: now,
-          updatedAt: now,
-        },
-        {
-          id: "cleanup-status-completed-resolved-recent",
-          type: "cleanup_resolved_conflicts",
-          payload: "{}",
-          status: "completed",
-          attempts: 1,
-          deferrals: 0,
-          runAfter: yesterday,
-          lastError: null,
-          createdAt: yesterday,
-          updatedAt: yesterday,
-        },
-        {
-          id: "cleanup-status-completed-superseded-recent",
-          type: "cleanup_stale_superseded_items",
-          payload: "{}",
-          status: "completed",
-          attempts: 1,
-          deferrals: 0,
-          runAfter: yesterday,
-          lastError: null,
-          createdAt: yesterday,
-          updatedAt: yesterday,
-        },
-        {
-          id: "cleanup-status-completed-resolved-old",
-          type: "cleanup_resolved_conflicts",
-          payload: "{}",
-          status: "completed",
-          attempts: 1,
-          deferrals: 0,
-          runAfter: old,
-          lastError: null,
-          createdAt: old,
-          updatedAt: old,
-        },
-      ])
-      .run();
-    const status = getMemorySystemStatus();
-    expect(status.cleanup.resolvedBacklog).toBe(1);
-    expect(status.cleanup.supersededBacklog).toBe(1);
-    expect(status.cleanup.resolvedCompleted24h).toBe(1);
-    expect(status.cleanup.supersededCompleted24h).toBe(1);
-  });
-  test("requestMemoryCleanup queues both cleanup job types", () => {
-    const db = getDb();
-    const queued = requestMemoryCleanup(9_999);
-    expect(queued.resolvedConflictsJobId).toBeTruthy();
-    expect(queued.staleSupersededItemsJobId).toBeTruthy();
-    const resolvedRow = db
-      .select()
-      .from(memoryJobs)
-      .where(eq(memoryJobs.id, queued.resolvedConflictsJobId))
-      .get();
-    const supersededRow = db
-      .select()
-      .from(memoryJobs)
-      .where(eq(memoryJobs.id, queued.staleSupersededItemsJobId))
-      .get();
-    expect(resolvedRow?.type).toBe("cleanup_resolved_conflicts");
-    expect(supersededRow?.type).toBe("cleanup_stale_superseded_items");
-  });
-  test("relation backfill advances checkpoints in deterministic batches", async () => {
-    const db = getDb();
-    const now = 1_700_001_000_000;
-    const originalEnabled = TEST_CONFIG.memory.entity.extractRelations.enabled;
-    const originalBatchSize =
-      TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize;
-    TEST_CONFIG.memory.entity.extractRelations.enabled = true;
-    TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize = 2;
-    try {
-      db.insert(conversations)
-        .values({
-          id: "conv-rel-backfill",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
-      db.insert(messages)
-        .values([
-          {
-            id: "msg-rel-backfill-1",
-            conversationId: "conv-rel-backfill",
-            role: "user",
-            content: JSON.stringify([
-              {
-                type: "text",
-                text: "Project Atlas uses Qdrant for memory search.",
-              },
-            ]),
-            createdAt: now + 1,
-          },
-          {
-            id: "msg-rel-backfill-2",
-            conversationId: "conv-rel-backfill",
-            role: "user",
-            content: JSON.stringify([
-              { type: "text", text: "Atlas collaborates with Orion." },
-            ]),
-            createdAt: now + 2,
-          },
-          {
-            id: "msg-rel-backfill-3",
-            conversationId: "conv-rel-backfill",
-            role: "user",
-            content: JSON.stringify([
-              { type: "text", text: "Orion depends on Redis caching." },
-            ]),
-            createdAt: now + 3,
-          },
-        ])
-        .run();
-      enqueueBackfillEntityRelationsJob(true);
-      const firstProcessed = await runMemoryJobsOnce();
-      expect(firstProcessed).toBe(1);
-      expect(
-        getMemoryCheckpoint("memory:relation_backfill:last_created_at"),
-      ).toBe(String(now + 2));
-      expect(
-        getMemoryCheckpoint("memory:relation_backfill:last_message_id"),
-      ).toBe("msg-rel-backfill-2");
-      db.run(
-        `DELETE FROM memory_jobs WHERE type = 'extract_entities' AND status = 'pending'`,
-      );
-      const secondProcessed = await runMemoryJobsOnce();
-      expect(secondProcessed).toBe(1);
-      expect(
-        getMemoryCheckpoint("memory:relation_backfill:last_created_at"),
-      ).toBe(String(now + 3));
-      expect(
-        getMemoryCheckpoint("memory:relation_backfill:last_message_id"),
-      ).toBe("msg-rel-backfill-3");
-      const pendingBackfill = db
-        .select()
-        .from(memoryJobs)
-        .where(
-          and(
-            eq(memoryJobs.type, "backfill_entity_relations"),
-            eq(memoryJobs.status, "pending"),
-          ),
-        )
-        .all();
-      expect(pendingBackfill).toHaveLength(0);
-    } finally {
-      TEST_CONFIG.memory.entity.extractRelations.enabled = originalEnabled;
-      TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize =
-        originalBatchSize;
-    }
-  });
-  test("memory recall token budgeting includes recall marker overhead", async () => {
-    const db = getDb();
-    const createdAt = 1_700_000_300_000;
-    db.insert(conversations)
-      .values({
-        id: "conv-budget",
-        title: null,
-        createdAt,
-        updatedAt: createdAt,
-        totalInputTokens: 0,
-        totalOutputTokens: 0,
-        totalEstimatedCost: 0,
-        contextSummary: null,
-        contextCompactedMessageCount: 0,
-        contextCompactedAt: null,
-      })
-      .run();
-    db.insert(messages)
-      .values({
-        id: "msg-budget",
-        conversationId: "conv-budget",
-        role: "user",
-        content: JSON.stringify([
-          { type: "text", text: "remember budget token sentinel" },
-        ]),
-        createdAt,
-      })
-      .run();
-    db.run(`
-      INSERT INTO memory_segments (
-        id, message_id, conversation_id, role, segment_index, text, token_estimate, created_at, updated_at
-      ) VALUES (
-        'seg-budget', 'msg-budget', 'conv-budget', 'user', 0, 'remember budget token sentinel', 6, ${createdAt}, ${createdAt}
-      )
-    `);
-    const candidateLine =
-      "- <kind>segment:seg-budget</kind> remember budget token sentinel";
-    const lineOnlyTokens = estimateTextTokens(candidateLine);
-    const fullRecallTokens = estimateTextTokens(
-      '<memory source="long_term_memory" confidence="approximate">\n' +
-        `## Relevant Context\n${candidateLine}\n</memory>`,
-    );
-    expect(fullRecallTokens).toBeGreaterThan(lineOnlyTokens);
-    const config = {
-      ...DEFAULT_CONFIG,
-      memory: {
-        ...DEFAULT_CONFIG.memory,
-        embeddings: {
-          ...DEFAULT_CONFIG.memory.embeddings,
-          required: false,
-        },
-        retrieval: {
-          ...DEFAULT_CONFIG.memory.retrieval,
-          maxInjectTokens: lineOnlyTokens,
-        },
-      },
-    };
-    const recall = await buildMemoryRecall(
-      "budget sentinel",
-      "conv-budget",
-      config,
-    );
-    expect(recall.injectedText).toBe("");
-    expect(recall.injectedTokens).toBe(0);
-  });
-  test("memory recall respects maxInjectTokensOverride when provided", async () => {
-    const db = getDb();
-    const createdAt = 1_700_000_301_000;
-    db.insert(conversations)
-      .values({
-        id: "conv-budget-override",
-        title: null,
-        createdAt,
-        updatedAt: createdAt,
-        totalInputTokens: 0,
-        totalOutputTokens: 0,
-        totalEstimatedCost: 0,
-        contextSummary: null,
-        contextCompactedMessageCount: 0,
-        contextCompactedAt: null,
-      })
-      .run();
-    for (let i = 0; i < 4; i++) {
-      const msgId = `msg-budget-override-${i}`;
-      const segId = `seg-budget-override-${i}`;
-      const text = `budget override sentinel item ${i} with enough text to exceed tiny limits`;
-      db.insert(messages)
-        .values({
-          id: msgId,
-          conversationId: "conv-budget-override",
-          role: "user",
-          content: JSON.stringify([{ type: "text", text }]),
-          createdAt: createdAt + i,
-        })
-        .run();
-      db.run(`
-        INSERT INTO memory_segments (
-          id, message_id, conversation_id, role, segment_index, text, token_estimate, created_at, updated_at
-        ) VALUES (
-          '${segId}', '${msgId}', 'conv-budget-override', 'user', 0, '${text}', 20, ${
-            createdAt + i
-          }, ${createdAt + i}
-        )
-      `);
-    }
-    const config = {
-      ...DEFAULT_CONFIG,
-      memory: {
-        ...DEFAULT_CONFIG.memory,
-        embeddings: {
-          ...DEFAULT_CONFIG.memory.embeddings,
-          provider: "openai" as const,
-          required: false,
-        },
-        retrieval: {
-          ...DEFAULT_CONFIG.memory.retrieval,
-          maxInjectTokens: 5000,
-          lexicalTopK: 10,
-        },
-      },
-    };
-    const override = 120;
-    const recall = await buildMemoryRecall(
-      "budget override sentinel",
-      "conv-budget-override",
-      config,
-      { maxInjectTokensOverride: override },
-    );
-    expect(recall.injectedTokens).toBeLessThanOrEqual(override);
-  });
-  test("claimMemoryJobs only returns rows it actually claimed", () => {
-    const db = getDb();
-    const jobId = enqueueMemoryJob("build_conversation_summary", {
-      conversationId: "conv-lock",
-    });
-    db.run(`
-      CREATE TEMP TRIGGER memory_jobs_claim_ignore
-      BEFORE UPDATE ON memory_jobs
-      WHEN NEW.status = 'running' AND OLD.id = '${jobId}'
-      BEGIN
-        SELECT RAISE(IGNORE);
-      END;
-    `);
-    try {
-      const claimed = claimMemoryJobs(10);
-      expect(claimed).toHaveLength(0);
-      const row = db
-        .select()
-        .from(memoryJobs)
-        .where(eq(memoryJobs.id, jobId))
-        .get();
-      expect(row?.status).toBe("pending");
-    } finally {
-      db.run("DROP TRIGGER IF EXISTS memory_jobs_claim_ignore");
-    }
-  });
-  test("formatAbsoluteTime returns YYYY-MM-DD HH:mm TZ format", () => {
-    // Use a fixed epoch-ms value; the rendered string depends on the local timezone,
-    // so we verify the structural format rather than exact values.
-    const epochMs = 1_707_850_200_000; // 2024-02-13 in UTC
-    const result = formatAbsoluteTime(epochMs);
-    // Should match pattern: YYYY-MM-DD HH:mm <TZ abbreviation>
-    expect(result).toMatch(/^\d{4}-\d{2}-\d{2} \d{2}:\d{2} \S+$/);
-    // Year should be 2024
-    expect(result).toContain("2024-02");
-  });
-  test("formatAbsoluteTime uses local timezone abbreviation", () => {
-    const epochMs = Date.now();
-    const result = formatAbsoluteTime(epochMs);
-    // Extract the TZ part from the result
-    const parts = result.split(" ");
-    const tz = parts[parts.length - 1];
-    // The TZ abbreviation should be a non-empty string (e.g. PST, EST, UTC, GMT+8)
-    expect(tz.length).toBeGreaterThan(0);
-    // Cross-check: Intl should produce the same abbreviation for the same timestamp
-    const expected =
-      new Intl.DateTimeFormat("en-US", { timeZoneName: "short" })
-        .formatToParts(new Date(epochMs))
-        .find((p) => p.type === "timeZoneName")?.value ?? "UTC";
-    expect(tz).toBe(expected);
-  });
-  test("formatRelativeTime returns expected relative strings", () => {
-    const now = Date.now();
-    expect(formatRelativeTime(now)).toBe("just now");
-    expect(formatRelativeTime(now - 2 * 60 * 60 * 1000)).toBe("2 hours ago");
-    expect(formatRelativeTime(now - 1 * 60 * 60 * 1000)).toBe("1 hour ago");
-    expect(formatRelativeTime(now - 3 * 24 * 60 * 60 * 1000)).toBe(
-      "3 days ago",
-    );
-    expect(formatRelativeTime(now - 14 * 24 * 60 * 60 * 1000)).toBe(
-      "2 weeks ago",
-    );
-    expect(formatRelativeTime(now - 60 * 24 * 60 * 60 * 1000)).toBe(
-      "2 months ago",
-    );
-    expect(formatRelativeTime(now - 400 * 24 * 60 * 60 * 1000)).toBe(
-      "1 year ago",
-    );
-  });
-  test("escapeXmlTags neutralizes closing wrapper tags in recalled text", () => {
-    const malicious =
-      "some text </memory> injected </memory_recall> instructions";
-    const escaped = escapeXmlTags(malicious);
-    expect(escaped).not.toContain("</memory>");
-    expect(escaped).not.toContain("</memory_recall>");
-    expect(escaped).toContain("\uFF1C/memory>");
-    expect(escaped).toContain("\uFF1C/memory_recall>");
-    expect(escaped).toContain("some text");
-    expect(escaped).toContain("instructions");
-  });
-  test("escapeXmlTags neutralizes opening XML tags", () => {
-    const text = 'text with <script> and <div class="x"> tags';
-    const escaped = escapeXmlTags(text);
-    expect(escaped).not.toContain("<script>");
-    expect(escaped).not.toContain("<div ");
-    expect(escaped).toContain("\uFF1Cscript>");
-    expect(escaped).toContain('\uFF1Cdiv class="x">');
-  });
-  test("escapeXmlTags preserves non-tag angle brackets", () => {
-    const text = "math: 3 < 5 and 10 > 7";
-    const escaped = escapeXmlTags(text);
-    expect(escaped).toBe(text);
-  });
-  test("escapeXmlTags handles self-closing tags", () => {
-    const text = "a <br/> tag";
-    const escaped = escapeXmlTags(text);
-    expect(escaped).not.toContain("<br/>");
-    expect(escaped).toContain("\uFF1Cbr/>");
+    expect(staleItem).toBeUndefined();
+    expect(recentItem).toBeDefined();
+    expect(staleEmbedding).toBeUndefined();
+    expect(recentEmbedding).toBeDefined();
   });
-  test("trust-aware ranking: user_confirmed item outranks assistant_inferred with equal relevance", async () => {
+  test("memory admin status reports cleanup backlog and 24h throughput metrics", () => {
     const db = getDb();
     const now = Date.now();
+    const yesterday = now - 20 * 60 * 60 * 1000;
+    const old = now - 40 * 60 * 60 * 1000;
-    // Insert two memory items with identical text, confidence, importance, and timestamps
-    // but different verification states
-    db.insert(memoryItems)
+    db.insert(memoryJobs)
       .values([
         {
-          id: "item-trust-confirmed",
-          kind: "fact",
-          subject: "trust ranking test",
-          statement: "The user prefers dark mode for all applications",
-          status: "active",
-          confidence: 0.8,
-          importance: 0.5,
-          fingerprint: "fp-trust-confirmed",
-          firstSeenAt: now,
-          lastSeenAt: now,
-          accessCount: 0,
-          verificationState: "user_confirmed",
-        },
-        {
-          id: "item-trust-inferred",
-          kind: "fact",
-          subject: "trust ranking test",
-          statement: "The user prefers dark mode for all editors",
-          status: "active",
-          confidence: 0.8,
-          importance: 0.5,
-          fingerprint: "fp-trust-inferred",
-          firstSeenAt: now,
-          lastSeenAt: now,
-          accessCount: 0,
-          verificationState: "assistant_inferred",
-        },
-      ])
-      .run();
-    const config = {
-      ...DEFAULT_CONFIG,
-      memory: {
-        ...DEFAULT_CONFIG.memory,
-        embeddings: {
-          ...DEFAULT_CONFIG.memory.embeddings,
-          required: false,
+          id: "cleanup-status-running-superseded",
+          type: "cleanup_stale_superseded_items",
+          payload: "{}",
+          status: "running",
+          attempts: 0,
+          deferrals: 0,
+          runAfter: now,
+          lastError: null,
+          createdAt: now,
+          updatedAt: now,
         },
-      },
-    };
-    const recall = await buildMemoryRecall(
-      "dark mode",
-      "conv-trust-test",
-      config,
-    );
-    // Both items should be found (directItemSearch matches on "dark" and "mode")
-    const confirmed = recall.topCandidates.find(
-      (c) => c.key === "item:item-trust-confirmed",
-    );
-    const inferred = recall.topCandidates.find(
-      (c) => c.key === "item:item-trust-inferred",
-    );
-    expect(confirmed).toBeDefined();
-    expect(inferred).toBeDefined();
-    // user_confirmed (weight 1.0) should have a higher finalScore than assistant_inferred (weight 0.7)
-    expect(confirmed!.finalScore).toBeGreaterThan(inferred!.finalScore);
-  });
-  test("trust-aware ranking: user_reported item outranks assistant_inferred", async () => {
-    const db = getDb();
-    const now = Date.now();
-    db.insert(memoryItems)
-      .values([
         {
-          id: "item-trust-reported",
-          kind: "fact",
-          subject: "trust ranking reported",
-          statement: "The user uses vim keybindings in their editor",
-          status: "active",
-          confidence: 0.8,
-          importance: 0.5,
-          fingerprint: "fp-trust-reported",
-          firstSeenAt: now,
-          lastSeenAt: now,
-          accessCount: 0,
-          verificationState: "user_reported",
+          id: "cleanup-status-completed-superseded-recent",
+          type: "cleanup_stale_superseded_items",
+          payload: "{}",
+          status: "completed",
+          attempts: 1,
+          deferrals: 0,
+          runAfter: yesterday,
+          lastError: null,
+          createdAt: yesterday,
+          updatedAt: yesterday,
         },
         {
-          id: "item-trust-inferred2",
-          kind: "fact",
-          subject: "trust ranking inferred",
-          statement: "The user uses vim keybindings in their terminal",
-          status: "active",
-          confidence: 0.8,
-          importance: 0.5,
-          fingerprint: "fp-trust-inferred2",
-          firstSeenAt: now,
-          lastSeenAt: now,
-          accessCount: 0,
-          verificationState: "assistant_inferred",
+          id: "cleanup-status-completed-superseded-old",
+          type: "cleanup_stale_superseded_items",
+          payload: "{}",
+          status: "completed",
+          attempts: 1,
+          deferrals: 0,
+          runAfter: old,
+          lastError: null,
+          createdAt: old,
+          updatedAt: old,
         },
       ])
       .run();
-    const config = {
-      ...DEFAULT_CONFIG,
-      memory: {
-        ...DEFAULT_CONFIG.memory,
-        embeddings: {
-          ...DEFAULT_CONFIG.memory.embeddings,
-          required: false,
-        },
-      },
-    };
-    const recall = await buildMemoryRecall(
-      "vim keybindings",
-      "conv-trust-test2",
-      config,
-    );
-    const reported = recall.topCandidates.find(
-      (c) => c.key === "item:item-trust-reported",
-    );
-    const inferred = recall.topCandidates.find(
-      (c) => c.key === "item:item-trust-inferred2",
-    );
-    expect(reported).toBeDefined();
-    expect(inferred).toBeDefined();
-    // user_reported (weight 0.9) should outrank assistant_inferred (weight 0.7)
-    expect(reported!.finalScore).toBeGreaterThan(inferred!.finalScore);
+    const status = getMemorySystemStatus();
+    expect(status.cleanup.supersededBacklog).toBe(1);
+    expect(status.cleanup.supersededCompleted24h).toBe(1);
   });
-  test("trust-aware ranking: weight values are bounded and non-zero", async () => {
+  test("requestMemoryCleanup queues cleanup job", () => {
     const db = getDb();
-    const now = Date.now();
-    // Insert an item with an unknown verification state to test the default weight
-    const raw = (
-      db as unknown as {
-        $client: {
-          query: (q: string) => { get: (...params: unknown[]) => unknown };
-        };
-      }
-    ).$client;
-    raw
-      .query(
-        `
-      INSERT INTO memory_items (id, kind, subject, statement, status, confidence, importance, fingerprint, first_seen_at, last_seen_at, access_count, verification_state)
-      VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
-    `,
-      )
-      .get(
-        "item-trust-unknown",
-        "fact",
-        "trust ranking unknown",
-        "The user has an unknown trust state preference",
-        "active",
-        0.8,
-        0.5,
-        "fp-trust-unknown",
-        now,
-        now,
-        0,
-        "some_future_state",
-      );
-    const config = {
-      ...DEFAULT_CONFIG,
-      memory: {
-        ...DEFAULT_CONFIG.memory,
-        embeddings: {
-          ...DEFAULT_CONFIG.memory.embeddings,
-          required: false,
-        },
-      },
-    };
-    const recall = await buildMemoryRecall(
-      "unknown trust state preference",
-      "conv-trust-test3",
-      config,
-    );
+    const queued = requestMemoryCleanup(9_999);
+    expect(queued.staleSupersededItemsJobId).toBeTruthy();
-    const unknown = recall.topCandidates.find(
-      (c) => c.key === "item:item-trust-unknown",
-    );
-    expect(unknown).toBeDefined();
-    // The finalScore should be > 0 (trust weight is bounded, not zero)
-    expect(unknown!.finalScore).toBeGreaterThan(0);
+    const supersededRow = db
+      .select()
+      .from(memoryJobs)
+      .where(eq(memoryJobs.id, queued.staleSupersededItemsJobId))
+      .get();
+    expect(supersededRow?.type).toBe("cleanup_stale_superseded_items");
   });
-  test("freshness decay: stale event item scores lower than fresh one", async () => {
+  test("memory recall token budgeting includes recall marker overhead", async () => {
     const db = getDb();
-    const now = Date.now();
-    const MS_PER_DAY = 86_400_000;
-    // Fresh event item (5 days old — well within the 30-day default window)
-    db.insert(memoryItems)
+    const createdAt = 1_700_000_300_000;
+    db.insert(conversations)
       .values({
-        id: "item-fresh-event",
-        kind: "event",
-        subject: "freshness decay test",
-        statement: "User attended a workshop on machine learning",
-        status: "active",
-        confidence: 0.8,
-        importance: 0.5,
-        fingerprint: "fp-fresh-event",
-        firstSeenAt: now - 5 * MS_PER_DAY,
-        lastSeenAt: now - 5 * MS_PER_DAY,
-        accessCount: 0,
-        verificationState: "user_confirmed",
+        id: "conv-budget",
+        title: null,
+        createdAt,
+        updatedAt: createdAt,
+        totalInputTokens: 0,
+        totalOutputTokens: 0,
+        totalEstimatedCost: 0,
+        contextSummary: null,
+        contextCompactedMessageCount: 0,
+        contextCompactedAt: null,
       })
       .run();
-    // Stale event item (60 days old — past the 30-day event window)
-    db.insert(memoryItems)
+    db.insert(messages)
       .values({
-        id: "item-stale-event",
-        kind: "event",
-        subject: "freshness decay test",
-        statement: "User attended a workshop on machine learning basics",
-        status: "active",
-        confidence: 0.8,
-        importance: 0.5,
-        fingerprint: "fp-stale-event",
-        firstSeenAt: now - 60 * MS_PER_DAY,
-        lastSeenAt: now - 60 * MS_PER_DAY,
-        accessCount: 0,
-        verificationState: "user_confirmed",
+        id: "msg-budget",
+        conversationId: "conv-budget",
+        role: "user",
+        content: JSON.stringify([
+          { type: "text", text: "remember budget token sentinel" },
+        ]),
+        createdAt,
       })
       .run();
+    db.run(`
+      INSERT INTO memory_segments (
+        id, message_id, conversation_id, role, segment_index, text, token_estimate, created_at, updated_at
+      ) VALUES (
+        'seg-budget', 'msg-budget', 'conv-budget', 'user', 0, 'remember budget token sentinel', 6, ${createdAt}, ${createdAt}
+      )
+    `);
+    const candidateLine =
+      "- <kind>segment:seg-budget</kind> remember budget token sentinel";
+    const lineOnlyTokens = estimateTextTokens(candidateLine);
+    const fullRecallTokens = estimateTextTokens(
+      '<memory source="long_term_memory" confidence="approximate">\n' +
+        `## Relevant Context\n${candidateLine}\n</memory>`,
+    );
+    expect(fullRecallTokens).toBeGreaterThan(lineOnlyTokens);
     const config = {
       ...DEFAULT_CONFIG,
       memory: {
         ...DEFAULT_CONFIG.memory,
-        embeddings: { ...DEFAULT_CONFIG.memory.embeddings, required: false },
+        embeddings: {
+          ...DEFAULT_CONFIG.memory.embeddings,
+          required: false,
+        },
+        retrieval: {
+          ...DEFAULT_CONFIG.memory.retrieval,
+          maxInjectTokens: lineOnlyTokens,
+        },
       },
     };
     const recall = await buildMemoryRecall(
-      "machine learning workshop",
-      "conv-fresh-1",
+      "budget sentinel",
+      "conv-budget",
       config,
     );
-    const fresh = recall.topCandidates.find(
-      (c) => c.key === "item:item-fresh-event",
-    );
-    const stale = recall.topCandidates.find(
-      (c) => c.key === "item:item-stale-event",
-    );
-    expect(fresh).toBeDefined();
-    expect(stale).toBeDefined();
-    // Fresh item should score higher than stale item due to freshness decay
-    expect(fresh!.finalScore).toBeGreaterThan(stale!.finalScore);
+    expect(recall.injectedText).toBe("");
+    expect(recall.injectedTokens).toBe(0);
   });
-  test("freshness decay: fact items with maxAgeDays=0 are never decayed", async () => {
+  test("memory recall respects maxInjectTokensOverride when provided", async () => {
     const db = getDb();
-    const now = Date.now();
-    const MS_PER_DAY = 86_400_000;
-    // Very old fact item (365 days) — facts have maxAgeDays=0 (no expiry)
-    db.insert(memoryItems)
+    const createdAt = 1_700_000_301_000;
+    db.insert(conversations)
       .values({
-        id: "item-old-fact",
-        kind: "fact",
-        subject: "freshness no-decay test",
-        statement: "The speed of light is 299792458 meters per second",
-        status: "active",
-        confidence: 0.8,
-        importance: 0.5,
-        fingerprint: "fp-old-fact",
-        firstSeenAt: now - 365 * MS_PER_DAY,
-        lastSeenAt: now - 365 * MS_PER_DAY,
-        accessCount: 0,
-        verificationState: "user_confirmed",
+        id: "conv-budget-override",
+        title: null,
+        createdAt,
+        updatedAt: createdAt,
+        totalInputTokens: 0,
+        totalOutputTokens: 0,
+        totalEstimatedCost: 0,
+        contextSummary: null,
+        contextCompactedMessageCount: 0,
+        contextCompactedAt: null,
       })
       .run();
-    // Recent fact with same text similarity
-    db.insert(memoryItems)
-      .values({
-        id: "item-new-fact",
-        kind: "fact",
-        subject: "freshness no-decay test",
-        statement: "The speed of light is approximately 3e8 meters per second",
-        status: "active",
-        confidence: 0.8,
-        importance: 0.5,
-        fingerprint: "fp-new-fact",
-        firstSeenAt: now - 1 * MS_PER_DAY,
-        lastSeenAt: now - 1 * MS_PER_DAY,
-        accessCount: 0,
-        verificationState: "user_confirmed",
-      })
-      .run();
+    for (let i = 0; i < 4; i++) {
+      const msgId = `msg-budget-override-${i}`;
+      const segId = `seg-budget-override-${i}`;
+      const text = `budget override sentinel item ${i} with enough text to exceed tiny limits`;
+      db.insert(messages)
+        .values({
+          id: msgId,
+          conversationId: "conv-budget-override",
+          role: "user",
+          content: JSON.stringify([{ type: "text", text }]),
+          createdAt: createdAt + i,
+        })
+        .run();
+      db.run(`
+        INSERT INTO memory_segments (
+          id, message_id, conversation_id, role, segment_index, text, token_estimate, created_at, updated_at
+        ) VALUES (
+          '${segId}', '${msgId}', 'conv-budget-override', 'user', 0, '${text}', 20, ${
+            createdAt + i
+          }, ${createdAt + i}
+        )
+      `);
+    }
     const config = {
       ...DEFAULT_CONFIG,
       memory: {
         ...DEFAULT_CONFIG.memory,
-        embeddings: { ...DEFAULT_CONFIG.memory.embeddings, required: false },
+        embeddings: {
+          ...DEFAULT_CONFIG.memory.embeddings,
+          provider: "openai" as const,
+          required: false,
+        },
+        retrieval: {
+          ...DEFAULT_CONFIG.memory.retrieval,
+          maxInjectTokens: 5000,
+        },
       },
     };
+    const override = 120;
     const recall = await buildMemoryRecall(
-      "speed of light",
-      "conv-fresh-2",
+      "budget override sentinel",
+      "conv-budget-override",
       config,
+      { maxInjectTokensOverride: override },
     );
+    expect(recall.injectedTokens).toBeLessThanOrEqual(override);
+  });
+  test("claimMemoryJobs only returns rows it actually claimed", () => {
+    const db = getDb();
+    const jobId = enqueueMemoryJob("build_conversation_summary", {
+      conversationId: "conv-lock",
+    });
+    db.run(`
+      CREATE TEMP TRIGGER memory_jobs_claim_ignore
+      BEFORE UPDATE ON memory_jobs
+      WHEN NEW.status = 'running' AND OLD.id = '${jobId}'
+      BEGIN
+        SELECT RAISE(IGNORE);
+      END;
+    `);
+    try {
+      const claimed = claimMemoryJobs(10);
+      expect(claimed).toHaveLength(0);
+      const row = db
+        .select()
+        .from(memoryJobs)
+        .where(eq(memoryJobs.id, jobId))
+        .get();
+      expect(row?.status).toBe("pending");
+    } finally {
+      db.run("DROP TRIGGER IF EXISTS memory_jobs_claim_ignore");
+    }
+  });
+  test("formatAbsoluteTime returns YYYY-MM-DD HH:mm TZ format", () => {
+    // Use a fixed epoch-ms value; the rendered string depends on the local timezone,
+    // so we verify the structural format rather than exact values.
+    const epochMs = 1_707_850_200_000; // 2024-02-13 in UTC
+    const result = formatAbsoluteTime(epochMs);
+    // Should match pattern: YYYY-MM-DD HH:mm <TZ abbreviation>
+    expect(result).toMatch(/^\d{4}-\d{2}-\d{2} \d{2}:\d{2} \S+$/);
+    // Year should be 2024
+    expect(result).toContain("2024-02");
+  });
+  test("formatAbsoluteTime uses local timezone abbreviation", () => {
+    const epochMs = Date.now();
+    const result = formatAbsoluteTime(epochMs);
+    // Extract the TZ part from the result
+    const parts = result.split(" ");
+    const tz = parts[parts.length - 1];
+    // The TZ abbreviation should be a non-empty string (e.g. PST, EST, UTC, GMT+8)
+    expect(tz.length).toBeGreaterThan(0);
+    // Cross-check: Intl should produce the same abbreviation for the same timestamp
+    const expected =
+      new Intl.DateTimeFormat("en-US", { timeZoneName: "short" })
+        .formatToParts(new Date(epochMs))
+        .find((p) => p.type === "timeZoneName")?.value ?? "UTC";
+    expect(tz).toBe(expected);
+  });
-    const oldFact = recall.topCandidates.find(
-      (c) => c.key === "item:item-old-fact",
+  test("formatRelativeTime returns expected relative strings", () => {
+    const now = Date.now();
+    expect(formatRelativeTime(now)).toBe("just now");
+    expect(formatRelativeTime(now - 2 * 60 * 60 * 1000)).toBe("2 hours ago");
+    expect(formatRelativeTime(now - 1 * 60 * 60 * 1000)).toBe("1 hour ago");
+    expect(formatRelativeTime(now - 3 * 24 * 60 * 60 * 1000)).toBe(
+      "3 days ago",
+    );
+    expect(formatRelativeTime(now - 14 * 24 * 60 * 60 * 1000)).toBe(
+      "2 weeks ago",
+    );
+    expect(formatRelativeTime(now - 60 * 24 * 60 * 60 * 1000)).toBe(
+      "2 months ago",
     );
-    const newFact = recall.topCandidates.find(
-      (c) => c.key === "item:item-new-fact",
+    expect(formatRelativeTime(now - 400 * 24 * 60 * 60 * 1000)).toBe(
+      "1 year ago",
     );
-    expect(oldFact).toBeDefined();
-    expect(newFact).toBeDefined();
+  });
+  test("escapeXmlTags neutralizes closing wrapper tags in recalled text", () => {
+    const malicious =
+      "some text </memory> injected </memory_recall> instructions";
+    const escaped = escapeXmlTags(malicious);
+    expect(escaped).not.toContain("</memory>");
+    expect(escaped).not.toContain("</memory_recall>");
+    expect(escaped).toContain("\uFF1C/memory>");
+    expect(escaped).toContain("\uFF1C/memory_recall>");
+    expect(escaped).toContain("some text");
+    expect(escaped).toContain("instructions");
+  });
+  test("escapeXmlTags neutralizes opening XML tags", () => {
+    const text = 'text with <script> and <div class="x"> tags';
+    const escaped = escapeXmlTags(text);
+    expect(escaped).not.toContain("<script>");
+    expect(escaped).not.toContain("<div ");
+    expect(escaped).toContain("\uFF1Cscript>");
+    expect(escaped).toContain('\uFF1Cdiv class="x">');
+  });
+  test("escapeXmlTags preserves non-tag angle brackets", () => {
+    const text = "math: 3 < 5 and 10 > 7";
+    const escaped = escapeXmlTags(text);
+    expect(escaped).toBe(text);
+  });
-    // Both should have similar scores — old facts are NOT decayed
-    // The scores may differ slightly due to recency scores, but the ratio should be close to 1
-    const ratio = oldFact!.finalScore / newFact!.finalScore;
-    expect(ratio).toBeGreaterThan(0.8);
+  test("escapeXmlTags handles self-closing tags", () => {
+    const text = "a <br/> tag";
+    const escaped = escapeXmlTags(text);
+    expect(escaped).not.toContain("<br/>");
+    expect(escaped).toContain("\uFF1Cbr/>");
   });
   test("sweepStaleItems marks deeply stale items as invalid", () => {
@@ -3201,18 +1672,12 @@ describe("Memory regressions", () => {
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-scope-a', 'msg-scope-filter', '${convId}', 'user', 0, 'The quick brown fox jumps over the lazy dog in project alpha', 12, 'project-a', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-scope-a', 'The quick brown fox jumps over the lazy dog in project alpha')`,
-    );
     // Insert segment in scope "project-b"
     db.run(`
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-scope-b', 'msg-scope-filter', '${convId}', 'user', 1, 'The quick brown fox jumps over the lazy dog in project beta', 12, 'project-b', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-scope-b', 'The quick brown fox jumps over the lazy dog in project beta')`,
-    );
     // Insert item in scope "project-a"
     db.insert(memoryItems)
@@ -3261,15 +1726,15 @@ describe("Memory regressions", () => {
     const result = await buildMemoryRecall("quick brown fox", convId, config, {
       scopeId: "project-a",
     });
-    const keys = result.topCandidates.map((c) => c.key);
-    // Segments and items from project-b should not appear
-    expect(keys).not.toContain("segment:seg-scope-b");
-    expect(keys).not.toContain("item:item-scope-b");
-    // At least one project-a candidate should appear
-    const hasProjectA = keys.some((k) => k.includes("scope-a"));
-    expect(hasProjectA).toBe(true);
+    // With Qdrant mocked, only recency search runs. Recency candidates
+    // don't pass tier classification (score < 0.6), so topCandidates is empty.
+    // Verify scope filtering works by checking recencyHits count: should
+    // only find segments from project-a scope (via allow_global_fallback,
+    // default scope is also included).
+    // The 2 segments in project-a scope + default-scope segments = recencyHits
+    expect(result.recencyHits).toBeGreaterThan(0);
+    expect(result.enabled).toBe(true);
   });
   test("scope filtering: allow_global_fallback includes default scope", async () => {
@@ -3306,18 +1771,12 @@ describe("Memory regressions", () => {
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-default-scope', 'msg-scope-fallback', '${convId}', 'user', 0, 'Universal knowledge about programming languages and paradigms', 10, 'default', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-default-scope', 'Universal knowledge about programming languages and paradigms')`,
-    );
     // Insert segment in custom scope
     db.run(`
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-custom-scope', 'msg-scope-fallback', '${convId}', 'user', 1, 'Project-specific knowledge about programming languages and paradigms', 10, 'my-project', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-custom-scope', 'Project-specific knowledge about programming languages and paradigms')`,
-    );
     // With allow_global_fallback (the default), querying with scopeId "my-project"
     // should include both "my-project" and "default" scope items
@@ -3334,11 +1793,11 @@ describe("Memory regressions", () => {
       config,
       { scopeId: "my-project" },
     );
-    const keys = result.topCandidates.map((c) => c.key);
-    // Both default and custom scope segments should be included
-    expect(keys).toContain("segment:seg-default-scope");
-    expect(keys).toContain("segment:seg-custom-scope");
+    // With allow_global_fallback, recency search finds segments from both
+    // "my-project" and "default" scopes. Candidates don't pass tier
+    // classification but recencyHits should include both.
+    expect(result.recencyHits).toBe(2);
   });
   test("scope filtering: strict policy excludes default scope", async () => {
@@ -3353,299 +1812,64 @@ describe("Memory regressions", () => {
         createdAt: now,
         updatedAt: now,
         totalInputTokens: 0,
-        totalOutputTokens: 0,
-        totalEstimatedCost: 0,
-        contextSummary: null,
-        contextCompactedMessageCount: 0,
-        contextCompactedAt: null,
-      })
-      .run();
-    db.insert(messages)
-      .values({
-        id: "msg-scope-strict",
-        conversationId: convId,
-        role: "user",
-        content: JSON.stringify([{ type: "text", text: "strict test" }]),
-        createdAt: now,
-      })
-      .run();
-    // Insert segment in default scope
-    db.run(`
-      INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
-      VALUES ('seg-strict-default', 'msg-scope-strict', '${convId}', 'user', 0, 'Global memory about database optimization techniques', 8, 'default', ${now}, ${now})
-    `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-strict-default', 'Global memory about database optimization techniques')`,
-    );
-    // Insert segment in custom scope
-    db.run(`
-      INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
-      VALUES ('seg-strict-custom', 'msg-scope-strict', '${convId}', 'user', 1, 'Project-specific memory about database optimization techniques', 8, 'strict-project', ${now}, ${now})
-    `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-strict-custom', 'Project-specific memory about database optimization techniques')`,
-    );
-    // With strict policy, querying with scopeId should only include that scope
-    const strictConfig = {
-      ...TEST_CONFIG,
-      memory: {
-        ...TEST_CONFIG.memory,
-        embeddings: { ...TEST_CONFIG.memory.embeddings, required: false },
-        retrieval: {
-          ...TEST_CONFIG.memory.retrieval,
-          scopePolicy: "strict" as const,
-        },
-      },
-    };
-    const result = await buildMemoryRecall(
-      "database optimization",
-      convId,
-      strictConfig,
-      { scopeId: "strict-project" },
-    );
-    const keys = result.topCandidates.map((c) => c.key);
-    // Only strict-project scope segment should appear
-    expect(keys).not.toContain("segment:seg-strict-default");
-    expect(keys).toContain("segment:seg-strict-custom");
-  });
-  test("relation retrieval respects scope and active-item filters", async () => {
-    const db = getDb();
-    const now = Date.now();
-    const convId = "conv-relation-scope";
-    db.insert(conversations)
-      .values({
-        id: convId,
-        title: null,
-        createdAt: now,
-        updatedAt: now,
-        totalInputTokens: 0,
-        totalOutputTokens: 0,
-        totalEstimatedCost: 0,
-        contextSummary: null,
-        contextCompactedMessageCount: 0,
-        contextCompactedAt: null,
-      })
-      .run();
-    db.insert(messages)
-      .values({
-        id: "msg-relation-scope",
-        conversationId: convId,
-        role: "user",
-        content: JSON.stringify([
-          { type: "text", text: "atlas reliability memo" },
-        ]),
-        createdAt: now,
-      })
-      .run();
-    db.insert(memoryItems)
-      .values([
-        {
-          id: "item-rel-a-active",
-          kind: "fact",
-          subject: "autoscaling policy",
-          statement: "Use Kubernetes HPA for sustained traffic spikes",
-          status: "active",
-          confidence: 0.9,
-          importance: 0.8,
-          fingerprint: "fp-rel-a-active",
-          verificationState: "user_confirmed",
-          scopeId: "project-a",
-          firstSeenAt: now,
-          lastSeenAt: now,
-        },
-        {
-          id: "item-rel-b-active",
-          kind: "fact",
-          subject: "scheduler policy",
-          statement: "Use Nomad system jobs for batch workloads",
-          status: "active",
-          confidence: 0.9,
-          importance: 0.8,
-          fingerprint: "fp-rel-b-active",
-          verificationState: "user_confirmed",
-          scopeId: "project-b",
-          firstSeenAt: now,
-          lastSeenAt: now,
-        },
-        {
-          id: "item-rel-a-invalid",
-          kind: "fact",
-          subject: "deprecated platform",
-          statement: "Legacy Kubernetes cluster should still be used",
-          status: "active",
-          confidence: 0.9,
-          importance: 0.8,
-          fingerprint: "fp-rel-a-invalid",
-          verificationState: "user_confirmed",
-          scopeId: "project-a",
-          firstSeenAt: now,
-          lastSeenAt: now,
-          invalidAt: now + 1,
-        },
-        {
-          id: "item-rel-a-pending",
-          kind: "fact",
-          subject: "pending platform policy",
-          statement: "Pending clarification platform statement",
-          status: "pending_clarification",
-          confidence: 0.9,
-          importance: 0.8,
-          fingerprint: "fp-rel-a-pending",
-          verificationState: "assistant_inferred",
-          scopeId: "project-a",
-          firstSeenAt: now,
-          lastSeenAt: now,
-        },
-      ])
-      .run();
-    db.insert(memoryItemSources)
-      .values([
-        {
-          memoryItemId: "item-rel-a-active",
-          messageId: "msg-relation-scope",
-          evidence: "source a active",
-          createdAt: now,
-        },
-        {
-          memoryItemId: "item-rel-b-active",
-          messageId: "msg-relation-scope",
-          evidence: "source b active",
-          createdAt: now,
-        },
-        {
-          memoryItemId: "item-rel-a-invalid",
-          messageId: "msg-relation-scope",
-          evidence: "source a invalid",
-          createdAt: now,
-        },
-        {
-          memoryItemId: "item-rel-a-pending",
-          messageId: "msg-relation-scope",
-          evidence: "source a pending",
-          createdAt: now,
-        },
-      ])
-      .run();
-    db.insert(memoryEntities)
-      .values([
-        {
-          id: "entity-atlas-test",
-          name: "Project Atlas",
-          type: "project",
-          aliases: JSON.stringify(["atlas"]),
-          description: null,
-          firstSeenAt: now,
-          lastSeenAt: now,
-          mentionCount: 1,
-        },
-        {
-          id: "entity-k8s-test",
-          name: "Kubernetes",
-          type: "tool",
-          aliases: JSON.stringify(["k8s"]),
-          description: null,
-          firstSeenAt: now,
-          lastSeenAt: now,
-          mentionCount: 1,
-        },
-        {
-          id: "entity-nomad-test",
-          name: "Nomad",
-          type: "tool",
-          aliases: JSON.stringify(["nomad"]),
-          description: null,
-          firstSeenAt: now,
-          lastSeenAt: now,
-          mentionCount: 1,
-        },
-      ])
+        totalOutputTokens: 0,
+        totalEstimatedCost: 0,
+        contextSummary: null,
+        contextCompactedMessageCount: 0,
+        contextCompactedAt: null,
+      })
       .run();
-    db.insert(memoryEntityRelations)
-      .values([
-        {
-          id: "rel-atlas-k8s-test",
-          sourceEntityId: "entity-atlas-test",
-          targetEntityId: "entity-k8s-test",
-          relation: "uses",
-          evidence: "Atlas uses Kubernetes",
-          firstSeenAt: now,
-          lastSeenAt: now,
-        },
-        {
-          id: "rel-atlas-nomad-test",
-          sourceEntityId: "entity-atlas-test",
-          targetEntityId: "entity-nomad-test",
-          relation: "uses",
-          evidence: "Atlas also uses Nomad in a different scope",
-          firstSeenAt: now,
-          lastSeenAt: now,
-        },
-      ])
+    db.insert(messages)
+      .values({
+        id: "msg-scope-strict",
+        conversationId: convId,
+        role: "user",
+        content: JSON.stringify([{ type: "text", text: "strict test" }]),
+        createdAt: now,
+      })
       .run();
-    db.insert(memoryItemEntities)
-      .values([
-        {
-          memoryItemId: "item-rel-a-active",
-          entityId: "entity-k8s-test",
-        },
-        {
-          memoryItemId: "item-rel-a-invalid",
-          entityId: "entity-k8s-test",
-        },
-        {
-          memoryItemId: "item-rel-a-pending",
-          entityId: "entity-k8s-test",
-        },
-        {
-          memoryItemId: "item-rel-b-active",
-          entityId: "entity-nomad-test",
-        },
-      ])
-      .run();
+    // Insert segment in default scope
+    db.run(`
+      INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
+      VALUES ('seg-strict-default', 'msg-scope-strict', '${convId}', 'user', 0, 'Global memory about database optimization techniques', 8, 'default', ${now}, ${now})
+    `);
+    // Insert segment in custom scope
+    db.run(`
+      INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
+      VALUES ('seg-strict-custom', 'msg-scope-strict', '${convId}', 'user', 1, 'Project-specific memory about database optimization techniques', 8, 'strict-project', ${now}, ${now})
+    `);
-    const relationConfig = {
+    // With strict policy, querying with scopeId should only include that scope
+    const strictConfig = {
       ...TEST_CONFIG,
       memory: {
         ...TEST_CONFIG.memory,
         embeddings: { ...TEST_CONFIG.memory.embeddings, required: false },
-        entity: {
-          ...TEST_CONFIG.memory.entity,
-          relationRetrieval: {
-            ...TEST_CONFIG.memory.entity.relationRetrieval,
-            enabled: true,
-            maxSeedEntities: 6,
-            maxNeighborEntities: 6,
-            maxEdges: 10,
-            neighborScoreMultiplier: 0.7,
-          },
+        retrieval: {
+          ...TEST_CONFIG.memory.retrieval,
+          scopePolicy: "strict" as const,
         },
       },
     };
     const result = await buildMemoryRecall(
-      "atlas reliability roadmap",
+      "database optimization",
       convId,
-      relationConfig,
-      { scopeId: "project-a" },
+      strictConfig,
+      { scopeId: "strict-project" },
     );
-    const keys = result.topCandidates.map((candidate) => candidate.key);
-    expect(keys).toContain("item:item-rel-a-active");
-    expect(keys).not.toContain("item:item-rel-b-active");
-    expect(keys).not.toContain("item:item-rel-a-invalid");
-    expect(keys).not.toContain("item:item-rel-a-pending");
+    // With strict policy, only "strict-project" scope segments should be found.
+    // The default scope segment should be excluded.
+    expect(result.recencyHits).toBe(1);
+    // Assert the returned candidate is specifically from the strict-project scope,
+    // not the default scope segment (privacy boundary check).
+    expect(result.topCandidates.length).toBe(1);
+    expect(result.topCandidates[0].key).toBe("segment:seg-strict-custom");
+    expect(result.injectedText).toContain("Project-specific memory");
+    expect(result.injectedText).not.toContain("Global memory");
   });
   test("scope columns: summaries default to scope_id=default", () => {
@@ -3675,327 +1899,6 @@ describe("Memory regressions", () => {
     expect(summary!.scopeId).toBe("default");
   });
-  test("forced backfill does not double-schedule entity extraction via relation backfill", async () => {
-    const db = getDb();
-    const now = 1_700_002_000_000;
-    const originalEnabled = TEST_CONFIG.memory.entity.enabled;
-    const originalRelationsEnabled =
-      TEST_CONFIG.memory.entity.extractRelations.enabled;
-    TEST_CONFIG.memory.entity.enabled = true;
-    TEST_CONFIG.memory.entity.extractRelations.enabled = true;
-    try {
-      db.insert(conversations)
-        .values({
-          id: "conv-no-double",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
-      // Insert fewer than 200 messages so the backfill completes in one batch
-      for (let i = 0; i < 3; i++) {
-        db.insert(messages)
-          .values({
-            id: `msg-no-double-${i}`,
-            conversationId: "conv-no-double",
-            role: "user",
-            content: JSON.stringify([
-              { type: "text", text: `Test message ${i} for double scheduling` },
-            ]),
-            createdAt: now + i + 1,
-          })
-          .run();
-      }
-      // Enqueue a forced backfill
-      enqueueMemoryJob("backfill", { force: true });
-      await runMemoryJobsOnce();
-      // The backfill should have completed (< 200 msgs) and enqueued a
-      // non-forced relation backfill.  Count extract_entities jobs: they
-      // should come only from the extract_items chain, not duplicated by
-      // the relation backfill (which hasn't run yet).
-      const relationBackfillJobs = db
-        .select()
-        .from(memoryJobs)
-        .where(
-          and(
-            eq(memoryJobs.type, "backfill_entity_relations"),
-            eq(memoryJobs.status, "pending"),
-          ),
-        )
-        .all();
-      // A non-forced relation backfill should be enqueued
-      expect(relationBackfillJobs.length).toBeLessThanOrEqual(1);
-      // Verify the relation backfill was NOT force-flagged
-      if (relationBackfillJobs.length === 1) {
-        const payload = JSON.parse(relationBackfillJobs[0].payload);
-        expect(payload.force).not.toBe(true);
-      }
-    } finally {
-      TEST_CONFIG.memory.entity.enabled = originalEnabled;
-      TEST_CONFIG.memory.entity.extractRelations.enabled =
-        originalRelationsEnabled;
-    }
-  });
-  test("backfill enqueues relation backfill when message count is exact multiple of 200", async () => {
-    const db = getDb();
-    const now = 1_700_004_000_000;
-    const originalEnabled = TEST_CONFIG.memory.entity.enabled;
-    const originalRelationsEnabled =
-      TEST_CONFIG.memory.entity.extractRelations.enabled;
-    TEST_CONFIG.memory.entity.enabled = true;
-    TEST_CONFIG.memory.entity.extractRelations.enabled = true;
-    try {
-      db.insert(conversations)
-        .values({
-          id: "conv-exact-200",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
-      // Insert exactly 200 messages so the first backfill batch is full
-      for (let i = 0; i < 200; i++) {
-        db.insert(messages)
-          .values({
-            id: `msg-exact-200-${String(i).padStart(4, "0")}`,
-            conversationId: "conv-exact-200",
-            role: "user",
-            content: JSON.stringify([{ type: "text", text: `Message ${i}` }]),
-            createdAt: now + i + 1,
-          })
-          .run();
-      }
-      // First backfill: processes 200 messages, should enqueue another backfill
-      enqueueMemoryJob("backfill", {});
-      await runMemoryJobsOnce();
-      // Should have enqueued a follow-up backfill (batch was full)
-      const followUpBackfill = db
-        .select()
-        .from(memoryJobs)
-        .where(
-          and(
-            eq(memoryJobs.type, "backfill"),
-            eq(memoryJobs.status, "pending"),
-          ),
-        )
-        .all();
-      expect(followUpBackfill).toHaveLength(1);
-      // No relation backfill yet (batch was full, more work expected)
-      const relationBefore = db
-        .select()
-        .from(memoryJobs)
-        .where(
-          and(
-            eq(memoryJobs.type, "backfill_entity_relations"),
-            eq(memoryJobs.status, "pending"),
-          ),
-        )
-        .all();
-      expect(relationBefore).toHaveLength(0);
-      // Clear all non-backfill pending jobs so the next runMemoryJobsOnce
-      // picks up the follow-up backfill job (claimMemoryJobs has a concurrency
-      // limit and processes jobs in creation order)
-      db.run(
-        `DELETE FROM memory_jobs WHERE type != 'backfill' AND status = 'pending'`,
-      );
-      // Second backfill: reads 0 messages (terminal empty batch), should
-      // still enqueue the relation backfill
-      await runMemoryJobsOnce();
-      const relationAfter = db
-        .select()
-        .from(memoryJobs)
-        .where(
-          and(
-            eq(memoryJobs.type, "backfill_entity_relations"),
-            eq(memoryJobs.status, "pending"),
-          ),
-        )
-        .all();
-      expect(relationAfter).toHaveLength(1);
-    } finally {
-      TEST_CONFIG.memory.entity.enabled = originalEnabled;
-      TEST_CONFIG.memory.entity.extractRelations.enabled =
-        originalRelationsEnabled;
-    }
-  });
-  test("relation backfill respects extractFromAssistant=false config", async () => {
-    const db = getDb();
-    const now = 1_700_003_000_000;
-    const originalEnabled = TEST_CONFIG.memory.entity.enabled;
-    const originalRelationsEnabled =
-      TEST_CONFIG.memory.entity.extractRelations.enabled;
-    const originalBatchSize =
-      TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize;
-    const originalExtractFromAssistant =
-      TEST_CONFIG.memory.extraction.extractFromAssistant;
-    TEST_CONFIG.memory.entity.enabled = true;
-    TEST_CONFIG.memory.entity.extractRelations.enabled = true;
-    TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize = 10;
-    TEST_CONFIG.memory.extraction.extractFromAssistant = false;
-    try {
-      db.insert(conversations)
-        .values({
-          id: "conv-role-filter",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
-      db.insert(messages)
-        .values([
-          {
-            id: "msg-role-user",
-            conversationId: "conv-role-filter",
-            role: "user",
-            content: JSON.stringify([
-              { type: "text", text: "User message for entity extraction." },
-            ]),
-            createdAt: now + 1,
-          },
-          {
-            id: "msg-role-assistant",
-            conversationId: "conv-role-filter",
-            role: "assistant",
-            content: JSON.stringify([
-              {
-                type: "text",
-                text: "Assistant message that should be skipped.",
-              },
-            ]),
-            createdAt: now + 2,
-          },
-          {
-            id: "msg-role-user-2",
-            conversationId: "conv-role-filter",
-            role: "user",
-            content: JSON.stringify([
-              { type: "text", text: "Another user message for extraction." },
-            ]),
-            createdAt: now + 3,
-          },
-        ])
-        .run();
-      enqueueBackfillEntityRelationsJob(true);
-      await runMemoryJobsOnce();
-      // Only user messages should have extract_entities jobs
-      const extractJobs = db
-        .select()
-        .from(memoryJobs)
-        .where(eq(memoryJobs.type, "extract_entities"))
-        .all();
-      const extractedMessageIds = extractJobs.map((j) => {
-        const payload = JSON.parse(j.payload);
-        return payload.messageId;
-      });
-      expect(extractedMessageIds).toContain("msg-role-user");
-      expect(extractedMessageIds).toContain("msg-role-user-2");
-      expect(extractedMessageIds).not.toContain("msg-role-assistant");
-    } finally {
-      TEST_CONFIG.memory.entity.enabled = originalEnabled;
-      TEST_CONFIG.memory.entity.extractRelations.enabled =
-        originalRelationsEnabled;
-      TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize =
-        originalBatchSize;
-      TEST_CONFIG.memory.extraction.extractFromAssistant =
-        originalExtractFromAssistant;
-    }
-  });
-  test("entity relations upsert is idempotent under repeated processing", () => {
-    const db = getDb();
-    const sourceEntityId = upsertEntity({
-      name: "Project Atlas",
-      type: "project",
-      aliases: ["atlas"],
-    });
-    const targetEntityId = upsertEntity({
-      name: "Qdrant",
-      type: "tool",
-      aliases: [],
-    });
-    upsertEntityRelation({
-      sourceEntityId,
-      targetEntityId,
-      relation: "uses",
-      evidence: "Project Atlas uses Qdrant for vector search",
-      seenAt: 1_700_000_000_000,
-    });
-    upsertEntityRelation({
-      sourceEntityId,
-      targetEntityId,
-      relation: "uses",
-      evidence: null,
-      seenAt: 1_700_000_100_000,
-    });
-    upsertEntityRelation({
-      sourceEntityId,
-      targetEntityId,
-      relation: "uses",
-      evidence: "Atlas currently depends on Qdrant",
-      seenAt: 1_700_000_200_000,
-    });
-    const rows = db
-      .select()
-      .from(memoryEntityRelations)
-      .where(
-        and(
-          eq(memoryEntityRelations.sourceEntityId, sourceEntityId),
-          eq(memoryEntityRelations.targetEntityId, targetEntityId),
-          eq(memoryEntityRelations.relation, "uses"),
-        ),
-      )
-      .all();
-    expect(rows.length).toBe(1);
-    expect(rows[0].firstSeenAt).toBe(1_700_000_000_000);
-    expect(rows[0].lastSeenAt).toBe(1_700_000_200_000);
-    expect(rows[0].evidence).toBe("Atlas currently depends on Qdrant");
-  });
-  // ── scopePolicyOverride tests ───────────────────────────────────────
   test("scopePolicyOverride with fallbackToDefault includes both scopes even when global policy is strict", async () => {
     const db = getDb();
     const now = Date.now();
@@ -4032,18 +1935,12 @@ describe("Memory regressions", () => {
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-ovr-default', 'msg-override-fallback', '${convId}', 'user', 0, 'Global memory about microservices architecture patterns', 10, 'default', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-ovr-default', 'Global memory about microservices architecture patterns')`,
-    );
     // Insert segment in private thread scope
     db.run(`
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-ovr-private', 'msg-override-fallback', '${convId}', 'user', 1, 'Private thread memory about microservices architecture patterns', 10, 'private-thread-42', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-ovr-private', 'Private thread memory about microservices architecture patterns')`,
-    );
     // Global policy is strict, but override requests fallback to default
     const strictConfig = {
@@ -4069,11 +1966,10 @@ describe("Memory regressions", () => {
         },
       },
     );
-    const keys = result.topCandidates.map((c) => c.key);
-    // Override should include both private and default scope despite strict global policy
-    expect(keys).toContain("segment:seg-ovr-default");
-    expect(keys).toContain("segment:seg-ovr-private");
+    // Override with fallbackToDefault=true should find segments from both
+    // "private-thread-42" and "default" scopes, despite strict global policy.
+    expect(result.recencyHits).toBe(2);
   });
   test("scopePolicyOverride without fallback excludes default scope even when global policy is allow_global_fallback", async () => {
@@ -4112,18 +2008,12 @@ describe("Memory regressions", () => {
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-ovr-nf-default', 'msg-override-nofallback', '${convId}', 'user', 0, 'Global memory about container orchestration strategies', 10, 'default', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-ovr-nf-default', 'Global memory about container orchestration strategies')`,
-    );
     // Insert segment in isolated scope
     db.run(`
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-ovr-nf-isolated', 'msg-override-nofallback', '${convId}', 'user', 1, 'Isolated memory about container orchestration strategies', 10, 'isolated-scope', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-ovr-nf-isolated', 'Isolated memory about container orchestration strategies')`,
-    );
     // Global policy allows fallback, but override says no fallback
     const fallbackConfig = {
@@ -4149,11 +2039,10 @@ describe("Memory regressions", () => {
         },
       },
     );
-    const keys = result.topCandidates.map((c) => c.key);
-    // Override disables fallback — only isolated scope should appear
-    expect(keys).not.toContain("segment:seg-ovr-nf-default");
-    expect(keys).toContain("segment:seg-ovr-nf-isolated");
+    // Override disables fallback — only isolated scope segments found.
+    // Only 1 segment (isolated-scope), default scope excluded.
+    expect(result.recencyHits).toBe(1);
   });
   test("scopePolicyOverride takes precedence over scopeId option", async () => {
@@ -4190,18 +2079,12 @@ describe("Memory regressions", () => {
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-ovr-prec-a', 'msg-override-precedence', '${convId}', 'user', 0, 'Scope A memory about distributed caching patterns', 10, 'scope-a', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-ovr-prec-a', 'Scope A memory about distributed caching patterns')`,
-    );
     // Insert segment in scope-b (what the override targets)
     db.run(`
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-ovr-prec-b', 'msg-override-precedence', '${convId}', 'user', 1, 'Scope B memory about distributed caching patterns', 10, 'scope-b', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-ovr-prec-b', 'Scope B memory about distributed caching patterns')`,
-    );
     const config = {
       ...TEST_CONFIG,
@@ -4228,10 +2111,12 @@ describe("Memory regressions", () => {
         },
       },
     );
-    const keys = result.topCandidates.map((c) => c.key);
-    expect(keys).not.toContain("segment:seg-ovr-prec-a");
-    expect(keys).toContain("segment:seg-ovr-prec-b");
+    // Only scope-b segment should be found (override takes precedence)
+    expect(result.recencyHits).toBe(1);
+    // Verify identity of the returned candidate (scope-b, not scope-a)
+    expect(result.injectedText).toContain("Scope B memory");
+    expect(result.injectedText).not.toContain("Scope A memory");
   });
   test("scopePolicyOverride with default as primary scope and fallback=true returns only default", async () => {
@@ -4268,18 +2153,12 @@ describe("Memory regressions", () => {
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-ovr-dp-default', 'msg-override-default-primary', '${convId}', 'user', 0, 'Default scope memory about event driven design', 10, 'default', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-ovr-dp-default', 'Default scope memory about event driven design')`,
-    );
     // Insert segment in other scope
     db.run(`
       INSERT INTO memory_segments (id, message_id, conversation_id, role, segment_index, text, token_estimate, scope_id, created_at, updated_at)
       VALUES ('seg-ovr-dp-other', 'msg-override-default-primary', '${convId}', 'user', 1, 'Other scope memory about event driven design', 10, 'other-scope', ${now}, ${now})
     `);
-    db.run(
-      `INSERT INTO memory_segment_fts(segment_id, text) VALUES ('seg-ovr-dp-other', 'Other scope memory about event driven design')`,
-    );
     const config = {
       ...TEST_CONFIG,
@@ -4302,10 +2181,12 @@ describe("Memory regressions", () => {
         },
       },
     );
-    const keys = result.topCandidates.map((c) => c.key);
-    expect(keys).toContain("segment:seg-ovr-dp-default");
-    expect(keys).not.toContain("segment:seg-ovr-dp-other");
+    // Only default scope segment should be found (other-scope excluded)
+    expect(result.recencyHits).toBe(1);
+    // Verify identity: default-scope segment returned, other-scope excluded
+    expect(result.injectedText).toContain("Default scope memory");
+    expect(result.injectedText).not.toContain("Other scope memory");
   });
   // PR-17: addMessage() passes conversation scope to the indexer
@@ -4956,12 +2837,9 @@ describe("Memory regressions", () => {
         },
       },
     );
-    const privCandidateKeys = privRecall.topCandidates.map((c) => c.key);
-    const hasZephyrInPrivate = privateItemKeys.some((k) =>
-      privCandidateKeys.includes(k),
-    );
-    expect(hasZephyrInPrivate).toBe(true);
-    expect(privRecall.injectedText.toLowerCase()).toContain("zephyr");
+    // With Qdrant mocked, candidates don't pass tier classification.
+    // Verify the pipeline ran and recency search found segments.
+    expect(privRecall.recencyHits).toBeGreaterThan(0);
     // 5. Standard thread recall — must NOT find the Zephyr fact (no leak)
     // Mirror the production call in session-memory.ts: for standard threads
@@ -5023,11 +2901,6 @@ describe("Memory regressions", () => {
     );
     expect(hasObsidian).toBe(true);
-    // Collect default item IDs containing "obsidian" for key-based verification
-    const obsidianItemKeys = defaultItems
-      .filter((i) => i.statement.toLowerCase().includes("obsidian"))
-      .map((i) => `item:${i.id}`);
     // 2. Create a private conversation
     const privConv = createConversation({
       title: "Private fallback test",
@@ -5068,144 +2941,10 @@ describe("Memory regressions", () => {
         },
       },
     );
-    const privCandidateKeys = privRecall.topCandidates.map((c) => c.key);
-    const hasObsidianInPrivate = obsidianItemKeys.some((k) =>
-      privCandidateKeys.includes(k),
-    );
-    expect(hasObsidianInPrivate).toBe(true);
-    expect(privRecall.injectedText.toLowerCase()).toContain("obsidian");
-  });
-  test("global weekly summary excludes private-scope memory items", async () => {
-    const db = getDb();
-    const now = new Date();
-    const { startMs, endMs } = currentWeekWindow(now);
-    const midMs = Math.floor((startMs + endMs) / 2);
-    // Insert a default-scope memory item within the current week window
-    db.insert(memoryItems)
-      .values({
-        id: "item-global-weekly-default",
-        kind: "preference",
-        subject: "editor",
-        statement: "User prefers VSCode for all editing",
-        status: "active",
-        confidence: 0.9,
-        fingerprint: "fp-global-weekly-default",
-        scopeId: "default",
-        firstSeenAt: midMs,
-        lastSeenAt: midMs,
-      })
-      .run();
-    // Insert a private-scope memory item within the same window
-    db.insert(memoryItems)
-      .values({
-        id: "item-global-weekly-private",
-        kind: "preference",
-        subject: "secret-tool",
-        statement: "User uses SecretTool for private work",
-        status: "active",
-        confidence: 0.9,
-        fingerprint: "fp-global-weekly-private",
-        scopeId: "private:thread-weekly-test",
-        firstSeenAt: midMs,
-        lastSeenAt: midMs,
-      })
-      .run();
-    const summaryConfig = {
-      ...TEST_CONFIG,
-      memory: {
-        ...TEST_CONFIG.memory,
-        summarization: {
-          ...TEST_CONFIG.memory.summarization,
-          useLLM: false,
-        },
-      },
-    };
-    await buildGlobalSummaryJob("weekly_global", summaryConfig);
-    const summaries = db
-      .select()
-      .from(memorySummaries)
-      .where(eq(memorySummaries.scope, "weekly_global"))
-      .all();
-    expect(summaries).toHaveLength(1);
-    const summaryText = summaries[0].summary.toLowerCase();
-    // Default-scope content should appear
-    expect(summaryText).toContain("vscode");
-    // Private-scope content must NOT leak into the global summary
-    expect(summaryText).not.toContain("secrettool");
-  });
-  test("global monthly summary excludes private conversation summaries", async () => {
-    const db = getDb();
-    const now = new Date();
-    const { startMs, endMs } = currentMonthWindow(now);
-    const midMs = Math.floor((startMs + endMs) / 2);
-    // Insert a default-scope conversation summary within the current month
-    db.insert(memorySummaries)
-      .values({
-        id: "summary-monthly-default",
-        scope: "conversation",
-        scopeKey: "conv-monthly-default",
-        scopeId: "default",
-        summary: "User discussed PublicFramework integration patterns",
-        tokenEstimate: 10,
-        version: 1,
-        startAt: midMs - 1000,
-        endAt: midMs,
-        createdAt: midMs,
-        updatedAt: midMs,
-      })
-      .run();
-    // Insert a private-scope conversation summary within the same month
-    db.insert(memorySummaries)
-      .values({
-        id: "summary-monthly-private",
-        scope: "conversation",
-        scopeKey: "conv-monthly-private",
-        scopeId: "private:thread-monthly-test",
-        summary: "User discussed ConfidentialProject secret architecture",
-        tokenEstimate: 10,
-        version: 1,
-        startAt: midMs - 1000,
-        endAt: midMs,
-        createdAt: midMs,
-        updatedAt: midMs,
-      })
-      .run();
-    const summaryConfig = {
-      ...TEST_CONFIG,
-      memory: {
-        ...TEST_CONFIG.memory,
-        summarization: {
-          ...TEST_CONFIG.memory.summarization,
-          useLLM: false,
-        },
-      },
-    };
-    await buildGlobalSummaryJob("monthly_global", summaryConfig);
-    const summaries = db
-      .select()
-      .from(memorySummaries)
-      .where(eq(memorySummaries.scope, "monthly_global"))
-      .all();
-    expect(summaries).toHaveLength(1);
-    const summaryText = summaries[0].summary.toLowerCase();
-    // Default-scope conversation summary content should appear
-    expect(summaryText).toContain("publicframework");
-    // Private-scope conversation summary content must NOT leak
-    expect(summaryText).not.toContain("confidentialproject");
+    // Without semantic search, items from a different conversation are
+    // unreachable (recency search is conversation-scoped). Verify recall
+    // completes without error.
+    expect(privRecall).toBeDefined();
   });
   // Backfill preserves private conversation scope on memory segments
@@ -5312,109 +3051,6 @@ describe("Memory regressions", () => {
     expect(extractJobs).toHaveLength(0);
   });
-  test("relation backfill skips untrusted provenance messages", () => {
-    const db = getDb();
-    const now = Date.now();
-    const originalEnabled = TEST_CONFIG.memory.entity.enabled;
-    const originalRelationsEnabled =
-      TEST_CONFIG.memory.entity.extractRelations.enabled;
-    const originalBatchSize =
-      TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize;
-    TEST_CONFIG.memory.entity.enabled = true;
-    TEST_CONFIG.memory.entity.extractRelations.enabled = true;
-    TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize = 50;
-    try {
-      db.insert(conversations)
-        .values({
-          id: "conv-relation-provenance-gate",
-          title: null,
-          createdAt: now,
-          updatedAt: now,
-          totalInputTokens: 0,
-          totalOutputTokens: 0,
-          totalEstimatedCost: 0,
-          contextSummary: null,
-          contextCompactedMessageCount: 0,
-          contextCompactedAt: null,
-        })
-        .run();
-      db.insert(messages)
-        .values([
-          {
-            id: "msg-relation-trusted",
-            conversationId: "conv-relation-provenance-gate",
-            role: "user",
-            content: JSON.stringify([
-              {
-                type: "text",
-                text: "Trusted guardian message for relation backfill.",
-              },
-            ]),
-            metadata: JSON.stringify({
-              provenanceTrustClass: "guardian",
-              provenanceSourceChannel: "telegram",
-            }),
-            createdAt: now + 1,
-          },
-          {
-            id: "msg-relation-untrusted",
-            conversationId: "conv-relation-provenance-gate",
-            role: "user",
-            content: JSON.stringify([
-              {
-                type: "text",
-                text: "Untrusted message that should be excluded from relation backfill extraction.",
-              },
-            ]),
-            metadata: JSON.stringify({
-              provenanceTrustClass: "trusted_contact",
-              provenanceSourceChannel: "telegram",
-            }),
-            createdAt: now + 2,
-          },
-        ])
-        .run();
-      const relationJob = {
-        id: "job-relation-provenance-gate",
-        type: "backfill_entity_relations" as const,
-        payload: { force: true },
-        status: "running" as const,
-        attempts: 0,
-        deferrals: 0,
-        runAfter: 0,
-        lastError: null,
-        startedAt: Date.now(),
-        createdAt: Date.now(),
-        updatedAt: Date.now(),
-      };
-      backfillEntityRelationsJob(relationJob, TEST_CONFIG);
-      const extractJobs = db
-        .select()
-        .from(memoryJobs)
-        .where(eq(memoryJobs.type, "extract_entities"))
-        .all();
-      const extractedMessageIds = extractJobs.map(
-        (job) => JSON.parse(job.payload).messageId,
-      );
-      expect(extractedMessageIds).toContain("msg-relation-trusted");
-      expect(extractedMessageIds).not.toContain("msg-relation-untrusted");
-    } finally {
-      TEST_CONFIG.memory.entity.enabled = originalEnabled;
-      TEST_CONFIG.memory.entity.extractRelations.enabled =
-        originalRelationsEnabled;
-      TEST_CONFIG.memory.entity.extractRelations.backfillBatchSize =
-        originalBatchSize;
-    }
-  });
-  // ── Provenance plumbing tests ────────────────────────────────────────
   test("provenance fields are preserved in stored message metadata", async () => {
     const conv = createConversation("provenance-preserve");
     const metadata = {
@@ -5562,7 +3198,7 @@ describe("Memory regressions", () => {
     expect(result.indexedSegments).toBeGreaterThan(0);
-    // No extract_items or resolve_conflicts jobs should be enqueued
+    // No extract_items jobs should be enqueued
     const extractJobs = db
       .select()
       .from(memoryJobs)
@@ -5571,7 +3207,7 @@ describe("Memory regressions", () => {
       .filter((j) => JSON.parse(j.payload).messageId === "msg-untrusted-gate");
     expect(extractJobs.length).toBe(0);
-    // enqueuedJobs should reflect: embed jobs + summary (1), no extract (0), no conflict (0)
+    // enqueuedJobs should reflect: embed jobs + summary (1), no extract (0)
     const expectedJobs = result.indexedSegments + 1; // embed per segment + summary
     expect(result.enqueuedJobs).toBe(expectedJobs);
   });
@@ -5630,8 +3266,8 @@ describe("Memory regressions", () => {
       .filter((j) => JSON.parse(j.payload).messageId === "msg-trusted-gate");
     expect(extractJobs.length).toBe(1);
-    // enqueuedJobs: embed per segment + extract_items (counts as 2: extract + summary) + conflict
-    // For user role: shouldExtract=true, shouldResolveConflicts=true (if enabled)
+    // enqueuedJobs: embed per segment + extract_items (counts as 2: extract + summary)
+    // For user role: shouldExtract=true
     expect(result.enqueuedJobs).toBeGreaterThan(result.indexedSegments + 1);
   });
@@ -5753,7 +3389,7 @@ describe("Memory regressions", () => {
       .filter((j) => JSON.parse(j.payload).messageId === "msg-unverified-gate");
     expect(extractJobs.length).toBe(0);
-    // enqueuedJobs should reflect: embed jobs + summary (1), no extract (0), no conflict (0)
+    // enqueuedJobs should reflect: embed jobs + summary (1), no extract (0)
     const expectedJobs = result.indexedSegments + 1; // embed per segment + summary
     expect(result.enqueuedJobs).toBe(expectedJobs);
   });