npm - @vellumai/assistant - Versions diffs - 0.4.49 → 0.4.50 - Mend

@vellumai/assistant 0.4.49 → 0.4.50

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (239) hide show

package/ARCHITECTURE.md +24 -33
package/README.md +3 -3
package/docs/architecture/memory.md +180 -119
package/package.json +2 -2
package/src/__tests__/agent-loop.test.ts +3 -1
package/src/__tests__/anthropic-provider.test.ts +114 -23
package/src/__tests__/approval-cascade.test.ts +1 -15
package/src/__tests__/approval-routes-http.test.ts +2 -0
package/src/__tests__/assistant-feature-flag-guard.test.ts +0 -23
package/src/__tests__/canonical-guardian-store.test.ts +95 -0
package/src/__tests__/checker.test.ts +13 -0
package/src/__tests__/config-schema.test.ts +1 -68
package/src/__tests__/context-memory-e2e.test.ts +11 -100
package/src/__tests__/conversation-routes-guardian-reply.test.ts +8 -0
package/src/__tests__/conversation-routes-slash-commands.test.ts +1 -0
package/src/__tests__/credential-security-e2e.test.ts +1 -0
package/src/__tests__/credential-vault-unit.test.ts +4 -0
package/src/__tests__/credential-vault.test.ts +13 -1
package/src/__tests__/cu-unified-flow.test.ts +532 -0
package/src/__tests__/date-context.test.ts +93 -77
package/src/__tests__/deterministic-verification-control-plane.test.ts +64 -0
package/src/__tests__/guardian-routing-invariants.test.ts +93 -0
package/src/__tests__/history-repair.test.ts +245 -0
package/src/__tests__/host-cu-proxy.test.ts +165 -3
package/src/__tests__/http-user-message-parity.test.ts +1 -0
package/src/__tests__/invite-redemption-service.test.ts +65 -1
package/src/__tests__/keychain-broker-client.test.ts +4 -4
package/src/__tests__/memory-context-benchmark.benchmark.test.ts +56 -18
package/src/__tests__/memory-lifecycle-e2e.test.ts +244 -387
package/src/__tests__/memory-recall-quality.test.ts +244 -407
package/src/__tests__/memory-regressions.experimental.test.ts +126 -101
package/src/__tests__/memory-regressions.test.ts +477 -2841
package/src/__tests__/memory-retrieval.benchmark.test.ts +33 -150
package/src/__tests__/memory-upsert-concurrency.test.ts +5 -244
package/src/__tests__/mime-builder.test.ts +28 -0
package/src/__tests__/native-web-search.test.ts +1 -0
package/src/__tests__/oauth-cli.test.ts +572 -5
package/src/__tests__/oauth-store.test.ts +120 -6
package/src/__tests__/qdrant-collection-migration.test.ts +53 -8
package/src/__tests__/registry.test.ts +0 -1
package/src/__tests__/relay-server.test.ts +46 -1
package/src/__tests__/schedule-tools.test.ts +32 -0
package/src/__tests__/script-proxy-certs.test.ts +1 -1
package/src/__tests__/secret-onetime-send.test.ts +1 -0
package/src/__tests__/secure-keys.test.ts +7 -2
package/src/__tests__/send-endpoint-busy.test.ts +3 -0
package/src/__tests__/session-abort-tool-results.test.ts +1 -14
package/src/__tests__/session-agent-loop-overflow.test.ts +1583 -0
package/src/__tests__/session-agent-loop.test.ts +19 -15
package/src/__tests__/session-confirmation-signals.test.ts +1 -15
package/src/__tests__/session-error.test.ts +124 -2
package/src/__tests__/session-history-web-search.test.ts +918 -0
package/src/__tests__/session-pre-run-repair.test.ts +1 -14
package/src/__tests__/session-provider-retry-repair.test.ts +25 -28
package/src/__tests__/session-queue.test.ts +37 -27
package/src/__tests__/session-runtime-assembly.test.ts +54 -0
package/src/__tests__/session-slash-known.test.ts +1 -15
package/src/__tests__/session-slash-queue.test.ts +1 -15
package/src/__tests__/session-slash-unknown.test.ts +1 -15
package/src/__tests__/session-workspace-cache-state.test.ts +3 -33
package/src/__tests__/session-workspace-injection.test.ts +3 -37
package/src/__tests__/session-workspace-tool-tracking.test.ts +3 -37
package/src/__tests__/skills-install-extract.test.ts +93 -0
package/src/__tests__/skillssh-registry.test.ts +451 -0
package/src/__tests__/trust-store.test.ts +15 -0
package/src/__tests__/voice-invite-redemption.test.ts +32 -1
package/src/agent/ax-tree-compaction.test.ts +51 -0
package/src/agent/loop.ts +39 -12
package/src/approvals/AGENTS.md +1 -1
package/src/approvals/guardian-request-resolvers.ts +14 -2
package/src/bundler/compiler-tools.ts +66 -2
package/src/calls/call-domain.ts +132 -0
package/src/calls/call-store.ts +6 -0
package/src/calls/relay-server.ts +43 -5
package/src/calls/relay-setup-router.ts +17 -1
package/src/calls/twilio-config.ts +1 -1
package/src/calls/types.ts +3 -1
package/src/cli/commands/doctor.ts +4 -3
package/src/cli/commands/mcp.ts +46 -59
package/src/cli/commands/memory.ts +16 -165
package/src/cli/commands/oauth/apps.ts +31 -2
package/src/cli/commands/oauth/connections.ts +431 -97
package/src/cli/commands/oauth/providers.ts +15 -1
package/src/cli/commands/sessions.ts +5 -2
package/src/cli/commands/skills.ts +173 -1
package/src/cli/http-client.ts +0 -20
package/src/cli/main-screen.tsx +2 -2
package/src/cli/program.ts +5 -6
package/src/cli.ts +4 -10
package/src/config/bundled-skills/computer-use/TOOLS.json +1 -1
package/src/config/bundled-skills/computer-use/tools/computer-use-observe.ts +12 -0
package/src/config/bundled-tool-registry.ts +2 -5
package/src/config/schema.ts +1 -12
package/src/config/schemas/memory-lifecycle.ts +0 -9
package/src/config/schemas/memory-processing.ts +0 -180
package/src/config/schemas/memory-retrieval.ts +32 -104
package/src/config/schemas/memory.ts +0 -10
package/src/config/types.ts +0 -4
package/src/context/window-manager.ts +4 -1
package/src/daemon/config-watcher.ts +61 -3
package/src/daemon/daemon-control.ts +1 -1
package/src/daemon/date-context.ts +114 -31
package/src/daemon/handlers/sessions.ts +18 -13
package/src/daemon/handlers/skills.ts +20 -1
package/src/daemon/history-repair.ts +72 -8
package/src/daemon/host-cu-proxy.ts +55 -26
package/src/daemon/lifecycle.ts +31 -3
package/src/daemon/mcp-reload-service.ts +2 -2
package/src/daemon/message-types/computer-use.ts +1 -12
package/src/daemon/message-types/memory.ts +4 -16
package/src/daemon/message-types/messages.ts +1 -0
package/src/daemon/message-types/sessions.ts +4 -0
package/src/daemon/server.ts +12 -1
package/src/daemon/session-agent-loop-handlers.ts +38 -0
package/src/daemon/session-agent-loop.ts +334 -48
package/src/daemon/session-error.ts +89 -6
package/src/daemon/session-history.ts +17 -7
package/src/daemon/session-media-retry.ts +6 -2
package/src/daemon/session-memory.ts +69 -149
package/src/daemon/session-process.ts +10 -1
package/src/daemon/session-runtime-assembly.ts +49 -19
package/src/daemon/session-surfaces.ts +4 -1
package/src/daemon/session-tool-setup.ts +7 -1
package/src/daemon/session.ts +12 -2
package/src/instrument.ts +61 -1
package/src/memory/admin.ts +2 -191
package/src/memory/canonical-guardian-store.ts +38 -2
package/src/memory/conversation-crud.ts +0 -33
package/src/memory/conversation-queries.ts +22 -3
package/src/memory/db-init.ts +28 -0
package/src/memory/embedding-backend.ts +84 -8
package/src/memory/embedding-types.ts +9 -1
package/src/memory/indexer.ts +7 -46
package/src/memory/items-extractor.ts +274 -76
package/src/memory/job-handlers/backfill.ts +2 -127
package/src/memory/job-handlers/cleanup.ts +2 -16
package/src/memory/job-handlers/extraction.ts +2 -138
package/src/memory/job-handlers/index-maintenance.ts +1 -6
package/src/memory/job-handlers/summarization.ts +3 -148
package/src/memory/job-utils.ts +21 -59
package/src/memory/jobs-store.ts +1 -159
package/src/memory/jobs-worker.ts +9 -52
package/src/memory/migrations/104-core-indexes.ts +3 -3
package/src/memory/migrations/149-oauth-tables.ts +2 -0
package/src/memory/migrations/150-oauth-apps-client-secret-path.ts +98 -0
package/src/memory/migrations/151-oauth-providers-ping-url.ts +11 -0
package/src/memory/migrations/152-memory-item-supersession.ts +44 -0
package/src/memory/migrations/153-drop-entity-tables.ts +15 -0
package/src/memory/migrations/154-drop-fts.ts +20 -0
package/src/memory/migrations/155-drop-conflicts.ts +7 -0
package/src/memory/migrations/156-call-session-invite-metadata.ts +24 -0
package/src/memory/migrations/index.ts +7 -0
package/src/memory/qdrant-client.ts +148 -51
package/src/memory/raw-query.ts +1 -1
package/src/memory/retriever.test.ts +294 -273
package/src/memory/retriever.ts +421 -645
package/src/memory/schema/calls.ts +2 -0
package/src/memory/schema/memory-core.ts +3 -48
package/src/memory/schema/oauth.ts +2 -0
package/src/memory/search/formatting.ts +263 -176
package/src/memory/search/lexical.ts +1 -254
package/src/memory/search/ranking.ts +0 -455
package/src/memory/search/semantic.ts +100 -14
package/src/memory/search/staleness.ts +47 -0
package/src/memory/search/tier-classifier.ts +21 -0
package/src/memory/search/types.ts +15 -77
package/src/memory/task-memory-cleanup.ts +4 -6
package/src/messaging/providers/gmail/mime-builder.ts +17 -7
package/src/oauth/byo-connection.test.ts +8 -1
package/src/oauth/oauth-store.ts +113 -27
package/src/oauth/seed-providers.ts +6 -0
package/src/oauth/token-persistence.ts +11 -3
package/src/permissions/defaults.ts +1 -0
package/src/permissions/trust-store.ts +23 -1
package/src/playbooks/playbook-compiler.ts +1 -1
package/src/prompts/system-prompt.ts +18 -2
package/src/providers/anthropic/client.ts +56 -126
package/src/providers/types.ts +7 -1
package/src/runtime/AGENTS.md +9 -0
package/src/runtime/auth/route-policy.ts +6 -3
package/src/runtime/guardian-reply-router.ts +24 -22
package/src/runtime/http-server.ts +2 -2
package/src/runtime/invite-redemption-service.ts +19 -1
package/src/runtime/invite-service.ts +25 -0
package/src/runtime/pending-interactions.ts +2 -2
package/src/runtime/routes/brain-graph-routes.ts +10 -90
package/src/runtime/routes/conversation-routes.ts +9 -1
package/src/runtime/routes/inbound-stages/acl-enforcement.ts +21 -12
package/src/runtime/routes/memory-item-routes.test.ts +754 -0
package/src/runtime/routes/memory-item-routes.ts +503 -0
package/src/runtime/routes/session-management-routes.ts +3 -3
package/src/runtime/routes/settings-routes.ts +2 -2
package/src/runtime/routes/trust-rules-routes.ts +14 -0
package/src/runtime/routes/workspace-routes.ts +2 -1
package/src/security/keychain-broker-client.ts +17 -4
package/src/security/secure-keys.ts +25 -3
package/src/security/token-manager.ts +36 -36
package/src/skills/catalog-install.ts +74 -18
package/src/skills/skillssh-registry.ts +503 -0
package/src/tools/assets/search.ts +5 -1
package/src/tools/computer-use/definitions.ts +0 -10
package/src/tools/computer-use/registry.ts +1 -1
package/src/tools/credentials/vault.ts +1 -3
package/src/tools/memory/definitions.ts +4 -13
package/src/tools/memory/handlers.test.ts +83 -103
package/src/tools/memory/handlers.ts +50 -85
package/src/tools/schedule/create.ts +8 -1
package/src/tools/schedule/update.ts +8 -1
package/src/tools/skills/load.ts +25 -2
package/src/__tests__/clarification-resolver.test.ts +0 -193
package/src/__tests__/conflict-intent-tokenization.test.ts +0 -160
package/src/__tests__/conflict-policy.test.ts +0 -269
package/src/__tests__/conflict-store.test.ts +0 -372
package/src/__tests__/contradiction-checker.test.ts +0 -361
package/src/__tests__/entity-extractor.test.ts +0 -211
package/src/__tests__/entity-search.test.ts +0 -1117
package/src/__tests__/profile-compiler.test.ts +0 -392
package/src/__tests__/session-conflict-gate.test.ts +0 -1228
package/src/__tests__/session-profile-injection.test.ts +0 -557
package/src/config/bundled-skills/knowledge-graph/SKILL.md +0 -25
package/src/config/bundled-skills/knowledge-graph/TOOLS.json +0 -66
package/src/config/bundled-skills/knowledge-graph/tools/graph-query.ts +0 -211
package/src/daemon/session-conflict-gate.ts +0 -167
package/src/daemon/session-dynamic-profile.ts +0 -77
package/src/memory/clarification-resolver.ts +0 -417
package/src/memory/conflict-intent.ts +0 -205
package/src/memory/conflict-policy.ts +0 -127
package/src/memory/conflict-store.ts +0 -410
package/src/memory/contradiction-checker.ts +0 -508
package/src/memory/entity-extractor.ts +0 -535
package/src/memory/format-recall.ts +0 -47
package/src/memory/fts-reconciler.ts +0 -165
package/src/memory/job-handlers/conflict.ts +0 -200
package/src/memory/profile-compiler.ts +0 -195
package/src/memory/recall-cache.ts +0 -117
package/src/memory/search/entity.ts +0 -535
package/src/memory/search/query-expansion.test.ts +0 -70
package/src/memory/search/query-expansion.ts +0 -118
package/src/runtime/routes/mcp-routes.ts +0 -20

package/src/__tests__/memory-retrieval.benchmark.test.ts CHANGED Viewed

@@ -4,6 +4,13 @@
  * Measures end-to-end memory recall time with varying database sizes.
  * Validates latency stays within acceptable bounds and token budget
  * enforcement works correctly.
+ *
+ * The new pipeline uses hybrid search (Qdrant) + recency search.
+ * With Qdrant mocked and semanticSearch returning empty, only recency
+ * search provides candidates. These recency-only candidates have
+ * low finalScore (< 0.6) and are filtered out by tier classification,
+ * so injectedText is empty. The tests verify pipeline completion,
+ * latency bounds, and correct handling of recency hits.
  */
 import { mkdtempSync, rmSync } from "node:fs";
 import { tmpdir } from "node:os";
@@ -38,8 +45,7 @@ mock.module("../util/logger.js", () => ({
     }),
 }));
-// Counter for semantic search invocations — used to verify early termination
-// skips the call entirely rather than relying on flaky wall-clock comparisons.
+// Counter for semantic search invocations
 let semanticSearchCallCount = 0;
 mock.module("../memory/search/semantic.js", () => ({
@@ -63,6 +69,8 @@ mock.module("../memory/embedding-backend.js", () => ({
     model: "mock-embedding",
     vectors: [new Array(1536).fill(0)],
   }),
+  generateSparseEmbedding: () => ({ indices: [], values: [] }),
+  logMemoryEmbeddingWarning: () => {},
 }));
 import { DEFAULT_CONFIG } from "../config/defaults.js";
@@ -135,13 +143,7 @@ function makeConfig(overrides?: { maxInjectTokens?: number }): AssistantConfig {
       },
       retrieval: {
         ...DEFAULT_CONFIG.memory.retrieval,
-        lexicalTopK: 50,
-        semanticTopK: 20,
         maxInjectTokens: overrides?.maxInjectTokens ?? 750,
-        reranking: {
-          ...DEFAULT_CONFIG.memory.retrieval.reranking,
-          enabled: false,
-        },
         dynamicBudget: {
           enabled: false,
           minInjectTokens: 160,
@@ -161,13 +163,9 @@ describe("Memory retrieval benchmark", () => {
   beforeEach(() => {
     const db = getDb();
     db.run("DELETE FROM memory_item_sources");
-    db.run("DELETE FROM memory_item_entities");
-    db.run("DELETE FROM memory_entity_relations");
-    db.run("DELETE FROM memory_entities");
     db.run("DELETE FROM memory_embeddings");
-    db.run("DELETE FROM memory_summaries");
     db.run("DELETE FROM memory_items");
-    db.run("DELETE FROM memory_segment_fts");
     db.run("DELETE FROM memory_segments");
     db.run("DELETE FROM messages");
     db.run("DELETE FROM conversations");
@@ -198,8 +196,8 @@ describe("Memory retrieval benchmark", () => {
     expect(recall.enabled).toBe(true);
     expect(recall.degraded).toBe(false);
-    expect(recall.lexicalHits).toBeGreaterThan(0);
-    expect(recall.selectedCount).toBeGreaterThan(0);
+    // Recency search finds conversation-scoped segments
+    expect(recall.recencyHits).toBeGreaterThan(0);
     // Relaxed threshold — guards against severe regressions, not precise benchmarking
     expect(recall.latencyMs).toBeLessThan(500);
   });
@@ -218,8 +216,7 @@ describe("Memory retrieval benchmark", () => {
     expect(recall.enabled).toBe(true);
     expect(recall.degraded).toBe(false);
-    expect(recall.lexicalHits).toBeGreaterThan(0);
-    expect(recall.selectedCount).toBeGreaterThan(0);
+    expect(recall.recencyHits).toBeGreaterThan(0);
     expect(recall.latencyMs).toBeLessThan(1000);
   });
@@ -237,8 +234,7 @@ describe("Memory retrieval benchmark", () => {
     expect(recall.enabled).toBe(true);
     expect(recall.degraded).toBe(false);
-    expect(recall.lexicalHits).toBeGreaterThan(0);
-    expect(recall.selectedCount).toBeGreaterThan(0);
+    expect(recall.recencyHits).toBeGreaterThan(0);
     expect(recall.latencyMs).toBeLessThan(2000);
   });
@@ -256,10 +252,11 @@ describe("Memory retrieval benchmark", () => {
     );
     expect(recall.enabled).toBe(true);
+    // With Qdrant mocked empty and recency-only candidates below tier threshold,
+    // injectedTokens is 0. Verify the budget cap is still respected.
     expect(recall.injectedTokens).toBeLessThanOrEqual(smallBudget);
-    expect(recall.injectedTokens).toBeGreaterThan(0);
-    // Compare against a larger budget to verify the cap actually constrains
+    // Compare against a larger budget
     const largeBudget = 2000;
     const largeConfig = makeConfig({ maxInjectTokens: largeBudget });
     const largeRecall = await buildMemoryRecall(
@@ -275,137 +272,20 @@ describe("Memory retrieval benchmark", () => {
     );
   });
-  test("early termination reduces latency when applicable", async () => {
-    const conversationId = "conv-bench-et";
-    const now = 1_700_500_000_000;
-    // Seed enough items that early termination can trigger
-    seedMemoryItems(conversationId, 500, now);
-    // Config with early termination enabled and low thresholds to trigger it
-    const etConfig: AssistantConfig = {
-      ...DEFAULT_CONFIG,
-      memory: {
-        ...DEFAULT_CONFIG.memory,
-        embeddings: {
-          ...DEFAULT_CONFIG.memory.embeddings,
-          provider: "local" as const,
-          required: false,
-        },
-        retrieval: {
-          ...DEFAULT_CONFIG.memory.retrieval,
-          lexicalTopK: 50,
-          semanticTopK: 20,
-          maxInjectTokens: 750,
-          reranking: {
-            ...DEFAULT_CONFIG.memory.retrieval.reranking,
-            enabled: false,
-          },
-          dynamicBudget: {
-            enabled: false,
-            minInjectTokens: 160,
-            maxInjectTokens: 750,
-            targetHeadroomTokens: 900,
-          },
-          earlyTermination: {
-            enabled: true,
-            minCandidates: 5,
-            minHighConfidence: 3,
-            confidenceThreshold: 0.3,
-          },
-        },
-      },
-    };
-    const recall = await buildMemoryRecall(
-      "What do we know about topic-5 and keyword-3?",
-      conversationId,
-      etConfig,
-    );
-    expect(recall.enabled).toBe(true);
-    expect(recall.earlyTerminated).toBe(true);
-    // Semantic search should be skipped when early termination fires
-    expect(recall.semanticHits).toBe(0);
-    expect(recall.selectedCount).toBeGreaterThan(0);
-  });
-  test("early termination skips semantic search entirely", async () => {
-    const conversationId = "conv-bench-et-skip";
+  test("semantic search is invoked when not early terminated", async () => {
+    const conversationId = "conv-bench-semantic";
     const now = 1_700_500_000_000;
-    seedMemoryItems(conversationId, 500, now);
+    seedMemoryItems(conversationId, 100, now);
     const query = "What do we know about topic-5 and keyword-3?";
-    const etConfig: AssistantConfig = {
-      ...DEFAULT_CONFIG,
-      memory: {
-        ...DEFAULT_CONFIG.memory,
-        embeddings: {
-          ...DEFAULT_CONFIG.memory.embeddings,
-          provider: "local" as const,
-          required: false,
-        },
-        retrieval: {
-          ...DEFAULT_CONFIG.memory.retrieval,
-          lexicalTopK: 50,
-          semanticTopK: 20,
-          maxInjectTokens: 750,
-          reranking: {
-            ...DEFAULT_CONFIG.memory.retrieval.reranking,
-            enabled: false,
-          },
-          dynamicBudget: {
-            enabled: false,
-            minInjectTokens: 160,
-            maxInjectTokens: 750,
-            targetHeadroomTokens: 900,
-          },
-          earlyTermination: {
-            enabled: true,
-            minCandidates: 5,
-            minHighConfidence: 3,
-            confidenceThreshold: 0.3,
-          },
-        },
-      },
-    };
-    const noEtConfig: AssistantConfig = {
-      ...etConfig,
-      memory: {
-        ...etConfig.memory,
-        retrieval: {
-          ...etConfig.memory.retrieval,
-          earlyTermination: {
-            enabled: false,
-            minCandidates: 5,
-            minHighConfidence: 3,
-            confidenceThreshold: 0.3,
-          },
-        },
-      },
-    };
-    // Run with ET enabled — semantic search should be skipped
-    semanticSearchCallCount = 0;
-    const etRecall = await buildMemoryRecall(query, conversationId, etConfig);
-    const etCalls = semanticSearchCallCount;
-    expect(etRecall.earlyTerminated).toBe(true);
-    expect(etRecall.semanticHits).toBe(0);
-    expect(etCalls).toBe(0);
-    // Run without ET — semantic search should be invoked
+    // earlyTermination is always false in the new pipeline, so semantic
+    // search should always be invoked when a query vector is available.
     semanticSearchCallCount = 0;
-    const baselineRecall = await buildMemoryRecall(
-      query,
-      conversationId,
-      noEtConfig,
-    );
-    const baselineCalls = semanticSearchCallCount;
+    const config = makeConfig();
+    await buildMemoryRecall(query, conversationId, config);
-    expect(baselineRecall.earlyTerminated).toBe(false);
-    expect(baselineCalls).toBeGreaterThan(0);
+    expect(semanticSearchCallCount).toBeGreaterThan(0);
   });
   test("recall.latencyMs tracks wall-clock within 50% tolerance", async () => {
@@ -427,14 +307,17 @@ describe("Memory retrieval benchmark", () => {
     const wallMs = Date.now() - wallStart;
     expect(recall.enabled).toBe(true);
-    expect(recall.latencyMs).toBeGreaterThan(0);
+    // latencyMs may be 0 when the pipeline runs very fast (< 1ms granularity)
+    expect(recall.latencyMs).toBeGreaterThanOrEqual(0);
     // Self-reported latencyMs should agree with wall-clock within 50%.
     // Tolerance is wide because both sides use Date.now() (integer ms),
     // so on fast runs the quantization error can be large relative to
     // total elapsed time.
-    const ratio = recall.latencyMs / Math.max(wallMs, 1);
-    expect(ratio).toBeGreaterThanOrEqual(0.5);
-    expect(ratio).toBeLessThanOrEqual(1.5);
+    if (wallMs > 0) {
+      const ratio = recall.latencyMs / wallMs;
+      expect(ratio).toBeGreaterThanOrEqual(0.5);
+      expect(ratio).toBeLessThanOrEqual(1.5);
+    }
   });
 });

package/src/__tests__/memory-upsert-concurrency.test.ts CHANGED Viewed

@@ -1,11 +1,10 @@
 /**
  * Atomicity tests for memory UPSERT paths.
  *
- * SQLite is single-writer, and indexMessageNow / createOrUpdatePendingConflict
- * are synchronous functions.  Because every call runs to completion before the
- * next microtask starts, the Promise.all / Promise.resolve().then() pattern
- * used here does NOT create true concurrent execution — calls still run
- * sequentially.
+ * SQLite is single-writer, and indexMessageNow is a synchronous function.
+ * Because every call runs to completion before the next microtask starts, the
+ * Promise.all / Promise.resolve().then() pattern used here does NOT create
+ * true concurrent execution — calls still run sequentially.
  *
  * What these tests DO verify is the correctness of the ON CONFLICT /
  * IMMEDIATE-transaction logic when the same logical operation is repeated many
@@ -47,6 +46,7 @@ mock.module("../util/logger.js", () => ({
 mock.module("../memory/qdrant-client.js", () => ({
   getQdrantClient: () => ({
     searchWithFilter: async () => [],
+    hybridSearch: async () => [],
     upsertPoints: async () => {},
     deletePoints: async () => {},
   }),
@@ -75,10 +75,6 @@ mock.module("../config/loader.js", () => ({
   invalidateConfigCache: () => {},
 }));
-import {
-  createOrUpdatePendingConflict,
-  listPendingConflicts,
-} from "../memory/conflict-store.js";
 import { getDb, initializeDb, resetDb } from "../memory/db.js";
 import { indexMessageNow } from "../memory/indexer.js";
 import {
@@ -102,15 +98,9 @@ afterAll(() => {
 function resetTables() {
   const db = getDb();
-  db.run("DELETE FROM memory_item_conflicts");
-  db.run("DELETE FROM memory_item_entities");
-  db.run("DELETE FROM memory_entity_relations");
-  db.run("DELETE FROM memory_entities");
   db.run("DELETE FROM memory_item_sources");
   db.run("DELETE FROM memory_embeddings");
-  db.run("DELETE FROM memory_summaries");
   db.run("DELETE FROM memory_items");
-  db.run("DELETE FROM memory_segment_fts");
   db.run("DELETE FROM memory_segments");
   db.run("DELETE FROM memory_jobs");
   db.run("DELETE FROM messages");
@@ -151,50 +141,6 @@ function seedConversationAndMessage(
     .run();
 }
-/** Insert a pair of memory items that can serve as conflict participants. */
-function seedItemPair(
-  suffix: string,
-  scopeId = "default",
-): { existingItemId: string; candidateItemId: string } {
-  const db = getDb();
-  const now = Date.now();
-  const existingItemId = `existing-${suffix}`;
-  const candidateItemId = `candidate-${suffix}`;
-  db.insert(memoryItems)
-    .values([
-      {
-        id: existingItemId,
-        kind: "preference",
-        subject: "framework preference",
-        statement: `Existing statement ${suffix}`,
-        status: "active",
-        confidence: 0.8,
-        importance: 0.7,
-        fingerprint: `fp-existing-${suffix}`,
-        verificationState: "assistant_inferred",
-        scopeId,
-        firstSeenAt: now,
-        lastSeenAt: now,
-      },
-      {
-        id: candidateItemId,
-        kind: "preference",
-        subject: "framework preference",
-        statement: `Candidate statement ${suffix}`,
-        status: "pending_clarification",
-        confidence: 0.8,
-        importance: 0.7,
-        fingerprint: `fp-candidate-${suffix}`,
-        verificationState: "assistant_inferred",
-        scopeId,
-        firstSeenAt: now,
-        lastSeenAt: now,
-      },
-    ])
-    .run();
-  return { existingItemId, candidateItemId };
-}
 // ─────────────────────────────────────────────────────────────────────────────
 // Test suite: segment UPSERT atomicity under parallel indexer load
 // ─────────────────────────────────────────────────────────────────────────────
@@ -484,191 +430,6 @@ describe("segment UPSERT atomicity under repeated indexer invocations", () => {
   });
 });
-// ─────────────────────────────────────────────────────────────────────────────
-// Test suite: conflict creation UPSERT atomicity
-// ─────────────────────────────────────────────────────────────────────────────
-describe("conflict creation UPSERT atomicity", () => {
-  beforeEach(() => {
-    resetTables();
-  });
-  test("repeated createOrUpdatePendingConflict calls for the same pair produce exactly one conflict row", async () => {
-    // Critical UPSERT path: the same conflict pair inserted multiple times
-    // (e.g. duplicate worker dispatches, retries).  The IMMEDIATE transaction
-    // guard in createOrUpdatePendingConflict must ensure only one row exists.
-    const pair = seedItemPair("parallel-create");
-    // Call createOrUpdatePendingConflict N times for the same pair.  Calls run
-    // sequentially (synchronous); the test verifies that repeated calls produce
-    // exactly one conflict row — the IMMEDIATE transaction deduplication path.
-    const WORKERS = 10;
-    const results = await Promise.all(
-      Array.from({ length: WORKERS }, (_, i) =>
-        Promise.resolve().then(() =>
-          createOrUpdatePendingConflict({
-            scopeId: "default",
-            existingItemId: pair.existingItemId,
-            candidateItemId: pair.candidateItemId,
-            relationship: "ambiguous_contradiction",
-            clarificationQuestion: `Worker ${i} discovered a contradiction`,
-          }),
-        ),
-      ),
-    );
-    // All callers must receive the same conflict ID — the deduplication path
-    // returns the existing row on the second and subsequent calls.
-    const firstId = results[0].id;
-    for (const result of results) {
-      expect(result.id).toBe(firstId);
-    }
-    // Exactly one pending conflict row in the DB.
-    const pending = listPendingConflicts("default");
-    expect(pending).toHaveLength(1);
-    expect(pending[0].id).toBe(firstId);
-  });
-  test("conflict creation for different pairs produces distinct rows without cross-contamination", async () => {
-    // Each unique item pair must get its own conflict row — deduplication must
-    // be scoped to the pair, not global.  Also exercises the idempotent
-    // insert-then-update path within each pair.
-    const PAIR_COUNT = 6;
-    const pairs = Array.from({ length: PAIR_COUNT }, (_, i) =>
-      seedItemPair(`multi-pair-${i}`),
-    );
-    // For each pair, make two calls: one insert and one update.  All calls run
-    // sequentially.  The test verifies that each pair ends up with exactly one
-    // conflict row (no cross-pair contamination, idempotent update path works).
-    await Promise.all(
-      pairs.flatMap((pair) => [
-        // First call: insert with 'contradiction'.
-        Promise.resolve().then(() =>
-          createOrUpdatePendingConflict({
-            scopeId: "default",
-            existingItemId: pair.existingItemId,
-            candidateItemId: pair.candidateItemId,
-            relationship: "contradiction",
-          }),
-        ),
-        // Second call: update to 'ambiguous_contradiction' — tests the idempotent update path.
-        Promise.resolve().then(() =>
-          createOrUpdatePendingConflict({
-            scopeId: "default",
-            existingItemId: pair.existingItemId,
-            candidateItemId: pair.candidateItemId,
-            relationship: "ambiguous_contradiction",
-          }),
-        ),
-      ]),
-    );
-    // Each pair must have produced exactly one pending conflict.
-    const pending = listPendingConflicts("default");
-    expect(pending).toHaveLength(PAIR_COUNT);
-    // All conflict IDs must be unique.
-    const ids = pending.map((c) => c.id);
-    expect(new Set(ids).size).toBe(PAIR_COUNT);
-    // Each returned conflict must reference the correct item pair.
-    for (let i = 0; i < PAIR_COUNT; i++) {
-      const pair = pairs[i];
-      const found = pending.find(
-        (c) =>
-          c.existingItemId === pair.existingItemId &&
-          c.candidateItemId === pair.candidateItemId,
-      );
-      expect(found).toBeDefined();
-      // The update call ran after the insert, so relationship is ambiguous_contradiction.
-      expect(found!.relationship).toBe("ambiguous_contradiction");
-    }
-  });
-  test("repeated updates to the same conflict row converge to a consistent state", async () => {
-    // Multiple update calls for the same conflict (e.g. repeated worker runs).
-    // All updates must succeed (last writer wins is acceptable) and the row
-    // must remain internally consistent.
-    const pair = seedItemPair("concurrent-update");
-    const first = createOrUpdatePendingConflict({
-      scopeId: "default",
-      existingItemId: pair.existingItemId,
-      candidateItemId: pair.candidateItemId,
-      relationship: "contradiction",
-      clarificationQuestion: "Initial question",
-    });
-    // Call createOrUpdatePendingConflict N times against the same existing row.
-    // Calls are sequential; the test verifies the row stays consistent (one row,
-    // valid status/relationship) after repeated updates — last writer wins.
-    const UPDATES = 8;
-    const results = await Promise.all(
-      Array.from({ length: UPDATES }, (_, i) =>
-        Promise.resolve().then(() =>
-          createOrUpdatePendingConflict({
-            scopeId: "default",
-            existingItemId: pair.existingItemId,
-            candidateItemId: pair.candidateItemId,
-            relationship: "ambiguous_contradiction",
-            clarificationQuestion: `Updated question from worker ${i}`,
-          }),
-        ),
-      ),
-    );
-    // All calls must return the same conflict ID.
-    for (const result of results) {
-      expect(result.id).toBe(first.id);
-    }
-    // Still exactly one row in the DB.
-    const pending = listPendingConflicts("default");
-    expect(pending).toHaveLength(1);
-    // The row must be consistent: valid status, valid relationship.
-    const conflict = pending[0];
-    expect(conflict.status).toBe("pending_clarification");
-    expect(conflict.relationship).toBe("ambiguous_contradiction");
-  });
-  test("scope isolation ensures conflicts in different scopes do not interfere", async () => {
-    // Conflicts created in different scopes must not cross-contaminate each
-    // other's conflict sets — scopeId must be part of the deduplication key.
-    const SCOPES = ["scope-alpha", "scope-beta", "scope-gamma"];
-    const scopePairs = SCOPES.map((scope) => ({
-      scope,
-      pair: seedItemPair(`scope-${scope}`, scope),
-    }));
-    // Make 3 calls per scope for all scopes.  Calls run sequentially; the test
-    // verifies that each scope produces exactly one conflict row and that there
-    // is no cross-scope contamination from repeated same-scope calls.
-    await Promise.all(
-      scopePairs.flatMap(({ scope, pair }) =>
-        Array.from({ length: 3 }, () =>
-          Promise.resolve().then(() =>
-            createOrUpdatePendingConflict({
-              scopeId: scope,
-              existingItemId: pair.existingItemId,
-              candidateItemId: pair.candidateItemId,
-              relationship: "contradiction",
-            }),
-          ),
-        ),
-      ),
-    );
-    for (const scope of SCOPES) {
-      const pending = listPendingConflicts(scope);
-      // Exactly one conflict per scope, no cross-scope leakage.
-      expect(pending).toHaveLength(1);
-      expect(pending[0].scopeId).toBe(scope);
-    }
-  });
-});
 // ─────────────────────────────────────────────────────────────────────────────
 // Test suite: memory segment job atomicity
 // ─────────────────────────────────────────────────────────────────────────────

package/src/__tests__/mime-builder.test.ts CHANGED Viewed

@@ -81,4 +81,32 @@ describe("buildMultipartMime", () => {
     expect(decoded).toContain('filename="b.png"');
     expect(decoded).toContain("Content-Type: image/png");
   });
+  test("sanitizes CRLF from header values to prevent header injection", () => {
+    const result = buildMultipartMime({
+      to: "victim@example.com\r\nBcc: attacker@example.com",
+      subject: "Fwd: Hello\r\nCc: attacker@example.com",
+      body: "Body",
+      cc: "team@example.com\nX-Injected: yes",
+      bcc: "audit@example.com\r\nX-Another: value",
+      inReplyTo: "<id@example.com>\nReferences: <evil@example.com>",
+      attachments: [],
+    });
+    const decoded = Buffer.from(
+      result.replace(/-/g, "+").replace(/_/g, "/"),
+      "base64",
+    ).toString("utf-8");
+    expect(decoded).toContain("To: victim@example.com Bcc: attacker@example.com");
+    expect(decoded).toContain("Subject: Fwd: Hello Cc: attacker@example.com");
+    expect(decoded).toContain("Cc: team@example.com X-Injected: yes");
+    expect(decoded).toContain("Bcc: audit@example.com X-Another: value");
+    expect(decoded).toContain(
+      "In-Reply-To: <id@example.com> References: <evil@example.com>",
+    );
+    expect(decoded).not.toContain("\r\nBcc: attacker@example.com");
+    expect(decoded).not.toContain("\r\nCc: attacker@example.com");
+  });
 });

package/src/__tests__/native-web-search.test.ts CHANGED Viewed

@@ -431,6 +431,7 @@ describe("Native Web Search — Streaming Events", () => {
       type: "server_tool_start",
       name: "web_search",
       toolUseId: "stu_stream123",
+      input: {},
     });
   });