npm - @vellumai/assistant - Versions diffs - 0.5.7 → 0.5.9 - Mend

@vellumai/assistant 0.5.7 → 0.5.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (205) hide show

package/Dockerfile +2 -1
package/docker-entrypoint.sh +9 -0
package/docs/architecture/memory.md +13 -11
package/eslint.config.mjs +0 -31
package/node_modules/@vellumai/ces-contracts/src/error.ts +1 -1
package/node_modules/@vellumai/ces-contracts/src/grants.ts +1 -1
package/node_modules/@vellumai/ces-contracts/src/handles.ts +1 -1
package/node_modules/@vellumai/ces-contracts/src/index.ts +1 -1
package/node_modules/@vellumai/ces-contracts/src/rpc.ts +1 -1
package/package.json +1 -1
package/src/__tests__/approval-cascade.test.ts +0 -1
package/src/__tests__/browser-fill-credential.test.ts +1 -1
package/src/__tests__/call-controller.test.ts +0 -1
package/src/__tests__/ces-rpc-credential-backend.test.ts +3 -3
package/src/__tests__/ces-startup-timeout.test.ts +40 -0
package/src/__tests__/config-schema-cmd.test.ts +0 -1
package/src/__tests__/config-schema.test.ts +2 -0
package/src/__tests__/conversation-abort-tool-results.test.ts +0 -1
package/src/__tests__/conversation-agent-loop-overflow.test.ts +0 -2
package/src/__tests__/conversation-agent-loop.test.ts +2 -4
package/src/__tests__/conversation-confirmation-signals.test.ts +0 -1
package/src/__tests__/conversation-error.test.ts +15 -1
package/src/__tests__/conversation-messaging-secret-redirect.test.ts +1 -1
package/src/__tests__/conversation-pre-run-repair.test.ts +0 -1
package/src/__tests__/conversation-provider-retry-repair.test.ts +0 -1
package/src/__tests__/conversation-queue.test.ts +0 -1
package/src/__tests__/conversation-runtime-assembly.test.ts +227 -0
package/src/__tests__/conversation-slash-queue.test.ts +0 -1
package/src/__tests__/conversation-slash-unknown.test.ts +0 -1
package/src/__tests__/conversation-workspace-injection.test.ts +0 -1
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +0 -1
package/src/__tests__/credential-execution-client.test.ts +5 -2
package/src/__tests__/credential-execution-feature-gates.test.ts +31 -16
package/src/__tests__/credential-execution-managed-contract.test.ts +2 -2
package/src/__tests__/credential-security-e2e.test.ts +1 -1
package/src/__tests__/credential-security-invariants.test.ts +2 -5
package/src/__tests__/credentials-cli.test.ts +4 -3
package/src/__tests__/daemon-credential-client.test.ts +123 -0
package/src/__tests__/deterministic-verification-control-plane.test.ts +1 -0
package/src/__tests__/gateway-client-managed-outbound.test.ts +79 -1
package/src/__tests__/journal-context.test.ts +335 -0
package/src/__tests__/memory-context-benchmark.benchmark.test.ts +0 -3
package/src/__tests__/memory-lifecycle-e2e.test.ts +70 -25
package/src/__tests__/memory-recall-quality.test.ts +48 -17
package/src/__tests__/memory-regressions.test.ts +408 -363
package/src/__tests__/memory-retrieval.benchmark.test.ts +0 -3
package/src/__tests__/non-member-access-request.test.ts +2 -2
package/src/__tests__/notification-decision-strategy.test.ts +71 -0
package/src/__tests__/oauth-cli.test.ts +5 -1
package/src/__tests__/provider-commit-message-generator.test.ts +0 -37
package/src/__tests__/provider-error-scenarios.test.ts +0 -267
package/src/__tests__/provider-streaming.benchmark.test.ts +2 -81
package/src/__tests__/relay-server.test.ts +1 -2
package/src/__tests__/script-proxy-injection-runtime.test.ts +1 -1
package/src/__tests__/secret-onetime-send.test.ts +1 -1
package/src/__tests__/secure-keys.test.ts +18 -15
package/src/__tests__/skill-memory.test.ts +17 -3
package/src/__tests__/stale-approval-dedup.test.ts +171 -0
package/src/__tests__/stt-hints.test.ts +437 -0
package/src/__tests__/task-memory-cleanup.test.ts +14 -0
package/src/__tests__/twilio-routes-twiml.test.ts +139 -1
package/src/__tests__/voice-quality.test.ts +58 -0
package/src/__tests__/voice-scoped-grant-consumer.test.ts +0 -1
package/src/__tests__/workspace-migration-016-migrate-credentials-from-keychain.test.ts +5 -3
package/src/acp/agent-process.ts +9 -1
package/src/agent/loop.ts +1 -1
package/src/approvals/guardian-request-resolvers.ts +164 -38
package/src/calls/__tests__/tts-text-sanitizer.test.ts +254 -0
package/src/calls/call-controller.ts +9 -5
package/src/calls/fish-audio-client.ts +26 -14
package/src/calls/stt-hints.ts +189 -0
package/src/calls/tts-text-sanitizer.ts +61 -0
package/src/calls/twilio-routes.ts +32 -4
package/src/calls/voice-quality.ts +15 -3
package/src/calls/voice-session-bridge.ts +1 -0
package/src/cli/commands/avatar.ts +2 -2
package/src/cli/commands/credentials.ts +110 -94
package/src/cli/commands/doctor.ts +2 -2
package/src/cli/commands/keys.ts +7 -7
package/src/cli/commands/memory.ts +1 -1
package/src/cli/commands/oauth/connections.ts +11 -29
package/src/cli/commands/oauth/platform.ts +389 -43
package/src/cli/lib/daemon-credential-client.ts +284 -0
package/src/cli.ts +1 -1
package/src/config/bundled-skills/AGENTS.md +34 -0
package/src/config/bundled-skills/acp/SKILL.md +10 -0
package/src/config/bundled-skills/app-builder/SKILL.md +0 -4
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +2 -2
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +1 -0
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +1 -0
package/src/config/bundled-skills/settings/SKILL.md +15 -2
package/src/config/bundled-skills/settings/TOOLS.json +46 -1
package/src/config/bundled-skills/settings/tools/avatar-remove.ts +59 -0
package/src/config/bundled-skills/settings/tools/avatar-update.ts +80 -0
package/src/config/bundled-skills/slack/SKILL.md +1 -1
package/src/config/bundled-tool-registry.ts +4 -0
package/src/config/defaults.ts +0 -2
package/src/config/env-registry.ts +4 -4
package/src/config/env.ts +14 -1
package/src/config/feature-flag-registry.json +1 -1
package/src/config/loader.ts +8 -11
package/src/config/schema.ts +5 -16
package/src/config/schemas/calls.ts +17 -0
package/src/config/schemas/inference.ts +2 -2
package/src/config/schemas/journal.ts +16 -0
package/src/config/schemas/memory-processing.ts +2 -2
package/src/config/types.ts +1 -0
package/src/contacts/contact-store.ts +2 -2
package/src/credential-execution/executable-discovery.ts +1 -1
package/src/credential-execution/startup-timeout.ts +36 -0
package/src/daemon/approval-generators.ts +3 -9
package/src/daemon/conversation-agent-loop.ts +6 -0
package/src/daemon/conversation-error.ts +13 -1
package/src/daemon/conversation-memory.ts +1 -2
package/src/daemon/conversation-process.ts +18 -1
package/src/daemon/conversation-runtime-assembly.ts +61 -1
package/src/daemon/conversation-surfaces.ts +30 -1
package/src/daemon/conversation.ts +20 -9
package/src/daemon/guardian-action-generators.ts +3 -9
package/src/daemon/lifecycle.ts +18 -11
package/src/daemon/message-types/conversations.ts +1 -0
package/src/daemon/server.ts +2 -3
package/src/memory/app-store.ts +31 -0
package/src/memory/db-init.ts +4 -0
package/src/memory/indexer.ts +19 -10
package/src/memory/items-extractor.ts +315 -322
package/src/memory/job-handlers/summarization.ts +26 -16
package/src/memory/jobs-store.ts +33 -1
package/src/memory/journal-memory.ts +214 -0
package/src/memory/migrations/193-add-source-type-columns.ts +81 -0
package/src/memory/migrations/index.ts +1 -0
package/src/memory/migrations/registry.ts +8 -0
package/src/memory/retriever.test.ts +37 -25
package/src/memory/retriever.ts +24 -49
package/src/memory/schema/memory-core.ts +2 -0
package/src/memory/search/formatting.ts +7 -44
package/src/memory/search/staleness.ts +4 -0
package/src/memory/search/tier-classifier.ts +10 -2
package/src/memory/search/types.ts +2 -5
package/src/memory/task-memory-cleanup.ts +4 -3
package/src/notifications/adapters/slack.ts +168 -6
package/src/notifications/broadcaster.ts +1 -0
package/src/notifications/copy-composer.ts +59 -2
package/src/notifications/signal.ts +2 -0
package/src/notifications/types.ts +2 -0
package/src/prompts/journal-context.ts +133 -0
package/src/prompts/persona-resolver.ts +80 -24
package/src/prompts/system-prompt.ts +30 -0
package/src/prompts/templates/NOW.md +26 -0
package/src/prompts/templates/SOUL.md +20 -0
package/src/prompts/update-bulletin-format.ts +0 -2
package/src/providers/provider-send-message.ts +3 -32
package/src/providers/registry.ts +2 -139
package/src/providers/types.ts +1 -1
package/src/runtime/access-request-helper.ts +4 -0
package/src/runtime/auth/__tests__/guard-tests.test.ts +9 -50
package/src/runtime/auth/route-policy.ts +2 -0
package/src/runtime/gateway-client.ts +47 -4
package/src/runtime/guardian-decision-types.ts +45 -4
package/src/runtime/http-server.ts +5 -2
package/src/runtime/routes/access-request-decision.ts +2 -2
package/src/runtime/routes/app-management-routes.ts +2 -1
package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +219 -30
package/src/runtime/routes/approval-strategies/guardian-text-engine-strategy.ts +37 -14
package/src/runtime/routes/channel-readiness-routes.ts +9 -4
package/src/runtime/routes/debug-routes.ts +12 -9
package/src/runtime/routes/guardian-approval-interception.ts +168 -11
package/src/runtime/routes/guardian-approval-prompt.ts +6 -1
package/src/runtime/routes/guardian-approval-reply-helpers.ts +103 -21
package/src/runtime/routes/identity-routes.ts +1 -1
package/src/runtime/routes/inbound-message-handler.ts +31 -1
package/src/runtime/routes/inbound-stages/acl-enforcement.ts +64 -5
package/src/runtime/routes/inbound-stages/background-dispatch.ts +52 -40
package/src/runtime/routes/integrations/twilio.ts +52 -10
package/src/runtime/routes/memory-item-routes.test.ts +3 -3
package/src/runtime/routes/memory-item-routes.ts +25 -11
package/src/runtime/routes/secret-routes.ts +141 -10
package/src/runtime/routes/tts-routes.ts +11 -1
package/src/security/ces-credential-client.ts +18 -9
package/src/security/ces-rpc-credential-backend.ts +4 -3
package/src/security/credential-backend.ts +10 -4
package/src/security/secure-keys.ts +21 -4
package/src/skills/catalog-install.ts +4 -36
package/src/skills/inline-command-expansions.ts +7 -7
package/src/skills/skill-memory.ts +1 -0
package/src/subagent/manager.ts +2 -5
package/src/tools/acp/spawn.ts +78 -1
package/src/tools/credentials/vault.ts +5 -3
package/src/tools/memory/definitions.ts +3 -2
package/src/tools/memory/handlers.ts +10 -7
package/src/tools/sensitive-output-placeholders.ts +2 -2
package/src/tools/terminal/safe-env.ts +1 -0
package/src/util/browser.ts +15 -0
package/src/util/platform.ts +1 -1
package/src/workspace/migrations/016-migrate-credentials-from-keychain.ts +4 -4
package/src/workspace/migrations/017-seed-persona-dirs.ts +2 -1
package/src/workspace/migrations/018-rekey-compound-credential-keys.ts +184 -0
package/src/workspace/migrations/019-scope-journal-to-guardian.ts +103 -0
package/src/workspace/migrations/migrate-to-workspace-volume.ts +4 -4
package/src/workspace/migrations/registry.ts +4 -0
package/src/workspace/provider-commit-message-generator.ts +12 -21
package/src/__tests__/provider-fail-open-selection.test.ts +0 -271
package/src/__tests__/provider-failover-actual-provider.test.ts +0 -66
package/src/memory/search/lexical.ts +0 -48
package/src/providers/failover.ts +0 -186

package/src/memory/items-extractor.ts CHANGED Viewed

@@ -1,22 +1,24 @@
-import { and, eq, like, sql } from "drizzle-orm";
+import { and, desc, eq, like, sql } from "drizzle-orm";
 import { v4 as uuid } from "uuid";
 import { getConfig } from "../config/loader.js";
 import type { MemoryExtractionConfig } from "../config/types.js";
+import { getAssistantName } from "../daemon/identity-helpers.js";
 import { resolveGuardianPersona } from "../prompts/persona-resolver.js";
 import { buildCoreIdentityContext } from "../prompts/system-prompt.js";
 import {
-  createTimeout,
   extractToolUse,
   getConfiguredProvider,
   userMessage,
 } from "../providers/provider-send-message.js";
+import { BackendUnavailableError } from "../util/errors.js";
 import { getLogger } from "../util/logger.js";
 import { truncate } from "../util/truncate.js";
 import { maybeEnqueueConversationStartersJob } from "./conversation-starters-cadence.js";
 import { getDb } from "./db.js";
 import { computeMemoryFingerprint } from "./fingerprint.js";
 import { enqueueMemoryJob } from "./jobs-store.js";
+import { upsertJournalMemoriesFromDisk } from "./journal-memory.js";
 import { extractTextFromStoredMessageContent } from "./message-content.js";
 import { withQdrantBreaker } from "./qdrant-circuit-breaker.js";
 import { getQdrantClient } from "./qdrant-client.js";
@@ -32,7 +34,8 @@ export type MemoryItemKind =
   | "project"
   | "decision"
   | "constraint"
-  | "event";
+  | "event"
+  | "journal";
 export type OverrideConfidence = "explicit" | "tentative" | "inferred";
@@ -56,8 +59,16 @@ const VALID_KINDS = new Set<string>([
   "decision",
   "constraint",
   "event",
+  "journal",
 ]);
+/**
+ * Kinds the LLM is allowed to produce during extraction. Excludes "journal"
+ * because journal memories are created directly from disk files — any
+ * LLM-produced journal items would be silently dropped, wasting tokens.
+ */
+const EXTRACTION_KINDS = [...VALID_KINDS].filter((k) => k !== "journal");
 /** Maps old kind names to their new equivalents for graceful migration. */
 const KIND_MIGRATION_MAP: Record<string, MemoryItemKind> = {
   profile: "identity",
@@ -184,17 +195,57 @@ For each item, provide:
 Rules:
 - Only extract genuinely memorable information. Skip pleasantries, filler, and transient discussion.
 - Do NOT extract information about what tools the assistant used or what files it read — only extract substantive facts about the user, their projects, and their preferences.
-- Do NOT extract claims about actions the assistant performed, outcomes it achieved, or progress it reported (e.g., "I booked an appointment", "I sent the email"). Only extract facts stated by the user or from external sources — the assistant's self-reports are not reliable memory material.
 - Do NOT extract raw code snippets, JSON fragments, YAML, configuration values, log output, or data structures. Only extract the human-readable meaning or intent behind such content, not the literal syntax.
 - Prefer fewer high-quality items over many low-quality ones.
-- If the message contains no memorable information, return an empty array.`;
+- If the message contains no memorable information, return an empty array.
+- The preceding conversation context (if provided) is for disambiguation only. Extract items ONLY from the final message after the --- separator, not from the context messages.`;
+  // Try to extract user name from persona text
+  let userName = "the user";
+  if (userPersona) {
+    const nameMatch = userPersona.match(/\*\*Name:\*\*\s*(.+)/);
+    if (nameMatch) {
+      userName = nameMatch[1].trim();
+    }
+  }
   if (messageRole === "assistant") {
     instructions += `
-IMPORTANT: The message below is from the ASSISTANT, not the user. Do NOT attribute the assistant's own statements, feelings, self-descriptions, or introspection to the user. Only extract facts about the user, the world, or the project that the assistant is referencing or relaying — NOT the assistant's own identity, uncertainty, or behavior. If the assistant is simply talking about itself (e.g., introducing itself, expressing uncertainty about its own purpose), extract nothing.`;
+IMPORTANT: The message below is from the ASSISTANT. You may extract facts about actions taken, decisions made, and outcomes achieved. However, do NOT attribute the assistant's own identity, personality, or self-descriptions to the user. If the assistant is just introducing itself or expressing uncertainty about its own nature, extract nothing.`;
   }
+  instructions += `
+## Examples
+Good extractions from user messages:
+- "I'm a backend engineer at Acme Corp, mostly working with Go and PostgreSQL"
+  → kind: identity, subject: "Role at Acme Corp", statement: "${userName} is a backend engineer at Acme Corp, works primarily with Go and PostgreSQL"
+- "Always use semantic commits in this repo. I hate squash merges."
+  → kind: constraint, subject: "Git conventions", statement: "${userName} requires semantic commit messages. Strongly dislikes squash merges."
+- "We decided to go with Redis for the cache layer because DynamoDB was too expensive at our read volume"
+  → kind: decision, subject: "Cache layer choice", statement: "${userName} chose Redis over DynamoDB for caching due to cost at high read volumes"
+Good extractions from assistant messages:
+- "Based on your earlier mention, I see you're using Next.js 14 with the app router for the dashboard project."
+  → kind: project, subject: "Dashboard tech stack", statement: "${userName}'s dashboard project uses Next.js 14 with the app router"
+- "Since you mentioned your team follows trunk-based development, I'll keep the changes in a single commit."
+  → kind: constraint, subject: "Team branching strategy", statement: "${userName}'s team follows trunk-based development"
+- "I've refactored the auth middleware to use JWT validation and added rate limiting to the login endpoint."
+  → kind: project, subject: "Auth middleware changes", statement: "Auth middleware was refactored to use JWT validation with rate limiting on the login endpoint"
+Do NOT extract:
+- "I'll check that file for you" → assistant operational statement with no lasting information
+- "I think the best approach would be to refactor this" → speculative, no action taken yet
+- "The tests passed" → transient status
+- "Sure, sounds good" → filler
+- "\`\`\`json {"key": "val"} \`\`\`" → raw code/data, extract meaning not syntax`;
   if (existingItems.length > 0) {
     instructions += `\n\nExisting memory items (use these to identify supersession targets — set \`supersedes\` to the item ID if the new information replaces one of these):\n`;
     for (const item of existingItems) {
@@ -206,8 +257,7 @@ IMPORTANT: The message below is from the ASSISTANT, not the user. Do NOT attribu
   // generic "User ..." labels. Budget is dynamically computed: whatever
   // remains after the fixed instructions fits within the system prompt
   // ceiling, preventing oversized prompts from exceeding the provider input
-  // window (which would cause sendMessage to error and fall back to
-  // lower-quality pattern-based extraction).
+  // window (which would cause sendMessage to error).
   const rawIdentityContext = buildCoreIdentityContext(
     userPersona ? { userPersona } : undefined,
   );
@@ -320,188 +370,200 @@ async function extractItemsWithLLM(
   extractionConfig: MemoryExtractionConfig,
   scopeId: string,
   messageRole: string,
+  precedingMessages: Array<{ role: string; content: string }>,
   userPersona?: string | null,
 ): Promise<ExtractedItem[]> {
   const provider = await getConfiguredProvider();
   if (!provider) {
-    log.debug(
-      "Configured provider unavailable for LLM extraction, falling back to pattern-based",
+    throw new BackendUnavailableError(
+      "Provider unavailable for memory extraction",
     );
-    return extractItemsPatternBased(text, scopeId);
   }
-  try {
-    const { signal, cleanup } = createTimeout(15000);
-    try {
-      // Query existing items to give the LLM supersession context
-      const existingItems = queryExistingItemsForContext(scopeId, text);
-      const systemPrompt = buildExtractionSystemPrompt(
-        existingItems,
-        messageRole,
-        userPersona,
-      );
+  // Query existing items to give the LLM supersession context
+  const existingItems = queryExistingItemsForContext(scopeId, text);
+  const systemPrompt = buildExtractionSystemPrompt(
+    existingItems,
+    messageRole,
+    userPersona,
+  );
+  const assistantName = getAssistantName() ?? "the assistant";
+  const messagePrefix =
+    messageRole === "assistant"
+      ? `[This message is from ${assistantName}]\n\n`
+      : `[This message is from the user]\n\n`;
+  // Build user content with optional preceding conversation context
+  const contextParts: string[] = [];
+  for (const msg of precedingMessages) {
+    const msgText = extractTextFromStoredMessageContent(msg.content);
+    if (msgText.length === 0) continue;
+    const roleLabel =
+      msg.role === "assistant"
+        ? (getAssistantName() ?? "assistant")
+        : "user";
+    contextParts.push(`[${roleLabel}]: ${msgText}`);
+  }
+  let userContent = `${messagePrefix}${text}`;
+  if (contextParts.length > 0) {
+    userContent = `Preceding conversation context:\n${contextParts.join("\n\n")}\n\n---\n\nMessage to extract from:\n${messagePrefix}${text}`;
+  }
-      const messagePrefix =
-        messageRole === "assistant"
-          ? "[This message is from the assistant]\n\n"
-          : "";
-      const response = await provider.sendMessage(
-        [userMessage(`${messagePrefix}${text}`)],
-        [
-          {
-            name: "store_memory_items",
-            description: "Store extracted memory items from the message",
-            input_schema: {
-              type: "object" as const,
-              properties: {
-                items: {
-                  type: "array",
-                  items: {
-                    type: "object",
-                    properties: {
-                      kind: {
-                        type: "string",
-                        enum: [...VALID_KINDS],
-                        description: "Category of memory item",
-                      },
-                      subject: {
-                        type: "string",
-                        description:
-                          "Short label (2-8 words) for what this is about",
-                      },
-                      statement: {
-                        type: "string",
-                        description:
-                          "Relationship-rich factual statement to remember (1-2 sentences). Include relational context.",
-                      },
-                      confidence: {
-                        type: "number",
-                        description:
-                          "Confidence that this is accurate (0.0-1.0)",
-                      },
-                      importance: {
-                        type: "number",
-                        description:
-                          "How valuable this is to remember (0.0-1.0)",
-                      },
-                      supersedes: {
-                        type: ["string", "null"],
-                        description:
-                          "ID of the existing memory item this replaces, or null if not replacing anything",
-                      },
-                      overrideConfidence: {
-                        type: "string",
-                        enum: ["explicit", "tentative", "inferred"],
-                        description:
-                          "How confident you are that this overrides an existing item: explicit (clear override), tentative (ambiguous), inferred (weak signal)",
-                      },
-                    },
-                    required: [
-                      "kind",
-                      "subject",
-                      "statement",
-                      "confidence",
-                      "importance",
-                      "supersedes",
-                      "overrideConfidence",
-                    ],
+  const response = await provider.sendMessage(
+    [userMessage(userContent)],
+    [
+      {
+        name: "store_memory_items",
+        description: "Store extracted memory items from the message",
+        input_schema: {
+          type: "object" as const,
+          properties: {
+            items: {
+              type: "array",
+              items: {
+                type: "object",
+                properties: {
+                  kind: {
+                    type: "string",
+                    enum: EXTRACTION_KINDS,
+                    description: "Category of memory item",
+                  },
+                  subject: {
+                    type: "string",
+                    description:
+                      "Short label (2-8 words) for what this is about",
+                  },
+                  statement: {
+                    type: "string",
+                    description:
+                      "Relationship-rich factual statement to remember (1-2 sentences). Include relational context.",
+                  },
+                  confidence: {
+                    type: "number",
+                    description: "Confidence that this is accurate (0.0-1.0)",
+                  },
+                  importance: {
+                    type: "number",
+                    description: "How valuable this is to remember (0.0-1.0)",
+                  },
+                  supersedes: {
+                    type: ["string", "null"],
+                    description:
+                      "ID of the existing memory item this replaces, or null if not replacing anything",
+                  },
+                  overrideConfidence: {
+                    type: "string",
+                    enum: ["explicit", "tentative", "inferred"],
+                    description:
+                      "How confident you are that this overrides an existing item: explicit (clear override), tentative (ambiguous), inferred (weak signal)",
                   },
                 },
+                required: [
+                  "kind",
+                  "subject",
+                  "statement",
+                  "confidence",
+                  "importance",
+                  "supersedes",
+                  "overrideConfidence",
+                ],
               },
-              required: ["items"],
             },
           },
-        ],
-        systemPrompt,
-        {
-          config: {
-            modelIntent: extractionConfig.modelIntent,
-            max_tokens: 1024,
-            tool_choice: { type: "tool" as const, name: "store_memory_items" },
-          },
-          signal,
+          required: ["items"],
         },
-      );
-      cleanup();
+      },
+    ],
+    systemPrompt,
+    {
+      config: {
+        modelIntent: extractionConfig.modelIntent,
+        tool_choice: { type: "tool" as const, name: "store_memory_items" },
+      },
+    },
+  );
-      const toolBlock = extractToolUse(response);
-      if (!toolBlock) {
-        log.warn(
-          "No tool_use block in LLM extraction response, falling back to pattern-based",
-        );
-        return extractItemsPatternBased(text, scopeId);
-      }
+  const toolBlock = extractToolUse(response);
+  if (!toolBlock) {
+    throw new Error("No tool_use block in LLM extraction response");
+  }
-      const input = toolBlock.input as { items?: LLMExtractedItem[] };
-      if (!Array.isArray(input.items)) {
-        log.warn(
-          "Invalid items in LLM extraction response, falling back to pattern-based",
-        );
-        return extractItemsPatternBased(text, scopeId);
-      }
+  const input = toolBlock.input as { items?: LLMExtractedItem[] };
+  if (!Array.isArray(input.items)) {
+    throw new Error("Invalid items structure in LLM extraction response");
+  }
-      // Build set of known existing item IDs for supersession validation
-      const existingItemIds = new Set(existingItems.map((e) => e.id));
-      const items: ExtractedItem[] = [];
-      for (const raw of input.items) {
-        // Apply kind migration map for old kind names, then validate
-        const resolvedKind = KIND_MIGRATION_MAP[raw.kind] ?? raw.kind;
-        if (!VALID_KINDS.has(resolvedKind)) continue;
-        if (!raw.subject || !raw.statement) continue;
-        const subject = truncate(String(raw.subject), 80, "");
-        const statement = truncate(String(raw.statement), 500, "");
-        const confidence = clampUnitInterval(parseScore(raw.confidence, 0.5));
-        const importance = clampUnitInterval(parseScore(raw.importance, 0.5));
-        const fingerprint = computeMemoryFingerprint(
-          scopeId,
-          resolvedKind,
-          subject,
-          statement,
-        );
+  // Build set of known existing item IDs for supersession validation
+  const existingItemIds = new Set(existingItems.map((e) => e.id));
-        // Validate supersedes: must reference a known existing item ID.
-        // Reject hallucinated IDs that don't match any item we showed the LLM.
-        const rawSupersedes =
-          typeof raw.supersedes === "string" && raw.supersedes.length > 0
-            ? raw.supersedes
-            : null;
-        const supersedes =
-          rawSupersedes && existingItemIds.has(rawSupersedes)
-            ? rawSupersedes
-            : null;
-        const supersedesRejected = !!rawSupersedes && !supersedes;
-        const overrideConfidence = VALID_OVERRIDE_CONFIDENCES.has(
-          raw.overrideConfidence,
-        )
-          ? (raw.overrideConfidence as OverrideConfidence)
-          : "inferred";
-        items.push({
-          kind: resolvedKind as MemoryItemKind,
-          subject,
-          statement,
-          confidence,
-          importance,
-          fingerprint,
-          supersedes,
-          overrideConfidence,
-          supersedesRejected,
-        });
-      }
+  const items: ExtractedItem[] = [];
+  for (const raw of input.items) {
+    // Apply kind migration map for old kind names, then validate
+    const resolvedKind = KIND_MIGRATION_MAP[raw.kind] ?? raw.kind;
+    if (resolvedKind === "journal") continue; // journal memories created directly from disk
+    if (!VALID_KINDS.has(resolvedKind)) continue;
+    if (!raw.subject || !raw.statement) continue;
+    const subject = String(raw.subject).trim();
+    const statement = String(raw.statement).trim();
+    const confidence = clampUnitInterval(parseScore(raw.confidence, 0.5));
+    const importance = clampUnitInterval(parseScore(raw.importance, 0.5));
+    const fingerprint = computeMemoryFingerprint(
+      scopeId,
+      resolvedKind,
+      subject,
+      statement,
+    );
-      return deduplicateItems(items);
-    } finally {
-      cleanup();
-    }
+    // Validate supersedes: must reference a known existing item ID.
+    // Reject hallucinated IDs that don't match any item we showed the LLM.
+    const rawSupersedes =
+      typeof raw.supersedes === "string" && raw.supersedes.length > 0
+        ? raw.supersedes
+        : null;
+    const supersedes =
+      rawSupersedes && existingItemIds.has(rawSupersedes)
+        ? rawSupersedes
+        : null;
+    const supersedesRejected = !!rawSupersedes && !supersedes;
+    const overrideConfidence = VALID_OVERRIDE_CONFIDENCES.has(
+      raw.overrideConfidence,
+    )
+      ? (raw.overrideConfidence as OverrideConfidence)
+      : "inferred";
+    items.push({
+      kind: resolvedKind as MemoryItemKind,
+      subject,
+      statement,
+      confidence,
+      importance,
+      fingerprint,
+      supersedes,
+      overrideConfidence,
+      supersedesRejected,
+    });
+  }
+  return deduplicateItems(items);
+}
+/**
+ * Fire conversation starters generation when journal memories were created.
+ * Wrapped in try/catch so failures never propagate to the caller.
+ */
+function triggerConversationStartersIfNeeded(
+  count: number,
+  scopeId: string,
+): void {
+  if (count <= 0) return;
+  try {
+    maybeEnqueueConversationStartersJob(scopeId);
   } catch (err) {
-    const message = err instanceof Error ? err.message : String(err);
     log.warn(
-      { err: message },
-      "LLM extraction failed, falling back to pattern-based",
+      { err: err instanceof Error ? err.message : String(err) },
+      "Failed to check conversation starters cadence",
     );
-    return extractItemsPatternBased(text, scopeId);
   }
 }
@@ -519,6 +581,7 @@ export async function extractAndUpsertMemoryItemsForMessage(
       role: messages.role,
       content: messages.content,
       createdAt: messages.createdAt,
+      conversationId: messages.conversationId,
     })
     .from(messages)
     .where(eq(messages.id, messageId))
@@ -526,18 +589,52 @@ export async function extractAndUpsertMemoryItemsForMessage(
   if (!message) return 0;
+  // Fetch up to 6 preceding messages from the same conversation for
+  // disambiguation context (e.g. resolving "that framework" or "yes, do it").
+  const effectiveConversationId = conversationId ?? message.conversationId;
+  const precedingMessages = effectiveConversationId
+    ? db
+        .select({ role: messages.role, content: messages.content })
+        .from(messages)
+        .where(
+          and(
+            eq(messages.conversationId, effectiveConversationId),
+            sql`${messages.createdAt} < ${message.createdAt}`,
+          ),
+        )
+        .orderBy(desc(messages.createdAt))
+        .limit(6)
+        .all()
+        .reverse()
+    : [];
+  const effectiveScopeId = scopeId ?? "default";
+  // Directly create journal memories from any journal files written during
+  // this message, bypassing LLM extraction (which would summarize/rewrite them).
+  // This must run before the extraction guards (semantic density, useLLM, etc.)
+  // because journal disk scanning is independent of LLM extraction.
+  let journalUpserted = 0;
+  if (message.role === "assistant") {
+    journalUpserted = upsertJournalMemoriesFromDisk(
+      message.createdAt,
+      effectiveScopeId,
+      messageId,
+    );
+  }
   const text = extractTextFromStoredMessageContent(message.content);
   if (!hasSemanticDensity(text)) {
     log.debug(
       { messageId },
       "Skipping extraction — message lacks semantic density",
     );
-    return 0;
+    triggerConversationStartersIfNeeded(journalUpserted, effectiveScopeId);
+    return journalUpserted;
   }
   const config = getConfig();
   const extractionConfig = config.memory.extraction;
-  const effectiveScopeId = scopeId ?? "default";
   // Resolve the guardian's persona to provide personality-aware extraction
   // context. Currently uses the guardian persona for all conversations —
@@ -545,17 +642,24 @@ export async function extractAndUpsertMemoryItemsForMessage(
   // better extraction context than none.
   const userPersona = resolveGuardianPersona();
-  const extracted = extractionConfig.useLLM
-    ? await extractItemsWithLLM(
-        text,
-        extractionConfig,
-        effectiveScopeId,
-        message.role,
-        userPersona,
-      )
-    : extractItemsPatternBased(text, effectiveScopeId);
+  if (!extractionConfig.useLLM) {
+    triggerConversationStartersIfNeeded(journalUpserted, effectiveScopeId);
+    return journalUpserted;
+  }
-  if (extracted.length === 0) return 0;
+  const extracted = await extractItemsWithLLM(
+    text,
+    extractionConfig,
+    effectiveScopeId,
+    message.role,
+    precedingMessages,
+    userPersona,
+  );
+  if (extracted.length === 0) {
+    triggerConversationStartersIfNeeded(journalUpserted, effectiveScopeId);
+    return journalUpserted;
+  }
   // Guard: re-check after the async LLM call. The event loop yields during
   // extractItemsWithLLM, so another task could have marked the conversation
@@ -565,13 +669,10 @@ export async function extractAndUpsertMemoryItemsForMessage(
       { messageId, conversationId },
       "Skipping upsert — conversation marked failed during extraction",
     );
-    return 0;
+    triggerConversationStartersIfNeeded(journalUpserted, effectiveScopeId);
+    return journalUpserted;
   }
-  // Determine verification state from message role
-  const verificationState =
-    message.role === "user" ? "user_reported" : "assistant_inferred";
   let upserted = 0;
   for (const item of extracted) {
     const now = Date.now();
@@ -591,13 +692,21 @@ export async function extractAndUpsertMemoryItemsForMessage(
     let effectiveStatus: string = "active";
     if (existing) {
       memoryItemId = existing.id;
-      // Promote verification state if re-seen from a more trusted source
-      const promotedState =
-        existing.verificationState === "assistant_inferred" &&
-        verificationState === "user_reported"
-          ? "user_reported"
-          : existing.verificationState;
       effectiveStatus = "active";
+      // Preserve sourceType for tool-sourced items — extraction should not
+      // demote items the user explicitly saved.
+      const effectiveSourceType =
+        existing.sourceType === "tool" ? "tool" : "extraction";
+      // Dual-write verificationState alongside sourceType for client compat.
+      // Promote from assistant_inferred → user_reported when re-seen from user.
+      const effectiveVerificationState =
+        message.role === "user" || existing.verificationState === "user_reported"
+          ? "user_reported"
+          : existing.verificationState === "user_confirmed"
+            ? "user_confirmed"
+            : "assistant_inferred";
       db.update(memoryItems)
         .set({
           status: effectiveStatus,
@@ -608,7 +717,9 @@ export async function extractAndUpsertMemoryItemsForMessage(
             Math.max(existing.importance ?? 0, item.importance),
           ),
           lastSeenAt: Math.max(existing.lastSeenAt, seenAt),
-          verificationState: promotedState,
+          sourceType: effectiveSourceType,
+          sourceMessageRole: message.role,
+          verificationState: effectiveVerificationState,
         })
         .where(eq(memoryItems.id, existing.id))
         .run();
@@ -624,7 +735,11 @@ export async function extractAndUpsertMemoryItemsForMessage(
           confidence: item.confidence,
           importance: item.importance,
           fingerprint: item.fingerprint,
-          verificationState,
+          sourceType: "extraction",
+          sourceMessageRole: message.role,
+          // Dual-write verificationState for client compat
+          verificationState:
+            message.role === "user" ? "user_reported" : "assistant_inferred",
           scopeId: effectiveScopeId,
           firstSeenAt: message.createdAt,
           lastSeenAt: seenAt,
@@ -715,11 +830,9 @@ export async function extractAndUpsertMemoryItemsForMessage(
     }
     // Fallback subject-match supersession: only when the LLM did not
-    // explicitly handle supersession for this item. This preserves the
-    // original behavior for pattern-based extraction and items without
-    // LLM-directed supersession. Skip items whose supersedes ID was
-    // rejected (hallucinated) — they should coexist, not trigger
-    // subject-based replacement.
+    // explicitly handle supersession for this item. Skip items whose
+    // supersedes ID was rejected (hallucinated) — they should coexist,
+    // not trigger subject-based replacement.
     if (
       !item.supersedes &&
       !item.supersedesRejected &&
@@ -744,7 +857,7 @@ export async function extractAndUpsertMemoryItemsForMessage(
       .values({
         memoryItemId,
         messageId,
-        evidence: truncate(item.statement, 500, ""),
+        evidence: item.statement,
         createdAt: now,
       })
       .onConflictDoNothing()
@@ -753,139 +866,19 @@ export async function extractAndUpsertMemoryItemsForMessage(
     enqueueMemoryJob("embed_item", { itemId: memoryItemId });
   }
+  upserted += journalUpserted;
   log.debug(
     { messageId, extracted: extracted.length, upserted },
     "Extracted memory items from message",
   );
   // Trigger conversation starters generation when new items are upserted
-  if (upserted > 0) {
-    try {
-      maybeEnqueueConversationStartersJob(effectiveScopeId);
-    } catch (err) {
-      log.warn(
-        { err: err instanceof Error ? err.message : String(err) },
-        "Failed to check conversation starters cadence",
-      );
-    }
-  }
+  triggerConversationStartersIfNeeded(upserted, effectiveScopeId);
   return upserted;
 }
-// ── Pattern-based extraction (fallback) ────────────────────────────────
-function extractItemsPatternBased(
-  text: string,
-  scopeId: string = "default",
-): ExtractedItem[] {
-  const sentences = text
-    .split(/[\n\r]+|(?<=[.!?])\s+/)
-    .map((s) => s.trim())
-    .filter((s) => s.length >= 20 && s.length <= 500);
-  const items: ExtractedItem[] = [];
-  for (const sentence of sentences) {
-    const lower = sentence.toLowerCase();
-    const classification = classifySentence(lower);
-    if (!classification) continue;
-    const subject = inferSubject(sentence, classification.kind);
-    const statement = sentence.replace(/\s+/g, " ").trim();
-    const fingerprint = computeMemoryFingerprint(
-      scopeId,
-      classification.kind,
-      subject,
-      statement,
-    );
-    items.push({
-      kind: classification.kind,
-      subject,
-      statement,
-      confidence: classification.confidence,
-      importance: classification.importance,
-      fingerprint,
-      supersedes: null,
-      overrideConfidence: "inferred" as OverrideConfidence,
-    });
-  }
-  return deduplicateItems(items);
-}
-function classifySentence(
-  lower: string,
-): { kind: MemoryItemKind; confidence: number; importance: number } | null {
-  if (
-    includesAny(lower, [
-      "i prefer",
-      "prefer to",
-      "favorite",
-      "i like",
-      "i dislike",
-    ])
-  ) {
-    return { kind: "preference", confidence: 0.78, importance: 0.7 };
-  }
-  if (
-    includesAny(lower, [
-      "my name is",
-      "i am ",
-      "i work as",
-      "i live in",
-      "timezone",
-    ])
-  ) {
-    return { kind: "identity", confidence: 0.72, importance: 0.8 };
-  }
-  if (includesAny(lower, ["project", "repository", "repo", "codebase"])) {
-    return { kind: "project", confidence: 0.68, importance: 0.6 };
-  }
-  if (
-    includesAny(lower, ["we decided", "decision", "chosen approach", "we will"])
-  ) {
-    return { kind: "decision", confidence: 0.75, importance: 0.7 };
-  }
-  if (
-    includesAny(lower, ["todo", "to do", "next step", "follow up", "need to"])
-  ) {
-    return { kind: "project", confidence: 0.74, importance: 0.6 };
-  }
-  if (
-    includesAny(lower, [
-      "must",
-      "cannot",
-      "should not",
-      "constraint",
-      "requirement",
-    ])
-  ) {
-    return { kind: "constraint", confidence: 0.7, importance: 0.7 };
-  }
-  if (includesAny(lower, ["remember", "important", "fact", "noted"])) {
-    return { kind: "identity", confidence: 0.62, importance: 0.5 };
-  }
-  return null;
-}
-function inferSubject(sentence: string, kind: MemoryItemKind): string {
-  const trimmed = sentence.trim();
-  if (kind === "project") {
-    const match = trimmed.match(
-      /(?:project|repo(?:sitory)?)\s+([A-Za-z0-9._/-]{2,80})/i,
-    );
-    if (match) return match[1];
-  }
-  const words = trimmed.split(/\s+/).slice(0, 6).join(" ");
-  return truncate(words, 80, "");
-}
-function includesAny(text: string, needles: string[]): boolean {
-  for (const needle of needles) {
-    if (text.includes(needle)) return true;
-  }
-  return false;
-}
 // ── Helpers ────────────────────────────────────────────────────────────
 function deduplicateItems(items: ExtractedItem[]): ExtractedItem[] {