npm - @vellumai/assistant - Versions diffs - 0.5.2 → 0.5.3 - Mend

@vellumai/assistant 0.5.2 → 0.5.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

package/ARCHITECTURE.md +109 -0
package/docs/skills.md +100 -0
package/package.json +1 -1
package/src/__tests__/conversation-agent-loop-overflow.test.ts +7 -0
package/src/__tests__/conversation-agent-loop.test.ts +7 -0
package/src/__tests__/conversation-memory-dirty-tail.test.ts +150 -0
package/src/__tests__/conversation-provider-retry-repair.test.ts +7 -0
package/src/__tests__/conversation-wipe.test.ts +226 -0
package/src/__tests__/db-memory-archive-migration.test.ts +372 -0
package/src/__tests__/db-memory-brief-state-migration.test.ts +213 -0
package/src/__tests__/db-memory-reducer-checkpoints.test.ts +273 -0
package/src/__tests__/inline-command-runner.test.ts +311 -0
package/src/__tests__/inline-skill-authoring-guard.test.ts +220 -0
package/src/__tests__/inline-skill-load-permissions.test.ts +435 -0
package/src/__tests__/list-messages-attachments.test.ts +96 -0
package/src/__tests__/memory-brief-open-loops.test.ts +530 -0
package/src/__tests__/memory-brief-time.test.ts +285 -0
package/src/__tests__/memory-brief-wrapper.test.ts +311 -0
package/src/__tests__/memory-chunk-archive.test.ts +400 -0
package/src/__tests__/memory-chunk-dual-write.test.ts +453 -0
package/src/__tests__/memory-episode-archive.test.ts +370 -0
package/src/__tests__/memory-episode-dual-write.test.ts +626 -0
package/src/__tests__/memory-observation-archive.test.ts +375 -0
package/src/__tests__/memory-observation-dual-write.test.ts +318 -0
package/src/__tests__/memory-recall-quality.test.ts +2 -2
package/src/__tests__/memory-reducer-store.test.ts +728 -0
package/src/__tests__/memory-reducer-types.test.ts +699 -0
package/src/__tests__/memory-reducer.test.ts +698 -0
package/src/__tests__/memory-regressions.test.ts +6 -4
package/src/__tests__/memory-simplified-config.test.ts +281 -0
package/src/__tests__/parse-identity-fields.test.ts +129 -0
package/src/__tests__/skill-load-inline-command.test.ts +598 -0
package/src/__tests__/skill-load-inline-includes.test.ts +644 -0
package/src/__tests__/skills-inline-command-expansions.test.ts +301 -0
package/src/__tests__/skills-transitive-hash.test.ts +333 -0
package/src/__tests__/vellum-self-knowledge-inline-command.test.ts +320 -0
package/src/__tests__/workspace-migration-backfill-installation-id.test.ts +4 -4
package/src/config/bundled-skills/app-builder/SKILL.md +8 -8
package/src/config/bundled-skills/skill-management/SKILL.md +1 -1
package/src/config/bundled-skills/skill-management/TOOLS.json +2 -2
package/src/config/feature-flag-registry.json +16 -0
package/src/config/loader.ts +1 -0
package/src/config/raw-config-utils.ts +28 -0
package/src/config/schema.ts +12 -0
package/src/config/schemas/memory-simplified.ts +101 -0
package/src/config/schemas/memory.ts +4 -0
package/src/config/skills.ts +50 -4
package/src/daemon/conversation-agent-loop-handlers.ts +8 -3
package/src/daemon/conversation-agent-loop.ts +71 -1
package/src/daemon/conversation-lifecycle.ts +11 -1
package/src/daemon/conversation-runtime-assembly.ts +2 -1
package/src/daemon/conversation-surfaces.ts +31 -8
package/src/daemon/conversation.ts +40 -23
package/src/daemon/handlers/config-embeddings.ts +10 -2
package/src/daemon/handlers/config-model.ts +0 -9
package/src/daemon/handlers/identity.ts +12 -1
package/src/daemon/lifecycle.ts +9 -1
package/src/daemon/message-types/conversations.ts +0 -1
package/src/daemon/server.ts +1 -1
package/src/followups/followup-store.ts +47 -1
package/src/memory/archive-store.ts +400 -0
package/src/memory/brief-formatting.ts +33 -0
package/src/memory/brief-open-loops.ts +266 -0
package/src/memory/brief-time.ts +161 -0
package/src/memory/brief.ts +75 -0
package/src/memory/conversation-crud.ts +245 -101
package/src/memory/db-init.ts +12 -0
package/src/memory/indexer.ts +106 -15
package/src/memory/job-handlers/embedding.test.ts +1 -0
package/src/memory/job-handlers/embedding.ts +83 -0
package/src/memory/job-utils.ts +1 -1
package/src/memory/jobs-store.ts +6 -0
package/src/memory/jobs-worker.ts +12 -0
package/src/memory/migrations/185-memory-brief-state.ts +52 -0
package/src/memory/migrations/186-memory-archive.ts +109 -0
package/src/memory/migrations/187-memory-reducer-checkpoints.ts +19 -0
package/src/memory/migrations/index.ts +3 -0
package/src/memory/qdrant-client.ts +23 -4
package/src/memory/reducer-store.ts +271 -0
package/src/memory/reducer-types.ts +99 -0
package/src/memory/reducer.ts +453 -0
package/src/memory/schema/conversations.ts +3 -0
package/src/memory/schema/index.ts +2 -0
package/src/memory/schema/memory-archive.ts +121 -0
package/src/memory/schema/memory-brief.ts +55 -0
package/src/memory/search/semantic.ts +17 -4
package/src/oauth/oauth-store.ts +3 -1
package/src/permissions/checker.ts +89 -6
package/src/permissions/defaults.ts +14 -0
package/src/runtime/routes/conversation-management-routes.ts +6 -0
package/src/runtime/routes/conversation-query-routes.ts +7 -0
package/src/runtime/routes/conversation-routes.ts +52 -5
package/src/runtime/routes/identity-routes.ts +2 -35
package/src/runtime/routes/llm-context-normalization.ts +14 -1
package/src/runtime/routes/memory-item-routes.ts +90 -5
package/src/runtime/routes/secret-routes.ts +2 -0
package/src/runtime/routes/surface-action-routes.ts +68 -1
package/src/schedule/schedule-store.ts +21 -0
package/src/skills/inline-command-expansions.ts +204 -0
package/src/skills/inline-command-render.ts +127 -0
package/src/skills/inline-command-runner.ts +242 -0
package/src/skills/transitive-version-hash.ts +88 -0
package/src/tasks/task-store.ts +43 -1
package/src/tools/permission-checker.ts +8 -1
package/src/tools/skills/load.ts +140 -6
package/src/util/platform.ts +18 -0
package/src/workspace/migrations/{002-backfill-installation-id.ts → 011-backfill-installation-id.ts} +1 -1
package/src/workspace/migrations/registry.ts +1 -1

package/src/memory/reducer.ts ADDED Viewed

@@ -0,0 +1,453 @@
+/**
+ * Simplified memory reducer — provider-backed conversation turn processor.
+ *
+ * This module owns:
+ *   1. ReducerPromptInput — structured input for the provider call
+ *   2. runReducer — send the transcript span to the LLM and return a typed result
+ *   3. parseReducerOutput — raw string -> validated ReducerResult
+ *   4. Fallback to EMPTY_REDUCER_RESULT on any invalid output
+ *
+ * The reducer is intentionally side-effect-free: it never writes to the
+ * database. Callers are responsible for applying the returned ReducerResult.
+ */
+import {
+  createTimeout,
+  extractText,
+  getConfiguredProvider,
+} from "../providers/provider-send-message.js";
+import { getLogger } from "../util/logger.js";
+import {
+  type ArchiveEpisodeCandidate,
+  type ArchiveObservationCandidate,
+  EMPTY_REDUCER_RESULT,
+  type OpenLoopCreate,
+  type OpenLoopOp,
+  type OpenLoopUpdate,
+  type ReducerResult,
+  type TimeContextOp,
+  type TimeContextUpdate,
+} from "./reducer-types.js";
+const log = getLogger("memory-reducer");
+/** Timeout for the reducer provider call (ms). */
+const REDUCER_TIMEOUT_MS = 30_000;
+// ── Prompt input type ──────────────────────────────────────────────────
+/** The structured input that will be fed to the reducer provider call. */
+export interface ReducerPromptInput {
+  /** Conversation ID being reduced. */
+  conversationId: string;
+  /** New messages since the last reduction checkpoint (role + content). */
+  newMessages: Array<{ role: string; content: string }>;
+  /** Current time-context rows the model can reference for updates. */
+  existingTimeContexts: Array<{ id: string; summary: string }>;
+  /** Current open-loop rows the model can reference for updates. */
+  existingOpenLoops: Array<{ id: string; summary: string; status: string }>;
+  /** Current time as epoch ms — injected for deterministic tests. */
+  nowMs: number;
+  /** Memory scope identifier (e.g. assistant instance ID). */
+  scopeId: string;
+}
+// ── System prompt ─────────────────────────────────────────────────────
+/**
+ * Build the reducer system prompt. Extracted as a named function so tests can
+ * assert on prompt content without coupling to string literals.
+ */
+export function buildReducerSystemPrompt(): string {
+  return [
+    "You are a memory reducer for a personal assistant. Your job is to analyze",
+    "a span of new conversation messages and produce structured JSON output that",
+    "captures important information for the assistant's long-term memory.",
+    "",
+    "You output a single JSON object with four optional arrays:",
+    "",
+    "1. `timeContexts` — time-bounded situational context (e.g. 'user traveling next week').",
+    "   Each entry has: action ('create'|'update'|'resolve'), and fields depending on the action.",
+    "   - create: summary (string), source (string), activeFrom (epoch ms), activeUntil (epoch ms)",
+    "   - update: id (string), and at least one of: summary, activeFrom, activeUntil",
+    "   - resolve: id (string)",
+    "",
+    "2. `openLoops` — unresolved items to track (e.g. 'waiting for Bob's reply').",
+    "   Each entry has: action ('create'|'update'|'resolve'), and fields depending on the action.",
+    "   - create: summary (string), source (string), optional dueAt (epoch ms)",
+    "   - update: id (string), and at least one of: summary, dueAt",
+    "   - resolve: id (string), status ('resolved'|'expired')",
+    "",
+    "3. `archiveObservations` — factual statements extracted from the conversation.",
+    "   Each entry has: content (string), role (string), optional modality (string), optional source (string)",
+    "",
+    "4. `archiveEpisodes` — coherent narrative summaries of interaction spans.",
+    "   Each entry has: title (string), summary (string), optional source (string)",
+    "",
+    "Rules:",
+    "- Output ONLY valid JSON. No markdown, no explanation, no wrapping.",
+    "- Omit arrays that would be empty rather than including empty arrays.",
+    "- For updates and resolves, reference existing IDs from the provided context.",
+    "- Be selective: only extract genuinely important or actionable information.",
+    "- Timestamps are in epoch milliseconds.",
+    "- If there is nothing meaningful to extract, output: {}",
+  ].join("\n");
+}
+/**
+ * Build the user-message content for the reducer prompt from the structured input.
+ */
+export function buildReducerUserMessage(input: ReducerPromptInput): string {
+  const parts: string[] = [];
+  parts.push(
+    `Current time: ${new Date(input.nowMs).toISOString()} (${input.nowMs}ms)`,
+  );
+  parts.push(`Conversation: ${input.conversationId}`);
+  parts.push(`Scope: ${input.scopeId}`);
+  parts.push("");
+  // Existing state the model can reference for updates/resolves
+  if (input.existingTimeContexts.length > 0) {
+    parts.push("## Active time contexts");
+    for (const tc of input.existingTimeContexts) {
+      parts.push(`- [${tc.id}] ${tc.summary}`);
+    }
+    parts.push("");
+  }
+  if (input.existingOpenLoops.length > 0) {
+    parts.push("## Active open loops");
+    for (const ol of input.existingOpenLoops) {
+      parts.push(`- [${ol.id}] (${ol.status}) ${ol.summary}`);
+    }
+    parts.push("");
+  }
+  // The unreduced transcript span
+  parts.push("## New messages to process");
+  for (const msg of input.newMessages) {
+    parts.push(`[${msg.role}]: ${msg.content}`);
+  }
+  return parts.join("\n");
+}
+// ── Provider-backed reducer call ──────────────────────────────────────
+/**
+ * Run the memory reducer against a transcript span.
+ *
+ * Sends the unreduced messages, active time contexts, active open loops,
+ * current time, and scope metadata to the configured LLM provider. Parses
+ * the response into a typed {@link ReducerResult}.
+ *
+ * This function is **side-effect-free**: it never writes to the database.
+ * The caller is responsible for applying the returned result.
+ *
+ * Returns {@link EMPTY_REDUCER_RESULT} when:
+ * - No provider is configured/available
+ * - The provider call fails or times out
+ * - The model output is unparseable
+ *
+ * @param input  Structured reducer input
+ * @param signal Optional external abort signal
+ */
+export async function runReducer(
+  input: ReducerPromptInput,
+  signal?: AbortSignal,
+): Promise<ReducerResult> {
+  const provider = await getConfiguredProvider();
+  if (!provider) {
+    log.warn(
+      "No provider available for memory reducer — returning empty result",
+    );
+    return EMPTY_REDUCER_RESULT;
+  }
+  const systemPrompt = buildReducerSystemPrompt();
+  const userText = buildReducerUserMessage(input);
+  const { signal: timeoutSignal, cleanup } = createTimeout(REDUCER_TIMEOUT_MS);
+  const combinedSignal = signal
+    ? AbortSignal.any([signal, timeoutSignal])
+    : timeoutSignal;
+  try {
+    const response = await provider.sendMessage(
+      [{ role: "user", content: [{ type: "text", text: userText }] }],
+      undefined,
+      systemPrompt,
+      {
+        signal: combinedSignal,
+        config: {
+          modelIntent: "latency-optimized" as const,
+          max_tokens: 4096,
+        },
+      },
+    );
+    const rawText = extractText(response);
+    if (!rawText) {
+      log.warn("Reducer provider returned empty text — returning empty result");
+      return EMPTY_REDUCER_RESULT;
+    }
+    return parseReducerOutput(rawText);
+  } catch (err) {
+    if (combinedSignal.aborted) {
+      log.warn("Memory reducer provider call timed out or was aborted");
+    } else {
+      log.warn({ err }, "Memory reducer provider call failed");
+    }
+    return EMPTY_REDUCER_RESULT;
+  } finally {
+    cleanup();
+  }
+}
+// ── Validation helpers ─────────────────────────────────────────────────
+const VALID_TIME_CONTEXT_ACTIONS = new Set(["create", "update", "resolve"]);
+const VALID_OPEN_LOOP_ACTIONS = new Set(["create", "update", "resolve"]);
+const VALID_OPEN_LOOP_RESOLVE_STATUSES = new Set(["resolved", "expired"]);
+function isNonEmptyString(v: unknown): v is string {
+  return typeof v === "string" && v.length > 0;
+}
+function isPositiveNumber(v: unknown): v is number {
+  return typeof v === "number" && Number.isFinite(v) && v > 0;
+}
+function isNonNegativeNumber(v: unknown): v is number {
+  return typeof v === "number" && Number.isFinite(v) && v >= 0;
+}
+function validateTimeContextOp(raw: unknown): TimeContextOp | null {
+  if (raw == null || typeof raw !== "object") return null;
+  const obj = raw as Record<string, unknown>;
+  const action = obj.action;
+  if (!isNonEmptyString(action) || !VALID_TIME_CONTEXT_ACTIONS.has(action)) {
+    return null;
+  }
+  if (action === "create") {
+    if (
+      !isNonEmptyString(obj.summary) ||
+      !isNonEmptyString(obj.source) ||
+      !isNonNegativeNumber(obj.activeFrom) ||
+      !isPositiveNumber(obj.activeUntil)
+    ) {
+      return null;
+    }
+    return {
+      action: "create",
+      summary: obj.summary,
+      source: obj.source,
+      activeFrom: obj.activeFrom,
+      activeUntil: obj.activeUntil,
+    };
+  }
+  if (action === "update") {
+    if (!isNonEmptyString(obj.id)) return null;
+    // Extract and narrow optional fields
+    const summary = isNonEmptyString(obj.summary) ? obj.summary : undefined;
+    const activeFrom = isNonNegativeNumber(obj.activeFrom)
+      ? obj.activeFrom
+      : undefined;
+    const activeUntil = isPositiveNumber(obj.activeUntil)
+      ? obj.activeUntil
+      : undefined;
+    // At least one field must be provided for the update to be meaningful
+    if (
+      summary === undefined &&
+      activeFrom === undefined &&
+      activeUntil === undefined
+    ) {
+      return null;
+    }
+    const result: TimeContextUpdate = {
+      action: "update",
+      id: obj.id,
+    };
+    if (summary !== undefined) result.summary = summary;
+    if (activeFrom !== undefined) result.activeFrom = activeFrom;
+    if (activeUntil !== undefined) result.activeUntil = activeUntil;
+    return result;
+  }
+  // resolve
+  if (!isNonEmptyString(obj.id)) return null;
+  return { action: "resolve", id: obj.id };
+}
+function validateOpenLoopOp(raw: unknown): OpenLoopOp | null {
+  if (raw == null || typeof raw !== "object") return null;
+  const obj = raw as Record<string, unknown>;
+  const action = obj.action;
+  if (!isNonEmptyString(action) || !VALID_OPEN_LOOP_ACTIONS.has(action)) {
+    return null;
+  }
+  if (action === "create") {
+    if (!isNonEmptyString(obj.summary) || !isNonEmptyString(obj.source)) {
+      return null;
+    }
+    const result: OpenLoopCreate = {
+      action: "create",
+      summary: obj.summary,
+      source: obj.source,
+    };
+    const dueAt = isNonNegativeNumber(obj.dueAt) ? obj.dueAt : undefined;
+    if (dueAt !== undefined) result.dueAt = dueAt;
+    return result;
+  }
+  if (action === "update") {
+    if (!isNonEmptyString(obj.id)) return null;
+    const summary = isNonEmptyString(obj.summary) ? obj.summary : undefined;
+    const dueAt = isNonNegativeNumber(obj.dueAt) ? obj.dueAt : undefined;
+    if (summary === undefined && dueAt === undefined) return null;
+    const result: OpenLoopUpdate = {
+      action: "update",
+      id: obj.id,
+    };
+    if (summary !== undefined) result.summary = summary;
+    if (dueAt !== undefined) result.dueAt = dueAt;
+    return result;
+  }
+  // resolve
+  if (!isNonEmptyString(obj.id)) return null;
+  if (
+    !isNonEmptyString(obj.status) ||
+    !VALID_OPEN_LOOP_RESOLVE_STATUSES.has(obj.status)
+  ) {
+    return null;
+  }
+  return {
+    action: "resolve",
+    id: obj.id,
+    status: obj.status as "resolved" | "expired",
+  };
+}
+function validateArchiveObservation(
+  raw: unknown,
+): ArchiveObservationCandidate | null {
+  if (raw == null || typeof raw !== "object") return null;
+  const obj = raw as Record<string, unknown>;
+  if (!isNonEmptyString(obj.content) || !isNonEmptyString(obj.role)) {
+    return null;
+  }
+  const result: ArchiveObservationCandidate = {
+    content: obj.content,
+    role: obj.role,
+  };
+  if (isNonEmptyString(obj.modality)) result.modality = obj.modality;
+  if (isNonEmptyString(obj.source)) result.source = obj.source;
+  return result;
+}
+function validateArchiveEpisode(raw: unknown): ArchiveEpisodeCandidate | null {
+  if (raw == null || typeof raw !== "object") return null;
+  const obj = raw as Record<string, unknown>;
+  if (!isNonEmptyString(obj.title) || !isNonEmptyString(obj.summary)) {
+    return null;
+  }
+  const result: ArchiveEpisodeCandidate = {
+    title: obj.title,
+    summary: obj.summary,
+  };
+  if (isNonEmptyString(obj.source)) result.source = obj.source;
+  return result;
+}
+// ── Public API ─────────────────────────────────────────────────────────
+/**
+ * Parse raw model output into a validated ReducerResult.
+ *
+ * On any structural error (non-JSON, missing top-level keys, wrong types)
+ * the function returns EMPTY_REDUCER_RESULT rather than throwing. Individual
+ * invalid operations within an otherwise valid structure are silently dropped
+ * to preserve the rest of the result.
+ *
+ * However, if **all four** top-level arrays are absent or not arrays, the
+ * entire output is treated as invalid and returns the empty result.
+ */
+export function parseReducerOutput(raw: string): ReducerResult {
+  let parsed: unknown;
+  try {
+    parsed = JSON.parse(raw);
+  } catch {
+    log.warn("reducer output is not valid JSON — falling back to empty result");
+    return EMPTY_REDUCER_RESULT;
+  }
+  if (parsed == null || typeof parsed !== "object" || Array.isArray(parsed)) {
+    log.warn(
+      "reducer output is not a JSON object — falling back to empty result",
+    );
+    return EMPTY_REDUCER_RESULT;
+  }
+  const obj = parsed as Record<string, unknown>;
+  // Check that at least one top-level array key exists
+  const hasTimeContexts = Array.isArray(obj.timeContexts);
+  const hasOpenLoops = Array.isArray(obj.openLoops);
+  const hasArchiveObservations = Array.isArray(obj.archiveObservations);
+  const hasArchiveEpisodes = Array.isArray(obj.archiveEpisodes);
+  if (
+    !hasTimeContexts &&
+    !hasOpenLoops &&
+    !hasArchiveObservations &&
+    !hasArchiveEpisodes
+  ) {
+    log.warn(
+      "reducer output has no recognized top-level arrays — falling back to empty result",
+    );
+    return EMPTY_REDUCER_RESULT;
+  }
+  const timeContexts: TimeContextOp[] = [];
+  if (hasTimeContexts) {
+    for (const item of obj.timeContexts as unknown[]) {
+      const validated = validateTimeContextOp(item);
+      if (validated) timeContexts.push(validated);
+    }
+  }
+  const openLoops: OpenLoopOp[] = [];
+  if (hasOpenLoops) {
+    for (const item of obj.openLoops as unknown[]) {
+      const validated = validateOpenLoopOp(item);
+      if (validated) openLoops.push(validated);
+    }
+  }
+  const archiveObservations: ArchiveObservationCandidate[] = [];
+  if (hasArchiveObservations) {
+    for (const item of obj.archiveObservations as unknown[]) {
+      const validated = validateArchiveObservation(item);
+      if (validated) archiveObservations.push(validated);
+    }
+  }
+  const archiveEpisodes: ArchiveEpisodeCandidate[] = [];
+  if (hasArchiveEpisodes) {
+    for (const item of obj.archiveEpisodes as unknown[]) {
+      const validated = validateArchiveEpisode(item);
+      if (validated) archiveEpisodes.push(validated);
+    }
+  }
+  return { timeContexts, openLoops, archiveObservations, archiveEpisodes };
+}

package/src/memory/schema/conversations.ts CHANGED Viewed

@@ -30,6 +30,9 @@ export const conversations = sqliteTable(
     forkParentMessageId: text("fork_parent_message_id"),
     isAutoTitle: integer("is_auto_title").notNull().default(1),
     scheduleJobId: text("schedule_job_id"),
+    memoryReducedThroughMessageId: text("memory_reduced_through_message_id"),
+    memoryDirtyTailSinceMessageId: text("memory_dirty_tail_since_message_id"),
+    memoryLastReducedAt: integer("memory_last_reduced_at"),
   },
   (table) => [
     index("idx_conversations_updated_at").on(table.updatedAt),

package/src/memory/schema/index.ts CHANGED Viewed

@@ -3,6 +3,8 @@ export * from "./contacts.js";
 export * from "./conversations.js";
 export * from "./guardian.js";
 export * from "./infrastructure.js";
+export * from "./memory-archive.js";
+export * from "./memory-brief.js";
 export * from "./memory-core.js";
 export * from "./notifications.js";
 export * from "./oauth.js";

package/src/memory/schema/memory-archive.ts ADDED Viewed

@@ -0,0 +1,121 @@
+import {
+  index,
+  integer,
+  sqliteTable,
+  text,
+  uniqueIndex,
+} from "drizzle-orm/sqlite-core";
+import { conversations, messages } from "./conversations.js";
+/**
+ * Raw observation records captured from conversation turns. Each observation
+ * is a single factual statement extracted from user or assistant messages,
+ * annotated with modality and source metadata for downstream recall.
+ */
+export const memoryObservations = sqliteTable(
+  "memory_observations",
+  {
+    id: text("id").primaryKey(),
+    scopeId: text("scope_id").notNull().default("default"),
+    conversationId: text("conversation_id")
+      .notNull()
+      .references(() => conversations.id, { onDelete: "cascade" }),
+    messageId: text("message_id").references(() => messages.id, {
+      onDelete: "set null",
+    }),
+    /** The role that produced the observation (e.g. "user", "assistant"). */
+    role: text("role").notNull(),
+    /** Free-text statement capturing the observed fact. */
+    content: text("content").notNull(),
+    /**
+     * Modality of the source material: "text", "voice", "image", etc.
+     * Enables downstream filters for recall relevance.
+     */
+    modality: text("modality").notNull().default("text"),
+    /**
+     * Source channel or interface that produced the observation
+     * (e.g. "vellum", "telegram", "phone").
+     */
+    source: text("source"),
+    createdAt: integer("created_at").notNull(),
+  },
+  (table) => [
+    index("idx_memory_observations_scope_id").on(table.scopeId),
+    index("idx_memory_observations_conversation_id").on(table.conversationId),
+    index("idx_memory_observations_created_at").on(table.createdAt),
+  ],
+);
+/**
+ * Deduplicated content chunks derived from observations. Chunks are the unit
+ * of embedding and recall — each chunk carries a contentHash for idempotent
+ * dual-write safety so the same content is never stored twice.
+ */
+export const memoryChunks = sqliteTable(
+  "memory_chunks",
+  {
+    id: text("id").primaryKey(),
+    scopeId: text("scope_id").notNull().default("default"),
+    observationId: text("observation_id")
+      .notNull()
+      .references(() => memoryObservations.id, { onDelete: "cascade" }),
+    /** The chunk text used for embedding and recall. */
+    content: text("content").notNull(),
+    /** Token count estimate for context-window budgeting. */
+    tokenEstimate: integer("token_estimate").notNull(),
+    /**
+     * SHA-256 hash of the normalized content, used to skip duplicate inserts
+     * during dual-write windows.
+     */
+    contentHash: text("content_hash").notNull(),
+    createdAt: integer("created_at").notNull(),
+  },
+  (table) => [
+    index("idx_memory_chunks_scope_id").on(table.scopeId),
+    index("idx_memory_chunks_observation_id").on(table.observationId),
+    uniqueIndex("idx_memory_chunks_content_hash").on(
+      table.scopeId,
+      table.contentHash,
+    ),
+    index("idx_memory_chunks_created_at").on(table.createdAt),
+  ],
+);
+/**
+ * Episode records that group related observations into coherent narrative
+ * units. An episode represents a meaningful interaction or topic span,
+ * with source-link metadata for provenance tracking.
+ */
+export const memoryEpisodes = sqliteTable(
+  "memory_episodes",
+  {
+    id: text("id").primaryKey(),
+    scopeId: text("scope_id").notNull().default("default"),
+    conversationId: text("conversation_id")
+      .notNull()
+      .references(() => conversations.id, { onDelete: "cascade" }),
+    /** Human-readable title summarizing the episode. */
+    title: text("title").notNull(),
+    /** Longer narrative summary of the episode content. */
+    summary: text("summary").notNull(),
+    /** Token count estimate for the summary. */
+    tokenEstimate: integer("token_estimate").notNull(),
+    /**
+     * Source channel or interface that produced the episode
+     * (mirrors observation.source for episode-level filtering).
+     */
+    source: text("source"),
+    /** Epoch-ms timestamp of the earliest observation in the episode. */
+    startAt: integer("start_at").notNull(),
+    /** Epoch-ms timestamp of the latest observation in the episode. */
+    endAt: integer("end_at").notNull(),
+    createdAt: integer("created_at").notNull(),
+    updatedAt: integer("updated_at").notNull(),
+  },
+  (table) => [
+    index("idx_memory_episodes_scope_id").on(table.scopeId),
+    index("idx_memory_episodes_conversation_id").on(table.conversationId),
+    index("idx_memory_episodes_created_at").on(table.createdAt),
+  ],
+);

package/src/memory/schema/memory-brief.ts ADDED Viewed

@@ -0,0 +1,55 @@
+import { index, integer, sqliteTable, text } from "drizzle-orm/sqlite-core";
+/**
+ * Time contexts represent bounded temporal windows that are relevant to the
+ * assistant's current awareness — e.g. "user is traveling next week",
+ * "quarterly planning period ends Friday".  Each row captures one window
+ * with an activation range and a human-readable summary the brief can surface.
+ */
+export const timeContexts = sqliteTable(
+  "time_contexts",
+  {
+    id: text("id").primaryKey(),
+    scopeId: text("scope_id").notNull(),
+    summary: text("summary").notNull(),
+    source: text("source").notNull(), // e.g. 'conversation', 'schedule', 'manual'
+    activeFrom: integer("active_from").notNull(), // epoch ms — window start
+    activeUntil: integer("active_until").notNull(), // epoch ms — window end
+    createdAt: integer("created_at").notNull(),
+    updatedAt: integer("updated_at").notNull(),
+  },
+  (table) => [
+    index("idx_time_contexts_scope_active_until").on(
+      table.scopeId,
+      table.activeUntil,
+    ),
+  ],
+);
+/**
+ * Open loops track unresolved items the assistant should follow up on —
+ * e.g. "waiting for Bob's reply", "need to file taxes before April 15".
+ * Each row carries a status and an optional due date so the brief can
+ * prioritise which loops to surface.
+ */
+export const openLoops = sqliteTable(
+  "open_loops",
+  {
+    id: text("id").primaryKey(),
+    scopeId: text("scope_id").notNull(),
+    summary: text("summary").notNull(),
+    status: text("status").notNull().default("open"), // 'open' | 'resolved' | 'expired'
+    source: text("source").notNull(), // e.g. 'conversation', 'followup', 'manual'
+    dueAt: integer("due_at"), // epoch ms — optional deadline
+    surfacedAt: integer("surfaced_at"), // epoch ms — last time shown in brief
+    createdAt: integer("created_at").notNull(),
+    updatedAt: integer("updated_at").notNull(),
+  },
+  (table) => [
+    index("idx_open_loops_scope_status_due").on(
+      table.scopeId,
+      table.status,
+      table.dueAt,
+    ),
+  ],
+);

package/src/memory/search/semantic.ts CHANGED Viewed

@@ -61,6 +61,7 @@ export async function semanticSearch(
         fetchLimit,
         ["item", "summary", "segment", "media"],
         excludedMessageIds,
+        scopeIds,
       ),
     );
   }
@@ -277,13 +278,13 @@ export async function semanticSearch(
  * Build a Qdrant filter for hybrid search. Mirrors the logic in
  * `searchWithFilter` but as a standalone object for the query API.
  *
- * Scope filtering: items and media store `memory_scope_id` on the Qdrant
- * point payload, so we can filter at the Qdrant level. Segments and
- * summaries rely on post-query DB filtering (same as dense-only search).
+ * Scope filtering: points with a `memory_scope_id` payload field are
+ * filtered at the Qdrant level. Legacy points without the field pass
+ * through and are caught by post-query DB filtering.
  */
 function buildHybridFilter(
   excludeMessageIds: string[],
-  _scopeIds?: string[],
+  scopeIds?: string[],
 ): Record<string, unknown> {
   const mustConditions: Array<Record<string, unknown>> = [
     {
@@ -310,6 +311,18 @@ function buildHybridFilter(
     });
   }
+  // Scope filtering: accept points whose memory_scope_id matches one of the
+  // allowed scopes, OR points that lack the field entirely (legacy data).
+  // Post-query DB filtering remains as defense-in-depth for legacy points.
+  if (scopeIds && scopeIds.length > 0) {
+    mustConditions.push({
+      should: [
+        { key: "memory_scope_id", match: { any: scopeIds } },
+        { is_empty: { key: "memory_scope_id" } },
+      ],
+    });
+  }
   const mustNotConditions: Array<Record<string, unknown>> = [
     { key: "_meta", match: { value: true } },
   ];