npm - @vellumai/assistant - Versions diffs - 0.5.3 → 0.5.5 - Mend

@vellumai/assistant 0.5.3 → 0.5.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (111) hide show

package/Dockerfile +18 -27
package/docs/architecture/memory.md +105 -0
package/node_modules/@vellumai/ces-contracts/src/index.ts +1 -0
package/node_modules/@vellumai/ces-contracts/src/trust-rules.ts +42 -0
package/package.json +1 -1
package/src/__tests__/archive-recall.test.ts +560 -0
package/src/__tests__/conversation-clear-safety.test.ts +259 -0
package/src/__tests__/conversation-switch-memory-reduction.test.ts +474 -0
package/src/__tests__/credential-security-invariants.test.ts +2 -0
package/src/__tests__/db-schedule-syntax-migration.test.ts +3 -0
package/src/__tests__/memory-reducer-job.test.ts +538 -0
package/src/__tests__/memory-reducer-scheduling.test.ts +473 -0
package/src/__tests__/memory-reducer-types.test.ts +12 -4
package/src/__tests__/memory-reducer.test.ts +7 -1
package/src/__tests__/memory-regressions.test.ts +24 -4
package/src/__tests__/memory-simplified-config.test.ts +4 -4
package/src/__tests__/openai-whisper.test.ts +93 -0
package/src/__tests__/simplified-memory-e2e.test.ts +666 -0
package/src/__tests__/simplified-memory-runtime.test.ts +616 -0
package/src/__tests__/slack-messaging-token-resolution.test.ts +319 -0
package/src/__tests__/volume-security-guard.test.ts +155 -0
package/src/cli/commands/conversations.ts +18 -0
package/src/config/bundled-skills/messaging/tools/shared.ts +1 -0
package/src/config/bundled-skills/schedule/TOOLS.json +8 -0
package/src/config/bundled-skills/transcribe/tools/transcribe-media.ts +16 -37
package/src/config/env-registry.ts +9 -0
package/src/config/feature-flag-registry.json +8 -0
package/src/config/loader.ts +0 -1
package/src/config/schemas/memory-simplified.ts +1 -1
package/src/credential-execution/managed-catalog.ts +5 -15
package/src/daemon/config-watcher.ts +4 -1
package/src/daemon/conversation-memory.ts +117 -0
package/src/daemon/conversation-runtime-assembly.ts +1 -0
package/src/daemon/daemon-control.ts +7 -0
package/src/daemon/handlers/conversations.ts +11 -0
package/src/daemon/lifecycle.ts +51 -2
package/src/daemon/providers-setup.ts +2 -1
package/src/hooks/manager.ts +7 -0
package/src/instrument.ts +33 -1
package/src/memory/archive-recall.ts +516 -0
package/src/memory/brief-time.ts +5 -4
package/src/memory/conversation-crud.ts +210 -0
package/src/memory/conversation-key-store.ts +33 -4
package/src/memory/db-init.ts +4 -0
package/src/memory/embedding-local.ts +11 -5
package/src/memory/job-handlers/backfill-simplified-memory.ts +462 -0
package/src/memory/job-handlers/conversation-starters.ts +24 -30
package/src/memory/job-handlers/reduce-conversation-memory.ts +229 -0
package/src/memory/jobs-store.ts +2 -0
package/src/memory/jobs-worker.ts +8 -0
package/src/memory/migrations/036-normalize-phone-identities.ts +49 -14
package/src/memory/migrations/135-backfill-contact-interaction-stats.ts +9 -1
package/src/memory/migrations/141-rename-verification-table.ts +8 -0
package/src/memory/migrations/142-rename-verification-session-id-column.ts +7 -2
package/src/memory/migrations/174-rename-thread-starters-table.ts +8 -0
package/src/memory/migrations/188-schedule-quiet-flag.ts +13 -0
package/src/memory/migrations/index.ts +1 -0
package/src/memory/reducer-scheduler.ts +242 -0
package/src/memory/reducer-types.ts +9 -2
package/src/memory/reducer.ts +25 -11
package/src/memory/schema/infrastructure.ts +1 -0
package/src/messaging/provider.ts +9 -0
package/src/messaging/providers/slack/adapter.ts +29 -2
package/src/oauth/connection-resolver.test.ts +22 -18
package/src/oauth/connection-resolver.ts +92 -7
package/src/oauth/platform-connection.test.ts +78 -69
package/src/oauth/platform-connection.ts +12 -19
package/src/permissions/trust-client.ts +343 -0
package/src/permissions/trust-store-interface.ts +105 -0
package/src/permissions/trust-store.ts +523 -36
package/src/platform/client.test.ts +148 -0
package/src/platform/client.ts +71 -0
package/src/providers/speech-to-text/openai-whisper.test.ts +190 -0
package/src/providers/speech-to-text/openai-whisper.ts +68 -0
package/src/providers/speech-to-text/resolve.ts +9 -0
package/src/providers/speech-to-text/types.ts +17 -0
package/src/runtime/auth/route-policy.ts +10 -1
package/src/runtime/http-server.ts +2 -2
package/src/runtime/routes/conversation-management-routes.ts +88 -2
package/src/runtime/routes/guardian-bootstrap-routes.ts +19 -7
package/src/runtime/routes/inbound-message-handler.ts +27 -3
package/src/runtime/routes/inbound-stages/acl-enforcement.ts +16 -1
package/src/runtime/routes/inbound-stages/transcribe-audio.test.ts +287 -0
package/src/runtime/routes/inbound-stages/transcribe-audio.ts +122 -0
package/src/runtime/routes/log-export-routes.ts +1 -0
package/src/runtime/routes/secret-routes.ts +5 -1
package/src/schedule/schedule-store.ts +7 -0
package/src/schedule/scheduler.ts +6 -2
package/src/security/ces-credential-client.ts +173 -0
package/src/security/secure-keys.ts +65 -22
package/src/signals/bash.ts +3 -0
package/src/signals/cancel.ts +3 -0
package/src/signals/confirm.ts +3 -0
package/src/signals/conversation-undo.ts +3 -0
package/src/signals/event-stream.ts +7 -0
package/src/signals/shotgun.ts +3 -0
package/src/signals/trust-rule.ts +3 -0
package/src/telemetry/usage-telemetry-reporter.test.ts +23 -36
package/src/telemetry/usage-telemetry-reporter.ts +22 -20
package/src/tools/filesystem/edit.ts +6 -1
package/src/tools/filesystem/read.ts +6 -1
package/src/tools/filesystem/write.ts +6 -1
package/src/tools/memory/handlers.ts +129 -1
package/src/tools/schedule/create.ts +3 -0
package/src/tools/schedule/list.ts +5 -1
package/src/tools/schedule/update.ts +6 -0
package/src/util/device-id.ts +70 -7
package/src/util/logger.ts +35 -9
package/src/util/platform.ts +29 -5
package/src/workspace/migrations/migrate-to-workspace-volume.ts +113 -0
package/src/workspace/migrations/registry.ts +2 -0

package/src/memory/job-handlers/backfill-simplified-memory.ts ADDED Viewed

@@ -0,0 +1,462 @@
+/**
+ * Backfill job handler: migrates legacy memory rows into the simplified memory
+ * system without deleting the old tables.
+ *
+ * Migration mapping:
+ *   - `memory_segments` -> `memory_chunks` (via `memory_observations`)
+ *   - `memory_summaries` -> `memory_episodes`
+ *   - Active/high-confidence `memory_items` -> `memory_observations`,
+ *     plus `time_contexts` or `open_loops` when the mapping is unambiguous.
+ *
+ * The handler is idempotent: content-hash deduplication on chunks and
+ * checkpoint tracking prevent double-writes on re-runs.
+ */
+import { eq } from "drizzle-orm";
+import { v4 as uuid } from "uuid";
+import { estimateTextTokens } from "../../context/token-estimator.js";
+import { getLogger } from "../../util/logger.js";
+import {
+  computeChunkContentHash,
+  insertObservation,
+} from "../archive-store.js";
+import { getMemoryCheckpoint, setMemoryCheckpoint } from "../checkpoints.js";
+import { getDb, rawAll } from "../db.js";
+import type { MemoryJob } from "../jobs-store.js";
+import { enqueueMemoryJob } from "../jobs-store.js";
+import {
+  conversations,
+  memoryChunks,
+  memoryEpisodes,
+  memoryObservations,
+  openLoops,
+  timeContexts,
+} from "../schema.js";
+const log = getLogger("backfill-simplified-memory");
+/** Checkpoint keys for tracking backfill progress. */
+const CHECKPOINT_SEGMENTS = "simplified_backfill:segments:last_id";
+const CHECKPOINT_SUMMARIES = "simplified_backfill:summaries:last_id";
+const CHECKPOINT_ITEMS = "simplified_backfill:items:last_id";
+const CHECKPOINT_COMPLETE = "simplified_backfill:complete";
+/** Batch size for each migration pass. */
+const BATCH_SIZE = 200;
+// ── Legacy row types ──────────────────────────────────────────────────
+interface LegacySegment {
+  id: string;
+  message_id: string;
+  conversation_id: string;
+  role: string;
+  text: string;
+  token_estimate: number;
+  scope_id: string;
+  content_hash: string | null;
+  created_at: number;
+}
+interface LegacySummary {
+  id: string;
+  scope: string;
+  scope_key: string;
+  summary: string;
+  token_estimate: number;
+  scope_id: string;
+  start_at: number;
+  end_at: number;
+  created_at: number;
+}
+interface LegacyItem {
+  id: string;
+  kind: string;
+  subject: string;
+  statement: string;
+  status: string;
+  confidence: number;
+  scope_id: string;
+  first_seen_at: number;
+  last_seen_at: number;
+  valid_from: number | null;
+  invalid_at: number | null;
+}
+// ── Entry point ───────────────────────────────────────────────────────
+export async function backfillSimplifiedMemoryJob(
+  job: MemoryJob,
+): Promise<void> {
+  const force = job.payload.force === true;
+  if (!force) {
+    const complete = getMemoryCheckpoint(CHECKPOINT_COMPLETE);
+    if (complete === "true") {
+      log.debug("Simplified memory backfill already complete, skipping");
+      return;
+    }
+  }
+  if (force) {
+    // Reset all checkpoints so the backfill restarts from scratch
+    setMemoryCheckpoint(CHECKPOINT_SEGMENTS, "");
+    setMemoryCheckpoint(CHECKPOINT_SUMMARIES, "");
+    setMemoryCheckpoint(CHECKPOINT_ITEMS, "");
+    setMemoryCheckpoint(CHECKPOINT_COMPLETE, "false");
+  }
+  let hasMore = false;
+  // ── Phase 1: memory_segments -> memory_observations + memory_chunks
+  hasMore = migrateSegments();
+  if (hasMore) {
+    enqueueMemoryJob("backfill_simplified_memory", {});
+    return;
+  }
+  // ── Phase 2: memory_summaries -> memory_episodes
+  hasMore = migrateSummaries();
+  if (hasMore) {
+    enqueueMemoryJob("backfill_simplified_memory", {});
+    return;
+  }
+  // ── Phase 3: active memory_items -> memory_observations (+ brief-state)
+  hasMore = migrateItems();
+  if (hasMore) {
+    enqueueMemoryJob("backfill_simplified_memory", {});
+    return;
+  }
+  // All phases complete
+  setMemoryCheckpoint(CHECKPOINT_COMPLETE, "true");
+  log.info("Simplified memory backfill completed");
+}
+// ── Phase 1: Segments ─────────────────────────────────────────────────
+function migrateSegments(): boolean {
+  const lastId = getMemoryCheckpoint(CHECKPOINT_SEGMENTS) ?? "";
+  const segments = rawAll<LegacySegment>(
+    `SELECT id, message_id, conversation_id, role, text, token_estimate,
+            scope_id, content_hash, created_at
+     FROM memory_segments
+     WHERE id > ?
+     ORDER BY id ASC
+     LIMIT ?`,
+    lastId,
+    BATCH_SIZE,
+  );
+  if (segments.length === 0) return false;
+  for (const seg of segments) {
+    try {
+      // Insert as an observation — insertObservation handles chunk dedup
+      insertObservation({
+        conversationId: seg.conversation_id,
+        messageId: seg.message_id,
+        role: seg.role,
+        content: seg.text,
+        scopeId: seg.scope_id,
+        modality: "text",
+        source: "backfill:segment",
+      });
+    } catch (err) {
+      // Log and continue — individual failures should not block the batch
+      log.warn(
+        { err, segmentId: seg.id },
+        "Failed to migrate segment, skipping",
+      );
+    }
+  }
+  const lastSegment = segments[segments.length - 1];
+  setMemoryCheckpoint(CHECKPOINT_SEGMENTS, lastSegment.id);
+  log.debug(
+    { migrated: segments.length, lastId: lastSegment.id },
+    "Migrated segment batch",
+  );
+  return segments.length === BATCH_SIZE;
+}
+// ── Phase 2: Summaries ────────────────────────────────────────────────
+function migrateSummaries(): boolean {
+  const lastId = getMemoryCheckpoint(CHECKPOINT_SUMMARIES) ?? "";
+  const summaries = rawAll<LegacySummary>(
+    `SELECT id, scope, scope_key, summary, token_estimate, scope_id,
+            start_at, end_at, created_at
+     FROM memory_summaries
+     WHERE id > ?
+     ORDER BY id ASC
+     LIMIT ?`,
+    lastId,
+    BATCH_SIZE,
+  );
+  if (summaries.length === 0) return false;
+  const db = getDb();
+  const now = Date.now();
+  for (const sum of summaries) {
+    try {
+      // Derive a conversation ID from the scope_key if it looks like a conversation summary.
+      // scope_key format: "conversation:<conversationId>" or "<scope>:<key>"
+      const conversationId = extractConversationId(sum.scope, sum.scope_key);
+      if (!conversationId) {
+        log.debug(
+          { summaryId: sum.id, scope: sum.scope, scopeKey: sum.scope_key },
+          "Skipping non-conversation summary",
+        );
+        continue;
+      }
+      const episodeId = uuid();
+      const title = buildEpisodeTitle(sum.scope, sum.scope_key);
+      db.insert(memoryEpisodes)
+        .values({
+          id: episodeId,
+          scopeId: sum.scope_id,
+          conversationId,
+          title,
+          summary: sum.summary,
+          tokenEstimate: sum.token_estimate,
+          source: "backfill:summary",
+          startAt: sum.start_at,
+          endAt: sum.end_at,
+          createdAt: now,
+          updatedAt: now,
+        })
+        .onConflictDoNothing()
+        .run();
+      // Enqueue embedding for the new episode
+      enqueueMemoryJob("embed_episode", { episodeId });
+    } catch (err) {
+      log.warn(
+        { err, summaryId: sum.id },
+        "Failed to migrate summary, skipping",
+      );
+    }
+  }
+  const lastSummary = summaries[summaries.length - 1];
+  setMemoryCheckpoint(CHECKPOINT_SUMMARIES, lastSummary.id);
+  log.debug(
+    { migrated: summaries.length, lastId: lastSummary.id },
+    "Migrated summary batch",
+  );
+  return summaries.length === BATCH_SIZE;
+}
+// ── Phase 3: Items ────────────────────────────────────────────────────
+/** Sentinel conversation ID for legacy items that have no conversation linkage. */
+const LEGACY_SENTINEL_CONVERSATION_ID = "__legacy_backfill__";
+/**
+ * Ensure the legacy sentinel conversation row exists. This is needed because
+ * memory_observations has a FK constraint on conversation_id.
+ */
+function ensureLegacySentinelConversation(): void {
+  const db = getDb();
+  const existing = db
+    .select({ id: conversations.id })
+    .from(conversations)
+    .where(eq(conversations.id, LEGACY_SENTINEL_CONVERSATION_ID))
+    .get();
+  if (existing) return;
+  const now = Date.now();
+  db.insert(conversations)
+    .values({
+      id: LEGACY_SENTINEL_CONVERSATION_ID,
+      title: "[Legacy Memory Backfill]",
+      createdAt: now,
+      updatedAt: now,
+    })
+    .run();
+}
+function migrateItems(): boolean {
+  const lastId = getMemoryCheckpoint(CHECKPOINT_ITEMS) ?? "";
+  const items = rawAll<LegacyItem>(
+    `SELECT id, kind, subject, statement, status, confidence, scope_id,
+            first_seen_at, last_seen_at, valid_from, invalid_at
+     FROM memory_items
+     WHERE id > ?
+       AND status = 'active'
+       AND confidence >= 0.5
+       AND invalid_at IS NULL
+     ORDER BY id ASC
+     LIMIT ?`,
+    lastId,
+    BATCH_SIZE,
+  );
+  if (items.length === 0) return false;
+  // Ensure the sentinel conversation exists for items without conversation linkage
+  ensureLegacySentinelConversation();
+  const db = getDb();
+  const now = Date.now();
+  for (const item of items) {
+    try {
+      // Every active item becomes an observation
+      const observationId = uuid();
+      const observationContent = `[${item.kind}] ${item.subject}: ${item.statement}`;
+      db.insert(memoryObservations)
+        .values({
+          id: observationId,
+          scopeId: item.scope_id,
+          conversationId: LEGACY_SENTINEL_CONVERSATION_ID,
+          role: "user",
+          content: observationContent,
+          modality: "text",
+          source: "backfill:item",
+          createdAt: now,
+        })
+        .run();
+      // Create a chunk for the observation (with dedup)
+      const contentHash = computeChunkContentHash(
+        item.scope_id,
+        observationContent,
+      );
+      const chunkId = uuid();
+      const tokenEstimate = estimateTextTokens(observationContent);
+      db.insert(memoryChunks)
+        .values({
+          id: chunkId,
+          scopeId: item.scope_id,
+          observationId,
+          content: observationContent,
+          tokenEstimate,
+          contentHash,
+          createdAt: now,
+        })
+        .onConflictDoNothing({
+          target: [memoryChunks.scopeId, memoryChunks.contentHash],
+        })
+        .run();
+      // Enqueue embedding for the observation's chunk
+      enqueueMemoryJob("embed_chunk", { chunkId, scopeId: item.scope_id });
+      // ── Brief-state: map unambiguous items to time_contexts or open_loops
+      mapItemToBriefState(item, now);
+    } catch (err) {
+      log.warn({ err, itemId: item.id }, "Failed to migrate item, skipping");
+    }
+  }
+  const lastItem = items[items.length - 1];
+  setMemoryCheckpoint(CHECKPOINT_ITEMS, lastItem.id);
+  log.debug(
+    { migrated: items.length, lastId: lastItem.id },
+    "Migrated item batch",
+  );
+  return items.length === BATCH_SIZE;
+}
+// ── Brief-state mapping ───────────────────────────────────────────────
+/**
+ * Map a legacy memory item to `time_contexts` or `open_loops` when the
+ * mapping is unambiguous.
+ *
+ * - Items with `valid_from` and a future `invalid_at` -> time_context
+ * - `event` kind items with future timestamps -> open_loop
+ */
+function mapItemToBriefState(item: LegacyItem, now: number): void {
+  const db = getDb();
+  // Time-bounded items -> time_contexts
+  if (
+    item.valid_from != null &&
+    item.invalid_at != null &&
+    item.invalid_at > now
+  ) {
+    db.insert(timeContexts)
+      .values({
+        id: uuid(),
+        scopeId: item.scope_id,
+        summary: `${item.subject}: ${item.statement}`,
+        source: "backfill:item",
+        activeFrom: item.valid_from,
+        activeUntil: item.invalid_at,
+        createdAt: now,
+        updatedAt: now,
+      })
+      .run();
+    return;
+  }
+  // Event items with future last_seen_at -> open_loops
+  if (item.kind === "event" && item.last_seen_at > now) {
+    db.insert(openLoops)
+      .values({
+        id: uuid(),
+        scopeId: item.scope_id,
+        summary: `${item.subject}: ${item.statement}`,
+        source: "backfill:item",
+        status: "open",
+        dueAt: item.last_seen_at,
+        createdAt: now,
+        updatedAt: now,
+      })
+      .run();
+  }
+}
+// ── Helpers ───────────────────────────────────────────────────────────
+/**
+ * Extract a conversation ID from the summary's scope and scope_key.
+ * Returns null for non-conversation summaries.
+ */
+function extractConversationId(scope: string, scopeKey: string): string | null {
+  // Conversation summaries use scope "conversation" with scope_key as the ID
+  if (scope === "conversation") return scopeKey;
+  // Some summaries use "conversation:<id>" as scope_key
+  const match = scopeKey.match(/^conversation:(.+)$/);
+  if (match) return match[1];
+  return null;
+}
+/**
+ * Build a human-readable episode title from the summary's scope metadata.
+ */
+function buildEpisodeTitle(scope: string, scopeKey: string): string {
+  if (scope === "conversation") {
+    return `Conversation summary`;
+  }
+  if (scope === "weekly") {
+    return `Weekly summary (${scopeKey})`;
+  }
+  if (scope === "monthly") {
+    return `Monthly summary (${scopeKey})`;
+  }
+  return `${scope} summary`;
+}

package/src/memory/job-handlers/conversation-starters.ts CHANGED Viewed

@@ -176,11 +176,11 @@ async function generateStarters(scopeId: string): Promise<GeneratedStarter[]> {
     ? truncate(rawIdentityContext, 2000, "\n…[truncated]")
     : null;
-  const systemPrompt = `You are generating 4 conversation starters for a personal assistant app. These appear as clickable chips on the empty conversation page — the first thing the user sees when they open the app.
+  const systemPrompt = `You are generating 4 conversation starters for a personal assistant app. These appear as clickable chips on the empty conversation page — the first thing the user sees when they open the app. Clicking a chip sends its prompt as a message from the user.
 ${timeContext}
-Your goal: look at what's going on in this person's life right now and suggest the 4 most useful things they could ask you to do. Think about what a thoughtful chief of staff would proactively bring up in a 30-second check-in.
+Your goal: suggest the 4 most useful things this person could ask you to do right now.
 ${identityContext ? `## Assistant identity & user profile\n\n${identityContext}\n\n` : ""}## What you know
@@ -188,7 +188,9 @@ ${rollup}
 ${diff}
 ${skills}
-## How to think about this
+## Selection
+Generate exactly 4 starters, ranked #1 (best) to #4.
 Start from the user's situation, not from the skill list. Ask yourself:
 - What is this person likely dealing with right now (given the day/time and their context)?
@@ -197,11 +199,7 @@ Start from the user's situation, not from the skill list. Ask yourself:
 The skills list tells you what the assistant CAN do — use it to filter out suggestions the assistant can't actually help with, not as a menu to generate suggestions from.
-## Selection
-Generate exactly 4 starters, ranked #1 (best) to #4.
-For each, you must be able to clearly answer:
+For each starter, you must clearly answer:
 - Why now? (timing — day of week, recent activity, upcoming deadline)
 - Why this user? (grounded in their specific context, not generic)
 - Why would they be glad I suggested this? (genuine usefulness, not just relevance)
@@ -218,38 +216,34 @@ Favor what is live over what is merely true. Recent changes matter more than old
 ## Output format
-Return exactly 4 starters in rank order (best first).
 Each starter has:
-- label: 3-6 words, max 40 chars, starts with a verb. Should sound like a smart offer of help, not a feature name or task description. Must sound natural when read aloud.
-- prompt: 1-2 natural sentences, written as the user would actually say them — not templated.
+- label: 3-6 words, max 40 chars, starts with a verb. Written in the user's voice — something they'd want to do, not something the assistant is offering.
+- prompt: 1-2 natural sentences, as the user would actually say them.
 - category: one of ${CONVERSATION_STARTER_CATEGORIES.join(", ")}
-The 4 starters should feel like one coherent set of recommendations for this moment — similar abstraction level, no jarring mix of mundane chores and life strategy. Don't lift raw memory phrases, project names, or jargon into labels unless they already sound natural in conversation.
-Never include a chip whose primary meaning is configuration, setup, workflow creation, or "set up X for Y" unless it solves an urgent pain the user is actively feeling right now. Prefer the outcome over the mechanism — "Catch the emails that matter" beats "Set up a playbook for inbox."
+## Constraints
-## Topic diversity
+**Voice**: The user clicks these chips to send a message. Every label must read as something the user is asking to do, never something the assistant is saying to the user.
-Each chip should cover a distinct topic or concern. Never have two chips about the same tool, project, or theme — even if there are multiple related issues. Pick the single most impactful angle and give the other slot to something different. Four chips about three topics is too narrow; four chips about four topics is right.
+**Coherence**: The 4 starters should feel like one set — similar abstraction level, no jarring mix of mundane chores and life strategy.
-## User-facingness check
+**Diversity**: Each chip covers a distinct topic. Never two chips about the same tool, project, or theme. Four topics, four chips.
-If a label sounds like an issue title, project ticket, or implementation task, rewrite it. Prefer the user-visible payoff over the internal object name. The chip should feel inviting and useful, not merely accurate.
+**No setup chips**: Never include a chip whose primary meaning is configuration or "set up X for Y" unless it solves an urgent pain the user is actively feeling. Prefer the outcome over the mechanism.
-Prefer natural, flowing language over mechanical or operational phrasing. "Get Slack messages flowing" is better than "Restore outgoing Slack messages." The label should sound like something a helpful person would say, not a support ticket.
+**Natural language**: No jargon, project names, or raw memory phrases in labels unless they already sound natural in conversation. If a label sounds like a ticket title or backlog item, rewrite it as something the user would actually say.
-Before finalizing each label, ask yourself: would this feel good to click? Or does it sound like a backlog item? If it sounds like a backlog item, rewrite it.
+## Examples
-Examples of bad vs good:
-- BAD: "Fix Slack Socket Mode blocker" → GOOD: "Fix Slack so it just works"
-- BAD: "Rewire messaging for Socket Mode" → GOOD: "Get Socket Mode stable"
-- BAD: "Review this week's calendar" → GOOD: "Protect this week's focus"
-- BAD: "Model the coaching transition" → GOOD: "Plan the coaching transition"
-- BAD: "Restore outgoing Slack messages" → GOOD: "Get Slack messages flowing"
-- BAD: "Set up a playbook for inbox" → GOOD: "Catch the emails that matter"
+Bad → Good (ticket-speak → natural):
+- "Fix Slack Socket Mode blocker" → "Fix Slack so it just works"
+- "Restore outgoing Slack messages" → "Get Slack messages flowing"
+- "Review this week's calendar" → "Protect this week's focus"
+- "Set up a playbook for inbox" → "Triage my inbox"
-The good versions emphasize the user's payoff, not the internal mechanism.`;
+Bad → Good (assistant voice → user voice):
+- "You've got a busy week ahead" → "Plan my week ahead"
+- "Let me check your calendar" → "Check my Thursday schedule"`;
   const { signal, cleanup } = createTimeout(20000);
   try {
@@ -274,7 +268,7 @@ The good versions emphasize the user's payoff, not the internal mechanism.`;
                     label: {
                       type: "string",
                       description:
-                        "Concierge-quality chip text (2-7 words, max 40 chars, starts with a verb)",
+                        "User-voice chip label (2-7 words, max 40 chars, verb-first)",
                     },
                     prompt: {
                       type: "string",