npm - @vellumai/assistant - Versions diffs - 0.6.0 → 0.6.1 - Mend

@vellumai/assistant 0.6.0 → 0.6.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (285) hide show

package/AGENTS.md +4 -0
package/ARCHITECTURE.md +68 -15
package/Dockerfile +2 -2
package/bun.lock +6 -2
package/docker-entrypoint.sh +32 -1
package/docs/architecture/integrations.md +1 -1
package/docs/architecture/memory.md +21 -24
package/openapi.yaml +538 -3
package/package.json +5 -1
package/src/__tests__/anthropic-provider.test.ts +160 -95
package/src/__tests__/app-dir-path-guard.test.ts +1 -0
package/src/__tests__/app-executors.test.ts +47 -1
package/src/__tests__/app-source-watcher.test.ts +159 -0
package/src/__tests__/checker.test.ts +38 -6
package/src/__tests__/config-schema.test.ts +5 -0
package/src/__tests__/conversation-agent-loop-overflow.test.ts +4 -6
package/src/__tests__/conversation-agent-loop.test.ts +4 -51
package/src/__tests__/conversation-history-web-search.test.ts +1 -1
package/src/__tests__/conversation-runtime-assembly.test.ts +653 -832
package/src/__tests__/conversation-runtime-workspace.test.ts +1 -93
package/src/__tests__/conversation-tool-setup-app-refresh.test.ts +17 -4
package/src/__tests__/conversation-wipe.test.ts +2 -6
package/src/__tests__/conversation-workspace-cache-state.test.ts +6 -12
package/src/__tests__/conversation-workspace-injection.test.ts +25 -26
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
package/src/__tests__/copy-composer-tc-templates.test.ts +335 -0
package/src/__tests__/date-context.test.ts +76 -210
package/src/__tests__/db-schedule-syntax-migration.test.ts +16 -1
package/src/__tests__/file-list-tool.test.ts +219 -0
package/src/__tests__/first-greeting.test.ts +1 -1
package/src/__tests__/heartbeat-service.test.ts +180 -3
package/src/__tests__/identity-routes.test.ts +328 -0
package/src/__tests__/injection-block.test.ts +24 -0
package/src/__tests__/install-skill-routing.test.ts +7 -6
package/src/__tests__/jobs-store-qdrant-breaker.test.ts +15 -14
package/src/__tests__/list-messages-tool-merge.test.ts +300 -0
package/src/__tests__/llm-context-normalization.test.ts +18 -18
package/src/__tests__/llm-context-route-provider.test.ts +101 -0
package/src/__tests__/llm-request-log-turn-query.test.ts +162 -0
package/src/__tests__/log-export-workspace.test.ts +72 -105
package/src/__tests__/mcp-abort-signal.test.ts +5 -0
package/src/__tests__/mcp-client-auth.test.ts +5 -0
package/src/__tests__/memory-recall-log-store.test.ts +132 -0
package/src/__tests__/migration-export-streaming.test.ts +304 -0
package/src/__tests__/migration-import-commit-http.test.ts +11 -10
package/src/__tests__/mock-fetch.ts +87 -0
package/src/__tests__/notification-decision-recipient-context.test.ts +282 -0
package/src/__tests__/onboarding-template-contract.test.ts +62 -14
package/src/__tests__/parser.test.ts +32 -0
package/src/__tests__/permission-checker-host-gate.test.ts +452 -0
package/src/__tests__/permission-controls-v2-flag.test.ts +55 -0
package/src/__tests__/permission-mode-sse.test.ts +418 -0
package/src/__tests__/permission-mode-store.test.ts +277 -0
package/src/__tests__/permission-mode.test.ts +101 -0
package/src/__tests__/platform-bash-auto-approve.test.ts +359 -0
package/src/__tests__/profiler-routes.test.ts +502 -0
package/src/__tests__/profiler-run-store.test.ts +441 -0
package/src/__tests__/proxy-approval-callback.test.ts +4 -75
package/src/__tests__/registry.test.ts +1 -1
package/src/__tests__/sandbox-host-parity.test.ts +5 -4
package/src/__tests__/scheduler-reuse-conversation.test.ts +368 -0
package/src/__tests__/scrub-corrupted-image-attachments.test.ts +278 -0
package/src/__tests__/search-skills-unified.test.ts +4 -3
package/src/__tests__/send-endpoint-busy.test.ts +42 -3
package/src/__tests__/set-permission-mode.test.ts +274 -0
package/src/__tests__/skill-load-feature-flag.test.ts +12 -0
package/src/__tests__/skill-memory.test.ts +2 -783
package/src/__tests__/strip-memory-injections.test.ts +187 -0
package/src/__tests__/subagent-detail.test.ts +84 -0
package/src/__tests__/subagent-disposal.test.ts +308 -0
package/src/__tests__/subagent-manager-notify.test.ts +19 -10
package/src/__tests__/subagent-notify-parent.test.ts +390 -0
package/src/__tests__/subagent-role-registry.test.ts +108 -0
package/src/__tests__/subagent-tool-filtering.test.ts +71 -0
package/src/__tests__/subagent-tools.test.ts +464 -4
package/src/__tests__/system-prompt-ask-mode.test.ts +139 -0
package/src/__tests__/task-memory-cleanup.test.ts +12 -12
package/src/__tests__/terminal-tools.test.ts +17 -27
package/src/__tests__/test-preload.ts +4 -0
package/src/__tests__/tool-executor.test.ts +4 -26
package/src/__tests__/tool-side-effects-slack-dm.test.ts +1 -0
package/src/__tests__/top-level-renderer.test.ts +10 -13
package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +116 -2
package/src/__tests__/workspace-migration-028-recover-conversations-from-disk-view.test.ts +387 -0
package/src/agent/loop.ts +6 -0
package/src/approvals/guardian-request-resolvers.ts +24 -0
package/src/avatar/traits-png-sync.ts +3 -3
package/src/cli/__tests__/run-assistant-command.ts +29 -0
package/src/cli/commands/__tests__/email-download.test.ts +245 -0
package/src/cli/commands/__tests__/email-list.test.ts +192 -0
package/src/cli/commands/__tests__/email-register.test.ts +186 -0
package/src/cli/commands/__tests__/email-send.test.ts +291 -0
package/src/cli/commands/__tests__/email-status.test.ts +181 -0
package/src/cli/commands/__tests__/email-unregister.test.ts +139 -0
package/src/cli/commands/__tests__/routes.test.ts +562 -0
package/src/cli/commands/conversations.ts +1 -8
package/src/cli/commands/email.ts +584 -835
package/src/cli/commands/memory.ts +1 -34
package/src/cli/commands/notifications.ts +7 -2
package/src/cli/commands/oauth/connect.ts +14 -5
package/src/cli/commands/routes.ts +396 -0
package/src/cli/commands/skills.ts +130 -20
package/src/cli/program.ts +2 -0
package/src/cli.ts +1 -120
package/src/config/bundled-skills/app-builder/SKILL.md +4 -1
package/src/config/bundled-skills/gmail/SKILL.md +2 -2
package/src/config/bundled-skills/messaging/SKILL.md +7 -0
package/src/config/bundled-skills/schedule/SKILL.md +22 -2
package/src/config/bundled-skills/schedule/TOOLS.json +8 -0
package/src/config/bundled-skills/settings/tools/avatar-get.ts +3 -13
package/src/config/bundled-skills/settings/tools/avatar-remove.ts +2 -4
package/src/config/bundled-skills/settings/tools/avatar-update.ts +5 -2
package/src/config/bundled-skills/slack/SKILL.md +2 -0
package/src/config/bundled-skills/subagent/SKILL.md +43 -3
package/src/config/bundled-skills/subagent/TOOLS.json +29 -4
package/src/config/env-registry.ts +63 -0
package/src/config/feature-flag-registry.json +17 -1
package/src/config/schema.ts +8 -0
package/src/config/schemas/filing.ts +51 -0
package/src/config/schemas/heartbeat.ts +15 -12
package/src/config/schemas/memory-lifecycle.ts +12 -0
package/src/config/schemas/security.ts +14 -0
package/src/daemon/app-source-watcher.ts +93 -0
package/src/daemon/config-watcher.ts +79 -1
package/src/daemon/conversation-agent-loop-handlers.ts +20 -0
package/src/daemon/conversation-agent-loop.ts +158 -65
package/src/daemon/conversation-history.ts +4 -19
package/src/daemon/conversation-lifecycle.ts +8 -14
package/src/daemon/conversation-process.ts +13 -7
package/src/daemon/conversation-runtime-assembly.ts +300 -306
package/src/daemon/conversation-tool-setup.ts +44 -14
package/src/daemon/conversation-workspace.ts +1 -2
package/src/daemon/conversation.ts +18 -0
package/src/daemon/date-context.ts +26 -53
package/src/daemon/first-greeting.ts +1 -1
package/src/daemon/handlers/conversations.ts +4 -7
package/src/daemon/handlers/shared.test.ts +143 -0
package/src/daemon/handlers/shared.ts +63 -5
package/src/daemon/handlers/skills.ts +11 -18
package/src/daemon/lifecycle.ts +199 -157
package/src/daemon/message-types/conversations.ts +25 -6
package/src/daemon/message-types/messages.ts +9 -1
package/src/daemon/message-types/schedules.ts +1 -0
package/src/daemon/message-types/settings.ts +6 -0
package/src/daemon/profiler-run-store.ts +557 -0
package/src/daemon/server.ts +89 -9
package/src/daemon/shutdown-handlers.ts +5 -0
package/src/daemon/tool-side-effects.ts +23 -3
package/src/export/transcript-formatter.ts +148 -0
package/src/filing/filing-service.ts +228 -0
package/src/heartbeat/heartbeat-service.ts +96 -7
package/src/mcp/client.ts +6 -0
package/src/mcp/mcp-oauth-provider.ts +149 -27
package/src/memory/admin.ts +33 -32
package/src/memory/app-store.ts +69 -0
package/src/memory/conversation-bootstrap.ts +1 -1
package/src/memory/conversation-crud.ts +136 -107
package/src/memory/conversation-group-migration.ts +1 -1
package/src/memory/conversation-queries.ts +58 -12
package/src/memory/conversation-title-service.ts +1 -0
package/src/memory/db-init.ts +182 -376
package/src/memory/graph/bootstrap.ts +75 -66
package/src/memory/graph/capability-seed.ts +167 -15
package/src/memory/graph/consolidation.ts +38 -4
package/src/memory/graph/conversation-graph-memory.ts +133 -104
package/src/memory/graph/extraction-job.ts +9 -4
package/src/memory/graph/extraction.ts +66 -23
package/src/memory/graph/graph-memory-state-store.ts +37 -0
package/src/memory/graph/graph-search.ts +29 -15
package/src/memory/graph/injection.ts +38 -8
package/src/memory/graph/inspect.ts +12 -3
package/src/memory/graph/retriever.ts +365 -262
package/src/memory/graph/store.test.ts +48 -0
package/src/memory/graph/store.ts +150 -11
package/src/memory/graph/tool-handlers.ts +84 -209
package/src/memory/graph/tools.ts +8 -52
package/src/memory/graph/types.ts +24 -0
package/src/memory/job-handlers/cleanup.ts +44 -1
package/src/memory/jobs-store.ts +70 -60
package/src/memory/jobs-worker.ts +44 -28
package/src/memory/llm-request-log-store.ts +96 -12
package/src/memory/memory-recall-log-store.ts +49 -5
package/src/memory/migrations/203-drop-memory-items-tables.ts +33 -1
package/src/memory/migrations/206-memory-graph-node-edits.ts +19 -0
package/src/memory/migrations/206-scrub-corrupted-image-attachments.ts +131 -0
package/src/memory/migrations/207-conversation-graph-memory-state.ts +20 -0
package/src/memory/migrations/208-conversations-last-message-at.ts +35 -0
package/src/memory/migrations/209-strip-thinking-from-consolidated.ts +85 -0
package/src/memory/migrations/210-schedule-reuse-conversation.ts +13 -0
package/src/memory/migrations/211-memory-recall-logs-query-context.ts +21 -0
package/src/memory/migrations/212-llm-request-logs-created-at-index.ts +19 -0
package/src/memory/migrations/index.ts +8 -0
package/src/memory/migrations/registry.ts +8 -0
package/src/memory/schema/conversations.ts +14 -0
package/src/memory/schema/infrastructure.ts +8 -1
package/src/memory/schema/memory-core.ts +0 -51
package/src/memory/schema/memory-graph.ts +15 -0
package/src/memory/task-memory-cleanup.ts +30 -11
package/src/notifications/copy-composer.ts +86 -0
package/src/notifications/decision-engine.ts +35 -0
package/src/permissions/checker.ts +12 -1
package/src/permissions/permission-mode-store.ts +180 -0
package/src/permissions/permission-mode.ts +31 -0
package/src/permissions/workspace-policy.ts +9 -0
package/src/prompts/system-prompt.ts +59 -7
package/src/prompts/templates/BOOTSTRAP-REFERENCE.md +100 -0
package/src/prompts/templates/BOOTSTRAP.md +70 -165
package/src/prompts/templates/HEARTBEAT.md +3 -1
package/src/prompts/templates/SOUL.md +25 -4
package/src/prompts/templates/UPDATES.md +8 -0
package/src/providers/anthropic/client.ts +107 -219
package/src/runtime/auth/route-policy.ts +23 -0
package/src/runtime/http-server.ts +32 -2
package/src/runtime/http-types.ts +12 -1
package/src/runtime/migrations/vbundle-builder.ts +389 -3
package/src/runtime/migrations/vbundle-importer.ts +8 -6
package/src/runtime/routes/__tests__/user-route-dispatcher.test.ts +378 -0
package/src/runtime/routes/app-management-routes.ts +1 -11
package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +26 -0
package/src/runtime/routes/archive-utils.ts +29 -0
package/src/runtime/routes/avatar-routes.ts +2 -9
package/src/runtime/routes/btw-routes.ts +14 -1
package/src/runtime/routes/conversation-analysis-routes.ts +173 -0
package/src/runtime/routes/conversation-management-routes.ts +1 -14
package/src/runtime/routes/conversation-query-routes.ts +49 -3
package/src/runtime/routes/conversation-routes.ts +264 -44
package/src/runtime/routes/heartbeat-routes.ts +4 -10
package/src/runtime/routes/identity-routes.ts +53 -18
package/src/runtime/routes/llm-context-normalization.ts +14 -10
package/src/runtime/routes/log-export-routes.ts +23 -275
package/src/runtime/routes/memory-item-routes.test.ts +168 -233
package/src/runtime/routes/migration-routes.ts +18 -7
package/src/runtime/routes/profiler-routes.ts +350 -0
package/src/runtime/routes/schedule-routes.ts +27 -12
package/src/runtime/routes/settings-routes.ts +95 -8
package/src/runtime/routes/subagents-routes.ts +28 -7
package/src/runtime/routes/user-route-dispatcher.ts +223 -0
package/src/runtime/routes/user-routes.ts +41 -0
package/src/runtime/routes/workspace-routes.ts +0 -1
package/src/schedule/schedule-store.ts +30 -0
package/src/schedule/scheduler.ts +45 -18
package/src/skills/catalog-install.ts +10 -2
package/src/skills/managed-store.ts +2 -2
package/src/skills/skill-memory.ts +1 -293
package/src/subagent/index.ts +13 -3
package/src/subagent/manager.ts +308 -29
package/src/subagent/types.ts +68 -0
package/src/tasks/task-runner.ts +4 -4
package/src/tools/apps/executors.ts +29 -4
package/src/tools/filesystem/list.ts +93 -0
package/src/tools/permission-checker.ts +78 -0
package/src/tools/registry.ts +4 -0
package/src/tools/schedule/create.ts +3 -0
package/src/tools/schedule/list.ts +1 -0
package/src/tools/schedule/update.ts +6 -0
package/src/tools/shared/filesystem/errors.ts +5 -0
package/src/tools/shared/filesystem/file-ops-service.ts +90 -2
package/src/tools/shared/filesystem/types.ts +17 -0
package/src/tools/shared/shell-output.ts +31 -2
package/src/tools/subagent/abort.ts +12 -2
package/src/tools/subagent/message.ts +9 -2
package/src/tools/subagent/notify-parent.ts +79 -0
package/src/tools/subagent/read.ts +29 -8
package/src/tools/subagent/resolve.ts +21 -0
package/src/tools/subagent/spawn.ts +2 -0
package/src/tools/subagent/status.ts +11 -1
package/src/tools/system/avatar-generator.ts +3 -3
package/src/tools/system/register.ts +23 -0
package/src/tools/system/set-permission-mode.ts +103 -0
package/src/tools/terminal/parser.ts +30 -5
package/src/tools/terminal/safe-env.ts +16 -1
package/src/tools/tool-manifest.ts +6 -0
package/src/tools/types.ts +2 -0
package/src/util/logger.ts +1 -1
package/src/util/platform.ts +50 -17
package/src/workspace/migrations/023-move-config-files-to-workspace.ts +2 -2
package/src/workspace/migrations/024-move-runtime-files-to-workspace.ts +2 -2
package/src/workspace/migrations/028-recover-conversations-from-disk-view.ts +270 -0
package/src/workspace/migrations/029-seed-pkb.ts +84 -0
package/src/workspace/migrations/registry.ts +4 -0
package/src/workspace/top-level-renderer.ts +5 -9
package/src/__tests__/cli-memory.test.ts +0 -377
package/src/__tests__/clipboard.test.ts +0 -88
package/src/cli/cli-memory.ts +0 -179
package/src/util/clipboard.ts +0 -34

package/src/prompts/templates/UPDATES.md CHANGED Viewed

@@ -28,3 +28,11 @@ If your user finds proactive check-ins unwanted, they can disable it by setting
 The default checklist focuses on your user relationship, not generic tasks like weather or news. You can customize it by editing HEARTBEAT.md in your workspace.
 <!-- /vellum-update-release:heartbeat-default -->
+<!-- vellum-update-release:corrupted-attachment-cleanup -->
+## Corrupted image attachments cleaned up
+Some Slack image attachments were stored incorrectly due to a missing OAuth scope — the files contained error pages instead of actual image data. This caused conversations with those images to fail with "The AI provider rejected the request" on every subsequent message.
+This has been fixed automatically: the corrupted attachments were removed from affected conversations during this update, and the OAuth scope issue has been resolved so new image uploads work correctly. If your user mentions missing images from earlier conversations, this is why — the images were never successfully received in the first place.
+<!-- /vellum-update-release:corrupted-attachment-cleanup -->

package/src/providers/anthropic/client.ts CHANGED Viewed

@@ -206,143 +206,6 @@ function hasOrderedToolResultPrefix(
  * regular content — they are self-paired within the assistant message and must
  * not be separated by the cross-message pairing logic.
  */
-/**
- * Expand collapsed multi-turn assistant messages. During agentic tool use, the
- * daemon stores multiple thinking→tool_use→tool_result cycles in a single
- * assistant message. The Anthropic API rejects thinking blocks between
- * tool_use blocks ("tool_use without tool_result immediately after") and
- * requires thinking blocks in the latest assistant message to remain exactly
- * as generated.
- *
- * This function splits collapsed messages at each "thinking/redacted_thinking
- * after tool_use" boundary, recreating the original multi-turn structure.
- * It also distributes tool_result blocks from the following user message to
- * match each segment's tool_use blocks, creating proper assistant→user pairs.
- */
-function expandCollapsedAssistantTurns(
-  messages: Anthropic.MessageParam[],
-): Anthropic.MessageParam[] {
-  const result: Anthropic.MessageParam[] = [];
-  for (let mi = 0; mi < messages.length; mi++) {
-    const msg = messages[mi];
-    if (msg.role !== "assistant") {
-      result.push(msg);
-      continue;
-    }
-    const content = Array.isArray(msg.content) ? msg.content : [];
-    // Check if this message has thinking blocks between tool_use blocks
-    let hasThinkingAfterToolUse = false;
-    let seenToolUse = false;
-    for (const block of content) {
-      if (isToolUseBlock(block)) {
-        seenToolUse = true;
-      } else if (seenToolUse) {
-        const type = (block as { type: string }).type;
-        if (type === "thinking" || type === "redacted_thinking") {
-          hasThinkingAfterToolUse = true;
-          break;
-        }
-      }
-    }
-    if (!hasThinkingAfterToolUse) {
-      result.push(msg);
-      continue;
-    }
-    // Split at each "thinking after tool_use" boundary into separate segments
-    const segments: Anthropic.ContentBlockParam[][] = [];
-    let current: Anthropic.ContentBlockParam[] = [];
-    let segmentHasToolUse = false;
-    for (const block of content) {
-      const type = (block as { type: string }).type;
-      const isThinking = type === "thinking" || type === "redacted_thinking";
-      if (isThinking && segmentHasToolUse) {
-        segments.push(current);
-        current = [block];
-        segmentHasToolUse = false;
-      } else {
-        current.push(block);
-        if (isToolUseBlock(block)) {
-          segmentHasToolUse = true;
-        }
-      }
-    }
-    if (current.length > 0) {
-      segments.push(current);
-    }
-    // Build a map of tool_results from the following user message (if any)
-    const nextMsg = messages[mi + 1];
-    const nextIsUser = nextMsg && nextMsg.role === "user";
-    const nextContent =
-      nextIsUser && Array.isArray(nextMsg.content) ? nextMsg.content : [];
-    const toolResultMap = new Map<string, Anthropic.ContentBlockParam>();
-    const nonToolResultContent: Anthropic.ContentBlockParam[] = [];
-    for (const block of nextContent) {
-      if (isToolResultBlock(block)) {
-        toolResultMap.set(block.tool_use_id, block);
-      } else {
-        nonToolResultContent.push(block);
-      }
-    }
-    // Emit each segment as assistant→user pairs, distributing tool_results
-    for (let si = 0; si < segments.length; si++) {
-      const segment = segments[si];
-      const segToolUseIds = getOrderedToolUseIds(segment);
-      const isLastSegment = si === segments.length - 1;
-      result.push({ role: "assistant" as const, content: segment });
-      if (segToolUseIds.length > 0 && !isLastSegment) {
-        // Intermediate segment: pair with matching tool_results
-        const segResults = segToolUseIds.map(
-          (id) => toolResultMap.get(id) ?? buildSyntheticToolResult(id),
-        );
-        // Remove matched results from the map
-        for (const id of segToolUseIds) toolResultMap.delete(id);
-        result.push({ role: "user" as const, content: segResults });
-      }
-    }
-    // For the last segment, let ensureToolPairing handle pairing with the
-    // (now reduced) user message. Rebuild the user message without the
-    // tool_results that were already distributed to intermediate segments.
-    if (nextIsUser) {
-      const remainingResults = Array.from(toolResultMap.values());
-      const rebuiltUserContent = [...remainingResults, ...nonToolResultContent];
-      // Replace the original user message with the rebuilt one. When all
-      // tool_results were distributed to intermediate segments (empty rebuilt
-      // content), skip the synthetic placeholder if the next message is already
-      // a user turn — ensureToolPairing will pair the last assistant segment
-      // with that next user message naturally.
-      if (rebuiltUserContent.length > 0) {
-        result.push({ role: "user" as const, content: rebuiltUserContent });
-      } else {
-        const nextAfterUser = messages[mi + 2];
-        if (!nextAfterUser || nextAfterUser.role !== "user") {
-          result.push({
-            role: "user" as const,
-            content: [
-              { type: "text" as const, text: SYNTHETIC_CONTINUATION_TEXT },
-            ],
-          });
-        }
-      }
-      mi++; // skip the original user message
-    }
-  }
-  return result;
-}
 function splitAssistantForToolPairing(content: Anthropic.ContentBlockParam[]): {
   pairedContent: Anthropic.ContentBlockParam[];
   carryoverContent: Anthropic.ContentBlockParam[];
@@ -716,6 +579,7 @@ export class AnthropicProvider implements Provider {
     options?: SendMessageOptions,
   ): Promise<ProviderResponse> {
     const { config, onEvent, signal } = options ?? {};
+    const cacheTtl: "5m" | "1h" = ((config as Record<string, unknown> | undefined)?.cacheTtl as "5m" | "1h") ?? "1h";
     let sentMessages: Anthropic.MessageParam[] | undefined;
     try {
       const formatted = messages
@@ -819,58 +683,13 @@ export class AnthropicProvider implements Provider {
         }
       }
-      // Strip thinking/redacted_thinking blocks from historical assistant
-      // messages. These blocks carry cryptographic signatures tied to their
-      // original API response. Consolidated messages (from multi-step tool use)
-      // combine thinking blocks from different responses, making signature
-      // validation fail with "thinking blocks cannot be modified". Stripping is
-      // safe: the API allows it for all historical messages, and new responses
-      // generate fresh thinking blocks.
-      //
-      // The latest assistant turn is preserved: the API requires the most recent
-      // assistant message's thinking blocks to be passed back unmodified when
-      // sending tool results during in-progress tool-use loops.
-      let lastAssistantIdx = -1;
-      for (let i = formatted.length - 1; i >= 0; i--) {
-        if (formatted[i].role === "assistant") {
-          lastAssistantIdx = i;
-          break;
-        }
-      }
-      for (let i = 0; i < formatted.length; i++) {
-        const msg = formatted[i];
-        if (msg.role !== "assistant" || !Array.isArray(msg.content)) continue;
-        if (i === lastAssistantIdx) continue;
-        const stripped = msg.content.filter(
-          (b) =>
-            (b as { type: string }).type !== "thinking" &&
-            (b as { type: string }).type !== "redacted_thinking",
-        );
-        if (stripped.length < msg.content.length) {
-          // Ensure the message isn't empty after stripping
-          msg.content =
-            stripped.length > 0
-              ? stripped
-              : [
-                  {
-                    type: "text" as const,
-                    text: PLACEHOLDER_BLOCKS_OMITTED,
-                  },
-                ];
-        }
-      }
+      // Thinking blocks are stripped at rest by DB migration 209 so
+      // historical messages are clean when loaded. Within a turn,
+      // assistant messages have original thinking with valid signatures
+      // — the API accepts them. No provider-side stripping needed.
-      // Expand collapsed multi-turn assistant messages. When agentic tool use
-      // produces multiple thinking→tool_use cycles in a single stored message,
-      // the API rejects thinking blocks between tool_use blocks. Split such
-      // messages at each "thinking after tool_use" boundary to recreate the
-      // original multi-turn structure. With thinking blocks stripped above, the
-      // expansion is typically a no-op, but is kept as a safety net for edge
-      // cases where stripping is incomplete.
-      const expanded = expandCollapsedAssistantTurns(formatted);
-      sentMessages = ensureToolPairing(repairOrphanedServerToolUse(expanded));
-      const { effort, speed, output_config, ...restConfig } = (config ??
+      sentMessages = ensureToolPairing(repairOrphanedServerToolUse(formatted));
+      const { effort, speed, output_config, cacheTtl: _cacheTtl, ...restConfig } = (config ??
         {}) as Record<string, unknown> & {
         effort?: Anthropic.OutputConfig["effort"];
         speed?: "standard" | "fast";
@@ -914,12 +733,12 @@ export class AnthropicProvider implements Provider {
             {
               type: "text" as const,
               text: staticBlock,
-              cache_control: { type: "ephemeral" as const, ttl: "1h" as const },
+              cache_control: { type: "ephemeral" as const, ttl: cacheTtl },
             },
             {
               type: "text" as const,
               text: dynamicBlock,
-              cache_control: { type: "ephemeral" as const, ttl: "1h" as const },
+              cache_control: { type: "ephemeral" as const, ttl: cacheTtl },
             },
           ];
         } else {
@@ -927,7 +746,7 @@ export class AnthropicProvider implements Provider {
             {
               type: "text" as const,
               text: systemPrompt,
-              cache_control: { type: "ephemeral" as const, ttl: "1h" as const },
+              cache_control: { type: "ephemeral" as const, ttl: cacheTtl },
             },
           ];
         }
@@ -944,7 +763,12 @@ export class AnthropicProvider implements Provider {
             description: t.description,
             input_schema: t.input_schema as Anthropic.Tool["input_schema"],
             ...(i === otherTools.length - 1
-              ? { cache_control: { type: "ephemeral" as const, ttl: "1h" as const } }
+              ? {
+                  cache_control: {
+                    type: "ephemeral" as const,
+                    ttl: cacheTtl,
+                  },
+                }
               : {}),
           }));
           const webSearchTool: Anthropic.WebSearchTool20250305 = {
@@ -959,41 +783,98 @@ export class AnthropicProvider implements Provider {
             description: t.description,
             input_schema: t.input_schema as Anthropic.Tool["input_schema"],
             ...(i === tools.length - 1
-              ? { cache_control: { type: "ephemeral" as const, ttl: "1h" as const } }
+              ? {
+                  cache_control: {
+                    type: "ephemeral" as const,
+                    ttl: cacheTtl,
+                  },
+                }
               : {}),
           }));
         }
       }
-      // Place a cache breakpoint on the second-to-last user turn so the
-      // conversation prefix is cached between agent-loop iterations.
-      //
-      // Why second-to-last, not last?  The last user message is always new
-      // (either the initial message with fresh temporal context, or a tool
-      // result appended by the agent loop) so its breakpoint never produces
-      // a cache hit.  The second-to-last user turn is stable between
-      // iterations and caching up to it saves re-processing the full
-      // conversation prefix.
-      //
-      // We use only 1 user-turn breakpoint to stay within the Anthropic
-      // API limit of 4 cache_control blocks total:
-      //   system-static (1) + system-dynamic (2) + last-tool (3) + user (4)
-      const userIndices: number[] = [];
-      for (let i = 0; i < params.messages.length; i++) {
-        if (params.messages[i].role === "user") userIndices.push(i);
+      // Manual cache breakpoint on the turn-starting user message.
+      // This is the stable anchor for the current turn — everything up to
+      // and including it won't change during tool-use iterations, so a long
+      // TTL is appropriate. Walk backwards to find the last user message
+      // with a real text block (skipping tool_result-only messages and
+      // synthetic continuation placeholders injected by ensureToolPairing).
+      let turnStartIdx = -1;
+      for (let i = sentMessages.length - 1; i >= 0; i--) {
+        const msg = sentMessages[i];
+        if (msg.role !== "user" || !Array.isArray(msg.content)) continue;
+        const hasText = msg.content.some(
+          (b) =>
+            typeof b !== "string" &&
+            b.type === "text" &&
+            b.text !== SYNTHETIC_CONTINUATION_TEXT,
+        );
+        if (!hasText) continue;
+        const lastBlock = msg.content[msg.content.length - 1];
+        if (typeof lastBlock !== "string") {
+          (lastBlock as unknown as Record<string, unknown>).cache_control = {
+            type: "ephemeral",
+            ttl: cacheTtl,
+          };
+        }
+        turnStartIdx = i;
+        break;
       }
-      // slice(-2, -1) gives the second-to-last; empty array if < 2 user turns.
-      for (const idx of userIndices.slice(-2, -1)) {
-        const content = params.messages[idx].content;
-        if (Array.isArray(content) && content.length > 0) {
-          (
-            content[content.length - 1] as unknown as {
-              cache_control?: { type: string; ttl?: string };
+      // Advancing tail: place a short-lived 5m cache breakpoint on the last
+      // block of the last message when it falls after the turn-starting user
+      // message (i.e. tool-use loop content). This caches the growing tail
+      // cheaply without conflicting with the 1h breakpoints above.
+      // Skip thinking/redacted_thinking blocks — Anthropic doesn't allow
+      // cache_control on those types.
+      let tailBreakpointApplied = false;
+      if (turnStartIdx >= 0 && turnStartIdx < sentMessages.length - 1) {
+        const lastMsg = sentMessages[sentMessages.length - 1];
+        if (Array.isArray(lastMsg.content) && lastMsg.content.length > 0) {
+          const NON_CACHEABLE_TYPES = new Set(["thinking", "redacted_thinking"]);
+          let tailBlock: (typeof lastMsg.content)[number] | undefined;
+          for (let j = lastMsg.content.length - 1; j >= 0; j--) {
+            const block = lastMsg.content[j];
+            if (
+              typeof block !== "string" &&
+              !NON_CACHEABLE_TYPES.has((block as { type: string }).type)
+            ) {
+              tailBlock = block;
+              break;
             }
-          ).cache_control = { type: "ephemeral", ttl: "1h" };
+          }
+          if (tailBlock && typeof tailBlock !== "string") {
+            (tailBlock as unknown as Record<string, unknown>).cache_control = {
+              type: "ephemeral",
+              ttl: "5m",
+            };
+            tailBreakpointApplied = true;
+          }
         }
       }
+      // Enforce Anthropic API maximum of 4 cache_control blocks.
+      // When the system prompt boundary splits into 2 cached blocks AND
+      // tools + turn-start + advancing-tail breakpoints are all present,
+      // we'd have 5.  Drop the static system block's breakpoint — it's
+      // small (<1K tokens) so the re-read cost is negligible, while the
+      // dynamic block (workspace context) rarely changes mid-session and
+      // benefits more from caching.
+      const hasTailBreakpoint = tailBreakpointApplied;
+      const hasToolCacheBreakpoint =
+        params.tools?.some(
+          (t) => "cache_control" in t && t.cache_control != null,
+        ) ?? false;
+      if (
+        hasTailBreakpoint &&
+        Array.isArray(params.system) &&
+        params.system.length === 2 &&
+        hasToolCacheBreakpoint
+      ) {
+        delete (params.system[0] as unknown as Record<string, unknown>).cache_control;
+      }
       const { signal: timeoutSignal, cleanup: cleanupTimeout } =
         createStreamTimeout(this.streamTimeoutMs, signal);
@@ -1010,8 +891,7 @@ export class AnthropicProvider implements Provider {
       }
       // Fast mode: use the beta endpoint with speed: "fast" for Opus 4.6
-      const useFastMode =
-        speed === "fast" && effectiveModel.includes("opus");
+      const useFastMode = speed === "fast" && effectiveModel.includes("opus");
       // Collect required betas: extended cache TTL for 1h system prompt caching,
       // 1M context window, and fast-mode when applicable.
@@ -1198,6 +1078,14 @@ export class AnthropicProvider implements Provider {
             "Anthropic 400: tool_use/tool_result pairing error — dumping message structure",
           );
         }
+        log.error(
+          {
+            status: error.status,
+            message: error.message,
+            headers: Object.fromEntries(error.headers?.entries() ?? []),
+          },
+          `Anthropic API error (${error.status})`,
+        );
         const retryAfterMs = extractRetryAfterMs(error.headers);
         throw new ProviderError(
           `Anthropic API error (${error.status}): ${error.message}`,

package/src/runtime/auth/route-policy.ts CHANGED Viewed

@@ -130,6 +130,7 @@ const ACTOR_ENDPOINTS: Array<{ endpoint: string; scopes: Scope[] }> = [
   { endpoint: "conversations", scopes: ["chat.read"] },
   { endpoint: "conversations:POST", scopes: ["chat.write"] },
   { endpoint: "conversations/fork", scopes: ["chat.write"] },
+  { endpoint: "conversations/analyze", scopes: ["chat.write"] },
   { endpoint: "conversations/switch", scopes: ["chat.write"] },
   { endpoint: "conversations/name", scopes: ["chat.write"] },
   { endpoint: "conversations/cancel", scopes: ["chat.write"] },
@@ -374,6 +375,7 @@ const ACTOR_ENDPOINTS: Array<{ endpoint: string; scopes: Scope[] }> = [
   // Message content
   { endpoint: "messages/content", scopes: ["chat.read"] },
   { endpoint: "messages/llm-context", scopes: ["chat.read"] },
+  { endpoint: "llm-request-logs/payload", scopes: ["chat.read"] },
   { endpoint: "messages/tts", scopes: ["chat.read"] },
   // Queued message deletion
@@ -479,6 +481,10 @@ const ACTOR_ENDPOINTS: Array<{ endpoint: string; scopes: Scope[] }> = [
   // Tools
   { endpoint: "tools", scopes: ["settings.read"] },
   { endpoint: "tools/simulate-permission", scopes: ["settings.read"] },
+  // Permission mode
+  { endpoint: "permission-mode:GET", scopes: ["settings.read"] },
+  { endpoint: "permission-mode", scopes: ["settings.write"] },
 ];
 for (const { endpoint, scopes } of ACTOR_ENDPOINTS) {
@@ -531,3 +537,20 @@ registerPolicy("admin/rollback-migrations", {
   requiredScopes: ["internal.write"],
   allowedPrincipalTypes: ["svc_gateway"],
 });
+// Profiler management: gateway-only control-plane endpoints
+registerPolicy("profiler/runs", {
+  requiredScopes: ["internal.write"],
+  allowedPrincipalTypes: ["svc_gateway"],
+});
+registerPolicy("profiler/runs/export", {
+  requiredScopes: ["internal.write"],
+  allowedPrincipalTypes: ["svc_gateway"],
+});
+// User-defined routes under /x/*
+registerPolicy("x", {
+  requiredScopes: ["settings.read"],
+  allowedPrincipalTypes: ["actor", "svc_gateway", "svc_daemon", "local"],
+});

package/src/runtime/http-server.ts CHANGED Viewed

@@ -52,6 +52,7 @@ import { resolveConversationId } from "../memory/conversation-key-store.js";
 import {
   countConversations,
   listConversations,
+  listPinnedConversations,
 } from "../memory/conversation-queries.js";
 import type { ExternalConversationBinding } from "../memory/external-conversation-store.js";
 import * as externalConversationStore from "../memory/external-conversation-store.js";
@@ -126,6 +127,7 @@ import {
   contactCatchAllRouteDefinitions,
   contactRouteDefinitions,
 } from "./routes/contact-routes.js";
+import { conversationAnalysisRouteDefinitions } from "./routes/conversation-analysis-routes.js";
 import { conversationAttentionRouteDefinitions } from "./routes/conversation-attention-routes.js";
 import {
   type ConversationManagementDeps,
@@ -171,6 +173,7 @@ import {
   handlePairingStatus,
   pairingRouteDefinitions,
 } from "./routes/pairing-routes.js";
+import { profilerRouteDefinitions } from "./routes/profiler-routes.js";
 import { recordingRouteDefinitions } from "./routes/recording-routes.js";
 import { scheduleRouteDefinitions } from "./routes/schedule-routes.js";
 import { secretRouteDefinitions } from "./routes/secret-routes.js";
@@ -185,6 +188,7 @@ import { trustRulesRouteDefinitions } from "./routes/trust-rules-routes.js";
 import { ttsRouteDefinitions } from "./routes/tts-routes.js";
 import { upgradeBroadcastRouteDefinitions } from "./routes/upgrade-broadcast-routes.js";
 import { usageRouteDefinitions } from "./routes/usage-routes.js";
+import { userRouteDefinitions } from "./routes/user-routes.js";
 import { watchRouteDefinitions } from "./routes/watch-routes.js";
 import { workItemRouteDefinitions } from "./routes/work-items-routes.js";
 import { workspaceCommitRouteDefinitions } from "./routes/workspace-commit-routes.js";
@@ -826,6 +830,7 @@ export class RuntimeHttpServer {
       title: conversation.title ?? "Untitled",
       createdAt: conversation.createdAt,
       updatedAt: conversation.updatedAt,
+      lastMessageAt: conversation.lastMessageAt,
       conversationType: conversation.conversationType ?? "standard",
       source: conversation.source ?? "user",
       ...(conversation.scheduleJobId
@@ -961,6 +966,7 @@ export class RuntimeHttpServer {
       ...notificationRouteDefinitions(),
       ...diagnosticsRouteDefinitions(),
       ...logExportRouteDefinitions(),
+      ...profilerRouteDefinitions(),
       ...documentRouteDefinitions(),
       ...workItemRouteDefinitions(
         this.sendMessageDeps
@@ -1025,8 +1031,18 @@ export class RuntimeHttpServer {
           const offset = Number(url.searchParams.get("offset") ?? 0);
           const backgroundOnly =
             url.searchParams.get("conversationType") === "background";
-          const rows = listConversations(limit, backgroundOnly, offset);
+          let rows = listConversations(limit, backgroundOnly, offset);
           const totalCount = countConversations(backgroundOnly);
+          // On the first page, ensure all pinned conversations are included
+          // even if they fall outside the paginated window.
+          if (offset === 0 && !backgroundOnly) {
+            const pinned = listPinnedConversations();
+            const seen = new Set(rows.map((c) => c.id));
+            const missing = pinned.filter((c) => !seen.has(c.id));
+            if (missing.length > 0) {
+              rows = [...rows, ...missing];
+            }
+          }
           const conversationIds = rows.map((c) => c.id);
           const displayMeta = getDisplayMetaForConversations(conversationIds);
           const bindings =
@@ -1036,6 +1052,7 @@ export class RuntimeHttpServer {
           const attentionStates =
             getAttentionStateByConversationIds(conversationIds);
           const parentCache = new Map<string, ConversationRow | null>();
+          const nextOffset = offset + limit;
           const response: Record<string, unknown> = {
             conversations: rows.map((conversation) =>
               this.serializeConversationSummary({
@@ -1046,7 +1063,8 @@ export class RuntimeHttpServer {
                 parentCache,
               }),
             ),
-            hasMore: offset + rows.length < totalCount,
+            nextOffset,
+            hasMore: nextOffset < totalCount,
           };
           // Include groups array on first page only
           if (offset === 0) {
@@ -1067,6 +1085,14 @@ export class RuntimeHttpServer {
         ? conversationManagementRouteDefinitions(conversationManagementDeps)
         : []),
+      ...(this.sendMessageDeps
+        ? conversationAnalysisRouteDefinitions({
+            sendMessageDeps: this.sendMessageDeps,
+            buildConversationDetailResponse: (id) =>
+              this.buildConversationDetailResponse(id),
+          })
+        : []),
       ...groupRouteDefinitions(),
       {
@@ -1305,6 +1331,10 @@ export class RuntimeHttpServer {
       ...traceEventRouteDefinitions(),
       ...migrationRouteDefinitions(),
+      // User-defined routes under /x/* — must be LAST so built-in routes
+      // always take priority.
+      ...userRouteDefinitions(),
       // Internal OAuth callback (gateway -> runtime)
       {
         endpoint: "internal/oauth/callback",

package/src/runtime/http-types.ts CHANGED Viewed

@@ -5,6 +5,7 @@ import type { ChannelId, InterfaceId } from "../channels/types.js";
 import type { CesClient } from "../credential-execution/client.js";
 import type { Conversation } from "../daemon/conversation.js";
 import type { TrustContext } from "../daemon/conversation-runtime-assembly.js";
+import type { ConversationCreateOptions } from "../daemon/handlers/shared.js";
 import type { SkillOperationContext } from "../daemon/handlers/skills.js";
 import type { ServerMessage } from "../daemon/message-protocol.js";
 import type {
@@ -150,7 +151,10 @@ export type MessageProcessor = (
  * Hub publishing wires outbound events to the SSE stream.
  */
 export interface SendMessageDeps {
-  getOrCreateConversation: (conversationId: string) => Promise<Conversation>;
+  getOrCreateConversation: (
+    conversationId: string,
+    options?: ConversationCreateOptions,
+  ) => Promise<Conversation>;
   assistantEventHub: AssistantEventHub;
   resolveAttachments: (attachmentIds: string[]) => Array<{
     id: string;
@@ -274,4 +278,11 @@ export interface RuntimeMessagePayload {
   textSegments?: string[];
   thinkingSegments?: string[];
   contentOrder?: string[];
+  subagentNotification?: {
+    subagentId: string;
+    label: string;
+    status: string;
+    error?: string;
+    conversationId?: string;
+  };
 }