npm - @vellumai/assistant - Versions diffs - 0.8.4 → 0.8.5 - Mend

@vellumai/assistant 0.8.4 → 0.8.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (438) hide show

package/ARCHITECTURE.md +2 -2
package/docs/browser-use-architecture-phase2.md +1 -1
package/knip.json +2 -1
package/openapi.yaml +809 -11
package/package.json +1 -1
package/src/__tests__/anthropic-provider.test.ts +34 -37
package/src/__tests__/assistant-event-hub-self-exclusion.test.ts +293 -0
package/src/__tests__/assistant-feature-flags-integration.test.ts +3 -3
package/src/__tests__/audit-log-rotation.test.ts +70 -16
package/src/__tests__/background-workers-disk-pressure.test.ts +3 -3
package/src/__tests__/btw-routes.test.ts +2 -3
package/src/__tests__/call-controller.test.ts +0 -1
package/src/__tests__/cancel-resolves-conversation-key.test.ts +1 -1
package/src/__tests__/channel-guardian.test.ts +3 -3
package/src/__tests__/checker.test.ts +6 -15
package/src/__tests__/compaction-events.test.ts +1 -0
package/src/__tests__/compactor-call-site-logging.test.ts +214 -0
package/src/__tests__/computer-use-skill-manifest-regression.test.ts +5 -11
package/src/__tests__/computer-use-tools.test.ts +2 -4
package/src/__tests__/confirmation-request-guardian-bridge.test.ts +0 -1
package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-overflow.test.ts +197 -2
package/src/__tests__/conversation-agent-loop.test.ts +163 -122
package/src/__tests__/conversation-app-control-instantiation.test.ts +2 -5
package/src/__tests__/conversation-clear-safety.test.ts +25 -25
package/src/__tests__/conversation-delete-schedule-cleanup.test.ts +1 -1
package/src/__tests__/conversation-disk-view-integration.test.ts +2 -2
package/src/__tests__/conversation-error.test.ts +31 -0
package/src/__tests__/conversation-fork-crud.test.ts +178 -15
package/src/__tests__/conversation-lifecycle.test.ts +52 -11
package/src/__tests__/{conversation-load-cleaned-at.test.ts → conversation-load-history-stripped.test.ts} +13 -13
package/src/__tests__/conversation-provider-retry-repair.test.ts +1 -0
package/src/__tests__/conversation-routes-disk-view.test.ts +109 -0
package/src/__tests__/conversation-routes-slash-commands.test.ts +35 -0
package/src/__tests__/conversation-skill-tools.test.ts +2 -5
package/src/__tests__/conversation-store.test.ts +1 -1
package/src/__tests__/conversation-sync-tags.test.ts +99 -32
package/src/__tests__/conversation-workspace-cache-state.test.ts +1 -0
package/src/__tests__/conversation-workspace-injection.test.ts +1 -1
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
package/src/__tests__/credential-execution-feature-gates.test.ts +9 -7
package/src/__tests__/credential-execution-tools.test.ts +6 -6
package/src/__tests__/credential-security-invariants.test.ts +1 -0
package/src/__tests__/credential-vault-unit.test.ts +2 -2
package/src/__tests__/dynamic-page-surface.test.ts +2 -2
package/src/__tests__/email-html-renderer.test.ts +12 -0
package/src/__tests__/gateway-flag-listener.test.ts +237 -0
package/src/__tests__/gemini-provider.test.ts +78 -0
package/src/__tests__/guardian-dispatch.test.ts +0 -1
package/src/__tests__/guardian-outbound-http.test.ts +7 -5
package/src/__tests__/handlers-user-message-approval-consumption.test.ts +1 -1
package/src/__tests__/heartbeat-disk-pressure.test.ts +4 -0
package/src/__tests__/heartbeat-service.test.ts +4 -0
package/src/__tests__/host-shell-tool.test.ts +1 -1
package/src/__tests__/init-feature-flag-overrides.test.ts +5 -6
package/src/__tests__/list-messages-tool-merge.test.ts +70 -11
package/src/__tests__/llm-request-log-call-site.test.ts +136 -0
package/src/__tests__/llm-request-log-source-clickhouse.test.ts +26 -0
package/src/__tests__/llm-resolver.test.ts +77 -9
package/src/__tests__/llm-usage-store.test.ts +66 -0
package/src/__tests__/logger.test.ts +89 -0
package/src/__tests__/mcp-abort-signal.test.ts +2 -2
package/src/__tests__/media-generate-image.test.ts +31 -0
package/src/__tests__/memory-v2-static-injector.test.ts +7 -7
package/src/__tests__/model-intents.test.ts +2 -4
package/src/__tests__/notification-guardian-path.test.ts +0 -1
package/src/__tests__/onboarding-template-contract.test.ts +1 -1
package/src/__tests__/openai-provider.test.ts +46 -0
package/src/__tests__/openai-responses-provider.test.ts +114 -12
package/src/__tests__/pending-interactions-resolved-event.test.ts +0 -1
package/src/__tests__/platform-bash-auto-approve.test.ts +2 -2
package/src/__tests__/platform.test.ts +2 -2
package/src/__tests__/plugin-api-tool-definition.test.ts +92 -0
package/src/__tests__/plugin-bootstrap.test.ts +2 -2
package/src/__tests__/plugin-tool-contribution.test.ts +13 -6
package/src/__tests__/plugin-types.test.ts +3 -2
package/src/__tests__/prechat-onboarding-contract.test.ts +131 -98
package/src/__tests__/pricing.test.ts +12 -0
package/src/__tests__/prune-jobs-changes-parser.test.ts +61 -0
package/src/__tests__/registry.test.ts +2 -8
package/src/__tests__/require-fresh-approval.test.ts +2 -2
package/src/__tests__/runtime-events-sse-bilingual.test.ts +154 -0
package/src/__tests__/shell-tool-proxy-mode.test.ts +1 -1
package/src/__tests__/skill-feature-flags.test.ts +2 -2
package/src/__tests__/skill-projection-feature-flag.test.ts +4 -7
package/src/__tests__/skill-projection.benchmark.test.ts +2 -6
package/src/__tests__/skill-tool-factory.test.ts +1 -1
package/src/__tests__/subagent-notify-parent.test.ts +1 -1
package/src/__tests__/suggestion-routes.test.ts +1 -0
package/src/__tests__/sync-message-contract.test.ts +59 -0
package/src/__tests__/system-prompt.test.ts +145 -131
package/src/__tests__/terminal-tools.test.ts +1 -1
package/src/__tests__/tool-approval-handler.test.ts +1 -5
package/src/__tests__/tool-execute-pipeline.test.ts +2 -2
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +2 -5
package/src/__tests__/tool-executor-lifecycle-events.test.ts +15 -5
package/src/__tests__/tool-executor.test.ts +9 -62
package/src/__tests__/tool-grant-request-escalation.test.ts +1 -6
package/src/__tests__/trusted-contact-approval-notifier.test.ts +0 -1
package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +1 -6
package/src/__tests__/trusted-contact-multichannel.test.ts +0 -1
package/src/__tests__/ui-file-upload-surface.test.ts +2 -2
package/src/__tests__/usage-routes.test.ts +3 -0
package/src/__tests__/verification-control-plane-policy.test.ts +2 -2
package/src/__tests__/workspace-git-service.test.ts +6 -5
package/src/__tests__/workspace-migration-089-move-memory-tree-out-of-v3.test.ts +86 -0
package/src/acp/__tests__/prepare-agent-env.test.ts +146 -0
package/src/acp/prepare-agent-env.ts +78 -0
package/src/acp/session-manager.ts +1 -1
package/src/agent/loop.ts +8 -0
package/src/api/README.md +5 -0
package/src/api/index.ts +4 -0
package/src/api/package.json +10 -0
package/src/background-wake/background-wake-routes.test.ts +233 -0
package/src/background-wake/runtime-registry.ts +24 -0
package/src/cli/commands/__tests__/browser.test.ts +23 -5
package/src/cli/commands/__tests__/domain-register.test.ts +110 -0
package/src/cli/commands/__tests__/domain-status.test.ts +33 -33
package/src/cli/commands/__tests__/inference-send.test.ts +108 -5
package/src/cli/commands/__tests__/memory-v2-compare-render.test.ts +98 -0
package/src/cli/commands/__tests__/memory-v2.test.ts +1 -0
package/src/cli/commands/__tests__/memory-v3-render.test.ts +340 -0
package/src/cli/commands/browser.ts +247 -0
package/src/cli/commands/domain.ts +91 -41
package/src/cli/commands/inference.ts +93 -40
package/src/cli/commands/memory-v2-compare-render.ts +115 -0
package/src/cli/commands/memory-v2.ts +176 -1
package/src/cli/commands/memory-v3-render.ts +344 -0
package/src/cli/commands/memory-v3.ts +316 -0
package/src/cli/program.ts +2 -0
package/src/config/assistant-feature-flags.ts +21 -9
package/src/config/bundled-skills/document-editor/SKILL.md +11 -2
package/src/config/bundled-skills/document-editor/TOOLS.json +18 -0
package/src/config/bundled-skills/document-editor/tools/document-open.ts +12 -0
package/src/config/bundled-skills/image-studio/SKILL.md +4 -0
package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +2 -2
package/src/config/bundled-skills/media-processing/tools/ingest-media.ts +13 -8
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +10 -3
package/src/config/bundled-skills/phone-calls/references/TRANSCRIPTS.md +16 -14
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +7 -2
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +7 -2
package/src/config/bundled-tool-registry.ts +2 -0
package/src/config/call-site-defaults.ts +7 -6
package/src/config/feature-flag-registry.json +16 -0
package/src/config/schemas/__tests__/memory-v2.test.ts +213 -1
package/src/config/schemas/call-site-catalog.ts +21 -7
package/src/config/schemas/llm.ts +12 -1
package/src/config/schemas/memory-v2.ts +246 -0
package/src/config/schemas/memory.ts +2 -1
package/src/context/compactor.ts +52 -0
package/src/conversations/__tests__/message-consolidation.test.ts +350 -0
package/src/conversations/message-consolidation.ts +404 -0
package/src/daemon/__tests__/conversation-tool-setup-exclude.test.ts +1 -1
package/src/daemon/__tests__/meet-manifest-loader.test.ts +1 -1
package/src/daemon/conversation-agent-loop-handlers.ts +2 -13
package/src/daemon/conversation-agent-loop.ts +126 -76
package/src/daemon/conversation-error.ts +31 -1
package/src/daemon/conversation-lifecycle.ts +27 -22
package/src/daemon/conversation-runtime-assembly.ts +10 -9
package/src/daemon/conversation-tool-setup.ts +63 -3
package/src/daemon/conversation-usage.ts +2 -0
package/src/daemon/conversation.ts +14 -29
package/src/daemon/disk-pressure-guard.ts +14 -2
package/src/daemon/handlers/config-model.test.ts +1 -0
package/src/daemon/handlers/conversations.ts +11 -3
package/src/daemon/host-browser-proxy.ts +5 -5
package/src/daemon/host-cu-proxy.ts +4 -4
package/src/daemon/host-file-proxy.ts +4 -4
package/src/daemon/host-proxy-base.ts +4 -4
package/src/daemon/host-transfer-proxy.ts +10 -10
package/src/daemon/lifecycle.ts +23 -20
package/src/daemon/meet-manifest-loader.ts +1 -7
package/src/daemon/message-types/conversations.ts +6 -9
package/src/daemon/message-types/home.ts +1 -13
package/src/daemon/message-types/messages.ts +6 -14
package/src/daemon/message-types/sync.ts +14 -0
package/src/daemon/shutdown-handlers.ts +24 -5
package/src/daemon/switch-inference-profile-tool.ts +52 -0
package/src/daemon/tool-setup-types.ts +13 -0
package/src/events/relationship-state-updated.ts +25 -0
package/src/heartbeat/__tests__/heartbeat-service.test.ts +1 -1
package/src/home/home-greeting.ts +0 -9
package/src/home/suggested-prompts.ts +0 -9
package/src/ipc/gateway-flag-listener.ts +123 -0
package/src/ipc/skill-routes/registries.ts +8 -12
package/src/memory/__tests__/db-async-query.test.ts +165 -0
package/src/memory/__tests__/db-maintenance.test.ts +115 -0
package/src/memory/__tests__/jobs-store-enqueue-gate.test.ts +241 -0
package/src/memory/__tests__/jobs-store-job-classes.test.ts +28 -1
package/src/memory/__tests__/memory-retrospective-job.test.ts +7 -0
package/src/memory/auto-analysis-enqueue.ts +5 -1
package/src/memory/conversation-crud.ts +71 -70
package/src/memory/conversation-starters-cadence.ts +3 -1
package/src/memory/conversation-title-service.ts +19 -3
package/src/memory/db-async-query.ts +214 -0
package/src/memory/db-init.ts +10 -0
package/src/memory/db-maintenance.ts +30 -21
package/src/memory/graph/bootstrap.ts +8 -1
package/src/memory/graph/capability-seed.ts +7 -3
package/src/memory/graph/conversation-graph-memory.ts +100 -17
package/src/memory/graph/extraction.ts +1 -5
package/src/memory/graph/graph-search.ts +7 -1
package/src/memory/indexer.ts +28 -18
package/src/memory/job-handlers/cleanup.ts +76 -18
package/src/memory/job-handlers/conversation-starters.ts +1 -4
package/src/memory/jobs/embed-pkb-file.ts +6 -1
package/src/memory/jobs-store.ts +14 -0
package/src/memory/jobs-worker.ts +55 -22
package/src/memory/llm-request-log-source-clickhouse.ts +42 -2
package/src/memory/llm-request-log-source-local.ts +7 -0
package/src/memory/llm-request-log-source.ts +9 -2
package/src/memory/llm-request-log-store.ts +43 -1
package/src/memory/llm-usage-store.ts +24 -0
package/src/memory/memory-retrospective-enqueue.ts +8 -1
package/src/memory/memory-retrospective-job.ts +5 -0
package/src/memory/memory-v2-activation-log-store.ts +15 -6
package/src/memory/migrations/260-rename-cleaned-at.ts +44 -0
package/src/memory/migrations/261-llm-usage-add-raw-usage.ts +36 -0
package/src/memory/migrations/262-memory-v3-coactivation.ts +57 -0
package/src/memory/migrations/263-memory-v3-auto-edges.ts +50 -0
package/src/memory/migrations/264-llm-request-log-call-site.ts +29 -0
package/src/memory/migrations/index.ts +17 -0
package/src/memory/migrations/registry.ts +33 -0
package/src/memory/schema/conversations.ts +1 -1
package/src/memory/schema/infrastructure.ts +21 -0
package/src/memory/tool-usage-store.ts +36 -8
package/src/memory/v2/__tests__/consolidation-job.test.ts +1 -0
package/src/memory/v2/__tests__/harness-compare.test.ts +186 -0
package/src/memory/v2/__tests__/harness-metrics.test.ts +74 -0
package/src/memory/v2/__tests__/harness-oracle.test.ts +257 -0
package/src/memory/v2/__tests__/harness-replay-input.test.ts +225 -0
package/src/memory/v2/__tests__/harness-runner.test.ts +109 -0
package/src/memory/v2/__tests__/injection.test.ts +127 -98
package/src/memory/v2/__tests__/qdrant.test.ts +36 -0
package/src/memory/v2/__tests__/router.test.ts +171 -3
package/src/memory/v2/harness/compare.ts +57 -0
package/src/memory/v2/harness/metrics.ts +124 -0
package/src/memory/v2/harness/oracle.ts +145 -0
package/src/memory/v2/harness/replay-input.ts +224 -0
package/src/memory/v2/harness/retriever.ts +74 -0
package/src/memory/v2/harness/router-retriever.ts +43 -0
package/src/memory/v2/harness/runner.ts +106 -0
package/src/memory/v2/harness/trace.ts +58 -0
package/src/memory/v2/injection.ts +21 -15
package/src/memory/v2/prompts/router.ts +26 -1
package/src/memory/v2/qdrant.ts +14 -2
package/src/memory/v2/router.ts +171 -18
package/src/memory/v3/__tests__/coactivation-store.test.ts +422 -0
package/src/memory/v3/__tests__/consolidation-job.test.ts +468 -0
package/src/memory/v3/__tests__/edge-learning-job.test.ts +324 -0
package/src/memory/v3/__tests__/edges.test.ts +563 -0
package/src/memory/v3/__tests__/filter.test.ts +512 -0
package/src/memory/v3/__tests__/gate.test.ts +574 -0
package/src/memory/v3/__tests__/index-composition.test.ts +233 -0
package/src/memory/v3/__tests__/loop.test.ts +530 -0
package/src/memory/v3/__tests__/retriever.test.ts +226 -0
package/src/memory/v3/__tests__/scouts.test.ts +440 -0
package/src/memory/v3/__tests__/shadow-middleware.test.ts +312 -0
package/src/memory/v3/__tests__/system-prompts.test.ts +154 -0
package/src/memory/v3/__tests__/traversal.test.ts +469 -0
package/src/memory/v3/__tests__/tree-index.test.ts +280 -0
package/src/memory/v3/__tests__/tree-store.test.ts +529 -0
package/src/memory/v3/__tests__/tree-walk.test.ts +707 -0
package/src/memory/v3/__tests__/validate.test.ts +245 -0
package/src/memory/v3/auto-edges.ts +223 -0
package/src/memory/v3/coactivation-store.ts +124 -0
package/src/memory/v3/consolidation-job.ts +323 -0
package/src/memory/v3/edge-learning-job.ts +160 -0
package/src/memory/v3/edges.ts +249 -0
package/src/memory/v3/filter.ts +281 -0
package/src/memory/v3/gate.ts +334 -0
package/src/memory/v3/index-composition.ts +113 -0
package/src/memory/v3/llm-capture.ts +46 -0
package/src/memory/v3/loop.ts +382 -0
package/src/memory/v3/maintenance.ts +144 -0
package/src/memory/v3/prompt-context.ts +33 -0
package/src/memory/v3/prompts/consolidation.ts +458 -0
package/src/memory/v3/prompts/system-prompts.ts +196 -0
package/src/memory/v3/retriever.ts +33 -0
package/src/memory/v3/scouts.ts +420 -0
package/src/memory/v3/shadow-middleware.ts +305 -0
package/src/memory/v3/traversal.ts +206 -0
package/src/memory/v3/tree-index.ts +237 -0
package/src/memory/v3/tree-store.ts +394 -0
package/src/memory/v3/tree-walk.ts +351 -0
package/src/memory/v3/types.ts +65 -0
package/src/memory/v3/validate.ts +300 -0
package/src/notifications/adapters/macos.ts +18 -1
package/src/notifications/adapters/platform.ts +1 -1
package/src/notifications/decision-engine.ts +1 -4
package/src/notifications/emit-signal.ts +29 -49
package/src/permissions/prompter.ts +3 -3
package/src/permissions/question-prompter.ts +5 -2
package/src/permissions/secret-prompter.ts +2 -2
package/src/plugin-api/index.ts +4 -0
package/src/plugin-api/types.ts +7 -33
package/src/plugins/defaults/index.ts +6 -0
package/src/plugins/defaults/injectors.ts +18 -11
package/src/plugins/external-plugin-loader.ts +5 -68
package/src/plugins/types.ts +11 -16
package/src/proactive-artifact/aux-message-injector.ts +17 -4
package/src/prompts/__tests__/task-progress-hint-section.test.ts +3 -9
package/src/prompts/persona-resolver.ts +36 -21
package/src/prompts/sections.ts +39 -7
package/src/prompts/system-prompt.ts +50 -185
package/src/prompts/templates/BOOTSTRAP.md +2 -2
package/src/prompts/templates/system-sections.ts +230 -8
package/src/providers/__tests__/connection-model-compat.test.ts +234 -0
package/src/providers/__tests__/retry-callsite.test.ts +85 -5
package/src/providers/anthropic/client.ts +32 -66
package/src/providers/call-site-routing.ts +14 -2
package/src/providers/connection-model-compat.ts +38 -0
package/src/providers/connection-resolution.ts +16 -2
package/src/providers/gemini/client.ts +49 -6
package/src/providers/inference/adapter-factory.ts +3 -0
package/src/providers/minimax/client.ts +106 -0
package/src/providers/model-catalog.ts +43 -0
package/src/providers/model-intents.ts +1 -1
package/src/providers/openai/chat-completions-provider.ts +6 -3
package/src/providers/openai/codex-models.ts +18 -0
package/src/providers/openai/responses-provider.ts +78 -21
package/src/providers/provider-send-message.ts +7 -1
package/src/providers/retry.ts +34 -3
package/src/providers/thinking-config.ts +26 -1
package/src/providers/usage-tracking.ts +2 -0
package/src/runtime/AGENTS.md +2 -2
package/src/runtime/agent-wake.ts +1 -0
package/src/runtime/assistant-event-hub.ts +76 -6
package/src/runtime/auth/route-policy.ts +36 -0
package/src/runtime/btw-sidechain.ts +0 -6
package/src/runtime/http-types.ts +0 -2
package/src/runtime/migrations/vbundle-builder.ts +10 -3
package/src/runtime/pending-interactions.ts +0 -1
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +106 -0
package/src/runtime/routes/__tests__/memory-v2-simulate-route.test.ts +25 -6
package/src/runtime/routes/__tests__/plugins-routes.test.ts +512 -0
package/src/runtime/routes/acp-routes.test.ts +255 -6
package/src/runtime/routes/acp-routes.ts +8 -1
package/src/runtime/routes/avatar-routes.ts +10 -10
package/src/runtime/routes/background-wake-routes.ts +188 -0
package/src/runtime/routes/browser-tabs-routes.ts +200 -0
package/src/runtime/routes/btw-routes.ts +0 -6
package/src/runtime/routes/conversation-cli-routes.ts +1 -1
package/src/runtime/routes/conversation-list-routes.ts +12 -4
package/src/runtime/routes/conversation-management-routes.ts +77 -20
package/src/runtime/routes/conversation-query-routes.ts +142 -36
package/src/runtime/routes/conversation-routes.ts +252 -410
package/src/runtime/routes/conversation-starter-routes.ts +6 -3
package/src/runtime/routes/disk-pressure-routes.ts +1 -1
package/src/runtime/routes/domain-routes.ts +60 -10
package/src/runtime/routes/email-routes.ts +5 -2
package/src/runtime/routes/events-routes.ts +54 -10
package/src/runtime/routes/group-routes.ts +24 -8
package/src/runtime/routes/host-browser-routes.ts +10 -2
package/src/runtime/routes/host-cu-routes.ts +2 -2
package/src/runtime/routes/inbound-stages/acl-enforcement.ts +96 -3
package/src/runtime/routes/index.ts +8 -0
package/src/runtime/routes/inference-profile-session-handler.ts +22 -12
package/src/runtime/routes/inference-profile-session-routes.ts +7 -1
package/src/runtime/routes/llm-call-sites-routes.ts +32 -5
package/src/runtime/routes/memory-item-routes.ts +8 -3
package/src/runtime/routes/memory-v2-routes.ts +215 -5
package/src/runtime/routes/memory-v3-routes.ts +316 -0
package/src/runtime/routes/migration-routes.ts +21 -24
package/src/runtime/routes/plugins-routes.ts +337 -0
package/src/runtime/routes/rename-conversation-routes.ts +6 -2
package/src/runtime/routes/secret-routes.ts +25 -5
package/src/runtime/routes/settings-routes.ts +12 -11
package/src/runtime/routes/slack-channel-routes.ts +5 -4
package/src/runtime/routes/workspace-routes.ts +25 -10
package/src/runtime/sync/resource-sync-events.ts +106 -38
package/src/runtime/sync/sync-publisher.test.ts +49 -0
package/src/runtime/sync/sync-publisher.ts +2 -1
package/src/runtime/verification-outbound-actions.ts +73 -1
package/src/telemetry/types.ts +12 -0
package/src/telemetry/usage-telemetry-reporter.test.ts +48 -0
package/src/telemetry/usage-telemetry-reporter.ts +1 -0
package/src/tools/acp/spawn.test.ts +119 -0
package/src/tools/acp/spawn.ts +15 -2
package/src/tools/apps/definitions.ts +2 -8
package/src/tools/ask-question/ask-question-tool.test.ts +3 -3
package/src/tools/ask-question/ask-question-tool.ts +38 -45
package/src/tools/browser/__tests__/pinned-tabs.test.ts +70 -0
package/src/tools/browser/browser-execution.ts +16 -3
package/src/tools/browser/cdp-client/__tests__/browser-tabs-factory.test.ts +402 -0
package/src/tools/browser/cdp-client/__tests__/types.test.ts +3 -0
package/src/tools/browser/cdp-client/cdp-inspect-client.ts +12 -0
package/src/tools/browser/cdp-client/extension-cdp-client.ts +27 -1
package/src/tools/browser/cdp-client/factory.ts +100 -17
package/src/tools/browser/cdp-client/local-cdp-client.ts +12 -0
package/src/tools/browser/cdp-client/types.ts +65 -0
package/src/tools/browser/pinned-tabs.ts +96 -40
package/src/tools/computer-use/definitions.ts +22 -78
package/src/tools/credential-execution/make-authenticated-request.ts +3 -9
package/src/tools/credential-execution/manage-secure-command-tool.ts +3 -9
package/src/tools/credential-execution/run-authenticated-command.ts +3 -9
package/src/tools/credentials/vault.ts +3 -9
package/src/tools/document/document-tool.ts +59 -0
package/src/tools/execution-target.ts +21 -23
package/src/tools/executor.ts +6 -1
package/src/tools/filesystem/edit.ts +3 -9
package/src/tools/filesystem/list.ts +3 -9
package/src/tools/filesystem/read.ts +3 -9
package/src/tools/filesystem/write.ts +3 -9
package/src/tools/host-filesystem/edit.ts +3 -9
package/src/tools/host-filesystem/read.ts +3 -9
package/src/tools/host-filesystem/transfer.ts +3 -9
package/src/tools/host-filesystem/write.ts +3 -9
package/src/tools/host-terminal/host-shell.ts +3 -9
package/src/tools/mcp/mcp-tool-factory.ts +1 -8
package/src/tools/memory/register.test.ts +1 -1
package/src/tools/memory/register.ts +4 -9
package/src/tools/network/web-fetch.ts +3 -9
package/src/tools/network/web-search.ts +25 -32
package/src/tools/registry.ts +7 -23
package/src/tools/schema-transforms.ts +1 -1
package/src/tools/skills/execute.ts +3 -9
package/src/tools/skills/load.ts +3 -9
package/src/tools/skills/skill-tool-factory.ts +1 -8
package/src/tools/subagent/notify-parent.ts +3 -9
package/src/tools/system/request-permission.ts +3 -9
package/src/tools/terminal/shell.ts +3 -9
package/src/tools/tool-defaults.ts +94 -0
package/src/tools/types.ts +27 -98
package/src/tools/ui-surface/definitions.ts +6 -22
package/src/usage/pricing.ts +23 -0
package/src/usage/types.ts +12 -0
package/src/util/logger.ts +16 -7
package/src/util/platform.ts +7 -2
package/src/util/sqlite3-runtime.ts +65 -0
package/src/workspace/migrations/086-revert-stale-gemini-mis-rewrites.ts +1 -0
package/src/workspace/migrations/089-move-memory-tree-out-of-v3.ts +86 -0
package/src/workspace/migrations/registry.ts +2 -0
package/src/__tests__/compaction-strip-metadata-clear.test.ts +0 -206
package/src/__tests__/message-complete-display-id.test.ts +0 -175
package/src/daemon/query-complexity-router.ts +0 -75
package/src/prompts/cache-boundary.ts +0 -8

package/src/runtime/routes/conversation-routes.ts CHANGED Viewed

@@ -20,6 +20,10 @@ import {
 } from "../../channels/types.js";
 import { isHttpAuthDisabled } from "../../config/env.js";
 import { getConfig } from "../../config/loader.js";
+import {
+  mergeConsecutiveAssistantMessages,
+  mergeToolResultsIntoAssistantMessages,
+} from "../../conversations/message-consolidation.js";
 import { createApprovalConversationGenerator } from "../../daemon/approval-generators.js";
 import type { Conversation } from "../../daemon/conversation.js";
 import {
@@ -121,7 +125,12 @@ import {
   resolveTrustContext,
   withSourceChannel,
 } from "../trust-context-resolver.js";
-import { BadRequestError, InternalError, RouteError } from "./errors.js";
+import {
+  BadRequestError,
+  InternalError,
+  NotFoundError,
+  RouteError,
+} from "./errors.js";
 import type { RouteDefinition, RouteHandlerArgs } from "./types.js";
 import { RouteResponse } from "./types.js";
@@ -142,6 +151,34 @@ function isValidRiskThreshold(value: unknown): value is RiskThreshold {
   );
 }
+// ---------------------------------------------------------------------------
+// Temporary fix — remove when #31994 lands
+// ---------------------------------------------------------------------------
+//
+// The canned-response paths in this file (canned greeting, inline approval
+// reply, slash command, /compact, /clean) bypass the agent loop and so don't
+// pick up the per-turn anchor id allocated in conversation-agent-loop.ts.
+// Their `message_complete` events therefore went out without `messageId`,
+// and the macOS client filter at ChatActionHandler.swift:507 dropped those
+// events when they raced past the 50 ms streaming-buffer flush — leaving
+// `isSending` stuck for the full 60 s watchdog window.
+//
+// Centralized so the patch surface is one helper + N one-line callers rather
+// than N duplicated literals. When #31994 lands and stamps these sites with
+// `state.assistantTurnId` directly, grep for `emitCannedMessageComplete` to
+// find every call site and inline-then-delete.
+function emitCannedMessageComplete(
+  send: (msg: ServerMessage) => void,
+  conversationId: string,
+  persistedAssistantId: string,
+): void {
+  send({
+    type: "message_complete",
+    conversationId,
+    messageId: persistedAssistantId,
+  });
+}
 /**
  * True when a message's persisted metadata explicitly flags it as hidden.
  * Used to suppress internal scaffolding messages from UI history while
@@ -283,6 +320,8 @@ async function tryConsumeCanonicalGuardianReply(params: {
   verifiedActorExternalUserId?: string;
   /** Verified actor principal ID for principal-based authorization. */
   verifiedActorPrincipalId?: string;
+  /** Originating client identifier for sync_changed self-echo suppression. */
+  originClientId?: string;
 }): Promise<{ consumed: boolean; messageId?: string }> {
   const {
     conversationId,
@@ -295,6 +334,7 @@ async function tryConsumeCanonicalGuardianReply(params: {
     approvalConversationGenerator,
     verifiedActorExternalUserId,
     verifiedActorPrincipalId,
+    originClientId,
   } = params;
   const trimmedContent = content.trim();
@@ -392,7 +432,7 @@ async function tryConsumeCanonicalGuardianReply(params: {
         ? "Decision applied."
         : "Request already resolved.");
     const assistantMessage = createAssistantMessage(replyText);
-    await addMessage(
+    const persistedAssistant = await addMessage(
       conversationId,
       "assistant",
       JSON.stringify(assistantMessage.content),
@@ -407,9 +447,9 @@ async function tryConsumeCanonicalGuardianReply(params: {
         text: replyText,
         conversationId: conversationId,
       });
-      onEvent({ type: "message_complete", conversationId: conversationId });
+      emitCannedMessageComplete(onEvent, conversationId, persistedAssistant.id);
     }
-    publishConversationMessagesChanged(conversationId);
+    publishConversationMessagesChanged(conversationId, originClientId);
   } catch (err) {
     log.warn(
       { err, conversationId },
@@ -792,14 +832,8 @@ export function handleListMessages({
     // on createdAt. The mismatch is benign — it may return slightly extra
     // data on a page boundary but never loses messages.
     const displayTimestamp = m.sentAt ?? m.timestamp;
-    const mergedMessageIds = mergedIdMap.get(m.id) ?? [];
-    const daemonMessageId =
-      m.role === "assistant"
-        ? (mergedMessageIds[mergedMessageIds.length - 1] ?? m.id)
-        : undefined;
     return {
       id: m.id ?? "",
-      ...(daemonMessageId ? { daemonMessageId } : {}),
       role: m.role,
       content: m.text,
       timestamp: new Date(displayTimestamp).toISOString(),
@@ -849,305 +883,6 @@ export function handleListMessages({
   return { messages };
 }
-// ── Tool-result merging ─────────────────────────────────────────────
-function isToolResultType(type: string): boolean {
-  return type === "tool_result" || type === "web_search_tool_result";
-}
-function isSystemNoticeText(block: Record<string, unknown>): boolean {
-  if (block.type !== "text") return false;
-  const text = typeof block.text === "string" ? block.text : "";
-  return (
-    text.startsWith("<system_notice>") && text.endsWith("</system_notice>")
-  );
-}
-/**
- * Merge tool_result blocks from user messages into the preceding assistant
- * message's content array. This lets renderHistoryContent's pendingToolUses
- * map pair tool_use and tool_result blocks, preventing "unknown" tool names.
- *
- * User messages that consist entirely of tool_result blocks (and optional
- * system_notice text) are removed from the output. Mixed messages (tool_result
- * + real user text) keep only the non-tool-result blocks.
- */
-function mergeToolResultsIntoAssistantMessages(
-  messages: MessageRow[],
-): MessageRow[] {
-  // Index of the most recent assistant message in the output array.
-  let lastAssistantIdx = -1;
-  // Parsed content caches — lazily populated per assistant message.
-  const parsedAssistantContent = new Map<number, unknown[]>();
-  const result: MessageRow[] = [];
-  for (const msg of messages) {
-    if (msg.role === "assistant") {
-      lastAssistantIdx = result.length;
-      result.push(msg);
-      continue;
-    }
-    // Only process user messages — other roles pass through.
-    if (msg.role !== "user") {
-      result.push(msg);
-      continue;
-    }
-    let blocks: unknown[];
-    try {
-      const parsed = JSON.parse(msg.content);
-      if (!Array.isArray(parsed)) {
-        result.push(msg);
-        continue;
-      }
-      blocks = parsed;
-    } catch {
-      result.push(msg);
-      continue;
-    }
-    // Separate tool-result blocks from real user content.
-    const toolResultBlocks: unknown[] = [];
-    const otherBlocks: unknown[] = [];
-    for (const block of blocks) {
-      if (
-        typeof block === "object" &&
-        block !== null &&
-        typeof (block as Record<string, unknown>).type === "string"
-      ) {
-        const rec = block as Record<string, unknown>;
-        if (isToolResultType(rec.type as string)) {
-          toolResultBlocks.push(block);
-        } else if (isSystemNoticeText(rec)) {
-          // System notices don't count as user content — drop them when
-          // the message is otherwise tool-result-only.
-          otherBlocks.push(block);
-        } else {
-          otherBlocks.push(block);
-        }
-      } else {
-        otherBlocks.push(block);
-      }
-    }
-    // No tool results → pass through unchanged. System notices are only
-    // injected alongside tool results in the agent loop, so a pure user
-    // message (no tool_result blocks) should never be filtered — even if
-    // the user's text happens to look like a system_notice tag.
-    if (toolResultBlocks.length === 0) {
-      result.push(msg);
-      continue;
-    }
-    // Append tool_result blocks to the preceding assistant message's content.
-    if (lastAssistantIdx >= 0) {
-      const assistant = result[lastAssistantIdx];
-      let assistantContent = parsedAssistantContent.get(lastAssistantIdx);
-      if (!assistantContent) {
-        try {
-          const parsed = JSON.parse(assistant.content);
-          assistantContent = Array.isArray(parsed) ? parsed : [parsed];
-        } catch {
-          assistantContent = [];
-        }
-        parsedAssistantContent.set(lastAssistantIdx, assistantContent);
-      }
-      assistantContent.push(...toolResultBlocks);
-    } else {
-      // No preceding assistant message (pagination boundary) — keep the
-      // original message as-is to avoid permanent data loss. The preceding
-      // assistant tool_use lives in the previous page; dropping the result
-      // here would be unrecoverable.
-      // Still strip system notices so internal prompt text isn't exposed.
-      const filteredBlocks = blocks.filter(
-        (b) =>
-          !(
-            typeof b === "object" &&
-            b !== null &&
-            isSystemNoticeText(b as Record<string, unknown>)
-          ),
-      );
-      result.push({
-        ...msg,
-        content:
-          filteredBlocks.length === blocks.length
-            ? msg.content
-            : JSON.stringify(filteredBlocks),
-      });
-      continue;
-    }
-    // If the user message had only tool_result (+ system_notice) blocks,
-    // suppress it entirely. Otherwise keep the non-tool-result content.
-    const realUserContent = otherBlocks.filter(
-      (b) =>
-        !(
-          typeof b === "object" &&
-          b !== null &&
-          isSystemNoticeText(b as Record<string, unknown>)
-        ),
-    );
-    if (realUserContent.length > 0) {
-      result.push({ ...msg, content: JSON.stringify(otherBlocks) });
-    }
-    // else: tool-result-only → suppressed (results already merged above)
-  }
-  // Write back any modified assistant message content.
-  for (const [idx, content] of parsedAssistantContent) {
-    result[idx] = { ...result[idx], content: JSON.stringify(content) };
-  }
-  return result;
-}
-// ── Consecutive assistant message merging ────────────────────────────
-/** Parse a message's JSON content into an array of content blocks. */
-function parseContentBlocks(content: string): unknown[] {
-  try {
-    const parsed = JSON.parse(content);
-    return Array.isArray(parsed) ? parsed : [parsed];
-  } catch (err) {
-    log.warn(
-      { err },
-      "Failed to parse content blocks during assistant message merge",
-    );
-    return [];
-  }
-}
-/**
- * Append content blocks from a donor message onto a target block array.
- * Parses the donor's JSON content and pushes each block into `target`.
- */
-function appendContentBlocks(target: unknown[], donorContent: string): void {
-  try {
-    const parsed = JSON.parse(donorContent);
-    if (Array.isArray(parsed)) {
-      target.push(...parsed);
-    } else {
-      target.push(parsed);
-    }
-  } catch (err) {
-    log.warn(
-      { err },
-      "Failed to parse donor content blocks during assistant message merge",
-    );
-  }
-}
-/**
- * Promote metadata fields from a donor message to the surviving message
- * when the survivor lacks them. Currently promotes `subagentNotification`.
- * Returns a new MessageRow if promotion occurred, otherwise the original.
- */
-function promoteMetadata(survivor: MessageRow, donor: MessageRow): MessageRow {
-  if (donor.metadata && survivor.metadata) {
-    try {
-      const survivorMeta = JSON.parse(survivor.metadata);
-      const donorMeta = JSON.parse(donor.metadata);
-      if (
-        !survivorMeta.subagentNotification &&
-        donorMeta.subagentNotification
-      ) {
-        survivorMeta.subagentNotification = donorMeta.subagentNotification;
-        return { ...survivor, metadata: JSON.stringify(survivorMeta) };
-      }
-    } catch (err) {
-      log.warn(
-        { err },
-        "Failed to parse metadata during assistant message merge",
-      );
-    }
-  } else if (donor.metadata && !survivor.metadata) {
-    return { ...survivor, metadata: donor.metadata };
-  }
-  return survivor;
-}
-/**
- * Merge consecutive assistant messages into a single message at query time.
- *
- * During streaming, all assistant turns within one agent loop accumulate on
- * a single client-side ChatMessage. In the DB, each API turn is stored as a
- * separate assistant row (consolidation is deferred to compaction for
- * prefix-cache stability). This produces N separate assistant messages that
- * the client renders as N individual bubbles — each showing "Completed 1
- * step" instead of one grouped "Completed N steps" accordion.
- *
- * This function concatenates the content block arrays of consecutive
- * assistant messages (no intervening user messages after tool-result
- * merging) into the first message of each run. The merged messages are
- * removed from the output. This is query-time only — the DB is not
- * modified.
- *
- * The first message in each run keeps its id, createdAt, and metadata so
- * that attachment lookups, display timestamps, and subagent notifications
- * continue to work. Metadata from later messages in the run (e.g.
- * subagentNotification) is preserved by promoting it to the surviving
- * message when the surviving message has no metadata of its own for that
- * field.
- */
-function mergeConsecutiveAssistantMessages(messages: MessageRow[]): {
-  messages: MessageRow[];
-  /** Maps each surviving message ID → all original message IDs merged into it. */
-  mergedIdMap: Map<string, string[]>;
-} {
-  const result: MessageRow[] = [];
-  // Key = index in `result`, value = accumulated content blocks.
-  const pendingMerges = new Map<number, unknown[]>();
-  // Key = index in `result`, value = IDs of messages merged into the target.
-  const mergedIds = new Map<number, string[]>();
-  for (const msg of messages) {
-    const lastIdx = result.length - 1;
-    const isConsecutiveAssistant =
-      msg.role === "assistant" &&
-      lastIdx >= 0 &&
-      result[lastIdx].role === "assistant";
-    if (!isConsecutiveAssistant) {
-      result.push(msg);
-      continue;
-    }
-    // Track the donor message ID.
-    let ids = mergedIds.get(lastIdx);
-    if (!ids) {
-      ids = [];
-      mergedIds.set(lastIdx, ids);
-    }
-    ids.push(msg.id);
-    // Lazily parse the target's content on first merge.
-    let targetContent = pendingMerges.get(lastIdx);
-    if (!targetContent) {
-      targetContent = parseContentBlocks(result[lastIdx].content);
-      pendingMerges.set(lastIdx, targetContent);
-    }
-    appendContentBlocks(targetContent, msg.content);
-    result[lastIdx] = promoteMetadata(result[lastIdx], msg);
-  }
-  // Write back merged content for any messages that were targets.
-  for (const [idx, content] of pendingMerges) {
-    result[idx] = { ...result[idx], content: JSON.stringify(content) };
-  }
-  // Build the merged ID map keyed by surviving message ID.
-  const mergedIdMap = new Map<string, string[]>();
-  for (const [idx, ids] of mergedIds) {
-    mergedIdMap.set(result[idx].id, ids);
-  }
-  return { messages: result, mergedIdMap };
-}
-/**
 /**
  * Persist the pre-chat onboarding payload to disk.
  *
@@ -1240,6 +975,7 @@ export async function handleSendMessage(
 ): Promise<unknown> {
   const body = (rawBody ?? {}) as {
     conversationKey?: string;
+    conversationId?: string;
     content?: string;
     attachmentIds?: string[];
     sourceChannel?: string;
@@ -1271,8 +1007,14 @@ export async function handleSendMessage(
   const actorPrincipalId = headers?.["x-vellum-actor-principal-id"];
   const principalType = headers?.["x-vellum-principal-type"];
+  const originClientId =
+    headers?.["x-vellum-client-id"]?.trim() || undefined;
   const { conversationKey, content, attachmentIds } = body;
+  const inboundConversationId =
+    typeof body.conversationId === "string" && body.conversationId.length > 0
+      ? body.conversationId
+      : undefined;
   const clientMessageId =
     typeof body.clientMessageId === "string" ? body.clientMessageId : undefined;
   const requestedInferenceProfile =
@@ -1340,12 +1082,6 @@ export async function handleSendMessage(
       ? (canonicalizeTimeZone(body.clientTimezone) ?? undefined)
       : undefined;
-  // When conversationKey is omitted, derive a stable default from
-  // sourceChannel + sourceInterface so that repeated calls from the same
-  // channel/interface pair share a single conversation thread.
-  const resolvedConversationKey =
-    conversationKey ?? `default:${sourceChannel}:${sourceInterface}`;
   // Reject non-string content values (numbers, objects, etc.)
   if (content != null && typeof content !== "string") {
     throw new BadRequestError("content must be a string");
@@ -1409,9 +1145,40 @@ export async function handleSendMessage(
   // timer so the next heartbeat is a full interval after this interaction.
   HeartbeatService.getInstance()?.resetTimer();
-  const mapping = getOrCreateConversation(resolvedConversationKey, {
-    conversationType: "standard",
-  });
+  // Resolve the target conversation. Fetch by `conversationId` (the
+  // assistant-minted internal id) when the client supplies it — clients
+  // must obtain this id from a prior daemon response, so a missing row
+  // is a 404. Otherwise fall through to the external-key path: the
+  // client-supplied `conversationKey` (used by non-vellum channels and
+  // the web idempotency flow) or, when neither is provided, a stable
+  // default keyed on sourceChannel + sourceInterface so repeated calls
+  // from the same channel/interface share a single thread.
+  let mapping: {
+    conversationId: string;
+    conversationType: string;
+    created: boolean;
+  };
+  if (inboundConversationId !== undefined) {
+    const existing = getConversation(inboundConversationId);
+    if (!existing) {
+      throw new NotFoundError(
+        `Conversation ${inboundConversationId} not found`,
+      );
+    }
+    mapping = {
+      conversationId: existing.id,
+      conversationType: existing.conversationType,
+      created: false,
+    };
+  } else {
+    const resolvedConversationKey =
+      conversationKey && conversationKey.length > 0
+        ? conversationKey
+        : `default:${sourceChannel}:${sourceInterface}`;
+    mapping = getOrCreateConversation(resolvedConversationKey, {
+      conversationType: "standard",
+    });
+  }
   if (requestedRiskThreshold !== undefined) {
     const result = await ipcCall("set_conversation_threshold", {
@@ -1445,6 +1212,7 @@ export async function handleSendMessage(
       publishConversationListAndMetadataChanged(
         "created",
         mapping.conversationId,
+        originClientId,
       );
     }
   }
@@ -1664,7 +1432,7 @@ export async function handleSendMessage(
       const conversationId = mapping.conversationId;
       const assistantMsg = createAssistantMessage(cannedGreeting);
-      await addMessage(
+      const persistedAssistant = await addMessage(
         mapping.conversationId,
         "assistant",
         JSON.stringify(assistantMsg.content),
@@ -1708,8 +1476,12 @@ export async function handleSendMessage(
           text: cannedGreeting,
           conversationId,
         });
-        broadcastMessage({ type: "message_complete", conversationId });
-        publishConversationMessagesChanged(conversationId);
+        emitCannedMessageComplete(
+          broadcastMessage,
+          conversationId,
+          persistedAssistant.id,
+        );
+        publishConversationMessagesChanged(conversationId, originClientId);
         conversation.processing = false;
         silentlyWithLog(
           conversation.drainQueue(),
@@ -1787,6 +1559,7 @@ export async function handleSendMessage(
           : deps.approvalConversationGenerator,
       verifiedActorExternalUserId,
       verifiedActorPrincipalId,
+      originClientId,
     });
     if (inlineReplyResult.consumed) {
       return {
@@ -1975,7 +1748,7 @@ export async function handleSendMessage(
       conversation.getMessages().push(llmMsg);
       const assistantMsg = createAssistantMessage(slashResult.message);
-      await addMessage(
+      const persistedAssistant = await addMessage(
         mapping.conversationId,
         "assistant",
         JSON.stringify(assistantMsg.content),
@@ -2030,11 +1803,12 @@ export async function handleSendMessage(
           text: message,
           conversationId,
         });
-        broadcastMessage({
-          type: "message_complete",
-          conversationId: conversationId,
-        });
-        publishConversationMessagesChanged(conversationId);
+        emitCannedMessageComplete(
+          broadcastMessage,
+          conversationId,
+          persistedAssistant.id,
+        );
+        publishConversationMessagesChanged(conversationId, originClientId);
         conversation.processing = false;
         silentlyWithLog(conversation.drainQueue(), "slash-command queue drain");
       }, 0);
@@ -2062,12 +1836,22 @@ export async function handleSendMessage(
       assistantMessageInterface: sourceInterface,
     };
     const cleanMsg = createUserMessage(rawContent, attachments);
-    const persisted = await addMessage(
-      mapping.conversationId,
-      "user",
-      JSON.stringify(cleanMsg.content),
-      channelMeta,
-    );
+    let persisted: Awaited<ReturnType<typeof addMessage>>;
+    try {
+      persisted = await addMessage(
+        mapping.conversationId,
+        "user",
+        JSON.stringify(cleanMsg.content),
+        channelMeta,
+      );
+    } catch (err) {
+      // The fire-and-forget compaction below owns clearing `processing`, but a
+      // throw from this initial persist never reaches it — reset here so the
+      // conversation isn't stranded in queued mode.
+      conversation.processing = false;
+      silentlyWithLog(conversation.drainQueue(), "compact-command queue drain");
+      throw err;
+    }
     conversation.getMessages().push(cleanMsg);
     const conversationId = mapping.conversationId;
@@ -2085,7 +1869,7 @@ export async function handleSendMessage(
           messageId: persisted.id,
           clientMessageId,
         });
-        publishConversationMessagesChanged(conversationId);
+        publishConversationMessagesChanged(conversationId, originClientId);
         conversation.emitActivityState(
           "thinking",
           "context_compacting",
@@ -2097,7 +1881,7 @@ export async function handleSendMessage(
         const responseText = formatCompactResult(result);
         const assistantMsg = createAssistantMessage(responseText);
-        await addMessage(
+        const persistedAssistant = await addMessage(
           conversationId,
           "assistant",
           JSON.stringify(assistantMsg.content),
@@ -2111,11 +1895,15 @@ export async function handleSendMessage(
           text: responseText,
           conversationId,
         });
-        broadcastMessage({ type: "message_complete", conversationId });
-        publishConversationMessagesChanged(conversationId);
+        emitCannedMessageComplete(
+          broadcastMessage,
+          conversationId,
+          persistedAssistant.id,
+        );
+        publishConversationMessagesChanged(conversationId, originClientId);
       } catch (err) {
         if (assistantMessagePersisted) {
-          publishConversationMessagesChanged(conversationId);
+          publishConversationMessagesChanged(conversationId, originClientId);
         }
         log.error({ err, conversationId }, "Compact command failed");
         broadcastMessage({
@@ -2143,78 +1931,87 @@ export async function handleSendMessage(
   if (slashResult.kind === "clean") {
     conversation.processing = true;
-    const provenance = provenanceFromTrustContext(conversation.trustContext);
-    const channelMeta = {
-      ...provenance,
-      userMessageChannel: sourceChannel,
-      assistantMessageChannel: sourceChannel,
-      userMessageInterface: sourceInterface,
-      assistantMessageInterface: sourceInterface,
-    };
-    const cleanMsg = createUserMessage(rawContent, attachments);
-    const persisted = await addMessage(
-      mapping.conversationId,
-      "user",
-      JSON.stringify(cleanMsg.content),
-      channelMeta,
-    );
-    conversation.getMessages().push(cleanMsg);
     const conversationId = mapping.conversationId;
-    let assistantMessagePersisted = false;
+    // Outer try/finally guarantees the processing flag is cleared (and the
+    // queue drained) on every failure path — including a throw from the
+    // initial user-message persist below, which would otherwise leave the
+    // conversation stuck in queued mode indefinitely.
     try {
-      broadcastMessage({
-        type: "user_message_echo",
-        text: rawContent,
-        conversationId,
-        messageId: persisted.id,
-        clientMessageId,
-      });
-      publishConversationMessagesChanged(conversationId);
-      const result = await conversation.forceClean();
-      const responseText = formatCleanResult(result);
-      const assistantMsg = createAssistantMessage(responseText);
-      await addMessage(
-        conversationId,
-        "assistant",
-        JSON.stringify(assistantMsg.content),
+      const provenance = provenanceFromTrustContext(conversation.trustContext);
+      const channelMeta = {
+        ...provenance,
+        userMessageChannel: sourceChannel,
+        assistantMessageChannel: sourceChannel,
+        userMessageInterface: sourceInterface,
+        assistantMessageInterface: sourceInterface,
+      };
+      const cleanMsg = createUserMessage(rawContent, attachments);
+      const persisted = await addMessage(
+        mapping.conversationId,
+        "user",
+        JSON.stringify(cleanMsg.content),
         channelMeta,
       );
-      assistantMessagePersisted = true;
-      conversation.getMessages().push(assistantMsg);
+      conversation.getMessages().push(cleanMsg);
-      broadcastMessage({
-        type: "assistant_text_delta",
-        text: responseText,
-        conversationId,
-      });
-      broadcastMessage({ type: "message_complete", conversationId });
-      publishConversationMessagesChanged(conversationId);
-    } catch (err) {
-      if (assistantMessagePersisted) {
-        publishConversationMessagesChanged(conversationId);
+      let assistantMessagePersisted = false;
+      try {
+        broadcastMessage({
+          type: "user_message_echo",
+          text: rawContent,
+          conversationId,
+          messageId: persisted.id,
+          clientMessageId,
+        });
+        publishConversationMessagesChanged(conversationId, originClientId);
+        const result = await conversation.forceClean();
+        const responseText = formatCleanResult(result);
+        const assistantMsg = createAssistantMessage(responseText);
+        const persistedAssistant = await addMessage(
+          conversationId,
+          "assistant",
+          JSON.stringify(assistantMsg.content),
+          channelMeta,
+        );
+        assistantMessagePersisted = true;
+        conversation.getMessages().push(assistantMsg);
+        broadcastMessage({
+          type: "assistant_text_delta",
+          text: responseText,
+          conversationId,
+        });
+        emitCannedMessageComplete(
+          broadcastMessage,
+          conversationId,
+          persistedAssistant.id,
+        );
+        publishConversationMessagesChanged(conversationId, originClientId);
+      } catch (err) {
+        if (assistantMessagePersisted) {
+          publishConversationMessagesChanged(conversationId, originClientId);
+        }
+        log.error({ err, conversationId }, "Clean command failed");
+        broadcastMessage({
+          type: "conversation_error",
+          conversationId,
+          code: "UNKNOWN",
+          userMessage: `Clean failed: ${err instanceof Error ? err.message : String(err)}`,
+          retryable: true,
+        });
       }
-      log.error({ err, conversationId }, "Clean command failed");
-      broadcastMessage({
-        type: "conversation_error",
+      return {
+        accepted: true,
+        messageId: persisted.id,
         conversationId,
-        code: "UNKNOWN",
-        userMessage: `Clean failed: ${err instanceof Error ? err.message : String(err)}`,
-        retryable: true,
-      });
+      };
     } finally {
       conversation.processing = false;
       silentlyWithLog(conversation.drainQueue(), "clean-command queue drain");
     }
-    return {
-      accepted: true,
-      messageId: persisted.id,
-      conversationId,
-    };
   }
   const resolvedContent = slashResult.content;
@@ -2240,7 +2037,7 @@ export async function handleSendMessage(
     requestId,
     clientMessageId,
   });
-  publishConversationMessagesChanged(mapping.conversationId);
+  publishConversationMessagesChanged(mapping.conversationId, originClientId);
   // Fire-and-forget the agent loop; events flow to the hub via broadcastMessage.
   conversation
@@ -2285,14 +2082,25 @@ async function generateLlmSuggestion(
         ? escapeXmlContent(priorUserText)
         : priorUserText;
-  const systemPrompt =
-    "You generate short, casual reply suggestions a user might type next in a chat. Match the tone and register of the preceding conversation. Output only the reply text inside the requested tags — no preamble, no commentary.";
+  const systemPrompt = [
+    "You generate short, casual reply suggestions a user might type next in a chat.",
+    "Match the tone and register of the preceding conversation.",
+    "",
+    "CRITICAL — write from the USER'S perspective only, NEVER from the assistant's:",
+    "- The suggestion is what the USER will type into the chat input",
+    "- Use first-person \"I\" only if the user has used it in their prior messages",
+    "- NEVER start with phrases like \"I can help\", \"Here's what\", \"Let me\", \"I'd suggest\" — those are assistant-voice",
+    "- Think: if you were the user reading the assistant's reply, what question or follow-up would you ask next?",
+    "",
+    "Output only the reply text inside the requested tags — no preamble, no commentary.",
+  ].join("\n");
   const userPrompt =
     `Here is the end of a conversation:\n\n` +
     `<user_message>${truncatedUser ?? "(no prior user message)"}</user_message>\n` +
     `<assistant_message>${truncatedAssistant}</assistant_message>\n\n` +
-    `Write the user's next reply, focusing on the LAST question or call-to-action in the assistant message. Keep it short (under 15 words), casual, and in the user's voice. Respond in this exact format:\n\n` +
+    `Write the USER'S next reply — what the user would type. Focus on the LAST question or call-to-action in the assistant message. Keep it short (under 15 words), casual, and in the user's voice. ` +
+    `The reply must read as something typed BY the user, not something the assistant would say. Respond in this exact format:\n\n` +
     `<reply>YOUR_REPLY_HERE</reply>`;
   // Single user message only — no assistant-role prefill. Anthropic
@@ -2368,14 +2176,27 @@ export async function handleGetSuggestion(
   };
   const conversationKey = queryParams?.conversationKey;
-  if (!conversationKey) {
-    throw new BadRequestError("conversationKey query parameter is required");
+  const conversationId = queryParams?.conversationId;
+  if (!conversationKey && !conversationId) {
+    throw new BadRequestError(
+      "conversationKey or conversationId query parameter is required",
+    );
   }
-  const mapping = getConversationByKey(conversationKey);
-  if (!mapping) return noSuggestion;
+  let resolvedConversationId: string | undefined;
+  if (conversationId) {
+    resolvedConversationId = conversationId;
+  } else if (conversationKey) {
+    const mapping = getConversationByKey(conversationKey);
+    if (mapping) {
+      resolvedConversationId = mapping.conversationId;
+    } else if (getConversation(conversationKey)) {
+      resolvedConversationId = conversationKey;
+    }
+  }
+  if (!resolvedConversationId) return noSuggestion;
-  const rawMessages = getMessages(mapping.conversationId);
+  const rawMessages = getMessages(resolvedConversationId);
   if (rawMessages.length === 0) return noSuggestion;
   // Staleness check: compare requested messageId against the latest
@@ -2629,10 +2450,31 @@ export const ROUTES: RouteDefinition[] = [
     description:
       "Return an LLM-generated follow-up suggestion for the most recent assistant message.",
     tags: ["messages"],
+    queryParams: [
+      {
+        name: "conversationId",
+        type: "string",
+        description:
+          "Conversation ID to fetch a suggestion for. Either this or conversationKey is required.",
+      },
+      {
+        name: "conversationKey",
+        type: "string",
+        description:
+          "Legacy conversation key. Either this or conversationId is required.",
+      },
+      {
+        name: "messageId",
+        type: "string",
+        description:
+          "Optional. Latest assistant message ID the client has seen — used to detect staleness.",
+      },
+    ],
     responseBody: z.object({
-      suggestion: z.string(),
-      messageId: z.string(),
+      suggestion: z.string().nullable(),
+      messageId: z.string().nullable(),
       source: z.string(),
+      stale: z.boolean().optional(),
     }),
     handler: async (args) =>
       handleGetSuggestion(args, {