npm - @vellumai/assistant - Versions diffs - 0.8.4 → 0.8.5 - Mend

@vellumai/assistant 0.8.4 → 0.8.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (438) hide show

package/ARCHITECTURE.md +2 -2
package/docs/browser-use-architecture-phase2.md +1 -1
package/knip.json +2 -1
package/openapi.yaml +809 -11
package/package.json +1 -1
package/src/__tests__/anthropic-provider.test.ts +34 -37
package/src/__tests__/assistant-event-hub-self-exclusion.test.ts +293 -0
package/src/__tests__/assistant-feature-flags-integration.test.ts +3 -3
package/src/__tests__/audit-log-rotation.test.ts +70 -16
package/src/__tests__/background-workers-disk-pressure.test.ts +3 -3
package/src/__tests__/btw-routes.test.ts +2 -3
package/src/__tests__/call-controller.test.ts +0 -1
package/src/__tests__/cancel-resolves-conversation-key.test.ts +1 -1
package/src/__tests__/channel-guardian.test.ts +3 -3
package/src/__tests__/checker.test.ts +6 -15
package/src/__tests__/compaction-events.test.ts +1 -0
package/src/__tests__/compactor-call-site-logging.test.ts +214 -0
package/src/__tests__/computer-use-skill-manifest-regression.test.ts +5 -11
package/src/__tests__/computer-use-tools.test.ts +2 -4
package/src/__tests__/confirmation-request-guardian-bridge.test.ts +0 -1
package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-overflow.test.ts +197 -2
package/src/__tests__/conversation-agent-loop.test.ts +163 -122
package/src/__tests__/conversation-app-control-instantiation.test.ts +2 -5
package/src/__tests__/conversation-clear-safety.test.ts +25 -25
package/src/__tests__/conversation-delete-schedule-cleanup.test.ts +1 -1
package/src/__tests__/conversation-disk-view-integration.test.ts +2 -2
package/src/__tests__/conversation-error.test.ts +31 -0
package/src/__tests__/conversation-fork-crud.test.ts +178 -15
package/src/__tests__/conversation-lifecycle.test.ts +52 -11
package/src/__tests__/{conversation-load-cleaned-at.test.ts → conversation-load-history-stripped.test.ts} +13 -13
package/src/__tests__/conversation-provider-retry-repair.test.ts +1 -0
package/src/__tests__/conversation-routes-disk-view.test.ts +109 -0
package/src/__tests__/conversation-routes-slash-commands.test.ts +35 -0
package/src/__tests__/conversation-skill-tools.test.ts +2 -5
package/src/__tests__/conversation-store.test.ts +1 -1
package/src/__tests__/conversation-sync-tags.test.ts +99 -32
package/src/__tests__/conversation-workspace-cache-state.test.ts +1 -0
package/src/__tests__/conversation-workspace-injection.test.ts +1 -1
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
package/src/__tests__/credential-execution-feature-gates.test.ts +9 -7
package/src/__tests__/credential-execution-tools.test.ts +6 -6
package/src/__tests__/credential-security-invariants.test.ts +1 -0
package/src/__tests__/credential-vault-unit.test.ts +2 -2
package/src/__tests__/dynamic-page-surface.test.ts +2 -2
package/src/__tests__/email-html-renderer.test.ts +12 -0
package/src/__tests__/gateway-flag-listener.test.ts +237 -0
package/src/__tests__/gemini-provider.test.ts +78 -0
package/src/__tests__/guardian-dispatch.test.ts +0 -1
package/src/__tests__/guardian-outbound-http.test.ts +7 -5
package/src/__tests__/handlers-user-message-approval-consumption.test.ts +1 -1
package/src/__tests__/heartbeat-disk-pressure.test.ts +4 -0
package/src/__tests__/heartbeat-service.test.ts +4 -0
package/src/__tests__/host-shell-tool.test.ts +1 -1
package/src/__tests__/init-feature-flag-overrides.test.ts +5 -6
package/src/__tests__/list-messages-tool-merge.test.ts +70 -11
package/src/__tests__/llm-request-log-call-site.test.ts +136 -0
package/src/__tests__/llm-request-log-source-clickhouse.test.ts +26 -0
package/src/__tests__/llm-resolver.test.ts +77 -9
package/src/__tests__/llm-usage-store.test.ts +66 -0
package/src/__tests__/logger.test.ts +89 -0
package/src/__tests__/mcp-abort-signal.test.ts +2 -2
package/src/__tests__/media-generate-image.test.ts +31 -0
package/src/__tests__/memory-v2-static-injector.test.ts +7 -7
package/src/__tests__/model-intents.test.ts +2 -4
package/src/__tests__/notification-guardian-path.test.ts +0 -1
package/src/__tests__/onboarding-template-contract.test.ts +1 -1
package/src/__tests__/openai-provider.test.ts +46 -0
package/src/__tests__/openai-responses-provider.test.ts +114 -12
package/src/__tests__/pending-interactions-resolved-event.test.ts +0 -1
package/src/__tests__/platform-bash-auto-approve.test.ts +2 -2
package/src/__tests__/platform.test.ts +2 -2
package/src/__tests__/plugin-api-tool-definition.test.ts +92 -0
package/src/__tests__/plugin-bootstrap.test.ts +2 -2
package/src/__tests__/plugin-tool-contribution.test.ts +13 -6
package/src/__tests__/plugin-types.test.ts +3 -2
package/src/__tests__/prechat-onboarding-contract.test.ts +131 -98
package/src/__tests__/pricing.test.ts +12 -0
package/src/__tests__/prune-jobs-changes-parser.test.ts +61 -0
package/src/__tests__/registry.test.ts +2 -8
package/src/__tests__/require-fresh-approval.test.ts +2 -2
package/src/__tests__/runtime-events-sse-bilingual.test.ts +154 -0
package/src/__tests__/shell-tool-proxy-mode.test.ts +1 -1
package/src/__tests__/skill-feature-flags.test.ts +2 -2
package/src/__tests__/skill-projection-feature-flag.test.ts +4 -7
package/src/__tests__/skill-projection.benchmark.test.ts +2 -6
package/src/__tests__/skill-tool-factory.test.ts +1 -1
package/src/__tests__/subagent-notify-parent.test.ts +1 -1
package/src/__tests__/suggestion-routes.test.ts +1 -0
package/src/__tests__/sync-message-contract.test.ts +59 -0
package/src/__tests__/system-prompt.test.ts +145 -131
package/src/__tests__/terminal-tools.test.ts +1 -1
package/src/__tests__/tool-approval-handler.test.ts +1 -5
package/src/__tests__/tool-execute-pipeline.test.ts +2 -2
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +2 -5
package/src/__tests__/tool-executor-lifecycle-events.test.ts +15 -5
package/src/__tests__/tool-executor.test.ts +9 -62
package/src/__tests__/tool-grant-request-escalation.test.ts +1 -6
package/src/__tests__/trusted-contact-approval-notifier.test.ts +0 -1
package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +1 -6
package/src/__tests__/trusted-contact-multichannel.test.ts +0 -1
package/src/__tests__/ui-file-upload-surface.test.ts +2 -2
package/src/__tests__/usage-routes.test.ts +3 -0
package/src/__tests__/verification-control-plane-policy.test.ts +2 -2
package/src/__tests__/workspace-git-service.test.ts +6 -5
package/src/__tests__/workspace-migration-089-move-memory-tree-out-of-v3.test.ts +86 -0
package/src/acp/__tests__/prepare-agent-env.test.ts +146 -0
package/src/acp/prepare-agent-env.ts +78 -0
package/src/acp/session-manager.ts +1 -1
package/src/agent/loop.ts +8 -0
package/src/api/README.md +5 -0
package/src/api/index.ts +4 -0
package/src/api/package.json +10 -0
package/src/background-wake/background-wake-routes.test.ts +233 -0
package/src/background-wake/runtime-registry.ts +24 -0
package/src/cli/commands/__tests__/browser.test.ts +23 -5
package/src/cli/commands/__tests__/domain-register.test.ts +110 -0
package/src/cli/commands/__tests__/domain-status.test.ts +33 -33
package/src/cli/commands/__tests__/inference-send.test.ts +108 -5
package/src/cli/commands/__tests__/memory-v2-compare-render.test.ts +98 -0
package/src/cli/commands/__tests__/memory-v2.test.ts +1 -0
package/src/cli/commands/__tests__/memory-v3-render.test.ts +340 -0
package/src/cli/commands/browser.ts +247 -0
package/src/cli/commands/domain.ts +91 -41
package/src/cli/commands/inference.ts +93 -40
package/src/cli/commands/memory-v2-compare-render.ts +115 -0
package/src/cli/commands/memory-v2.ts +176 -1
package/src/cli/commands/memory-v3-render.ts +344 -0
package/src/cli/commands/memory-v3.ts +316 -0
package/src/cli/program.ts +2 -0
package/src/config/assistant-feature-flags.ts +21 -9
package/src/config/bundled-skills/document-editor/SKILL.md +11 -2
package/src/config/bundled-skills/document-editor/TOOLS.json +18 -0
package/src/config/bundled-skills/document-editor/tools/document-open.ts +12 -0
package/src/config/bundled-skills/image-studio/SKILL.md +4 -0
package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +2 -2
package/src/config/bundled-skills/media-processing/tools/ingest-media.ts +13 -8
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +10 -3
package/src/config/bundled-skills/phone-calls/references/TRANSCRIPTS.md +16 -14
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +7 -2
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +7 -2
package/src/config/bundled-tool-registry.ts +2 -0
package/src/config/call-site-defaults.ts +7 -6
package/src/config/feature-flag-registry.json +16 -0
package/src/config/schemas/__tests__/memory-v2.test.ts +213 -1
package/src/config/schemas/call-site-catalog.ts +21 -7
package/src/config/schemas/llm.ts +12 -1
package/src/config/schemas/memory-v2.ts +246 -0
package/src/config/schemas/memory.ts +2 -1
package/src/context/compactor.ts +52 -0
package/src/conversations/__tests__/message-consolidation.test.ts +350 -0
package/src/conversations/message-consolidation.ts +404 -0
package/src/daemon/__tests__/conversation-tool-setup-exclude.test.ts +1 -1
package/src/daemon/__tests__/meet-manifest-loader.test.ts +1 -1
package/src/daemon/conversation-agent-loop-handlers.ts +2 -13
package/src/daemon/conversation-agent-loop.ts +126 -76
package/src/daemon/conversation-error.ts +31 -1
package/src/daemon/conversation-lifecycle.ts +27 -22
package/src/daemon/conversation-runtime-assembly.ts +10 -9
package/src/daemon/conversation-tool-setup.ts +63 -3
package/src/daemon/conversation-usage.ts +2 -0
package/src/daemon/conversation.ts +14 -29
package/src/daemon/disk-pressure-guard.ts +14 -2
package/src/daemon/handlers/config-model.test.ts +1 -0
package/src/daemon/handlers/conversations.ts +11 -3
package/src/daemon/host-browser-proxy.ts +5 -5
package/src/daemon/host-cu-proxy.ts +4 -4
package/src/daemon/host-file-proxy.ts +4 -4
package/src/daemon/host-proxy-base.ts +4 -4
package/src/daemon/host-transfer-proxy.ts +10 -10
package/src/daemon/lifecycle.ts +23 -20
package/src/daemon/meet-manifest-loader.ts +1 -7
package/src/daemon/message-types/conversations.ts +6 -9
package/src/daemon/message-types/home.ts +1 -13
package/src/daemon/message-types/messages.ts +6 -14
package/src/daemon/message-types/sync.ts +14 -0
package/src/daemon/shutdown-handlers.ts +24 -5
package/src/daemon/switch-inference-profile-tool.ts +52 -0
package/src/daemon/tool-setup-types.ts +13 -0
package/src/events/relationship-state-updated.ts +25 -0
package/src/heartbeat/__tests__/heartbeat-service.test.ts +1 -1
package/src/home/home-greeting.ts +0 -9
package/src/home/suggested-prompts.ts +0 -9
package/src/ipc/gateway-flag-listener.ts +123 -0
package/src/ipc/skill-routes/registries.ts +8 -12
package/src/memory/__tests__/db-async-query.test.ts +165 -0
package/src/memory/__tests__/db-maintenance.test.ts +115 -0
package/src/memory/__tests__/jobs-store-enqueue-gate.test.ts +241 -0
package/src/memory/__tests__/jobs-store-job-classes.test.ts +28 -1
package/src/memory/__tests__/memory-retrospective-job.test.ts +7 -0
package/src/memory/auto-analysis-enqueue.ts +5 -1
package/src/memory/conversation-crud.ts +71 -70
package/src/memory/conversation-starters-cadence.ts +3 -1
package/src/memory/conversation-title-service.ts +19 -3
package/src/memory/db-async-query.ts +214 -0
package/src/memory/db-init.ts +10 -0
package/src/memory/db-maintenance.ts +30 -21
package/src/memory/graph/bootstrap.ts +8 -1
package/src/memory/graph/capability-seed.ts +7 -3
package/src/memory/graph/conversation-graph-memory.ts +100 -17
package/src/memory/graph/extraction.ts +1 -5
package/src/memory/graph/graph-search.ts +7 -1
package/src/memory/indexer.ts +28 -18
package/src/memory/job-handlers/cleanup.ts +76 -18
package/src/memory/job-handlers/conversation-starters.ts +1 -4
package/src/memory/jobs/embed-pkb-file.ts +6 -1
package/src/memory/jobs-store.ts +14 -0
package/src/memory/jobs-worker.ts +55 -22
package/src/memory/llm-request-log-source-clickhouse.ts +42 -2
package/src/memory/llm-request-log-source-local.ts +7 -0
package/src/memory/llm-request-log-source.ts +9 -2
package/src/memory/llm-request-log-store.ts +43 -1
package/src/memory/llm-usage-store.ts +24 -0
package/src/memory/memory-retrospective-enqueue.ts +8 -1
package/src/memory/memory-retrospective-job.ts +5 -0
package/src/memory/memory-v2-activation-log-store.ts +15 -6
package/src/memory/migrations/260-rename-cleaned-at.ts +44 -0
package/src/memory/migrations/261-llm-usage-add-raw-usage.ts +36 -0
package/src/memory/migrations/262-memory-v3-coactivation.ts +57 -0
package/src/memory/migrations/263-memory-v3-auto-edges.ts +50 -0
package/src/memory/migrations/264-llm-request-log-call-site.ts +29 -0
package/src/memory/migrations/index.ts +17 -0
package/src/memory/migrations/registry.ts +33 -0
package/src/memory/schema/conversations.ts +1 -1
package/src/memory/schema/infrastructure.ts +21 -0
package/src/memory/tool-usage-store.ts +36 -8
package/src/memory/v2/__tests__/consolidation-job.test.ts +1 -0
package/src/memory/v2/__tests__/harness-compare.test.ts +186 -0
package/src/memory/v2/__tests__/harness-metrics.test.ts +74 -0
package/src/memory/v2/__tests__/harness-oracle.test.ts +257 -0
package/src/memory/v2/__tests__/harness-replay-input.test.ts +225 -0
package/src/memory/v2/__tests__/harness-runner.test.ts +109 -0
package/src/memory/v2/__tests__/injection.test.ts +127 -98
package/src/memory/v2/__tests__/qdrant.test.ts +36 -0
package/src/memory/v2/__tests__/router.test.ts +171 -3
package/src/memory/v2/harness/compare.ts +57 -0
package/src/memory/v2/harness/metrics.ts +124 -0
package/src/memory/v2/harness/oracle.ts +145 -0
package/src/memory/v2/harness/replay-input.ts +224 -0
package/src/memory/v2/harness/retriever.ts +74 -0
package/src/memory/v2/harness/router-retriever.ts +43 -0
package/src/memory/v2/harness/runner.ts +106 -0
package/src/memory/v2/harness/trace.ts +58 -0
package/src/memory/v2/injection.ts +21 -15
package/src/memory/v2/prompts/router.ts +26 -1
package/src/memory/v2/qdrant.ts +14 -2
package/src/memory/v2/router.ts +171 -18
package/src/memory/v3/__tests__/coactivation-store.test.ts +422 -0
package/src/memory/v3/__tests__/consolidation-job.test.ts +468 -0
package/src/memory/v3/__tests__/edge-learning-job.test.ts +324 -0
package/src/memory/v3/__tests__/edges.test.ts +563 -0
package/src/memory/v3/__tests__/filter.test.ts +512 -0
package/src/memory/v3/__tests__/gate.test.ts +574 -0
package/src/memory/v3/__tests__/index-composition.test.ts +233 -0
package/src/memory/v3/__tests__/loop.test.ts +530 -0
package/src/memory/v3/__tests__/retriever.test.ts +226 -0
package/src/memory/v3/__tests__/scouts.test.ts +440 -0
package/src/memory/v3/__tests__/shadow-middleware.test.ts +312 -0
package/src/memory/v3/__tests__/system-prompts.test.ts +154 -0
package/src/memory/v3/__tests__/traversal.test.ts +469 -0
package/src/memory/v3/__tests__/tree-index.test.ts +280 -0
package/src/memory/v3/__tests__/tree-store.test.ts +529 -0
package/src/memory/v3/__tests__/tree-walk.test.ts +707 -0
package/src/memory/v3/__tests__/validate.test.ts +245 -0
package/src/memory/v3/auto-edges.ts +223 -0
package/src/memory/v3/coactivation-store.ts +124 -0
package/src/memory/v3/consolidation-job.ts +323 -0
package/src/memory/v3/edge-learning-job.ts +160 -0
package/src/memory/v3/edges.ts +249 -0
package/src/memory/v3/filter.ts +281 -0
package/src/memory/v3/gate.ts +334 -0
package/src/memory/v3/index-composition.ts +113 -0
package/src/memory/v3/llm-capture.ts +46 -0
package/src/memory/v3/loop.ts +382 -0
package/src/memory/v3/maintenance.ts +144 -0
package/src/memory/v3/prompt-context.ts +33 -0
package/src/memory/v3/prompts/consolidation.ts +458 -0
package/src/memory/v3/prompts/system-prompts.ts +196 -0
package/src/memory/v3/retriever.ts +33 -0
package/src/memory/v3/scouts.ts +420 -0
package/src/memory/v3/shadow-middleware.ts +305 -0
package/src/memory/v3/traversal.ts +206 -0
package/src/memory/v3/tree-index.ts +237 -0
package/src/memory/v3/tree-store.ts +394 -0
package/src/memory/v3/tree-walk.ts +351 -0
package/src/memory/v3/types.ts +65 -0
package/src/memory/v3/validate.ts +300 -0
package/src/notifications/adapters/macos.ts +18 -1
package/src/notifications/adapters/platform.ts +1 -1
package/src/notifications/decision-engine.ts +1 -4
package/src/notifications/emit-signal.ts +29 -49
package/src/permissions/prompter.ts +3 -3
package/src/permissions/question-prompter.ts +5 -2
package/src/permissions/secret-prompter.ts +2 -2
package/src/plugin-api/index.ts +4 -0
package/src/plugin-api/types.ts +7 -33
package/src/plugins/defaults/index.ts +6 -0
package/src/plugins/defaults/injectors.ts +18 -11
package/src/plugins/external-plugin-loader.ts +5 -68
package/src/plugins/types.ts +11 -16
package/src/proactive-artifact/aux-message-injector.ts +17 -4
package/src/prompts/__tests__/task-progress-hint-section.test.ts +3 -9
package/src/prompts/persona-resolver.ts +36 -21
package/src/prompts/sections.ts +39 -7
package/src/prompts/system-prompt.ts +50 -185
package/src/prompts/templates/BOOTSTRAP.md +2 -2
package/src/prompts/templates/system-sections.ts +230 -8
package/src/providers/__tests__/connection-model-compat.test.ts +234 -0
package/src/providers/__tests__/retry-callsite.test.ts +85 -5
package/src/providers/anthropic/client.ts +32 -66
package/src/providers/call-site-routing.ts +14 -2
package/src/providers/connection-model-compat.ts +38 -0
package/src/providers/connection-resolution.ts +16 -2
package/src/providers/gemini/client.ts +49 -6
package/src/providers/inference/adapter-factory.ts +3 -0
package/src/providers/minimax/client.ts +106 -0
package/src/providers/model-catalog.ts +43 -0
package/src/providers/model-intents.ts +1 -1
package/src/providers/openai/chat-completions-provider.ts +6 -3
package/src/providers/openai/codex-models.ts +18 -0
package/src/providers/openai/responses-provider.ts +78 -21
package/src/providers/provider-send-message.ts +7 -1
package/src/providers/retry.ts +34 -3
package/src/providers/thinking-config.ts +26 -1
package/src/providers/usage-tracking.ts +2 -0
package/src/runtime/AGENTS.md +2 -2
package/src/runtime/agent-wake.ts +1 -0
package/src/runtime/assistant-event-hub.ts +76 -6
package/src/runtime/auth/route-policy.ts +36 -0
package/src/runtime/btw-sidechain.ts +0 -6
package/src/runtime/http-types.ts +0 -2
package/src/runtime/migrations/vbundle-builder.ts +10 -3
package/src/runtime/pending-interactions.ts +0 -1
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +106 -0
package/src/runtime/routes/__tests__/memory-v2-simulate-route.test.ts +25 -6
package/src/runtime/routes/__tests__/plugins-routes.test.ts +512 -0
package/src/runtime/routes/acp-routes.test.ts +255 -6
package/src/runtime/routes/acp-routes.ts +8 -1
package/src/runtime/routes/avatar-routes.ts +10 -10
package/src/runtime/routes/background-wake-routes.ts +188 -0
package/src/runtime/routes/browser-tabs-routes.ts +200 -0
package/src/runtime/routes/btw-routes.ts +0 -6
package/src/runtime/routes/conversation-cli-routes.ts +1 -1
package/src/runtime/routes/conversation-list-routes.ts +12 -4
package/src/runtime/routes/conversation-management-routes.ts +77 -20
package/src/runtime/routes/conversation-query-routes.ts +142 -36
package/src/runtime/routes/conversation-routes.ts +252 -410
package/src/runtime/routes/conversation-starter-routes.ts +6 -3
package/src/runtime/routes/disk-pressure-routes.ts +1 -1
package/src/runtime/routes/domain-routes.ts +60 -10
package/src/runtime/routes/email-routes.ts +5 -2
package/src/runtime/routes/events-routes.ts +54 -10
package/src/runtime/routes/group-routes.ts +24 -8
package/src/runtime/routes/host-browser-routes.ts +10 -2
package/src/runtime/routes/host-cu-routes.ts +2 -2
package/src/runtime/routes/inbound-stages/acl-enforcement.ts +96 -3
package/src/runtime/routes/index.ts +8 -0
package/src/runtime/routes/inference-profile-session-handler.ts +22 -12
package/src/runtime/routes/inference-profile-session-routes.ts +7 -1
package/src/runtime/routes/llm-call-sites-routes.ts +32 -5
package/src/runtime/routes/memory-item-routes.ts +8 -3
package/src/runtime/routes/memory-v2-routes.ts +215 -5
package/src/runtime/routes/memory-v3-routes.ts +316 -0
package/src/runtime/routes/migration-routes.ts +21 -24
package/src/runtime/routes/plugins-routes.ts +337 -0
package/src/runtime/routes/rename-conversation-routes.ts +6 -2
package/src/runtime/routes/secret-routes.ts +25 -5
package/src/runtime/routes/settings-routes.ts +12 -11
package/src/runtime/routes/slack-channel-routes.ts +5 -4
package/src/runtime/routes/workspace-routes.ts +25 -10
package/src/runtime/sync/resource-sync-events.ts +106 -38
package/src/runtime/sync/sync-publisher.test.ts +49 -0
package/src/runtime/sync/sync-publisher.ts +2 -1
package/src/runtime/verification-outbound-actions.ts +73 -1
package/src/telemetry/types.ts +12 -0
package/src/telemetry/usage-telemetry-reporter.test.ts +48 -0
package/src/telemetry/usage-telemetry-reporter.ts +1 -0
package/src/tools/acp/spawn.test.ts +119 -0
package/src/tools/acp/spawn.ts +15 -2
package/src/tools/apps/definitions.ts +2 -8
package/src/tools/ask-question/ask-question-tool.test.ts +3 -3
package/src/tools/ask-question/ask-question-tool.ts +38 -45
package/src/tools/browser/__tests__/pinned-tabs.test.ts +70 -0
package/src/tools/browser/browser-execution.ts +16 -3
package/src/tools/browser/cdp-client/__tests__/browser-tabs-factory.test.ts +402 -0
package/src/tools/browser/cdp-client/__tests__/types.test.ts +3 -0
package/src/tools/browser/cdp-client/cdp-inspect-client.ts +12 -0
package/src/tools/browser/cdp-client/extension-cdp-client.ts +27 -1
package/src/tools/browser/cdp-client/factory.ts +100 -17
package/src/tools/browser/cdp-client/local-cdp-client.ts +12 -0
package/src/tools/browser/cdp-client/types.ts +65 -0
package/src/tools/browser/pinned-tabs.ts +96 -40
package/src/tools/computer-use/definitions.ts +22 -78
package/src/tools/credential-execution/make-authenticated-request.ts +3 -9
package/src/tools/credential-execution/manage-secure-command-tool.ts +3 -9
package/src/tools/credential-execution/run-authenticated-command.ts +3 -9
package/src/tools/credentials/vault.ts +3 -9
package/src/tools/document/document-tool.ts +59 -0
package/src/tools/execution-target.ts +21 -23
package/src/tools/executor.ts +6 -1
package/src/tools/filesystem/edit.ts +3 -9
package/src/tools/filesystem/list.ts +3 -9
package/src/tools/filesystem/read.ts +3 -9
package/src/tools/filesystem/write.ts +3 -9
package/src/tools/host-filesystem/edit.ts +3 -9
package/src/tools/host-filesystem/read.ts +3 -9
package/src/tools/host-filesystem/transfer.ts +3 -9
package/src/tools/host-filesystem/write.ts +3 -9
package/src/tools/host-terminal/host-shell.ts +3 -9
package/src/tools/mcp/mcp-tool-factory.ts +1 -8
package/src/tools/memory/register.test.ts +1 -1
package/src/tools/memory/register.ts +4 -9
package/src/tools/network/web-fetch.ts +3 -9
package/src/tools/network/web-search.ts +25 -32
package/src/tools/registry.ts +7 -23
package/src/tools/schema-transforms.ts +1 -1
package/src/tools/skills/execute.ts +3 -9
package/src/tools/skills/load.ts +3 -9
package/src/tools/skills/skill-tool-factory.ts +1 -8
package/src/tools/subagent/notify-parent.ts +3 -9
package/src/tools/system/request-permission.ts +3 -9
package/src/tools/terminal/shell.ts +3 -9
package/src/tools/tool-defaults.ts +94 -0
package/src/tools/types.ts +27 -98
package/src/tools/ui-surface/definitions.ts +6 -22
package/src/usage/pricing.ts +23 -0
package/src/usage/types.ts +12 -0
package/src/util/logger.ts +16 -7
package/src/util/platform.ts +7 -2
package/src/util/sqlite3-runtime.ts +65 -0
package/src/workspace/migrations/086-revert-stale-gemini-mis-rewrites.ts +1 -0
package/src/workspace/migrations/089-move-memory-tree-out-of-v3.ts +86 -0
package/src/workspace/migrations/registry.ts +2 -0
package/src/__tests__/compaction-strip-metadata-clear.test.ts +0 -206
package/src/__tests__/message-complete-display-id.test.ts +0 -175
package/src/daemon/query-complexity-router.ts +0 -75
package/src/prompts/cache-boundary.ts +0 -8

package/src/daemon/conversation-agent-loop.ts CHANGED Viewed

@@ -26,7 +26,6 @@ import type {
   TurnChannelContext,
   TurnInterfaceContext,
 } from "../channels/types.js";
-import { isAssistantFeatureFlagEnabled } from "../config/assistant-feature-flags.js";
 import {
   contextWindowConfigFromEffective,
   type EffectiveContextWindow,
@@ -60,7 +59,6 @@ import { commitAppTurnChanges } from "../memory/app-git-service.js";
 import { getApp, listAppFiles, resolveAppDir } from "../memory/app-store.js";
 import { enqueueAutoAnalysisOnCompaction } from "../memory/auto-analysis-enqueue.js";
 import {
-  clearStrippedInjectionMetadataForConversation,
   getConversation,
   getConversationOriginChannel,
   getConversationOriginInterface,
@@ -68,6 +66,7 @@ import {
   getLastUserTimestampBefore,
   getMessageById,
   provenanceFromTrustContext,
+  setConversationHistoryStrippedAt,
   setLastNotifiedInferenceProfile,
   updateConversationContextWindow,
   updateConversationSlackContextWatermark,
@@ -163,13 +162,13 @@ import {
   createEventHandlerState,
   dispatchAgentEvent,
   type EventHandlerDeps,
-  getClientDisplayMessageId,
 } from "./conversation-agent-loop-handlers.js";
 import {
   approveHostAttachmentRead,
   resolveAssistantAttachments,
 } from "./conversation-attachments.js";
 import {
+  budgetYieldUnrecoveredClassification,
   buildConversationErrorMessage,
   classifyConversationError,
   isUserCancellation,
@@ -222,10 +221,6 @@ import {
   SYNC_TAGS,
 } from "./message-types/sync.js";
 import { parseActualTokensFromError } from "./parse-actual-tokens-from-error.js";
-import {
-  classifyQueryComplexity,
-  complexityTierToProfileKey,
-} from "./query-complexity-router.js";
 import type { TraceEmitter } from "./trace-emitter.js";
 import type { TrustContext } from "./trust-context.js";
 import { stripHistoricalWebSearchResults } from "./web-search-history.js";
@@ -539,6 +534,19 @@ export interface AgentLoopConversationContext {
    * is inherited by later tool executions and nested subagents.
    */
   currentTurnOverrideProfile?: string;
+  /**
+   * Set by the `switch_inference_profile` tool when the model self-selects a
+   * different profile mid-turn. Read by `readCurrentOverrideProfile` in the
+   * agent loop so the next LLM call uses the switched profile. Reset at
+   * turn start.
+   */
+  toolRoutedProfile?: string;
+  /**
+   * True when the user has explicitly selected an inference profile for this
+   * conversation (via the composer profile picker). When set, tool-based
+   * auto-routing is suppressed — the user's explicit choice takes precedence.
+   */
+  hasExplicitProfileOverride?: boolean;
   commandIntent?: { type: string; payload?: string; languageCode?: string };
   trustContext?: TrustContext;
   /** Task-run scope for the current turn. Cleared at turn end so queued/drained turns don't inherit it. */
@@ -681,6 +689,13 @@ export async function runAgentLoopImpl(
   let yieldedForHandoff = false;
   let yieldedForBudget = false;
   let pendingCheckpointYield: "budget" | "handoff" | null = null;
+  // Captured when the auto_compress_latest_turn rerun yields at the mid-loop
+  // budget checkpoint. SSE emission happens immediately at the detection site;
+  // assistant-row persistence is deferred until after the pendingToolResults
+  // flush so we don't orphan tool_use/tool_result pairs in the durable history.
+  let budgetYieldClassification: ReturnType<
+    typeof budgetYieldUnrecoveredClassification
+  > | null = null;
   let emitTerminalExit:
     | ((reason: AgentLoopExitReason) => Promise<void>)
     | null = null;
@@ -709,52 +724,23 @@ export async function runAgentLoopImpl(
     options?.overrideProfile ??
     getConversationOverrideProfileFromRow(turnStartConversation);
+  ctx.hasExplicitProfileOverride = !!userExplicitOverride;
   const config = getConfig();
-  // Query complexity routing: when no explicit user override is set and the
-  // feature flag is enabled, classify the query and route to the appropriate
-  // profile for this turn. The override is ephemeral (not persisted).
-  let turnOverrideProfile = userExplicitOverride;
-  if (
-    !userExplicitOverride &&
-    turnCallSite === "mainAgent" &&
-    isAssistantFeatureFlagEnabled("query-complexity-routing", config)
-  ) {
-    const tier = await classifyQueryComplexity(content);
-    if (tier && tier !== "balanced") {
-      const routedProfile = complexityTierToProfileKey(tier);
-      if (config.llm.profiles?.[routedProfile]) {
-        turnOverrideProfile = routedProfile;
-      }
-    }
-  }
+  // Tool-based auto-routing: the switch_inference_profile tool lets the model
+  // self-select a different profile mid-turn. Reset the per-turn slot so a
+  // stale selection from a previous turn doesn't leak forward.
+  ctx.toolRoutedProfile = undefined;
-  // Notify clients when the auto-router selected a non-default profile.
-  if (turnOverrideProfile && turnOverrideProfile !== userExplicitOverride) {
-    const profileEntry = config.llm.profiles?.[turnOverrideProfile];
-    const label = profileEntry?.label ?? turnOverrideProfile;
-    broadcastMessage({
-      type: "turn_profile_auto_routed",
-      conversationId: ctx.conversationId,
-      profile: turnOverrideProfile,
-      profileLabel: label,
-    });
-  }
+  const turnOverrideProfile = userExplicitOverride;
-  // Only use the complexity-routed profile as a fallback — not the initial
-  // explicit override. If a mid-turn session expiry clears the conversation
-  // override, the old behavior (return undefined → revert to workspace
-  // defaults) must be preserved for non-routed turns.
-  const complexityRoutedProfile =
-    turnOverrideProfile !== userExplicitOverride
-      ? turnOverrideProfile
-      : undefined;
   const readCurrentOverrideProfile = (): string | undefined =>
     options?.overrideProfile ??
     getConversationOverrideProfileFromRow(
       getConversation(ctx.conversationId),
     ) ??
-    complexityRoutedProfile;
+    ctx.toolRoutedProfile;
   const effectiveContextWindow = resolveEffectiveContextWindow({
     llm: config.llm,
@@ -776,6 +762,7 @@ export async function runAgentLoopImpl(
   contextWindowManager.updateConfig?.(currentContextWindowConfig);
   let appliedOverrideProfile = turnOverrideProfile;
+  let emittedToolRoutedProfile: string | undefined;
   const refreshCurrentProfileState = (): string | undefined => {
     const currentOverrideProfile = readCurrentOverrideProfile();
     if (currentOverrideProfile !== appliedOverrideProfile) {
@@ -797,6 +784,24 @@ export async function runAgentLoopImpl(
         "Turn inference profile changed mid-loop",
       );
     }
+    // Emit turn_profile_auto_routed when the tool-based router selects a
+    // new profile. Deduplicated so the event fires at most once per profile.
+    if (
+      ctx.toolRoutedProfile &&
+      ctx.toolRoutedProfile !== emittedToolRoutedProfile
+    ) {
+      emittedToolRoutedProfile = ctx.toolRoutedProfile;
+      const profileEntry = config.llm.profiles?.[ctx.toolRoutedProfile];
+      const label = profileEntry?.label ?? ctx.toolRoutedProfile;
+      broadcastMessage({
+        type: "turn_profile_auto_routed",
+        conversationId: ctx.conversationId,
+        profile: ctx.toolRoutedProfile,
+        profileLabel: label,
+      });
+    }
     ctx.currentTurnOverrideProfile = currentOverrideProfile;
     return currentOverrideProfile;
   };
@@ -1645,7 +1650,7 @@ export async function runAgentLoopImpl(
     // V2 static memory block (essentials/threads/recent/buffer).
     // `currentMemoryV2Static` is the trust-gated content reused by every
     // re-injection path — it stays non-null on non-full-mode turns so
-    // that mid-turn reducer compaction (which strips the prior `<memory>`
+    // that mid-turn reducer compaction (which strips the prior `<info>`
     // block) can restore the freshest content. `memoryV2Static` is the
     // first-turn / post-compaction cadence-gated value for initial
     // injection only. `readMemoryV2StaticContent` self-gates on the v2
@@ -2307,14 +2312,7 @@ export async function runAgentLoopImpl(
       // so we compact the "raw" persistent messages.
       const rawHistory = stripInjectionsForCompaction(updatedHistory);
       ctx.messages = rawHistory;
-      try {
-        clearStrippedInjectionMetadataForConversation(ctx.conversationId);
-      } catch (err) {
-        rlog.warn(
-          { err },
-          "Failed to clear stripped-injection metadata after compaction strip (non-fatal)",
-        );
-      }
+      setConversationHistoryStrippedAt(ctx.conversationId, Date.now());
       ctx.emitActivityState(
         "thinking",
@@ -2598,14 +2596,7 @@ export async function runAgentLoopImpl(
       if (updatedHistory.length > preRunHistoryLength) {
         ctx.messages = stripInjectionsForCompaction(updatedHistory);
-        try {
-          clearStrippedInjectionMetadataForConversation(ctx.conversationId);
-        } catch (err) {
-          rlog.warn(
-            { err },
-            "Failed to clear stripped-injection metadata after compaction strip (non-fatal)",
-          );
-        }
+        setConversationHistoryStrippedAt(ctx.conversationId, Date.now());
         convergenceStripped = true;
         preRepairMessages = updatedHistory;
         preRunHistoryLength = updatedHistory.length;
@@ -2850,14 +2841,7 @@ export async function runAgentLoopImpl(
           // pre-rerun messages.
           if (updatedHistory.length > preRunHistoryLength) {
             ctx.messages = stripInjectionsForCompaction(updatedHistory);
-            try {
-              clearStrippedInjectionMetadataForConversation(ctx.conversationId);
-            } catch (err) {
-              rlog.warn(
-                { err },
-                "Failed to clear stripped-injection metadata after compaction strip (non-fatal)",
-              );
-            }
+            setConversationHistoryStrippedAt(ctx.conversationId, Date.now());
             convergenceStripped = true;
             preRepairMessages = updatedHistory;
             preRunHistoryLength = updatedHistory.length;
@@ -3006,6 +2990,32 @@ export async function runAgentLoopImpl(
         await emitTerminalExit?.("context_too_large");
         pendingCheckpointYield = null;
         onEvent(buildConversationErrorMessage(ctx.conversationId, classified));
+      } else if (yieldedForBudget && !abortController.signal.aborted) {
+        // The auto_compress_latest_turn rerun (action === "auto_compress_latest_turn"
+        // above) reset `contextTooLargeDetected` to false before its final
+        // `agentLoop.run`, so the context-too-large branch above won't fire
+        // even when that rerun yields at the mid-loop budget checkpoint with
+        // no further recovery layer to re-enter. Without surfacing this here,
+        // the turn terminates silently — the inspector sees `agent_loop_exit_reason
+        // = NULL` and the user sees no message at all (just a "ghost" turn).
+        //
+        // Unlike provider-error persistence at L3091 — which only fires when
+        // the loop produced NO assistant output — budget_yield_unrecovered
+        // typically yields AFTER one or more successful tool-use iterations,
+        // so `hasAssistantResponse` is true and that path would skip us. We
+        // capture the classification here so the live SSE event fires
+        // immediately, and persist a dedicated notice row below — after the
+        // pendingToolResults flush — so the transcript reads as: tool-use →
+        // tool results → "I couldn't fit the next step…" notice. Persisting
+        // earlier would orphan an assistant(tool_use) from its user(tool_result),
+        // breaking provider adjacency on replay.
+        budgetYieldClassification = budgetYieldUnrecoveredClassification();
+        onEvent(
+          buildConversationErrorMessage(
+            ctx.conversationId,
+            budgetYieldClassification,
+          ),
+        );
       }
     }
@@ -3081,6 +3091,52 @@ export async function runAgentLoopImpl(
       state.pendingToolResults.clear();
     }
+    // Persist the budget_yield_unrecovered notice now that any pending
+    // tool_results have flushed. The SSE event already fired upstream; this
+    // makes the row durable in the right position: tool-use → tool-results →
+    // notice. Doing it earlier (e.g. at the detection site) would land the
+    // assistant row between a tool_use and its tool_result and break provider
+    // adjacency on replay.
+    if (budgetYieldClassification && !abortController.signal.aborted) {
+      const yieldNoticeMessage = createAssistantMessage(
+        budgetYieldClassification.userMessage,
+      );
+      const yieldNoticeMetadata = {
+        ...provenanceFromTrustContext(ctx.trustContext),
+        userMessageChannel: capturedTurnChannelContext.userMessageChannel,
+        assistantMessageChannel:
+          capturedTurnChannelContext.assistantMessageChannel,
+        userMessageInterface: capturedTurnInterfaceContext.userMessageInterface,
+        assistantMessageInterface:
+          capturedTurnInterfaceContext.assistantMessageInterface,
+      };
+      try {
+        await runPipeline<PersistArgs, PersistResult>(
+          "persistence",
+          getMiddlewaresFor("persistence"),
+          defaultPersistenceTerminal,
+          {
+            op: "add",
+            conversationId: ctx.conversationId,
+            role: "assistant",
+            content: JSON.stringify(yieldNoticeMessage.content),
+            metadata: yieldNoticeMetadata,
+          },
+          buildPluginTurnContext(ctx, reqId),
+          DEFAULT_TIMEOUTS.persistence,
+        );
+      } catch (err) {
+        // Non-fatal — a DB hiccup must not escalate a budget-yield exit into
+        // a turn-level throw. The live SSE event was already emitted, so the
+        // user still sees the notice this turn even if the durable row missed.
+        rlog.warn(
+          { err },
+          "Failed to persist budget_yield_unrecovered notice (non-fatal)",
+        );
+      }
+      await emitTerminalExit?.("budget_yield_unrecovered");
+    }
     // Reconstruct history
     const newMessages = updatedHistory.slice(preRunHistoryLength).map((msg) => {
       if (msg.role !== "assistant") return msg;
@@ -3263,7 +3319,6 @@ export async function runAgentLoopImpl(
       ctx.lastAssistantAttachments = assistantAttachments;
       ctx.lastAttachmentWarnings = attachmentResult.directiveWarnings;
       syncLastAssistantMessageToDisk();
-      const clientDisplayMessageId = getClientDisplayMessageId(state);
       // Re-check: the user may have cancelled during attachment resolution
       if (abortController.signal.aborted) {
@@ -3309,9 +3364,6 @@ export async function runAgentLoopImpl(
           ...(state.lastAssistantMessageId
             ? { messageId: state.lastAssistantMessageId }
             : {}),
-          ...(clientDisplayMessageId
-            ? { displayMessageId: clientDisplayMessageId }
-            : {}),
         });
         publishLoopMessagesChanged();
       } else {
@@ -3336,9 +3388,6 @@ export async function runAgentLoopImpl(
           ...(state.lastAssistantMessageId
             ? { messageId: state.lastAssistantMessageId }
             : {}),
-          ...(clientDisplayMessageId
-            ? { displayMessageId: clientDisplayMessageId }
-            : {}),
         });
         publishLoopMessagesChanged();
@@ -3645,6 +3694,7 @@ export async function applyCompactionResult(
     result.summaryText,
     ctx.contextCompactedMessageCount,
   );
+  setConversationHistoryStrippedAt(ctx.conversationId, compactedAt);
   if (options.slackContextCompactionWatermarkTs) {
     updateConversationSlackContextWatermark(
       ctx.conversationId,

package/src/daemon/conversation-error.ts CHANGED Viewed

@@ -437,9 +437,15 @@ function classifyCore(
           errorCategory: "image_dimensions_too_large",
         };
       }
+      // Extract the provider detail after "API error (NNN): " prefix
+      const detailMatch = message.match(/API error \(\d+\):\s*(.+)/i);
+      const detail = detailMatch?.[1];
+      const suffix = detail
+        ? `: ${detail.length > 200 ? detail.slice(0, 200) + "…" : detail}`
+        : "";
       return {
         code: "PROVIDER_API",
-        userMessage: "The AI provider rejected the request.",
+        userMessage: `The AI provider rejected the request (HTTP ${error.statusCode})${suffix}`,
         retryable: true,
         errorCategory: "provider_api_error",
       };
@@ -760,6 +766,30 @@ function classifyByMessage(
   };
 }
+/**
+ * Classify a `budget_yield_unrecovered` terminal exit.
+ *
+ * Emitted when the agent loop's `auto_compress_latest_turn` rerun
+ * (the last layer of the overflow-recovery ladder) still yields at
+ * the mid-loop preflight budget checkpoint. The turn cannot proceed,
+ * but it is not a provider rejection — every compaction the loop ran
+ * has already been applied to the conversation, so the user's next
+ * message starts from the compacted history and typically succeeds.
+ *
+ * The returned `userMessage` is persisted as a `role="assistant"` row
+ * by the same path that already persists `PROVIDER_BILLING` etc., so
+ * the notice is durable across reload (not just a transient banner).
+ */
+export function budgetYieldUnrecoveredClassification(): ClassifiedConversationError {
+  return {
+    code: "BUDGET_YIELD_UNRECOVERED",
+    userMessage:
+      "I tried to compact this conversation but couldn't fit the next step into the model's context window. Send another message to continue — the compaction I did run has been saved, so your next turn starts from a smaller history.",
+    retryable: true,
+    errorCategory: "budget_yield_unrecovered",
+  };
+}
 /**
  * Build a `conversation_error` server message from a classified error.
  */

package/src/daemon/conversation-lifecycle.ts CHANGED Viewed

@@ -16,7 +16,7 @@ import {
   getMessages,
   type MessageRow,
 } from "../memory/conversation-crud.js";
-import { enqueueMemoryJob } from "../memory/jobs-store.js";
+import { enqueueMemoryJob, isMemoryEnabled } from "../memory/jobs-store.js";
 import { enqueueMemoryRetrospectiveIfEnabled } from "../memory/memory-retrospective-enqueue.js";
 import { shouldExposePersonalMemory } from "../memory/v2/static-context.js";
 import type { PermissionPrompter } from "../permissions/prompter.js";
@@ -189,17 +189,18 @@ export async function loadFromDb(ctx: LoadFromDbContext): Promise<void> {
     ctx.contextCompactedAt = conv?.contextCompactedAt ?? null;
   }
-  // `/clean` persists a timestamp; messages older than this should skip
-  // metadata rehydration and have any injection prefixes still embedded in
-  // their content stripped, so the cleaned state survives reload and forks.
-  const cleanedAt = conv?.cleanedAt ?? null;
+  // Every injection-strip event (`/clean` or compaction) updates
+  // `historyStrippedAt`. Messages older than this should skip metadata
+  // rehydration and have any injection prefixes still embedded in their
+  // content stripped, so the post-strip view survives reload and forks.
+  const historyStrippedAt = conv?.historyStrippedAt ?? null;
   const slicedDbMessages = dbMessages.slice(ctx.contextCompactedMessageCount);
-  let preCleanCount = 0;
-  if (cleanedAt != null) {
+  let preStrippedCount = 0;
+  if (historyStrippedAt != null) {
     const boundary = slicedDbMessages.findIndex(
-      (m) => m.createdAt >= cleanedAt,
+      (m) => m.createdAt >= historyStrippedAt,
     );
-    preCleanCount = boundary === -1 ? slicedDbMessages.length : boundary;
+    preStrippedCount = boundary === -1 ? slicedDbMessages.length : boundary;
   }
   // Mirror the injection-time gate (`shouldExposePersonalMemory` in
@@ -213,7 +214,7 @@ export async function loadFromDb(ctx: LoadFromDbContext): Promise<void> {
     isTrustedActor: resolveTrustClass(ctx.trustContext) === "guardian",
   });
   const parsedMessages: Message[] = slicedDbMessages.map((m, index, arr) => {
-    const isPreClean = index < preCleanCount;
+    const isPreStripped = index < preStrippedCount;
     const role = m.role as "user" | "assistant";
     let content: ContentBlock[];
     try {
@@ -233,7 +234,7 @@ export async function loadFromDb(ctx: LoadFromDbContext): Promise<void> {
     // Re-inject persisted injection blocks from metadata so it survives
     // conversation reloads (eviction, restart, fork).
-    if (role === "user" && m.metadata && !isPreClean) {
+    if (role === "user" && m.metadata && !isPreStripped) {
       try {
         const meta = JSON.parse(m.metadata);
         const isTail = index === arr.length - 1;
@@ -244,9 +245,12 @@ export async function loadFromDb(ctx: LoadFromDbContext): Promise<void> {
         // (pkb-context 30, pkb-reminder 35, memory-v2-static 38,
         // now-md 40 — the v2 static block lands inside the memory
         // prefix, so now-md splices *after* it):
-        //   [<workspace>, <turn_context>, <memory __injected>,
-        //    <memory>\n…</memory>, <NOW.md>, <system_reminder>,
+        //   [<workspace>, <turn_context>, <memory>dynamic</memory>,
+        //    <info>v2static</info>, <NOW.md>, <system_reminder>,
         //    <knowledge_base>, ...original]
+        // The v2 static block is replayed verbatim from stored metadata,
+        // so rows may carry either `<info>…</info>` or `<memory>…</memory>`
+        // depending on when they were persisted.
         // Required so Anthropic's prefix cache keeps matching msg[0]
         // across daemon restart and conversation eviction. The tail
         // row only rehydrates `memoryInjectedBlock` — the next turn
@@ -273,11 +277,12 @@ export async function loadFromDb(ctx: LoadFromDbContext): Promise<void> {
         }
         // The v2 static memory block (essentials/threads/recent/buffer
-        // wrapped in `<memory>…</memory>`) carries personal user memory.
-        // Trust-gated to mirror `shouldExposePersonalMemory` at injection
-        // time — untrusted-actor views must not read persisted personal
-        // memory back through metadata. Skipped on the tail row because
-        // the next turn re-injects fresh content on full-mode turns.
+        // wrapped in either `<info>…</info>` or `<memory>…</memory>`)
+        // carries personal user memory. Trust-gated to mirror
+        // `shouldExposePersonalMemory` at injection time — untrusted-actor
+        // views must not read persisted personal memory back through
+        // metadata. Skipped on the tail row because the next turn
+        // re-injects fresh content on full-mode turns.
         if (
           !isTail &&
           personalMemoryAllowed &&
@@ -336,13 +341,13 @@ export async function loadFromDb(ctx: LoadFromDbContext): Promise<void> {
   // Strip pre-clean messages only; post-clean messages keep the fresh
   // injections they were generated with.
   const messagesBeforeRepair =
-    preCleanCount === 0
+    preStrippedCount === 0
       ? parsedMessages
       : [
           ...stripInjectionsForCompaction(
-            parsedMessages.slice(0, preCleanCount),
+            parsedMessages.slice(0, preStrippedCount),
           ),
-          ...parsedMessages.slice(preCleanCount),
+          ...parsedMessages.slice(preStrippedCount),
         ];
   const { messages: repairedMessages, stats } =
@@ -448,7 +453,7 @@ export function disposeConversation(ctx: DisposeContext): void {
       } catch {
         // Best-effort — fall through to legacy v1 enqueue
       }
-      if (!v2Enabled) {
+      if (!v2Enabled && isMemoryEnabled()) {
         try {
           enqueueMemoryJob("graph_extract", {
             conversationId: ctx.conversationId,

package/src/daemon/conversation-runtime-assembly.ts CHANGED Viewed

@@ -1734,15 +1734,16 @@ const RUNTIME_INJECTION_PREFIXES = [
   "<background_turn>",
   "<memory_context __injected>",
   "<memory_context>", // backward-compat: strip legacy blocks from pre-__injected history
-  // The static `memory-v2-static` block (opens `<memory>\n…`) IS stripped
-  // so each compaction re-injects the freshest essentials/threads/recent/
-  // buffer view, matching the `<knowledge_base>` cadence. The dynamic
-  // activation block (opens `<memory __injected>…`) is intentionally NOT
-  // stripped — `startsWith("<memory>\n")` does not match it — so per-turn
-  // memory activations persist in history. The activation pipeline dedupes
-  // via `everInjected`, and compaction handles aggregate growth, so
-  // accumulation does not cause unbounded context growth.
+  // The static `memory-v2-static` block (`<info>\n…</info>`) and the
+  // dynamic activation block (`<memory>\n…</memory>`, plus legacy
+  // `<memory __injected>…`) are both stripped so each compaction
+  // re-injects the freshest essentials/threads/recent/buffer view and
+  // re-runs the activation pipeline, matching the `<knowledge_base>`
+  // cadence. The activation pipeline dedupes via `everInjected`, and
+  // compaction handles aggregate growth, so accumulation does not cause
+  // unbounded context growth. Both wrappers may appear in persisted rows.
   "<memory>\n",
+  "<info>\n",
   "<voice_call_control>",
   "<workspace_top_level>", // backward-compat: strip legacy workspace blocks
   // NOTE: <workspace> is intentionally NOT stripped — workspace context
@@ -2037,7 +2038,7 @@ export interface RuntimeInjectionOptions {
   /**
    * Pre-rendered v2 static memory content (essentials/threads/recent/buffer
    * concatenated, header-wrapped). When non-null on full-mode turns the
-   * `memory-v2-static` injector wraps it in `<memory>` and splices it onto
+   * `memory-v2-static` injector wraps it in `<info>` and splices it onto
    * the user message; subsequent turns leave the prior block cached on its
    * original user message.
    */

package/src/daemon/conversation-tool-setup.ts CHANGED Viewed

@@ -74,6 +74,11 @@ export function resolveTrustClass(
   return trustContext?.trustClass ?? "unknown";
 }
+import { isAssistantFeatureFlagEnabled } from "../config/assistant-feature-flags.js";
+import {
+  buildSwitchInferenceProfileToolDef,
+  SWITCH_INFERENCE_PROFILE_TOOL_NAME,
+} from "./switch-inference-profile-tool.js";
 import type { ToolSetupContext } from "./tool-setup-types.js";
 export type { ToolSetupContext } from "./tool-setup-types.js";
@@ -86,8 +91,8 @@ export type { ToolSetupContext } from "./tool-setup-types.js";
 export function buildToolDefinitions(): ToolDefinition[] {
   return [
     ...getAllToolDefinitions(),
-    ...allUiSurfaceTools.map((t) => t.getDefinition()),
-    ...coreAppProxyTools.map((t) => t.getDefinition()),
+    ...allUiSurfaceTools,
+    ...coreAppProxyTools,
   ];
 }
@@ -209,6 +214,33 @@ export function createToolExecutor(
       },
     };
+    // Intercept switch_inference_profile: daemon-internal tool that lets the
+    // model self-select a different inference profile mid-turn. No permission
+    // checks — this is a control-flow signal, not a user-visible tool.
+    if (executionName === SWITCH_INFERENCE_PROFILE_TOOL_NAME) {
+      const profile = typeof input.profile === "string" ? input.profile : "";
+      const config = getConfig();
+      const profileEntry = config.llm.profiles?.[profile];
+      if (!profileEntry) {
+        return {
+          content: `Profile "${profile}" not found. Available profiles: ${Object.keys(config.llm.profiles ?? {}).join(", ")}`,
+          isError: true,
+        };
+      }
+      if (profileEntry.status === "disabled") {
+        return {
+          content: `Profile "${profile}" is disabled.`,
+          isError: true,
+        };
+      }
+      ctx.toolRoutedProfile = profile;
+      const label = profileEntry.label ?? profile;
+      return {
+        content: `Switched to ${label} profile. Continue with your response.`,
+        isError: false,
+      };
+    }
     // Intercept skill_execute: extract the real tool name and input, then
     // route through the full executor pipeline so the underlying tool's
     // risk level, permission checks, hooks, and lifecycle events all fire
@@ -326,6 +358,14 @@ export interface SkillProjectionContext {
    * host tools into the LLM tool definitions.
    */
   readonly transportInterface?: InterfaceId;
+  /** Per-turn override profile, read by the switch_inference_profile tool injection. */
+  currentTurnOverrideProfile?: string;
+  /**
+   * True when the user has explicitly selected an inference profile for this
+   * conversation (via the composer profile picker). When set, tool-based
+   * auto-routing is suppressed — the user's explicit choice takes precedence.
+   */
+  hasExplicitProfileOverride?: boolean;
 }
 // ── Conditional tool sets ────────────────────────────────────────────
@@ -613,6 +653,26 @@ export function createResolveToolsCallback(
     }
     ctx.allowedToolNames = turnAllowed;
-    return injectActivityField(allBaseDefs, ACTIVITY_SKIP_SET);
+    const baseDefs = injectActivityField(allBaseDefs, ACTIVITY_SKIP_SET);
+    const config = getConfig();
+    if (
+      isAssistantFeatureFlagEnabled("query-complexity-routing", config) &&
+      config.llm &&
+      !ctx.hasExplicitProfileOverride
+    ) {
+      const currentProfile =
+        ctx.currentTurnOverrideProfile ?? config.llm.activeProfile;
+      const toolDef = buildSwitchInferenceProfileToolDef(
+        config.llm.profiles ?? {},
+        currentProfile,
+      );
+      if (toolDef) {
+        turnAllowed.add(SWITCH_INFERENCE_PROFILE_TOOL_NAME);
+        return [...baseDefs, toolDef];
+      }
+    }
+    return baseDefs;
   };
 }

package/src/daemon/conversation-usage.ts CHANGED Viewed

@@ -3,6 +3,7 @@ import { updateConversationUsage } from "../memory/conversation-crud.js";
 import { recordUsageEvent } from "../memory/llm-usage-store.js";
 import type { UsageActor } from "../usage/actors.js";
 import { resolveUsageAttribution } from "../usage/attribution.js";
+import { extractRawUsage } from "../usage/pricing.js";
 import type {
   AnthropicCacheCreationTokenDetails,
   PricingResult,
@@ -235,6 +236,7 @@ export function recordUsage(
         outputTokens,
         cacheCreationInputTokens: normalizedCacheCreationInputTokens,
         cacheReadInputTokens: normalizedCacheReadInputTokens,
+        rawUsage: extractRawUsage(rawResponse),
         conversationId: ctx.conversationId,
         runId: null,
         requestId,