npm - @vellumai/assistant - Versions diffs - 0.8.4 → 0.8.5 - Mend

@vellumai/assistant 0.8.4 → 0.8.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (438) hide show

package/ARCHITECTURE.md +2 -2
package/docs/browser-use-architecture-phase2.md +1 -1
package/knip.json +2 -1
package/openapi.yaml +809 -11
package/package.json +1 -1
package/src/__tests__/anthropic-provider.test.ts +34 -37
package/src/__tests__/assistant-event-hub-self-exclusion.test.ts +293 -0
package/src/__tests__/assistant-feature-flags-integration.test.ts +3 -3
package/src/__tests__/audit-log-rotation.test.ts +70 -16
package/src/__tests__/background-workers-disk-pressure.test.ts +3 -3
package/src/__tests__/btw-routes.test.ts +2 -3
package/src/__tests__/call-controller.test.ts +0 -1
package/src/__tests__/cancel-resolves-conversation-key.test.ts +1 -1
package/src/__tests__/channel-guardian.test.ts +3 -3
package/src/__tests__/checker.test.ts +6 -15
package/src/__tests__/compaction-events.test.ts +1 -0
package/src/__tests__/compactor-call-site-logging.test.ts +214 -0
package/src/__tests__/computer-use-skill-manifest-regression.test.ts +5 -11
package/src/__tests__/computer-use-tools.test.ts +2 -4
package/src/__tests__/confirmation-request-guardian-bridge.test.ts +0 -1
package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-overflow.test.ts +197 -2
package/src/__tests__/conversation-agent-loop.test.ts +163 -122
package/src/__tests__/conversation-app-control-instantiation.test.ts +2 -5
package/src/__tests__/conversation-clear-safety.test.ts +25 -25
package/src/__tests__/conversation-delete-schedule-cleanup.test.ts +1 -1
package/src/__tests__/conversation-disk-view-integration.test.ts +2 -2
package/src/__tests__/conversation-error.test.ts +31 -0
package/src/__tests__/conversation-fork-crud.test.ts +178 -15
package/src/__tests__/conversation-lifecycle.test.ts +52 -11
package/src/__tests__/{conversation-load-cleaned-at.test.ts → conversation-load-history-stripped.test.ts} +13 -13
package/src/__tests__/conversation-provider-retry-repair.test.ts +1 -0
package/src/__tests__/conversation-routes-disk-view.test.ts +109 -0
package/src/__tests__/conversation-routes-slash-commands.test.ts +35 -0
package/src/__tests__/conversation-skill-tools.test.ts +2 -5
package/src/__tests__/conversation-store.test.ts +1 -1
package/src/__tests__/conversation-sync-tags.test.ts +99 -32
package/src/__tests__/conversation-workspace-cache-state.test.ts +1 -0
package/src/__tests__/conversation-workspace-injection.test.ts +1 -1
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
package/src/__tests__/credential-execution-feature-gates.test.ts +9 -7
package/src/__tests__/credential-execution-tools.test.ts +6 -6
package/src/__tests__/credential-security-invariants.test.ts +1 -0
package/src/__tests__/credential-vault-unit.test.ts +2 -2
package/src/__tests__/dynamic-page-surface.test.ts +2 -2
package/src/__tests__/email-html-renderer.test.ts +12 -0
package/src/__tests__/gateway-flag-listener.test.ts +237 -0
package/src/__tests__/gemini-provider.test.ts +78 -0
package/src/__tests__/guardian-dispatch.test.ts +0 -1
package/src/__tests__/guardian-outbound-http.test.ts +7 -5
package/src/__tests__/handlers-user-message-approval-consumption.test.ts +1 -1
package/src/__tests__/heartbeat-disk-pressure.test.ts +4 -0
package/src/__tests__/heartbeat-service.test.ts +4 -0
package/src/__tests__/host-shell-tool.test.ts +1 -1
package/src/__tests__/init-feature-flag-overrides.test.ts +5 -6
package/src/__tests__/list-messages-tool-merge.test.ts +70 -11
package/src/__tests__/llm-request-log-call-site.test.ts +136 -0
package/src/__tests__/llm-request-log-source-clickhouse.test.ts +26 -0
package/src/__tests__/llm-resolver.test.ts +77 -9
package/src/__tests__/llm-usage-store.test.ts +66 -0
package/src/__tests__/logger.test.ts +89 -0
package/src/__tests__/mcp-abort-signal.test.ts +2 -2
package/src/__tests__/media-generate-image.test.ts +31 -0
package/src/__tests__/memory-v2-static-injector.test.ts +7 -7
package/src/__tests__/model-intents.test.ts +2 -4
package/src/__tests__/notification-guardian-path.test.ts +0 -1
package/src/__tests__/onboarding-template-contract.test.ts +1 -1
package/src/__tests__/openai-provider.test.ts +46 -0
package/src/__tests__/openai-responses-provider.test.ts +114 -12
package/src/__tests__/pending-interactions-resolved-event.test.ts +0 -1
package/src/__tests__/platform-bash-auto-approve.test.ts +2 -2
package/src/__tests__/platform.test.ts +2 -2
package/src/__tests__/plugin-api-tool-definition.test.ts +92 -0
package/src/__tests__/plugin-bootstrap.test.ts +2 -2
package/src/__tests__/plugin-tool-contribution.test.ts +13 -6
package/src/__tests__/plugin-types.test.ts +3 -2
package/src/__tests__/prechat-onboarding-contract.test.ts +131 -98
package/src/__tests__/pricing.test.ts +12 -0
package/src/__tests__/prune-jobs-changes-parser.test.ts +61 -0
package/src/__tests__/registry.test.ts +2 -8
package/src/__tests__/require-fresh-approval.test.ts +2 -2
package/src/__tests__/runtime-events-sse-bilingual.test.ts +154 -0
package/src/__tests__/shell-tool-proxy-mode.test.ts +1 -1
package/src/__tests__/skill-feature-flags.test.ts +2 -2
package/src/__tests__/skill-projection-feature-flag.test.ts +4 -7
package/src/__tests__/skill-projection.benchmark.test.ts +2 -6
package/src/__tests__/skill-tool-factory.test.ts +1 -1
package/src/__tests__/subagent-notify-parent.test.ts +1 -1
package/src/__tests__/suggestion-routes.test.ts +1 -0
package/src/__tests__/sync-message-contract.test.ts +59 -0
package/src/__tests__/system-prompt.test.ts +145 -131
package/src/__tests__/terminal-tools.test.ts +1 -1
package/src/__tests__/tool-approval-handler.test.ts +1 -5
package/src/__tests__/tool-execute-pipeline.test.ts +2 -2
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +2 -5
package/src/__tests__/tool-executor-lifecycle-events.test.ts +15 -5
package/src/__tests__/tool-executor.test.ts +9 -62
package/src/__tests__/tool-grant-request-escalation.test.ts +1 -6
package/src/__tests__/trusted-contact-approval-notifier.test.ts +0 -1
package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +1 -6
package/src/__tests__/trusted-contact-multichannel.test.ts +0 -1
package/src/__tests__/ui-file-upload-surface.test.ts +2 -2
package/src/__tests__/usage-routes.test.ts +3 -0
package/src/__tests__/verification-control-plane-policy.test.ts +2 -2
package/src/__tests__/workspace-git-service.test.ts +6 -5
package/src/__tests__/workspace-migration-089-move-memory-tree-out-of-v3.test.ts +86 -0
package/src/acp/__tests__/prepare-agent-env.test.ts +146 -0
package/src/acp/prepare-agent-env.ts +78 -0
package/src/acp/session-manager.ts +1 -1
package/src/agent/loop.ts +8 -0
package/src/api/README.md +5 -0
package/src/api/index.ts +4 -0
package/src/api/package.json +10 -0
package/src/background-wake/background-wake-routes.test.ts +233 -0
package/src/background-wake/runtime-registry.ts +24 -0
package/src/cli/commands/__tests__/browser.test.ts +23 -5
package/src/cli/commands/__tests__/domain-register.test.ts +110 -0
package/src/cli/commands/__tests__/domain-status.test.ts +33 -33
package/src/cli/commands/__tests__/inference-send.test.ts +108 -5
package/src/cli/commands/__tests__/memory-v2-compare-render.test.ts +98 -0
package/src/cli/commands/__tests__/memory-v2.test.ts +1 -0
package/src/cli/commands/__tests__/memory-v3-render.test.ts +340 -0
package/src/cli/commands/browser.ts +247 -0
package/src/cli/commands/domain.ts +91 -41
package/src/cli/commands/inference.ts +93 -40
package/src/cli/commands/memory-v2-compare-render.ts +115 -0
package/src/cli/commands/memory-v2.ts +176 -1
package/src/cli/commands/memory-v3-render.ts +344 -0
package/src/cli/commands/memory-v3.ts +316 -0
package/src/cli/program.ts +2 -0
package/src/config/assistant-feature-flags.ts +21 -9
package/src/config/bundled-skills/document-editor/SKILL.md +11 -2
package/src/config/bundled-skills/document-editor/TOOLS.json +18 -0
package/src/config/bundled-skills/document-editor/tools/document-open.ts +12 -0
package/src/config/bundled-skills/image-studio/SKILL.md +4 -0
package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +2 -2
package/src/config/bundled-skills/media-processing/tools/ingest-media.ts +13 -8
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +10 -3
package/src/config/bundled-skills/phone-calls/references/TRANSCRIPTS.md +16 -14
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +7 -2
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +7 -2
package/src/config/bundled-tool-registry.ts +2 -0
package/src/config/call-site-defaults.ts +7 -6
package/src/config/feature-flag-registry.json +16 -0
package/src/config/schemas/__tests__/memory-v2.test.ts +213 -1
package/src/config/schemas/call-site-catalog.ts +21 -7
package/src/config/schemas/llm.ts +12 -1
package/src/config/schemas/memory-v2.ts +246 -0
package/src/config/schemas/memory.ts +2 -1
package/src/context/compactor.ts +52 -0
package/src/conversations/__tests__/message-consolidation.test.ts +350 -0
package/src/conversations/message-consolidation.ts +404 -0
package/src/daemon/__tests__/conversation-tool-setup-exclude.test.ts +1 -1
package/src/daemon/__tests__/meet-manifest-loader.test.ts +1 -1
package/src/daemon/conversation-agent-loop-handlers.ts +2 -13
package/src/daemon/conversation-agent-loop.ts +126 -76
package/src/daemon/conversation-error.ts +31 -1
package/src/daemon/conversation-lifecycle.ts +27 -22
package/src/daemon/conversation-runtime-assembly.ts +10 -9
package/src/daemon/conversation-tool-setup.ts +63 -3
package/src/daemon/conversation-usage.ts +2 -0
package/src/daemon/conversation.ts +14 -29
package/src/daemon/disk-pressure-guard.ts +14 -2
package/src/daemon/handlers/config-model.test.ts +1 -0
package/src/daemon/handlers/conversations.ts +11 -3
package/src/daemon/host-browser-proxy.ts +5 -5
package/src/daemon/host-cu-proxy.ts +4 -4
package/src/daemon/host-file-proxy.ts +4 -4
package/src/daemon/host-proxy-base.ts +4 -4
package/src/daemon/host-transfer-proxy.ts +10 -10
package/src/daemon/lifecycle.ts +23 -20
package/src/daemon/meet-manifest-loader.ts +1 -7
package/src/daemon/message-types/conversations.ts +6 -9
package/src/daemon/message-types/home.ts +1 -13
package/src/daemon/message-types/messages.ts +6 -14
package/src/daemon/message-types/sync.ts +14 -0
package/src/daemon/shutdown-handlers.ts +24 -5
package/src/daemon/switch-inference-profile-tool.ts +52 -0
package/src/daemon/tool-setup-types.ts +13 -0
package/src/events/relationship-state-updated.ts +25 -0
package/src/heartbeat/__tests__/heartbeat-service.test.ts +1 -1
package/src/home/home-greeting.ts +0 -9
package/src/home/suggested-prompts.ts +0 -9
package/src/ipc/gateway-flag-listener.ts +123 -0
package/src/ipc/skill-routes/registries.ts +8 -12
package/src/memory/__tests__/db-async-query.test.ts +165 -0
package/src/memory/__tests__/db-maintenance.test.ts +115 -0
package/src/memory/__tests__/jobs-store-enqueue-gate.test.ts +241 -0
package/src/memory/__tests__/jobs-store-job-classes.test.ts +28 -1
package/src/memory/__tests__/memory-retrospective-job.test.ts +7 -0
package/src/memory/auto-analysis-enqueue.ts +5 -1
package/src/memory/conversation-crud.ts +71 -70
package/src/memory/conversation-starters-cadence.ts +3 -1
package/src/memory/conversation-title-service.ts +19 -3
package/src/memory/db-async-query.ts +214 -0
package/src/memory/db-init.ts +10 -0
package/src/memory/db-maintenance.ts +30 -21
package/src/memory/graph/bootstrap.ts +8 -1
package/src/memory/graph/capability-seed.ts +7 -3
package/src/memory/graph/conversation-graph-memory.ts +100 -17
package/src/memory/graph/extraction.ts +1 -5
package/src/memory/graph/graph-search.ts +7 -1
package/src/memory/indexer.ts +28 -18
package/src/memory/job-handlers/cleanup.ts +76 -18
package/src/memory/job-handlers/conversation-starters.ts +1 -4
package/src/memory/jobs/embed-pkb-file.ts +6 -1
package/src/memory/jobs-store.ts +14 -0
package/src/memory/jobs-worker.ts +55 -22
package/src/memory/llm-request-log-source-clickhouse.ts +42 -2
package/src/memory/llm-request-log-source-local.ts +7 -0
package/src/memory/llm-request-log-source.ts +9 -2
package/src/memory/llm-request-log-store.ts +43 -1
package/src/memory/llm-usage-store.ts +24 -0
package/src/memory/memory-retrospective-enqueue.ts +8 -1
package/src/memory/memory-retrospective-job.ts +5 -0
package/src/memory/memory-v2-activation-log-store.ts +15 -6
package/src/memory/migrations/260-rename-cleaned-at.ts +44 -0
package/src/memory/migrations/261-llm-usage-add-raw-usage.ts +36 -0
package/src/memory/migrations/262-memory-v3-coactivation.ts +57 -0
package/src/memory/migrations/263-memory-v3-auto-edges.ts +50 -0
package/src/memory/migrations/264-llm-request-log-call-site.ts +29 -0
package/src/memory/migrations/index.ts +17 -0
package/src/memory/migrations/registry.ts +33 -0
package/src/memory/schema/conversations.ts +1 -1
package/src/memory/schema/infrastructure.ts +21 -0
package/src/memory/tool-usage-store.ts +36 -8
package/src/memory/v2/__tests__/consolidation-job.test.ts +1 -0
package/src/memory/v2/__tests__/harness-compare.test.ts +186 -0
package/src/memory/v2/__tests__/harness-metrics.test.ts +74 -0
package/src/memory/v2/__tests__/harness-oracle.test.ts +257 -0
package/src/memory/v2/__tests__/harness-replay-input.test.ts +225 -0
package/src/memory/v2/__tests__/harness-runner.test.ts +109 -0
package/src/memory/v2/__tests__/injection.test.ts +127 -98
package/src/memory/v2/__tests__/qdrant.test.ts +36 -0
package/src/memory/v2/__tests__/router.test.ts +171 -3
package/src/memory/v2/harness/compare.ts +57 -0
package/src/memory/v2/harness/metrics.ts +124 -0
package/src/memory/v2/harness/oracle.ts +145 -0
package/src/memory/v2/harness/replay-input.ts +224 -0
package/src/memory/v2/harness/retriever.ts +74 -0
package/src/memory/v2/harness/router-retriever.ts +43 -0
package/src/memory/v2/harness/runner.ts +106 -0
package/src/memory/v2/harness/trace.ts +58 -0
package/src/memory/v2/injection.ts +21 -15
package/src/memory/v2/prompts/router.ts +26 -1
package/src/memory/v2/qdrant.ts +14 -2
package/src/memory/v2/router.ts +171 -18
package/src/memory/v3/__tests__/coactivation-store.test.ts +422 -0
package/src/memory/v3/__tests__/consolidation-job.test.ts +468 -0
package/src/memory/v3/__tests__/edge-learning-job.test.ts +324 -0
package/src/memory/v3/__tests__/edges.test.ts +563 -0
package/src/memory/v3/__tests__/filter.test.ts +512 -0
package/src/memory/v3/__tests__/gate.test.ts +574 -0
package/src/memory/v3/__tests__/index-composition.test.ts +233 -0
package/src/memory/v3/__tests__/loop.test.ts +530 -0
package/src/memory/v3/__tests__/retriever.test.ts +226 -0
package/src/memory/v3/__tests__/scouts.test.ts +440 -0
package/src/memory/v3/__tests__/shadow-middleware.test.ts +312 -0
package/src/memory/v3/__tests__/system-prompts.test.ts +154 -0
package/src/memory/v3/__tests__/traversal.test.ts +469 -0
package/src/memory/v3/__tests__/tree-index.test.ts +280 -0
package/src/memory/v3/__tests__/tree-store.test.ts +529 -0
package/src/memory/v3/__tests__/tree-walk.test.ts +707 -0
package/src/memory/v3/__tests__/validate.test.ts +245 -0
package/src/memory/v3/auto-edges.ts +223 -0
package/src/memory/v3/coactivation-store.ts +124 -0
package/src/memory/v3/consolidation-job.ts +323 -0
package/src/memory/v3/edge-learning-job.ts +160 -0
package/src/memory/v3/edges.ts +249 -0
package/src/memory/v3/filter.ts +281 -0
package/src/memory/v3/gate.ts +334 -0
package/src/memory/v3/index-composition.ts +113 -0
package/src/memory/v3/llm-capture.ts +46 -0
package/src/memory/v3/loop.ts +382 -0
package/src/memory/v3/maintenance.ts +144 -0
package/src/memory/v3/prompt-context.ts +33 -0
package/src/memory/v3/prompts/consolidation.ts +458 -0
package/src/memory/v3/prompts/system-prompts.ts +196 -0
package/src/memory/v3/retriever.ts +33 -0
package/src/memory/v3/scouts.ts +420 -0
package/src/memory/v3/shadow-middleware.ts +305 -0
package/src/memory/v3/traversal.ts +206 -0
package/src/memory/v3/tree-index.ts +237 -0
package/src/memory/v3/tree-store.ts +394 -0
package/src/memory/v3/tree-walk.ts +351 -0
package/src/memory/v3/types.ts +65 -0
package/src/memory/v3/validate.ts +300 -0
package/src/notifications/adapters/macos.ts +18 -1
package/src/notifications/adapters/platform.ts +1 -1
package/src/notifications/decision-engine.ts +1 -4
package/src/notifications/emit-signal.ts +29 -49
package/src/permissions/prompter.ts +3 -3
package/src/permissions/question-prompter.ts +5 -2
package/src/permissions/secret-prompter.ts +2 -2
package/src/plugin-api/index.ts +4 -0
package/src/plugin-api/types.ts +7 -33
package/src/plugins/defaults/index.ts +6 -0
package/src/plugins/defaults/injectors.ts +18 -11
package/src/plugins/external-plugin-loader.ts +5 -68
package/src/plugins/types.ts +11 -16
package/src/proactive-artifact/aux-message-injector.ts +17 -4
package/src/prompts/__tests__/task-progress-hint-section.test.ts +3 -9
package/src/prompts/persona-resolver.ts +36 -21
package/src/prompts/sections.ts +39 -7
package/src/prompts/system-prompt.ts +50 -185
package/src/prompts/templates/BOOTSTRAP.md +2 -2
package/src/prompts/templates/system-sections.ts +230 -8
package/src/providers/__tests__/connection-model-compat.test.ts +234 -0
package/src/providers/__tests__/retry-callsite.test.ts +85 -5
package/src/providers/anthropic/client.ts +32 -66
package/src/providers/call-site-routing.ts +14 -2
package/src/providers/connection-model-compat.ts +38 -0
package/src/providers/connection-resolution.ts +16 -2
package/src/providers/gemini/client.ts +49 -6
package/src/providers/inference/adapter-factory.ts +3 -0
package/src/providers/minimax/client.ts +106 -0
package/src/providers/model-catalog.ts +43 -0
package/src/providers/model-intents.ts +1 -1
package/src/providers/openai/chat-completions-provider.ts +6 -3
package/src/providers/openai/codex-models.ts +18 -0
package/src/providers/openai/responses-provider.ts +78 -21
package/src/providers/provider-send-message.ts +7 -1
package/src/providers/retry.ts +34 -3
package/src/providers/thinking-config.ts +26 -1
package/src/providers/usage-tracking.ts +2 -0
package/src/runtime/AGENTS.md +2 -2
package/src/runtime/agent-wake.ts +1 -0
package/src/runtime/assistant-event-hub.ts +76 -6
package/src/runtime/auth/route-policy.ts +36 -0
package/src/runtime/btw-sidechain.ts +0 -6
package/src/runtime/http-types.ts +0 -2
package/src/runtime/migrations/vbundle-builder.ts +10 -3
package/src/runtime/pending-interactions.ts +0 -1
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +106 -0
package/src/runtime/routes/__tests__/memory-v2-simulate-route.test.ts +25 -6
package/src/runtime/routes/__tests__/plugins-routes.test.ts +512 -0
package/src/runtime/routes/acp-routes.test.ts +255 -6
package/src/runtime/routes/acp-routes.ts +8 -1
package/src/runtime/routes/avatar-routes.ts +10 -10
package/src/runtime/routes/background-wake-routes.ts +188 -0
package/src/runtime/routes/browser-tabs-routes.ts +200 -0
package/src/runtime/routes/btw-routes.ts +0 -6
package/src/runtime/routes/conversation-cli-routes.ts +1 -1
package/src/runtime/routes/conversation-list-routes.ts +12 -4
package/src/runtime/routes/conversation-management-routes.ts +77 -20
package/src/runtime/routes/conversation-query-routes.ts +142 -36
package/src/runtime/routes/conversation-routes.ts +252 -410
package/src/runtime/routes/conversation-starter-routes.ts +6 -3
package/src/runtime/routes/disk-pressure-routes.ts +1 -1
package/src/runtime/routes/domain-routes.ts +60 -10
package/src/runtime/routes/email-routes.ts +5 -2
package/src/runtime/routes/events-routes.ts +54 -10
package/src/runtime/routes/group-routes.ts +24 -8
package/src/runtime/routes/host-browser-routes.ts +10 -2
package/src/runtime/routes/host-cu-routes.ts +2 -2
package/src/runtime/routes/inbound-stages/acl-enforcement.ts +96 -3
package/src/runtime/routes/index.ts +8 -0
package/src/runtime/routes/inference-profile-session-handler.ts +22 -12
package/src/runtime/routes/inference-profile-session-routes.ts +7 -1
package/src/runtime/routes/llm-call-sites-routes.ts +32 -5
package/src/runtime/routes/memory-item-routes.ts +8 -3
package/src/runtime/routes/memory-v2-routes.ts +215 -5
package/src/runtime/routes/memory-v3-routes.ts +316 -0
package/src/runtime/routes/migration-routes.ts +21 -24
package/src/runtime/routes/plugins-routes.ts +337 -0
package/src/runtime/routes/rename-conversation-routes.ts +6 -2
package/src/runtime/routes/secret-routes.ts +25 -5
package/src/runtime/routes/settings-routes.ts +12 -11
package/src/runtime/routes/slack-channel-routes.ts +5 -4
package/src/runtime/routes/workspace-routes.ts +25 -10
package/src/runtime/sync/resource-sync-events.ts +106 -38
package/src/runtime/sync/sync-publisher.test.ts +49 -0
package/src/runtime/sync/sync-publisher.ts +2 -1
package/src/runtime/verification-outbound-actions.ts +73 -1
package/src/telemetry/types.ts +12 -0
package/src/telemetry/usage-telemetry-reporter.test.ts +48 -0
package/src/telemetry/usage-telemetry-reporter.ts +1 -0
package/src/tools/acp/spawn.test.ts +119 -0
package/src/tools/acp/spawn.ts +15 -2
package/src/tools/apps/definitions.ts +2 -8
package/src/tools/ask-question/ask-question-tool.test.ts +3 -3
package/src/tools/ask-question/ask-question-tool.ts +38 -45
package/src/tools/browser/__tests__/pinned-tabs.test.ts +70 -0
package/src/tools/browser/browser-execution.ts +16 -3
package/src/tools/browser/cdp-client/__tests__/browser-tabs-factory.test.ts +402 -0
package/src/tools/browser/cdp-client/__tests__/types.test.ts +3 -0
package/src/tools/browser/cdp-client/cdp-inspect-client.ts +12 -0
package/src/tools/browser/cdp-client/extension-cdp-client.ts +27 -1
package/src/tools/browser/cdp-client/factory.ts +100 -17
package/src/tools/browser/cdp-client/local-cdp-client.ts +12 -0
package/src/tools/browser/cdp-client/types.ts +65 -0
package/src/tools/browser/pinned-tabs.ts +96 -40
package/src/tools/computer-use/definitions.ts +22 -78
package/src/tools/credential-execution/make-authenticated-request.ts +3 -9
package/src/tools/credential-execution/manage-secure-command-tool.ts +3 -9
package/src/tools/credential-execution/run-authenticated-command.ts +3 -9
package/src/tools/credentials/vault.ts +3 -9
package/src/tools/document/document-tool.ts +59 -0
package/src/tools/execution-target.ts +21 -23
package/src/tools/executor.ts +6 -1
package/src/tools/filesystem/edit.ts +3 -9
package/src/tools/filesystem/list.ts +3 -9
package/src/tools/filesystem/read.ts +3 -9
package/src/tools/filesystem/write.ts +3 -9
package/src/tools/host-filesystem/edit.ts +3 -9
package/src/tools/host-filesystem/read.ts +3 -9
package/src/tools/host-filesystem/transfer.ts +3 -9
package/src/tools/host-filesystem/write.ts +3 -9
package/src/tools/host-terminal/host-shell.ts +3 -9
package/src/tools/mcp/mcp-tool-factory.ts +1 -8
package/src/tools/memory/register.test.ts +1 -1
package/src/tools/memory/register.ts +4 -9
package/src/tools/network/web-fetch.ts +3 -9
package/src/tools/network/web-search.ts +25 -32
package/src/tools/registry.ts +7 -23
package/src/tools/schema-transforms.ts +1 -1
package/src/tools/skills/execute.ts +3 -9
package/src/tools/skills/load.ts +3 -9
package/src/tools/skills/skill-tool-factory.ts +1 -8
package/src/tools/subagent/notify-parent.ts +3 -9
package/src/tools/system/request-permission.ts +3 -9
package/src/tools/terminal/shell.ts +3 -9
package/src/tools/tool-defaults.ts +94 -0
package/src/tools/types.ts +27 -98
package/src/tools/ui-surface/definitions.ts +6 -22
package/src/usage/pricing.ts +23 -0
package/src/usage/types.ts +12 -0
package/src/util/logger.ts +16 -7
package/src/util/platform.ts +7 -2
package/src/util/sqlite3-runtime.ts +65 -0
package/src/workspace/migrations/086-revert-stale-gemini-mis-rewrites.ts +1 -0
package/src/workspace/migrations/089-move-memory-tree-out-of-v3.ts +86 -0
package/src/workspace/migrations/registry.ts +2 -0
package/src/__tests__/compaction-strip-metadata-clear.test.ts +0 -206
package/src/__tests__/message-complete-display-id.test.ts +0 -175
package/src/daemon/query-complexity-router.ts +0 -75
package/src/prompts/cache-boundary.ts +0 -8

package/src/providers/gemini/client.ts CHANGED Viewed

@@ -1,7 +1,6 @@
 import type * as genai from "@google/genai";
-import { ApiError, GoogleGenAI } from "@google/genai";
+import { ApiError, GoogleGenAI, ThinkingLevel } from "@google/genai";
-import { SYSTEM_PROMPT_CACHE_BOUNDARY } from "../../prompts/cache-boundary.js";
 import { isAbortReason } from "../../util/abort-reasons.js";
 import { ProviderError } from "../../util/errors.js";
 import { getLogger } from "../../util/logger.js";
@@ -34,6 +33,47 @@ function isGemini3Model(model: string): boolean {
   return model.startsWith("gemini-3") || model.startsWith("models/gemini-3");
 }
+const THINKING_LEVEL_BY_NAME: Record<string, ThinkingLevel> = {
+  minimal: ThinkingLevel.MINIMAL,
+  low: ThinkingLevel.LOW,
+  medium: ThinkingLevel.MEDIUM,
+  high: ThinkingLevel.HIGH,
+};
+/**
+ * Translate the resolved wire-shape `thinking` config into Gemini's
+ * `thinkingConfig`. Returns `undefined` when no thinking config was supplied,
+ * which lets Google's per-model default apply (e.g. `gemini-3.5-flash`
+ * defaults to dynamic medium-level thinking).
+ *
+ * `enabled: false` maps to `thinkingLevel: MINIMAL` because Gemini 3.x cannot
+ * fully disable thinking — `"minimal"` is the floor. `includeThoughts` is
+ * gated on `streamThinking` so callers that opted out of streaming thoughts
+ * don't pay for thought tokens in the response.
+ */
+function buildThinkingConfig(
+  thinking: Record<string, unknown> | undefined,
+): genai.ThinkingConfig | undefined {
+  if (!thinking) return undefined;
+  if (thinking.type === "disabled") {
+    return {
+      thinkingLevel: ThinkingLevel.MINIMAL,
+      includeThoughts: false,
+    };
+  }
+  if (thinking.type !== "adaptive") return undefined;
+  const result: genai.ThinkingConfig = {};
+  if (typeof thinking.level === "string") {
+    const mapped = THINKING_LEVEL_BY_NAME[thinking.level];
+    if (mapped) result.thinkingLevel = mapped;
+  }
+  if (typeof thinking.streamThinking === "boolean") {
+    result.includeThoughts = thinking.streamThinking;
+  }
+  return Object.keys(result).length > 0 ? result : undefined;
+}
 function stripGeminiHttpOptions(
   config: genai.GenerateContentConfig,
 ): genai.GenerateContentConfig {
@@ -175,6 +215,9 @@ export class GeminiProvider implements Provider {
     const usageAttributionHeaders = configObj?.usageAttributionHeaders as
       | Record<string, string>
       | undefined;
+    const thinkingConfig = buildThinkingConfig(
+      configObj?.thinking as Record<string, unknown> | undefined,
+    );
     const activeModel = modelOverride ?? this.model;
     try {
@@ -183,14 +226,14 @@ export class GeminiProvider implements Provider {
       const geminiConfig: genai.GenerateContentConfig = {};
       if (systemPrompt) {
-        geminiConfig.systemInstruction = systemPrompt.replaceAll(
-          SYSTEM_PROMPT_CACHE_BOUNDARY,
-          "\n",
-        );
+        geminiConfig.systemInstruction = systemPrompt;
       }
       if (maxTokens) {
         geminiConfig.maxOutputTokens = maxTokens;
       }
+      if (thinkingConfig) {
+        geminiConfig.thinkingConfig = thinkingConfig;
+      }
       if (tools && tools.length > 0) {
         geminiConfig.tools = [
           {

package/src/providers/inference/adapter-factory.ts CHANGED Viewed

@@ -21,6 +21,7 @@
 import { AnthropicProvider } from "../anthropic/client.js";
 import { FireworksProvider } from "../fireworks/client.js";
 import { GeminiProvider } from "../gemini/client.js";
+import { MinimaxProvider } from "../minimax/client.js";
 import { PROVIDER_CATALOG } from "../model-catalog.js";
 import { OllamaProvider } from "../ollama/client.js";
 import { OpenAIChatCompletionsProvider } from "../openai/chat-completions-provider.js";
@@ -111,6 +112,8 @@ const ADAPTER_FACTORIES: Record<string, AdapterFactory> = {
       streamTimeoutMs,
       ...(baseURL ? { baseURL } : {}),
     }),
+  minimax: ({ apiKey, model, streamTimeoutMs }) =>
+    new MinimaxProvider(apiKey, model, { streamTimeoutMs }),
 };
 /**

package/src/providers/minimax/client.ts ADDED Viewed

@@ -0,0 +1,106 @@
+import OpenAI from "openai";
+import { getLogger } from "../../util/logger.js";
+import { OpenAIChatCompletionsProvider } from "../openai/chat-completions-provider.js";
+const log = getLogger("minimax-client");
+/** Validation-specific timeout (10s) so a stalled network doesn't block key submission. */
+const VALIDATION_TIMEOUT_MS = 10_000;
+export interface MinimaxProviderOptions {
+  apiKey?: string;
+  baseURL?: string;
+  streamTimeoutMs?: number;
+}
+const DEFAULT_MINIMAX_BASE_URL = "https://api.minimax.io/v1";
+const FALLBACK_MINIMAX_BASE_URL = "https://api.minimaxi.com/v1";
+/**
+ * Validate a MiniMax API key by testing against the default URL first,
+ * then the fallback URL if the default fails. Both URLs must fail with
+ * definitive errors (401/403) for the key to be rejected. Transient errors
+ * (429, 5xx, network) allow the key to be stored.
+ */
+export async function validateMinimaxApiKey(
+  apiKey: string,
+): Promise<{ valid: true } | { valid: false; reason: string }> {
+  // Try default URL first
+  const defaultResult = await tryValidate(apiKey, DEFAULT_MINIMAX_BASE_URL);
+  if (defaultResult.valid && !defaultResult.transient) {
+    return { valid: true };
+  }
+  // Default failed or was transient — try fallback URL
+  const fallbackResult = await tryValidate(apiKey, FALLBACK_MINIMAX_BASE_URL);
+  if (fallbackResult.valid) {
+    return { valid: true };
+  }
+  // Both URLs failed definitively — reject the key
+  return { valid: false, reason: fallbackResult.reason };
+}
+async function tryValidate(
+  apiKey: string,
+  baseURL: string,
+): Promise<
+  | { valid: true; transient: false }
+  | { valid: true; transient: true }
+  | { valid: false; reason: string }
+> {
+  try {
+    const client = new OpenAI({
+      apiKey,
+      baseURL,
+      timeout: VALIDATION_TIMEOUT_MS,
+      maxRetries: 0,
+    });
+    await client.models.list();
+    return { valid: true, transient: false };
+  } catch (error) {
+    if (error instanceof OpenAI.APIError) {
+      if (error.status === 401) {
+        return { valid: false, reason: "API key is invalid or expired." };
+      }
+      if (error.status === 403) {
+        return {
+          valid: false,
+          reason: `MiniMax API error (${error.status}): ${error.message}`,
+        };
+      }
+      // Transient errors (429, 5xx, etc.) — try the other URL
+      log.warn(
+        { status: error.status, baseURL },
+        "MiniMax API returned a transient error during key validation — trying fallback",
+      );
+      return { valid: true, transient: true };
+    }
+    // Network errors — try the other URL
+    log.warn(
+      {
+        error: error instanceof Error ? error.message : String(error),
+        baseURL,
+      },
+      "Network error during MiniMax key validation — trying fallback",
+    );
+    return { valid: true, transient: true };
+  }
+}
+export class MinimaxProvider extends OpenAIChatCompletionsProvider {
+  constructor(
+    apiKey: string,
+    model: string,
+    options: MinimaxProviderOptions = {},
+  ) {
+    const baseURL = options.baseURL?.trim() || DEFAULT_MINIMAX_BASE_URL;
+    super(apiKey, model, {
+      baseURL,
+      providerName: "minimax",
+      providerLabel: "MiniMax",
+      streamTimeoutMs: options.streamTimeoutMs,
+    });
+  }
+}

package/src/providers/model-catalog.ts CHANGED Viewed

@@ -493,6 +493,21 @@ const RAW_PROVIDER_CATALOG: ProviderCatalogEntry[] = [
           cacheReadPer1mTokens: 0.025,
         },
       },
+      {
+        id: "gemini-3.1-flash-lite",
+        displayName: "Gemini 3.1 Flash-Lite",
+        contextWindowTokens: 1048576,
+        maxOutputTokens: 65536,
+        supportsThinking: true,
+        supportsCaching: true,
+        supportsVision: true,
+        supportsToolUse: true,
+        pricing: {
+          inputPer1mTokens: 0.25,
+          outputPer1mTokens: 1.5,
+          cacheReadPer1mTokens: 0.025,
+        },
+      },
       {
         id: "gemini-2.5-flash",
         displayName: "Gemini 2.5 Flash",
@@ -1122,6 +1137,34 @@ const RAW_PROVIDER_CATALOG: ProviderCatalogEntry[] = [
     models: [],
     defaultModel: "",
   },
+  {
+    id: "minimax",
+    displayName: "MiniMax",
+    subtitle: "MiniMax AI models. Requires a MiniMax API key.",
+    setupMode: "api-key",
+    setupHint: "Enter your MiniMax API key to enable MiniMax models.",
+    envVar: "MINIMAX_API_KEY",
+    credentialsGuide: {
+      description: "Sign in to the MiniMax dashboard and create an API key.",
+      url: "https://platform.minimax.io/",
+      linkLabel: "Open MiniMax Dashboard",
+    },
+    models: [
+      {
+        id: "MiniMax-M2.7",
+        displayName: "MiniMax M2.7",
+        contextWindowTokens: 200000,
+        maxOutputTokens: 16384,
+        supportsThinking: true,
+        supportsCaching: true,
+        supportsVision: false,
+        supportsToolUse: true,
+      },
+    ],
+    defaultModel: "MiniMax-M2.7",
+    apiKeyUrl: "https://platform.minimax.io/",
+    apiKeyPlaceholder: "sk-cp-...",
+  },
 ];
 export const PROVIDER_CATALOG: ProviderCatalogEntry[] =

package/src/providers/model-intents.ts CHANGED Viewed

@@ -24,7 +24,7 @@ const PROVIDER_MODEL_INTENTS: Record<string, Record<ModelIntent, string>> = {
   },
   gemini: {
     balanced: "gemini-3-flash-preview",
-    "latency-optimized": "gemini-3.1-flash-lite-preview",
+    "latency-optimized": "gemini-3.1-flash-lite",
     "quality-optimized": "gemini-3.1-pro-preview",
     "vision-optimized": "gemini-3-flash-preview",
   },

package/src/providers/openai/chat-completions-provider.ts CHANGED Viewed

@@ -1,6 +1,5 @@
 import OpenAI from "openai";
-import { SYSTEM_PROMPT_CACHE_BOUNDARY } from "../../prompts/cache-boundary.js";
 import { isAbortReason } from "../../util/abort-reasons.js";
 import { ProviderError } from "../../util/errors.js";
 import { extractRetryAfterMs } from "../../util/retry.js";
@@ -155,12 +154,16 @@ export class OpenAIChatCompletionsProvider implements Provider {
   ) {
     this.name = options.providerName ?? "openai";
     this.providerLabel = options.providerLabel ?? "OpenAI";
+    this.streamTimeoutMs = options.streamTimeoutMs ?? 1_800_000;
+    // Keep the SDK deadline behind our provider stream timeout so
+    // createStreamTimeout owns the user-facing timeout error.
+    const sdkTimeoutMs = this.streamTimeoutMs + 60_000;
     this.client = new OpenAI({
       apiKey,
       baseURL: options.baseURL,
+      timeout: sdkTimeoutMs,
     });
     this.model = model;
-    this.streamTimeoutMs = options.streamTimeoutMs ?? 1_800_000;
     this.extraCreateParams = options.extraCreateParams ?? {};
     this.maxReasoningEffort = options.maxReasoningEffort ?? "xhigh";
     this.requestHeaders = options.requestHeaders ?? {};
@@ -593,7 +596,7 @@ export class OpenAIChatCompletionsProvider implements Provider {
     if (systemPrompt) {
       result.push({
         role: "system",
-        content: systemPrompt.replaceAll(SYSTEM_PROMPT_CACHE_BOUNDARY, "\n"),
+        content: systemPrompt,
       });
     }

package/src/providers/openai/codex-models.ts ADDED Viewed

@@ -0,0 +1,18 @@
+/**
+ * Model IDs accepted by the ChatGPT Codex subscription endpoint
+ * (`https://chatgpt.com/backend-api/codex`).
+ *
+ * `oauth_subscription` OpenAI connections hard-route every request to that
+ * endpoint, which rejects any model outside this set with HTTP 400. The set
+ * gates whether such a connection may serve a given model during auto-
+ * resolution of an "Any active OpenAI connection" profile.
+ */
+export const CODEX_SUBSCRIPTION_MODEL_IDS: ReadonlySet<string> = new Set([
+  "gpt-5.4",
+  "gpt-5.3-codex",
+]);
+/** True when `model` is accepted by the Codex subscription endpoint. */
+export function isCodexSubscriptionModel(model: string): boolean {
+  return CODEX_SUBSCRIPTION_MODEL_IDS.has(model);
+}

package/src/providers/openai/responses-provider.ts CHANGED Viewed

@@ -1,8 +1,8 @@
 import OpenAI from "openai";
-import { SYSTEM_PROMPT_CACHE_BOUNDARY } from "../../prompts/cache-boundary.js";
 import { isAbortReason } from "../../util/abort-reasons.js";
 import { ProviderError } from "../../util/errors.js";
+import { getLogger } from "../../util/logger.js";
 import { extractRetryAfterMs } from "../../util/retry.js";
 import { escapeXmlAttr } from "../../util/xml.js";
 import { createStreamTimeout } from "../stream-timeout.js";
@@ -17,6 +17,8 @@ import type {
 import { ContextOverflowError } from "../types.js";
 import { detectOpenAICompatibleContextOverflow } from "./chat-completions-provider.js";
+const log = getLogger("openai-responses");
 export interface OpenAIResponsesProviderOptions {
   baseURL?: string;
   providerName?: string;
@@ -24,7 +26,7 @@ export interface OpenAIResponsesProviderOptions {
   streamTimeoutMs?: number;
   useNativeWebSearch?: boolean;
   /** When true, target the Codex subscription endpoint and strip fields it
-   *  rejects (`max_output_tokens`, `metadata`). */
+   *  rejects (`max_output_tokens`, `reasoning`, `text`, `tools`). */
   codexSubscription?: boolean;
 }
@@ -107,6 +109,7 @@ export class OpenAIResponsesProvider implements Provider {
   private streamTimeoutMs: number;
   private useNativeWebSearch: boolean;
   private codexSubscription: boolean;
+  private lastCodexErrorBody: string | undefined;
   constructor(
     apiKey: string,
@@ -116,14 +119,39 @@ export class OpenAIResponsesProvider implements Provider {
     this.name = options.providerName ?? "openai";
     this.providerLabel = options.providerLabel ?? "OpenAI";
     this.codexSubscription = options.codexSubscription ?? false;
+    this.streamTimeoutMs = options.streamTimeoutMs ?? 1_800_000;
+    // Keep the SDK deadline behind our provider stream timeout so
+    // createStreamTimeout owns the user-facing timeout error.
+    const sdkTimeoutMs = this.streamTimeoutMs + 60_000;
     this.client = new OpenAI({
       apiKey,
       baseURL: this.codexSubscription
         ? "https://chatgpt.com/backend-api/codex"
         : options.baseURL,
+      timeout: sdkTimeoutMs,
+      ...(this.codexSubscription
+        ? {
+            fetch: async (url: RequestInfo | URL, init?: RequestInit) => {
+              const res = await globalThis.fetch(url, init);
+              if (!res.ok) {
+                const body = await res.text();
+                this.lastCodexErrorBody = body;
+                log.warn(
+                  { status: res.status, body, url: String(url) },
+                  "Codex endpoint raw error response",
+                );
+                return new Response(body, {
+                  status: res.status,
+                  statusText: res.statusText,
+                  headers: res.headers,
+                });
+              }
+              return res;
+            },
+          }
+        : {}),
     });
     this.model = model;
-    this.streamTimeoutMs = options.streamTimeoutMs ?? 1_800_000;
     this.useNativeWebSearch = options.useNativeWebSearch ?? false;
   }
@@ -149,35 +177,35 @@ export class OpenAIResponsesProvider implements Provider {
       const params: Record<string, unknown> = {
         model: modelOverride ?? this.model,
         input,
+        ...(this.codexSubscription ? { store: false } : {}),
       };
       if (systemPrompt) {
-        params.instructions = systemPrompt.replaceAll(
-          SYSTEM_PROMPT_CACHE_BOUNDARY,
-          "\n",
-        );
+        params.instructions = systemPrompt;
       }
       if (maxTokens && !this.codexSubscription) {
         params.max_output_tokens = maxTokens;
       }
-      const reasoningEffort = effort
-        ? EFFORT_TO_REASONING_EFFORT[effort]
-        : undefined;
-      if (reasoningEffort) {
-        params.reasoning = { effort: reasoningEffort };
-      }
+      if (!this.codexSubscription) {
+        const reasoningEffort = effort
+          ? EFFORT_TO_REASONING_EFFORT[effort]
+          : undefined;
+        if (reasoningEffort) {
+          params.reasoning = { effort: reasoningEffort };
+        }
-      if (
-        verbosity &&
-        VALID_VERBOSITIES.has(verbosity) &&
-        modelSupportsVerbosity(modelOverride ?? this.model)
-      ) {
-        params.text = { verbosity };
+        if (
+          verbosity &&
+          VALID_VERBOSITIES.has(verbosity) &&
+          modelSupportsVerbosity(modelOverride ?? this.model)
+        ) {
+          params.text = { verbosity };
+        }
       }
-      if (tools && tools.length > 0) {
+      if (tools && tools.length > 0 && !this.codexSubscription) {
         if (
           this.useNativeWebSearch &&
           tools.some((t) => t.name === "web_search")
@@ -410,6 +438,21 @@ export class OpenAIResponsesProvider implements Provider {
           ? signal.reason
           : undefined;
       if (error instanceof OpenAI.APIError) {
+        // Temporary diagnostic: log the raw error shape for Codex 400 debugging
+        if (this.codexSubscription) {
+          log.warn(
+            {
+              status: error.status,
+              message: error.message,
+              code: error.code,
+              type: error.type,
+              param: error.param,
+              errorBody: error.error,
+              headers: Object.fromEntries(error.headers?.entries?.() ?? []),
+            },
+            "Codex subscription API error — raw details",
+          );
+        }
         const overflow = detectOpenAICompatibleContextOverflow(error);
         if (overflow) {
           throw new ContextOverflowError(
@@ -431,8 +474,22 @@ export class OpenAIResponsesProvider implements Provider {
         if (retryAfterMs !== undefined)
           errorOptions.retryAfterMs = retryAfterMs;
         if (abortReason) errorOptions.abortReason = abortReason;
+        let errorDetail = error.message;
+        if (this.lastCodexErrorBody) {
+          try {
+            const parsed = JSON.parse(this.lastCodexErrorBody);
+            if (parsed.detail) errorDetail = parsed.detail;
+          } catch {
+            errorDetail = this.lastCodexErrorBody.slice(0, 200);
+          }
+          this.lastCodexErrorBody = undefined;
+        }
+        const extras = [error.code, error.type, error.param]
+          .filter(Boolean)
+          .join(", ");
+        const extraSuffix = extras ? ` [${extras}]` : "";
         throw new ProviderError(
-          `${this.providerLabel} API error (${error.status}): ${error.message}`,
+          `${this.providerLabel} API error (${error.status}): ${errorDetail}${extraSuffix}`,
           this.name,
           error.status,
           Object.keys(errorOptions).length > 0 ? errorOptions : undefined,

package/src/providers/provider-send-message.ts CHANGED Viewed

@@ -9,6 +9,7 @@ import { getConfig } from "../config/loader.js";
 import type { LLMCallSite } from "../config/schemas/llm.js";
 import { getDb } from "../memory/db-connection.js";
 import { getLogger } from "../util/logger.js";
+import { isConnectionCompatibleWithModel } from "./connection-model-compat.js";
 import { tryResolveProviderForConnectionName } from "./connection-resolution.js";
 import { listConnections } from "./inference/connections.js";
 import { initializeProviders, listProviders } from "./registry.js";
@@ -126,7 +127,11 @@ export async function resolveConfiguredProvider(
         const candidates = listConnections(getDb(), {
           provider: inferenceProvider,
         });
-        const active = candidates.find((c) => c.status === "active");
+        const active = candidates.find(
+          (c) =>
+            c.status === "active" &&
+            isConnectionCompatibleWithModel(c, resolved.model),
+        );
         if (active) {
           connectionName = active.name;
         }
@@ -147,6 +152,7 @@ export async function resolveConfiguredProvider(
     connectionName,
     config,
     inferenceProvider,
+    resolved.model,
   );
   if (!connectionProvider) {
     // Soft credential failure — the connection resolved to no usable

package/src/providers/retry.ts CHANGED Viewed

@@ -47,9 +47,18 @@ const EFFORT_SUPPORTED_PROVIDERS = new Set([
 /**
  * Providers that consume the `thinking` config. Anthropic uses it directly on
  * the wire; OpenRouter either forwards it to its Anthropic-compatible path or
- * translates it into the unified `reasoning` parameter on OpenAI-compat calls.
+ * translates it into the unified `reasoning` parameter on OpenAI-compat calls;
+ * Gemini reads `thinking.level` to populate `thinkingConfig.thinkingLevel`.
  */
-const THINKING_AWARE_PROVIDERS = new Set(["anthropic", "openrouter"]);
+const THINKING_AWARE_PROVIDERS = new Set(["anthropic", "openrouter", "gemini"]);
+/**
+ * Providers that consume Gemini-only thinking extras (`level`,
+ * `streamThinking`). For other thinking-aware providers, we scrub these from
+ * the normalized wire payload because Anthropic's SDK rejects unknown keys
+ * inside the `thinking` object with "Extra inputs are not permitted".
+ */
+const THINKING_EXTRA_FIELDS_AWARE_PROVIDERS = new Set(["gemini"]);
 /**
  * Providers that consume the `verbosity` config. Currently OpenAI (mapped to
@@ -289,7 +298,8 @@ function normalizeSendMessageOptions(
   }
   // thinking is Anthropic-specific on the wire; OpenRouter reads it as a
-  // signal for its unified reasoning parameter. Strip it for other providers.
+  // signal for its unified reasoning parameter; Gemini reads `level` from it.
+  // Strip it for other providers.
   if (
     !THINKING_AWARE_PROVIDERS.has(providerName) &&
     nextConfig.thinking !== undefined
@@ -297,6 +307,27 @@ function normalizeSendMessageOptions(
     delete nextConfig.thinking;
   }
+  // Strip Gemini-only extras (`level`, `streamThinking`) from the wire
+  // `thinking` object for providers that don't read them. Anthropic in
+  // particular rejects unknown keys inside `thinking` with "Extra inputs are
+  // not permitted"; the OpenRouter Anthropic-compat path hits the same SDK.
+  if (
+    nextConfig.thinking !== undefined &&
+    !THINKING_EXTRA_FIELDS_AWARE_PROVIDERS.has(providerName) &&
+    typeof nextConfig.thinking === "object" &&
+    nextConfig.thinking !== null
+  ) {
+    const wire = nextConfig.thinking as Record<string, unknown>;
+    if (wire.level !== undefined || wire.streamThinking !== undefined) {
+      const scrubbed: Record<string, unknown> = {};
+      for (const [key, value] of Object.entries(wire)) {
+        if (key === "level" || key === "streamThinking") continue;
+        scrubbed[key] = value;
+      }
+      nextConfig.thinking = scrubbed;
+    }
+  }
   // Anthropic (and OpenRouter fronting Anthropic) rejects requests that
   // combine extended thinking with forced tool use (`tool_choice.type` of
   // `"tool"` or `"any"`).  Strip thinking when both are present so the

package/src/providers/thinking-config.ts CHANGED Viewed

@@ -1,20 +1,45 @@
+import { THINKING_LEVELS, type ThinkingLevel } from "../config/schemas/llm.js";
 type ThinkingConfigRecord = Record<string, unknown>;
+const THINKING_LEVEL_SET: ReadonlySet<string> = new Set(THINKING_LEVELS);
 function isRecord(value: unknown): value is ThinkingConfigRecord {
   return typeof value === "object" && value !== null && !Array.isArray(value);
 }
+function pickGeminiExtras(thinking: ThinkingConfigRecord): {
+  level?: ThinkingLevel;
+  streamThinking?: boolean;
+} {
+  const extras: { level?: ThinkingLevel; streamThinking?: boolean } = {};
+  if (
+    typeof thinking.level === "string" &&
+    THINKING_LEVEL_SET.has(thinking.level)
+  ) {
+    extras.level = thinking.level as ThinkingLevel;
+  }
+  if (typeof thinking.streamThinking === "boolean") {
+    extras.streamThinking = thinking.streamThinking;
+  }
+  return extras;
+}
 export function normalizeThinkingConfigForWire(
   thinking: unknown,
 ): ThinkingConfigRecord | undefined {
   if (!isRecord(thinking)) return undefined;
+  // Already in wire shape — preserve as-is so re-normalization is idempotent
+  // and Gemini-only fields stay attached for the Gemini provider to read.
   if (typeof thinking.type === "string") {
     return thinking;
   }
+  const extras = pickGeminiExtras(thinking);
   if (thinking.enabled === true) {
-    return { type: "adaptive" };
+    return { type: "adaptive", ...extras };
   }
   if (thinking.enabled === false) {

package/src/providers/usage-tracking.ts CHANGED Viewed

@@ -2,6 +2,7 @@ import { recordUsageEvent } from "../memory/llm-usage-store.js";
 import { resolveUsageAttribution } from "../usage/attribution.js";
 import {
   buildPricingUsageFromResponse,
+  extractRawUsage,
   resolveStructuredPricing,
 } from "../usage/pricing.js";
 import { getLogger } from "../util/logger.js";
@@ -76,6 +77,7 @@ export class UsageTrackingProvider implements Provider {
           outputTokens: pricingUsage.outputTokens,
           cacheCreationInputTokens: pricingUsage.cacheCreationInputTokens,
           cacheReadInputTokens: pricingUsage.cacheReadInputTokens,
+          rawUsage: extractRawUsage(response.rawResponse),
           conversationId: null,
           runId: null,
           requestId: null,

package/src/runtime/AGENTS.md CHANGED Viewed

@@ -161,10 +161,10 @@ All `/v1/*` endpoints share a per-client-IP sliding-window rate limiter (`middle
 When the limit is exceeded, the limiter returns 429 and logs a structured warning (module: `rate-limiter`) with the denied endpoint and a breakdown of which endpoints consumed the budget in the current window. This makes it easy to identify whether the cause is rapid conversation switching, polling, or unexpected request volume.
-Logs are written to `~/.vellum/workspace/data/logs/vellum.log` by default. If `logFile.dir` is configured, logs rotate daily as `assistant-YYYY-MM-DD.log` in that directory. To watch rate limit events in real time:
+Logs rotate daily into `$VELLUM_WORKSPACE_DIR/data/logs/assistant-YYYY-MM-DD.log` (or into the directory configured via `logFile.dir`). To watch rate limit events in real time:
 ```bash
-tail -f ~/.vellum/workspace/data/logs/vellum.log | grep rate-limit
+tail -f "$VELLUM_WORKSPACE_DIR/data/logs/assistant-$(date -u +%Y-%m-%d).log" | grep rate-limit
 ```
 The provider-level rate limiter (`providers/ratelimit.ts`) also logs warnings (module: `rate-limit`) when request rate or token budget limits are enforced.

package/src/runtime/agent-wake.ts CHANGED Viewed

@@ -640,6 +640,7 @@ export async function wakeAgentForOpportunity(
           JSON.stringify(record.rawResponse),
           undefined,
           record.provider,
+          "mainAgent",
         );
       } catch (err) {
         log.warn(