npm - @vellumai/assistant - Versions diffs - 0.7.2 → 0.7.3 - Mend

@vellumai/assistant 0.7.2 → 0.7.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (347) hide show

package/ARCHITECTURE.md +16 -1
package/docs/architecture/memory.md +5 -2
package/node_modules/@vellumai/gateway-client/src/ipc-client.ts +13 -4
package/node_modules/@vellumai/skill-host-contracts/src/assistant-event.ts +0 -9
package/node_modules/@vellumai/slack-text/src/index.test.ts +18 -35
package/node_modules/@vellumai/slack-text/src/index.ts +2 -48
package/openapi.yaml +449 -22
package/package.json +1 -1
package/src/__tests__/app-control-flow.test.ts +21 -11
package/src/__tests__/assistant-event-hub.test.ts +48 -0
package/src/__tests__/assistant-event.test.ts +0 -10
package/src/__tests__/assistant-events-sse-hardening.test.ts +2 -7
package/src/__tests__/assistant-feature-flags-integration.test.ts +18 -0
package/src/__tests__/auto-analysis-end-to-end.test.ts +62 -1
package/src/__tests__/background-workers-disk-pressure.test.ts +268 -0
package/src/__tests__/call-conversation-messages.test.ts +8 -2
package/src/__tests__/channel-inbound-disk-pressure.test.ts +537 -0
package/src/__tests__/channel-readiness-service.test.ts +4 -2
package/src/__tests__/config-loader-backfill.test.ts +379 -0
package/src/__tests__/config-schema.test.ts +1 -0
package/src/__tests__/config-watcher-cleanup-throttle.test.ts +18 -9
package/src/__tests__/config-watcher.test.ts +140 -69
package/src/__tests__/context-search-agent-runner.test.ts +61 -3
package/src/__tests__/context-search-conversations-source.test.ts +0 -24
package/src/__tests__/context-search-fanout.test.ts +0 -1
package/src/__tests__/context-search-memory-source.test.ts +3 -7
package/src/__tests__/context-search-memory-v2-source.test.ts +0 -2
package/src/__tests__/context-search-pkb-source.test.ts +0 -1
package/src/__tests__/context-search-workspace-source.test.ts +0 -1
package/src/__tests__/conversation-abort-tool-results.test.ts +6 -0
package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +223 -0
package/src/__tests__/conversation-agent-loop.test.ts +454 -5
package/src/__tests__/conversation-error.test.ts +150 -3
package/src/__tests__/conversation-process-callsite.test.ts +43 -0
package/src/__tests__/conversation-provider-retry-repair.test.ts +6 -0
package/src/__tests__/conversation-runtime-assembly.test.ts +65 -0
package/src/__tests__/conversation-slash-unknown.test.ts +6 -0
package/src/__tests__/conversation-speed-override.test.ts +0 -3
package/src/__tests__/conversation-store.test.ts +0 -18
package/src/__tests__/conversation-surfaces-app-control.test.ts +15 -4
package/src/__tests__/conversation-surfaces-data-persist.test.ts +404 -0
package/src/__tests__/conversation-tool-setup-app-refresh.test.ts +2 -5
package/src/__tests__/conversation-workspace-injection.test.ts +6 -0
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +6 -0
package/src/__tests__/credentials-cli.test.ts +7 -0
package/src/__tests__/cu-unified-flow.test.ts +176 -10
package/src/__tests__/date-context.test.ts +164 -2
package/src/__tests__/disk-pressure-guard.test.ts +262 -0
package/src/__tests__/disk-pressure-lifecycle.test.ts +168 -0
package/src/__tests__/disk-pressure-policy.test.ts +241 -0
package/src/__tests__/disk-pressure-routes.test.ts +379 -0
package/src/__tests__/disk-pressure-tools.test.ts +277 -0
package/src/__tests__/disk-usage.test.ts +150 -0
package/src/__tests__/events-client-registration.test.ts +52 -0
package/src/__tests__/events-dev-bypass-actor.test.ts +162 -0
package/src/__tests__/file-write-tool.test.ts +4 -10
package/src/__tests__/filing-service.test.ts +3 -4
package/src/__tests__/heartbeat-disk-pressure.test.ts +183 -0
package/src/__tests__/heartbeat-service.test.ts +260 -11
package/src/__tests__/host-app-control-proxy.test.ts +195 -25
package/src/__tests__/host-bash-proxy.test.ts +227 -34
package/src/__tests__/host-bash-routes.test.ts +178 -13
package/src/__tests__/host-cu-proxy.test.ts +210 -3
package/src/__tests__/host-cu-routes-targeted.test.ts +141 -12
package/src/__tests__/host-file-proxy-targeted.test.ts +48 -9
package/src/__tests__/host-file-proxy.test.ts +268 -6
package/src/__tests__/host-file-routes-targeted.test.ts +175 -17
package/src/__tests__/host-transfer-proxy-targeted.test.ts +408 -59
package/src/__tests__/host-transfer-routes-targeted.test.ts +232 -17
package/src/__tests__/http-user-message-parity.test.ts +107 -1
package/src/__tests__/injector-chain.test.ts +18 -6
package/src/__tests__/injector-disk-pressure.test.ts +224 -0
package/src/__tests__/managed-profile-guard.test.ts +18 -0
package/src/__tests__/mcp-abort-signal.test.ts +130 -0
package/src/__tests__/memory-admin-recall.test.ts +3 -11
package/src/__tests__/memory-retrieval-pipeline.test.ts +22 -1
package/src/__tests__/normalize-onboarding.test.ts +180 -0
package/src/__tests__/oauth-connect-routes.test.ts +316 -0
package/src/__tests__/oauth-provider-seed-logos.test.ts +24 -2
package/src/__tests__/onboarding-persona-write.test.ts +308 -0
package/src/__tests__/openai-provider.test.ts +45 -8
package/src/__tests__/persist-onboarding-artifacts.test.ts +44 -64
package/src/__tests__/platform-callback-registration.test.ts +21 -4
package/src/__tests__/platform.test.ts +2 -1
package/src/__tests__/playbook-execution.test.ts +0 -43
package/src/__tests__/plugin-tool-contribution.test.ts +47 -0
package/src/__tests__/prechat-onboarding-contract.test.ts +214 -27
package/src/__tests__/provider-tool-name.test.ts +23 -0
package/src/__tests__/relay-server.test.ts +15 -4
package/src/__tests__/runtime-events-sse.test.ts +4 -8
package/src/__tests__/scheduler-disk-pressure.test.ts +148 -0
package/src/__tests__/secret-ingress-http.test.ts +0 -1
package/src/__tests__/suggestion-routes.test.ts +46 -0
package/src/__tests__/twilio-validation.test.ts +2 -2
package/src/__tests__/workspace-migration-065-bump-stale-heartbeat-interval.test.ts +122 -0
package/src/__tests__/workspace-migration-066-seed-heartbeat-callsite-cost-default.test.ts +285 -0
package/src/__tests__/workspace-migration-068-release-notes-local-timezone.test.ts +90 -0
package/src/__tests__/workspace-migration-safe-storage-limits-release.test.ts +90 -0
package/src/approvals/guardian-decision-primitive.ts +13 -0
package/src/approvals/guardian-request-resolvers.ts +16 -17
package/src/backup/snapshot-lock.ts +2 -27
package/src/bundler/compiler-tools.ts +3 -2
package/src/calls/call-conversation-messages.ts +46 -10
package/src/cli/commands/__tests__/webhooks.test.ts +0 -4
package/src/cli/commands/bash.ts +35 -108
package/src/cli/commands/contacts.ts +64 -25
package/src/cli/commands/credentials.ts +56 -0
package/src/cli/commands/memory-v2.ts +7 -6
package/src/cli/commands/oauth/__tests__/connect.test.ts +437 -1
package/src/cli/commands/oauth/connect.ts +127 -1
package/src/cli/commands/platform/__tests__/callback-routes-list.test.ts +0 -3
package/src/cli/commands/platform/__tests__/connect.test.ts +7 -1
package/src/cli/commands/platform/__tests__/disconnect.test.ts +7 -1
package/src/cli/commands/platform/__tests__/status.test.ts +103 -6
package/src/cli/commands/platform/index.ts +16 -7
package/src/cli/commands/status.ts +57 -0
package/src/cli/program.ts +4 -2
package/src/config/assistant-feature-flags.ts +13 -3
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +4 -3
package/src/config/bundled-skills/phone-calls/references/TROUBLESHOOTING.md +13 -7
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +2 -2
package/src/config/bundled-skills/playbooks/tools/playbook-delete.ts +2 -2
package/src/config/bundled-skills/playbooks/tools/playbook-list.ts +2 -2
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +2 -2
package/src/config/env.ts +0 -8
package/src/config/feature-flag-registry.json +27 -3
package/src/config/loader.ts +127 -8
package/src/config/schemas/__tests__/memory-v2.test.ts +10 -5
package/src/config/schemas/call-site-catalog.ts +14 -0
package/src/config/schemas/channels.ts +0 -5
package/src/config/schemas/heartbeat.ts +1 -1
package/src/config/schemas/llm.ts +2 -0
package/src/config/schemas/memory-lifecycle.ts +13 -0
package/src/config/schemas/memory-v2.ts +75 -11
package/src/config/schemas/platform.ts +43 -3
package/src/config/schemas/services.ts +28 -0
package/src/config/seed-inference-profiles.ts +230 -33
package/src/contacts/contact-store.ts +0 -25
package/src/daemon/__tests__/conversation-tool-setup.test.ts +86 -25
package/src/daemon/assistant-attachments.ts +4 -4
package/src/daemon/config-watcher.ts +85 -57
package/src/daemon/conversation-agent-loop-handlers.ts +6 -0
package/src/daemon/conversation-agent-loop.ts +170 -33
package/src/daemon/conversation-error.ts +87 -15
package/src/daemon/conversation-lifecycle.ts +1 -3
package/src/daemon/conversation-process.ts +8 -0
package/src/daemon/conversation-runtime-assembly.ts +26 -0
package/src/daemon/conversation-store.ts +2 -2
package/src/daemon/conversation-surfaces.ts +195 -15
package/src/daemon/conversation-tool-setup.ts +57 -14
package/src/daemon/conversation.ts +17 -22
package/src/daemon/date-context.ts +71 -22
package/src/daemon/disk-pressure-background-gate.ts +73 -0
package/src/daemon/disk-pressure-guard.ts +343 -0
package/src/daemon/disk-pressure-policy.ts +163 -0
package/src/daemon/handlers/shared.ts +0 -1
package/src/daemon/handlers/skills.ts +3 -4
package/src/daemon/host-app-control-proxy.ts +137 -41
package/src/daemon/host-bash-proxy.ts +46 -21
package/src/daemon/host-cu-proxy.ts +49 -3
package/src/daemon/host-file-proxy.ts +43 -7
package/src/daemon/host-transfer-proxy.ts +95 -4
package/src/daemon/lifecycle.ts +79 -28
package/src/daemon/meet-host-supervisor.ts +4 -4
package/src/daemon/meet-manifest-loader.ts +0 -1
package/src/daemon/memory-v2-startup.ts +14 -4
package/src/daemon/message-protocol.ts +3 -0
package/src/daemon/message-types/conversations.ts +4 -0
package/src/daemon/message-types/disk-pressure.ts +9 -0
package/src/daemon/message-types/messages.ts +3 -0
package/src/daemon/profiler-run-store.ts +5 -5
package/src/daemon/tool-setup-types.ts +2 -2
package/src/documents/document-store.ts +85 -0
package/src/filing/filing-service.ts +30 -5
package/src/heartbeat/__tests__/heartbeat-feed-event.test.ts +9 -16
package/src/heartbeat/__tests__/heartbeat-run-store.test.ts +36 -0
package/src/heartbeat/heartbeat-run-store.ts +13 -0
package/src/heartbeat/heartbeat-service.ts +205 -31
package/src/home/feed-scheduler.ts +18 -0
package/src/inbound/platform-callback-registration.ts +8 -15
package/src/ipc/__tests__/clients-list-ipc.test.ts +169 -0
package/src/ipc/assistant-server.ts +56 -2
package/src/ipc/gateway-client.ts +37 -3
package/src/live-voice/live-voice-archive.ts +4 -4
package/src/live-voice/protocol.ts +5 -7
package/src/media/image-service.ts +1 -7
package/src/memory/__tests__/fixtures/memory-v2-activation-fixtures.ts +21 -13
package/src/memory/__tests__/jobs-worker-v2-schedule.test.ts +52 -22
package/src/memory/__tests__/memory-v2-activation-log-store.test.ts +0 -6
package/src/memory/__tests__/memory-v2-concept-frequency.test.ts +272 -0
package/src/memory/admin.ts +5 -9
package/src/memory/context-search/agent-runner.ts +19 -2
package/src/memory/context-search/sources/conversations.ts +2 -11
package/src/memory/context-search/sources/memory-v2.ts +5 -4
package/src/memory/context-search/sources/memory.ts +0 -1
package/src/memory/context-search/types.ts +0 -1
package/src/memory/conversation-crud.ts +4 -12
package/src/memory/db-init.ts +2 -0
package/src/memory/embedding-runtime-manager.ts +119 -5
package/src/memory/graph/__tests__/conversation-graph-memory-v2-routing.test.ts +32 -21
package/src/memory/graph/conversation-graph-memory.ts +42 -54
package/src/memory/graph/extraction.ts +1 -3
package/src/memory/graph/graph-search.test.ts +10 -67
package/src/memory/graph/graph-search.ts +1 -20
package/src/memory/graph/retriever.test.ts +6 -0
package/src/memory/graph/retriever.ts +6 -10
package/src/memory/indexer.ts +54 -45
package/src/memory/job-handlers/backfill.ts +2 -11
package/src/memory/job-handlers/cleanup.ts +43 -0
package/src/memory/job-handlers/embedding.ts +6 -8
package/src/memory/job-handlers/summarization.ts +2 -7
package/src/memory/jobs-store.ts +48 -0
package/src/memory/jobs-worker.ts +81 -43
package/src/memory/memory-v2-activation-log-store.ts +32 -14
package/src/memory/memory-v2-concept-frequency.ts +169 -0
package/src/memory/migrations/239-trace-events-created-at-index.ts +18 -0
package/src/memory/migrations/index.ts +1 -0
package/src/memory/pkb/pkb-search.test.ts +6 -0
package/src/memory/qdrant-client.ts +0 -13
package/src/memory/rerank-local.ts +374 -0
package/src/memory/search/semantic.ts +6 -67
package/src/memory/trace-event-store.ts +1 -17
package/src/memory/v2/__tests__/activation.test.ts +311 -250
package/src/memory/v2/__tests__/consolidation-job.test.ts +40 -8
package/src/memory/v2/__tests__/injection.test.ts +157 -167
package/src/memory/v2/__tests__/prompts-consolidation.test.ts +61 -2
package/src/memory/v2/__tests__/qdrant.test.ts +16 -0
package/src/memory/v2/__tests__/reranker.test.ts +338 -0
package/src/memory/v2/__tests__/sim.test.ts +5 -199
package/src/memory/v2/__tests__/skill-store.test.ts +71 -65
package/src/memory/v2/__tests__/static-context.test.ts +76 -1
package/src/memory/v2/activation.ts +149 -156
package/src/memory/v2/consolidation-job.ts +62 -12
package/src/memory/v2/injection.ts +47 -60
package/src/memory/v2/prompts/consolidation.ts +36 -1
package/src/memory/v2/qdrant.ts +99 -0
package/src/memory/v2/reranker.ts +177 -0
package/src/memory/v2/sim.ts +10 -84
package/src/memory/v2/skill-content.ts +4 -3
package/src/memory/v2/skill-store.ts +82 -59
package/src/memory/v2/static-context.ts +22 -0
package/src/memory/v2/types.ts +10 -10
package/src/notifications/copy-composer.ts +13 -0
package/src/notifications/signal.ts +4 -0
package/src/oauth/AGENTS.md +3 -1
package/src/oauth/__tests__/oauth-connect-state.test.ts +137 -0
package/src/oauth/connect-orchestrator.ts +2 -0
package/src/oauth/connection-resolver.test.ts +66 -1
package/src/oauth/connection-resolver.ts +55 -1
package/src/oauth/oauth-connect-state.ts +77 -0
package/src/oauth/seed-providers.ts +58 -1
package/src/plugins/defaults/injectors.ts +35 -2
package/src/plugins/defaults/memory-retrieval.ts +5 -6
package/src/plugins/types.ts +7 -0
package/src/proactive-artifact/aux-message-injector.ts +74 -0
package/src/proactive-artifact/decision.test.ts +226 -0
package/src/proactive-artifact/decision.ts +165 -0
package/src/proactive-artifact/index.ts +7 -0
package/src/proactive-artifact/job.test.ts +867 -0
package/src/proactive-artifact/job.ts +352 -0
package/src/proactive-artifact/message-copy.ts +41 -0
package/src/proactive-artifact/trigger-state.test.ts +277 -0
package/src/proactive-artifact/trigger-state.ts +119 -0
package/src/prompts/normalize-onboarding.ts +80 -0
package/src/prompts/persona-resolver.ts +101 -9
package/src/prompts/system-prompt.ts +21 -7
package/src/prompts/templates/BOOTSTRAP.md +13 -5
package/src/providers/__tests__/retry-callsite.test.ts +222 -1
package/src/providers/model-intents.ts +7 -0
package/src/providers/openrouter/client.ts +8 -0
package/src/providers/retry.ts +50 -0
package/src/providers/types.ts +1 -0
package/src/runtime/__tests__/agent-wake.test.ts +456 -3
package/src/runtime/agent-wake.ts +238 -100
package/src/runtime/assistant-event-hub.ts +36 -6
package/src/runtime/assistant-event.ts +0 -1
package/src/runtime/auth/__tests__/route-policy.test.ts +64 -0
package/src/runtime/auth/route-policy.ts +14 -1
package/src/runtime/auth/same-actor.ts +216 -0
package/src/runtime/channel-retry-sweep.ts +65 -1
package/src/runtime/guardian-reply-router.ts +10 -0
package/src/runtime/local-actor-identity.ts +52 -11
package/src/runtime/pending-interactions.ts +8 -0
package/src/runtime/routes/__tests__/client-routes.test.ts +155 -0
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +0 -5
package/src/runtime/routes/__tests__/heartbeat-routes.test.ts +1 -1
package/src/runtime/routes/client-routes.ts +20 -2
package/src/runtime/routes/contact-routes.ts +0 -25
package/src/runtime/routes/conversation-routes.ts +35 -26
package/src/runtime/routes/debug-bash-routes.ts +163 -0
package/src/runtime/routes/disk-pressure-routes.ts +121 -0
package/src/runtime/routes/document-pdf-renderer.ts +6 -2
package/src/runtime/routes/documents-routes.ts +2 -75
package/src/runtime/routes/events-routes.ts +41 -9
package/src/runtime/routes/host-bash-routes.ts +23 -3
package/src/runtime/routes/host-cu-routes.ts +33 -6
package/src/runtime/routes/host-file-routes.ts +32 -6
package/src/runtime/routes/host-transfer-routes.ts +79 -16
package/src/runtime/routes/identity-routes.ts +7 -138
package/src/runtime/routes/inbound-message-handler.ts +77 -12
package/src/runtime/routes/inbound-stages/guardian-reply-intercept.ts +3 -0
package/src/runtime/routes/index.ts +6 -0
package/src/runtime/routes/memory-item-routes.test.ts +41 -15
package/src/runtime/routes/memory-v2-routes.ts +33 -0
package/src/runtime/routes/oauth-connect-routes.ts +153 -0
package/src/runtime/verification-outbound-actions.ts +4 -4
package/src/schedule/run-script.ts +37 -5
package/src/schedule/scheduler.ts +20 -1
package/src/security/encrypted-store.ts +2 -0
package/src/security/secure-keys.ts +55 -0
package/src/skills/remote-skill-policy.ts +4 -10
package/src/subagent/index.ts +1 -7
package/src/subagent/manager.ts +1 -15
package/src/tasks/task-runner.ts +0 -1
package/src/tasks/task-store.ts +0 -3
package/src/tools/background-tool-registry.ts +17 -3
package/src/tools/host-filesystem/edit.test.ts +151 -0
package/src/tools/host-filesystem/edit.ts +43 -1
package/src/tools/host-filesystem/read.test.ts +129 -0
package/src/tools/host-filesystem/read.ts +43 -1
package/src/tools/host-filesystem/transfer.test.ts +127 -2
package/src/tools/host-filesystem/transfer.ts +56 -11
package/src/tools/host-filesystem/write.test.ts +134 -0
package/src/tools/host-filesystem/write.ts +43 -1
package/src/tools/host-terminal/host-shell.ts +13 -6
package/src/tools/mcp/mcp-tool-factory.ts +2 -1
package/src/tools/memory/register.test.ts +12 -9
package/src/tools/memory/register.ts +1 -2
package/src/tools/provider-tool-name.ts +28 -0
package/src/tools/registry.ts +30 -9
package/src/tools/terminal/shell.ts +9 -1
package/src/tools/tool-approval-handler.ts +31 -6
package/src/tools/types.ts +24 -2
package/src/tts/provider-catalog.ts +3 -5
package/src/util/disk-usage.ts +138 -0
package/src/util/platform.ts +21 -11
package/src/util/process-liveness.ts +26 -0
package/src/workspace/heartbeat-service.ts +19 -0
package/src/workspace/migrations/065-bump-stale-heartbeat-interval.ts +60 -0
package/src/workspace/migrations/066-seed-heartbeat-callsite-cost-default.ts +146 -0
package/src/workspace/migrations/067-release-notes-safe-storage-limits.ts +72 -0
package/src/workspace/migrations/068-release-notes-local-timezone.ts +65 -0
package/src/workspace/migrations/registry.ts +8 -0
package/src/__tests__/conversation-tool-setup-memory-scope.test.ts +0 -167
package/src/memory/v2/__tests__/skill-qdrant.test.ts +0 -657
package/src/memory/v2/skill-qdrant.ts +0 -404
package/src/signals/bash.ts +0 -198

package/src/providers/model-intents.ts CHANGED Viewed

@@ -11,31 +11,37 @@ const PROVIDER_DEFAULT_MODELS: Record<string, string> = Object.fromEntries(
 const PROVIDER_MODEL_INTENTS: Record<string, Record<ModelIntent, string>> = {
   anthropic: {
+    balanced: "claude-sonnet-4-6",
     "latency-optimized": "claude-haiku-4-5-20251001",
     "quality-optimized": "claude-opus-4-7",
     "vision-optimized": "claude-opus-4-6",
   },
   openai: {
+    balanced: "gpt-5.4-mini",
     "latency-optimized": "gpt-5.4-nano",
     "quality-optimized": "gpt-5.4",
     "vision-optimized": "gpt-5.4",
   },
   gemini: {
+    balanced: "gemini-3-flash-preview",
     "latency-optimized": "gemini-3.1-flash-lite-preview",
     "quality-optimized": "gemini-3.1-pro-preview",
     "vision-optimized": "gemini-3-flash-preview",
   },
   ollama: {
+    balanced: "llama3.2",
     "latency-optimized": "llama3.2",
     "quality-optimized": "llama3.2",
     "vision-optimized": "llama3.2",
   },
   fireworks: {
+    balanced: "accounts/fireworks/models/kimi-k2p5",
     "latency-optimized": "accounts/fireworks/models/kimi-k2p5",
     "quality-optimized": "accounts/fireworks/models/kimi-k2p5",
     "vision-optimized": "accounts/fireworks/models/kimi-k2p5",
   },
   openrouter: {
+    balanced: "anthropic/claude-sonnet-4.6",
     "latency-optimized": "anthropic/claude-haiku-4.5",
     "quality-optimized": "anthropic/claude-opus-4.7",
     "vision-optimized": "anthropic/claude-opus-4.6",
@@ -45,6 +51,7 @@ const PROVIDER_MODEL_INTENTS: Record<string, Record<ModelIntent, string>> = {
 const FALLBACK_DEFAULT_MODEL = "claude-opus-4-7";
 const MODEL_INTENTS = new Set<ModelIntent>([
+  "balanced",
   "latency-optimized",
   "quality-optimized",
   "vision-optimized",

package/src/providers/openrouter/client.ts CHANGED Viewed

@@ -1,3 +1,4 @@
+import { ProviderError } from "../../util/errors.js";
 import { AnthropicProvider } from "../anthropic/client.js";
 import { OpenAIChatCompletionsProvider } from "../openai/chat-completions-provider.js";
 import { isThinkingConfigEnabled } from "../thinking-config.js";
@@ -139,6 +140,13 @@ export class OpenRouterProvider extends OpenAIChatCompletionsProvider {
           cause: error,
         });
       }
+      if (error instanceof ProviderError && error.provider !== this.name) {
+        throw new ProviderError(error.message, this.name, error.statusCode, {
+          cause: error.cause ?? error,
+          retryAfterMs: error.retryAfterMs,
+          abortReason: error.abortReason,
+        });
+      }
       throw error;
     }
   }

package/src/providers/retry.ts CHANGED Viewed

@@ -273,6 +273,56 @@ function normalizeSendMessageOptions(
     delete nextConfig.thinking;
   }
+  // Anthropic (and OpenRouter fronting Anthropic) rejects requests that
+  // combine extended thinking with `temperature` ≠ 1. From the API:
+  //   "`temperature` may only be set to 1 when thinking is enabled or in
+  //   adaptive mode."
+  //
+  // Defense-in-depth: callers that hardcode a non-default temperature in
+  // their per-call config are easy to miss when reviewing — we already had
+  // this bug ship in three places (reply suggestions, recall agent
+  // round, recall fallback finalize). Drop the offending temperature with
+  // a warn log so the request goes through with Anthropic's default
+  // (which is 1 in thinking mode anyway). We keep `thinking` rather than
+  // `temperature` because thinking is the more deliberate, profile-level
+  // choice — silently downgrading reasoning capacity for an unrelated
+  // per-call hint would be the worse failure mode.
+  //
+  // Scope:
+  // - Anthropic: always.
+  // - OpenRouter fronting `anthropic/*`: same wire constraint applies.
+  // - Other providers: not our problem here (e.g. OpenAI reasoning models
+  //   strip `temperature` upstream; non-Anthropic OpenRouter reasoning
+  //   models don't have this exact constraint).
+  const isThinkingTemperatureConflict = (() => {
+    if (nextConfig.thinking == null) return false;
+    if (isThinkingConfigDisabled(nextConfig.thinking)) return false;
+    const temp = nextConfig.temperature;
+    if (typeof temp !== "number") return false;
+    if (temp === 1) return false;
+    if (providerName === "anthropic") return true;
+    if (providerName === "openrouter") {
+      const model =
+        typeof nextConfig.model === "string" ? nextConfig.model : "";
+      return model.startsWith("anthropic/");
+    }
+    return false;
+  })();
+  if (isThinkingTemperatureConflict) {
+    log.warn(
+      {
+        providerName,
+        callSite: config.callSite,
+        droppedTemperature: nextConfig.temperature,
+      },
+      "Dropping `temperature` because thinking is enabled — Anthropic only " +
+        "accepts `temperature: 1` (or unset) when thinking/adaptive mode is " +
+        "on. Set `thinking: { type: 'disabled' }` on the call site if you " +
+        "need a specific temperature.",
+    );
+    delete nextConfig.temperature;
+  }
   // effort is supported by Anthropic, OpenAI, and OpenAI-compatible providers; strip for others
   if (
     !EFFORT_SUPPORTED_PROVIDERS.has(providerName) &&

package/src/providers/types.ts CHANGED Viewed

@@ -91,6 +91,7 @@ export interface Message {
 }
 export type ModelIntent =
+  | "balanced"
   | "latency-optimized"
   | "quality-optimized"
   | "vision-optimized";

package/src/runtime/__tests__/agent-wake.test.ts CHANGED Viewed

@@ -17,6 +17,8 @@
 import { beforeEach, describe, expect, mock, test } from "bun:test";
+import type { DiskPressureStatus } from "../../daemon/disk-pressure-guard.js";
 // Stub the DB-backed override-profile read so unit tests don't need a
 // real SQLite database. The wake helper calls this on every invocation
 // to honor the conversation's pinned inference profile.
@@ -24,6 +26,48 @@ mock.module("../../memory/conversation-crud.js", () => ({
   getConversationOverrideProfile: () => undefined,
 }));
+mock.module("../../config/loader.js", () => ({
+  getConfig: () => ({ llm: {} }),
+  loadConfig: () => ({ llm: {} }),
+  loadRawConfig: () => ({}),
+  saveRawConfig: () => {},
+  getConfigReadOnly: () => ({ llm: {} }),
+  applyNestedDefaults: (config: unknown) => config,
+  deepMergeOverwrite: (base: unknown) => base,
+  mergeDefaultWorkspaceConfig: () => {},
+  getNestedValue: () => undefined,
+  setNestedValue: () => {},
+  API_KEY_PROVIDERS: [],
+  _appendQuarantineBulletin: () => {},
+  invalidateConfigCache: () => {},
+}));
+mock.module("../../config/llm-context-resolution.js", () => ({
+  resolveEffectiveContextWindow: () => ({
+    maxInputTokens: 200_000,
+  }),
+}));
+let mockDiskPressureStatus: DiskPressureStatus = {
+  enabled: false,
+  state: "disabled",
+  locked: false,
+  acknowledged: false,
+  overrideActive: false,
+  effectivelyLocked: false,
+  lockId: null,
+  usagePercent: null,
+  thresholdPercent: 95,
+  path: null,
+  lastCheckedAt: null,
+  blockedCapabilities: [],
+  error: null,
+};
+mock.module("../../daemon/disk-pressure-guard.js", () => ({
+  getDiskPressureStatus: () => mockDiskPressureStatus,
+}));
 import type { AgentEvent } from "../../agent/loop.js";
 import type { Message } from "../../providers/types.js";
 import {
@@ -37,7 +81,11 @@ import {
 interface MockTarget extends WakeTarget {
   emittedEvents: AgentEvent[];
   pushedMessages: Message[];
-  runCalls: Array<{ input: Message[]; requestId?: string }>;
+  runCalls: Array<{
+    input: Message[];
+    requestId?: string;
+    turnContext?: unknown;
+  }>;
   processingToggles: boolean[];
   /** Tail messages handed to `persistTailMessage`, in call order. */
   persistedTailCalls: Message[];
@@ -70,7 +118,11 @@ function makeTarget(options: {
 }): MockTarget {
   const emittedEvents: AgentEvent[] = [];
   const pushedMessages: Message[] = [];
-  const runCalls: Array<{ input: Message[]; requestId?: string }> = [];
+  const runCalls: Array<{
+    input: Message[];
+    requestId?: string;
+    turnContext?: unknown;
+  }> = [];
   const processingToggles: boolean[] = [];
   const persistedTailCalls: Message[] = [];
   const callSequence: string[] = [];
@@ -97,8 +149,11 @@ function makeTarget(options: {
         onEvent: (event: AgentEvent) => void | Promise<void>,
         _signal?: AbortSignal,
         requestId?: string,
+        _onCheckpoint?: unknown,
+        _callSite?: unknown,
+        turnContext?: unknown,
       ) => {
-        runCalls.push({ input: [...input], requestId });
+        runCalls.push({ input: [...input], requestId, turnContext });
         // Emit any scripted events the test wanted us to produce.
         for (const ev of options.scriptedEvents ?? []) {
           await onEvent(ev);
@@ -165,11 +220,163 @@ function makeTarget(options: {
 beforeEach(() => {
   __resetWakeChainForTests();
+  mockDiskPressureStatus = {
+    enabled: false,
+    state: "disabled",
+    locked: false,
+    acknowledged: false,
+    overrideActive: false,
+    effectivelyLocked: false,
+    lockId: null,
+    usagePercent: null,
+    thresholdPercent: 95,
+    path: null,
+    lastCheckedAt: null,
+    blockedCapabilities: [],
+    error: null,
+  };
 });
 // ── Tests ────────────────────────────────────────────────────────────
 describe("wakeAgentForOpportunity", () => {
+  test("disabled disk pressure flag allows background wakes to pass through", async () => {
+    const target = makeTarget({
+      scriptedAssistant: null,
+    });
+    const result = await wakeAgentForOpportunity(
+      {
+        conversationId: target.conversationId,
+        hint: "background completion",
+        source: "background-tool",
+      },
+      { resolveTarget: async () => target },
+    );
+    expect(result).toEqual({ invoked: true, producedToolCalls: false });
+    expect(target.runCalls).toHaveLength(1);
+  });
+  test("blocks background wakes during disk pressure before marking processing", async () => {
+    mockDiskPressureStatus = {
+      enabled: true,
+      state: "critical",
+      locked: true,
+      acknowledged: true,
+      overrideActive: false,
+      effectivelyLocked: true,
+      lockId: "disk-pressure-test",
+      usagePercent: 98,
+      thresholdPercent: 95,
+      path: "/",
+      lastCheckedAt: "2026-05-05T00:00:00.000Z",
+      blockedCapabilities: ["agent-turns", "background-work", "remote-ingress"],
+      error: null,
+    };
+    const target = makeTarget({
+      isProcessing: true,
+      scriptedAssistant: {
+        role: "assistant",
+        content: [{ type: "text", text: "should not run" }],
+      },
+    });
+    const result = await wakeAgentForOpportunity(
+      {
+        conversationId: target.conversationId,
+        hint: "background shell completed",
+        source: "background-tool",
+        trustContext: { sourceChannel: "vellum", trustClass: "guardian" },
+      },
+      { resolveTarget: async () => target },
+    );
+    expect(result).toEqual({
+      invoked: false,
+      producedToolCalls: false,
+      reason: "disk_pressure",
+    });
+    expect(target.runCalls).toHaveLength(0);
+    expect(target.processingToggles).toEqual([]);
+    expect(target.drainQueueCalls).toBe(0);
+    expect(target.isProcessing()).toBe(true);
+  });
+  test("blocks trusted-contact direct wakes during disk pressure", async () => {
+    mockDiskPressureStatus = {
+      enabled: true,
+      state: "critical",
+      locked: true,
+      acknowledged: true,
+      overrideActive: false,
+      effectivelyLocked: true,
+      lockId: "disk-pressure-test",
+      usagePercent: 98,
+      thresholdPercent: 95,
+      path: "/",
+      lastCheckedAt: "2026-05-05T00:00:00.000Z",
+      blockedCapabilities: ["agent-turns", "background-work", "remote-ingress"],
+      error: null,
+    };
+    const target = makeTarget({ scriptedAssistant: null });
+    const result = await wakeAgentForOpportunity(
+      {
+        conversationId: target.conversationId,
+        hint: "notify the guardian",
+        source: "notification",
+        trustContext: {
+          sourceChannel: "slack",
+          trustClass: "trusted_contact",
+        },
+      },
+      { resolveTarget: async () => target },
+    );
+    expect(result.reason).toBe("disk_pressure");
+    expect(target.runCalls).toHaveLength(0);
+  });
+  test("threads cleanup-mode injection context for explicit local-owner wakes", async () => {
+    mockDiskPressureStatus = {
+      enabled: true,
+      state: "critical",
+      locked: true,
+      acknowledged: true,
+      overrideActive: false,
+      effectivelyLocked: true,
+      lockId: "disk-pressure-test",
+      usagePercent: 98,
+      thresholdPercent: 95,
+      path: "/",
+      lastCheckedAt: "2026-05-05T00:00:00.000Z",
+      blockedCapabilities: ["agent-turns", "background-work", "remote-ingress"],
+      error: null,
+    };
+    const target = makeTarget({ scriptedAssistant: null });
+    const result = await wakeAgentForOpportunity(
+      {
+        conversationId: target.conversationId,
+        hint: "clean storage",
+        source: "local-cleanup",
+        sourceChannel: "vellum",
+        sourceInterface: "macos",
+      },
+      { resolveTarget: async () => target },
+    );
+    expect(result).toEqual({ invoked: true, producedToolCalls: false });
+    expect(target.runCalls).toHaveLength(1);
+    expect(target.runCalls[0]!.turnContext).toMatchObject({
+      conversationId: target.conversationId,
+      injectionInputs: {
+        diskPressureContext: { cleanupModeActive: true },
+      },
+    });
+  });
   test("silent no-op when agent produces no tool calls and no text", async () => {
     const target = makeTarget({
       baseline: [
@@ -982,4 +1189,250 @@ describe("wakeAgentForOpportunity", () => {
       expect(target.processingDuringDrain).toEqual([false]);
     },
   );
+  test(
+    "checkpoint fires mid-run: events stream live and tail is persisted " +
+      "incrementally so a long-running wake is observable",
+    async () => {
+      // Locks in the streaming-during-run fix. A long-running wake (e.g.
+      // memory consolidation, often 5-30 minutes and 30+ turns) must
+      // emit events and persist tail messages as each turn finalizes —
+      // otherwise opening the conversation mid-flight returns 0 messages
+      // from fetchHistory and the client renders the empty welcome
+      // state instead of the in-progress turns.
+      const turn1Assistant: Message = {
+        role: "assistant",
+        content: [
+          { type: "tool_use", id: "tu-1", name: "file_write", input: {} },
+        ],
+      };
+      const turn1ToolResult: Message = {
+        role: "user",
+        content: [{ type: "tool_result", tool_use_id: "tu-1", content: "ok" }],
+      };
+      const turn2Assistant: Message = {
+        role: "assistant",
+        content: [
+          { type: "tool_use", id: "tu-2", name: "remember", input: {} },
+        ],
+      };
+      const turn2ToolResult: Message = {
+        role: "user",
+        content: [{ type: "tool_result", tool_use_id: "tu-2", content: "ok" }],
+      };
+      const finalAssistant: Message = {
+        role: "assistant",
+        content: [{ type: "text", text: "All done." }],
+      };
+      const emittedEvents: AgentEvent[] = [];
+      const pushedMessages: Message[] = [];
+      const persistedTailCalls: Message[] = [];
+      // Snapshot of how many tail messages had been persisted at each
+      // point a streaming event reached the target. This is the actual
+      // observability invariant: when a turn-2 streaming event arrives,
+      // turn-1's messages must already be persisted so a fetchHistory
+      // call from a client opening the conversation mid-stream returns
+      // turn-1's content.
+      const persistedAtEachEmit: number[] = [];
+      const baseline: Message[] = [
+        { role: "user", content: [{ type: "text", text: "hi" }] },
+      ];
+      const history: Message[] = [...baseline];
+      let processing = false;
+      const target: WakeTarget = {
+        conversationId: "conv-stream",
+        agentLoop: {
+          run: async (_input, onEvent, _signal, _requestId, onCheckpoint) => {
+            // Preamble + assistant hint + postamble (mirrors what the
+            // wake injects). The agent-wake helper expects these three
+            // hint messages in the input it hands to run().
+            const runHistory: Message[] = [..._input];
+            // Turn 1: stream a text_delta + message_complete, then
+            // fire the checkpoint after the tool_result lands.
+            await onEvent({ type: "text_delta", text: "Working" });
+            runHistory.push(turn1Assistant);
+            await onEvent({
+              type: "message_complete",
+              message: turn1Assistant,
+            });
+            runHistory.push(turn1ToolResult);
+            const dec1 = await onCheckpoint!({
+              turnIndex: 0,
+              toolCount: 1,
+              hasToolUse: true,
+              history: runHistory,
+            });
+            expect(dec1).toBe("continue");
+            // Turn 2: another tool turn — must already see the live
+            // streaming because mode flipped after turn 1.
+            await onEvent({ type: "text_delta", text: "Still going" });
+            runHistory.push(turn2Assistant);
+            await onEvent({
+              type: "message_complete",
+              message: turn2Assistant,
+            });
+            runHistory.push(turn2ToolResult);
+            const dec2 = await onCheckpoint!({
+              turnIndex: 1,
+              toolCount: 1,
+              hasToolUse: true,
+              history: runHistory,
+            });
+            expect(dec2).toBe("continue");
+            // Final assistant message with no tool calls — loop would
+            // exit. onCheckpoint does NOT fire for the terminal turn,
+            // so the post-run flushPendingTail must catch this one.
+            await onEvent({ type: "text_delta", text: "All done." });
+            runHistory.push(finalAssistant);
+            await onEvent({
+              type: "message_complete",
+              message: finalAssistant,
+            });
+            return runHistory;
+          },
+        },
+        getMessages: () => history,
+        pushMessage: (msg) => {
+          pushedMessages.push(msg);
+          history.push(msg);
+        },
+        emitAgentEvent: (event) => {
+          emittedEvents.push(event);
+          persistedAtEachEmit.push(persistedTailCalls.length);
+        },
+        isProcessing: () => processing,
+        markProcessing: (on) => {
+          processing = on;
+        },
+        persistTailMessage: async (msg) => {
+          persistedTailCalls.push(msg);
+        },
+      };
+      const result = await wakeAgentForOpportunity(
+        {
+          conversationId: "conv-stream",
+          hint: "consolidate",
+          source: "memory_v2_consolidation",
+        },
+        { resolveTarget: async () => target },
+      );
+      expect(result).toEqual({ invoked: true, producedToolCalls: true });
+      // All 5 tail messages persisted in order. The first two via
+      // turn-1 checkpoint, the next two via turn-2 checkpoint, and
+      // `finalAssistant` via the post-run flush.
+      expect(persistedTailCalls).toHaveLength(5);
+      expect(persistedTailCalls[0]).toBe(turn1Assistant);
+      expect(persistedTailCalls[1]).toBe(turn1ToolResult);
+      expect(persistedTailCalls[2]).toBe(turn2Assistant);
+      expect(persistedTailCalls[3]).toBe(turn2ToolResult);
+      expect(persistedTailCalls[4]).toBe(finalAssistant);
+      // Critical observability invariant: by the time turn-2's
+      // streaming text_delta reached the client, turn-1's messages
+      // were already persisted. A client opening the conversation at
+      // that moment would fetchHistory and see turn-1, plus stream
+      // turn-2 live — instead of seeing an empty welcome view.
+      const turn2DeltaIdx = emittedEvents.findIndex(
+        (e) => e.type === "text_delta" && e.text === "Still going",
+      );
+      expect(turn2DeltaIdx).toBeGreaterThan(-1);
+      expect(persistedAtEachEmit[turn2DeltaIdx]).toBeGreaterThanOrEqual(2);
+    },
+  );
+  test(
+    "checkpoint-driven wake injects ui_surface card into the first " +
+      "assistant tail message",
+    async () => {
+      // The wake card ("Conversation Woke") is the visual entry point —
+      // it must land in the first assistant message regardless of
+      // whether the wake produced output via checkpoints or only via
+      // post-run (tool-free) detection. This test covers the
+      // checkpoint path; the existing post-run path is covered by the
+      // tool_use tests above.
+      const firstAssistant: Message = {
+        role: "assistant",
+        content: [
+          { type: "tool_use", id: "tu-1", name: "some_tool", input: {} },
+        ],
+      };
+      const toolResult: Message = {
+        role: "user",
+        content: [{ type: "tool_result", tool_use_id: "tu-1", content: "ok" }],
+      };
+      const persistedTailCalls: Message[] = [];
+      const baseline: Message[] = [
+        { role: "user", content: [{ type: "text", text: "hi" }] },
+      ];
+      const history: Message[] = [...baseline];
+      let processing = false;
+      const wakeProducedOutputCalls: string[] = [];
+      const target: WakeTarget = {
+        conversationId: "conv-card",
+        agentLoop: {
+          run: async (_input, _onEvent, _signal, _requestId, onCheckpoint) => {
+            const runHistory: Message[] = [..._input];
+            runHistory.push(firstAssistant);
+            runHistory.push(toolResult);
+            await onCheckpoint!({
+              turnIndex: 0,
+              toolCount: 1,
+              hasToolUse: true,
+              history: runHistory,
+            });
+            return runHistory;
+          },
+        },
+        getMessages: () => history,
+        pushMessage: (msg) => {
+          history.push(msg);
+        },
+        emitAgentEvent: () => {},
+        isProcessing: () => processing,
+        markProcessing: (on) => {
+          processing = on;
+        },
+        persistTailMessage: async (msg) => {
+          persistedTailCalls.push(msg);
+        },
+        onWakeProducedOutput: (_source, _hint, surfaceId) => {
+          wakeProducedOutputCalls.push(surfaceId);
+        },
+      };
+      await wakeAgentForOpportunity(
+        {
+          conversationId: "conv-card",
+          hint: "do the thing",
+          source: "memory_v2_consolidation",
+        },
+        { resolveTarget: async () => target },
+      );
+      // ui_surface fired exactly once (idempotent goLive), and the
+      // surfaceId matches the block prepended into the first
+      // assistant message.
+      expect(wakeProducedOutputCalls).toHaveLength(1);
+      const persistedFirst = persistedTailCalls[0];
+      expect(persistedFirst).toBeDefined();
+      const blocks = Array.isArray(persistedFirst!.content)
+        ? persistedFirst!.content
+        : [];
+      const uiBlock = blocks.find(
+        (b: { type?: string }) => b.type === "ui_surface",
+      ) as { surfaceId?: string } | undefined;
+      expect(uiBlock).toBeDefined();
+      expect(uiBlock!.surfaceId).toBe(wakeProducedOutputCalls[0]);
+    },
+  );
 });