npm - @vellumai/assistant - Versions diffs - 0.8.2 → 0.8.4 - Mend

@vellumai/assistant 0.8.2 → 0.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (503) hide show

package/ARCHITECTURE.md +11 -12
package/docker-entrypoint.sh +13 -2
package/docker-init-apt-root.sh +79 -6
package/node_modules/@vellumai/gateway-client/src/types.ts +2 -0
package/openapi.yaml +945 -36
package/package.json +1 -1
package/src/__tests__/agent-loop-exit-reason.test.ts +271 -0
package/src/__tests__/agent-loop-override-profile.test.ts +1 -1
package/src/__tests__/agent-loop-provider-error-recording.test.ts +195 -0
package/src/__tests__/agent-loop.test.ts +88 -3
package/src/__tests__/anthropic-provider.test.ts +272 -0
package/src/__tests__/approval-cascade.test.ts +1 -1
package/src/__tests__/background-workers-disk-pressure.test.ts +2 -1
package/src/__tests__/channel-delivery-store.test.ts +193 -0
package/src/__tests__/channel-reply-delivery.test.ts +284 -5
package/src/__tests__/channel-retry-sweep.test.ts +274 -1
package/src/__tests__/compaction-events.test.ts +1 -1
package/src/__tests__/compactor-preserved-tail-count.test.ts +110 -0
package/src/__tests__/compactor-tail-resolution.test.ts +107 -1
package/src/__tests__/config-get-vision-flag.test.ts +136 -0
package/src/__tests__/config-loader-backfill.test.ts +115 -18
package/src/__tests__/config-watcher.test.ts +1 -1
package/src/__tests__/context-token-estimator.test.ts +112 -57
package/src/__tests__/conversation-abort-tool-results.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +54 -3
package/src/__tests__/conversation-agent-loop-overflow.test.ts +31 -6
package/src/__tests__/conversation-agent-loop.test.ts +77 -3
package/src/__tests__/conversation-app-control-lifecycle.test.ts +1 -1
package/src/__tests__/conversation-clean-command.test.ts +137 -0
package/src/__tests__/conversation-confirmation-signals.test.ts +1 -1
package/src/__tests__/conversation-fork-crud.test.ts +161 -0
package/src/__tests__/conversation-lifecycle.test.ts +1 -1
package/src/__tests__/conversation-load-cleaned-at.test.ts +279 -0
package/src/__tests__/conversation-load-history-repair.test.ts +1 -1
package/src/__tests__/conversation-media-retry.test.ts +19 -8
package/src/__tests__/conversation-pairing.test.ts +2 -2
package/src/__tests__/conversation-process-callsite.test.ts +1 -1
package/src/__tests__/conversation-provider-retry-repair.test.ts +1 -1
package/src/__tests__/conversation-queue.test.ts +1 -1
package/src/__tests__/conversation-runtime-assembly.test.ts +290 -85
package/src/__tests__/conversation-seed-composer.test.ts +66 -4
package/src/__tests__/conversation-slash-commands.test.ts +36 -8
package/src/__tests__/conversation-slash-queue.test.ts +1 -1
package/src/__tests__/conversation-slash-unknown.test.ts +1 -1
package/src/__tests__/conversation-speed-override.test.ts +1 -1
package/src/__tests__/conversation-surfaces-task-progress.test.ts +220 -0
package/src/__tests__/conversation-workspace-cache-state.test.ts +1 -1
package/src/__tests__/conversation-workspace-injection.test.ts +5 -1
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +5 -1
package/src/__tests__/credential-security-invariants.test.ts +6 -0
package/src/__tests__/cu-unified-flow.test.ts +10 -1
package/src/__tests__/date-context.test.ts +45 -0
package/src/__tests__/dm-backfill.test.ts +64 -0
package/src/__tests__/dm-persistence.test.ts +33 -0
package/src/__tests__/document-find-replace.test.ts +501 -0
package/src/__tests__/external-plugin-loader.test.ts +91 -19
package/src/__tests__/first-greeting.test.ts +23 -2
package/src/__tests__/guardian-action-no-hardcoded-copy.test.ts +0 -1
package/src/__tests__/guardian-dispatch.test.ts +1 -0
package/src/__tests__/headless-browser-navigate.test.ts +172 -0
package/src/__tests__/heartbeat-service.test.ts +24 -164
package/src/__tests__/helpers/channel-test-adapter.ts +0 -2
package/src/__tests__/host-app-control-proxy.test.ts +241 -0
package/src/__tests__/host-bash-proxy.test.ts +6 -0
package/src/__tests__/host-browser-proxy.test.ts +10 -0
package/src/__tests__/host-cu-proxy.test.ts +8 -1
package/src/__tests__/host-file-proxy.test.ts +8 -1
package/src/__tests__/host-proxy-preactivation.test.ts +200 -13
package/src/__tests__/host-transfer-proxy.test.ts +8 -1
package/src/__tests__/identity-routes.test.ts +57 -0
package/src/__tests__/inbound-slack-persistence.test.ts +3 -0
package/src/__tests__/injector-background-turn.test.ts +153 -0
package/src/__tests__/injector-chain.test.ts +7 -0
package/src/__tests__/injector-document-comments.test.ts +378 -0
package/src/__tests__/injector-pkb-v2-silenced.test.ts +4 -25
package/src/__tests__/lifecycle-memory-v2-seed.test.ts +9 -2
package/src/__tests__/list-messages-attachments.test.ts +21 -17
package/src/__tests__/list-messages-hidden-metadata.test.ts +217 -0
package/src/__tests__/list-messages-page-latest.test.ts +130 -14
package/src/__tests__/list-messages-tool-merge.test.ts +17 -16
package/src/__tests__/llm-callsite-catalog.test.ts +25 -0
package/src/__tests__/llm-catalog-parity.test.ts +3 -0
package/src/__tests__/llm-context-normalization.test.ts +0 -2
package/src/__tests__/llm-request-log-agent-loop-exit-reason.test.ts +116 -0
package/src/__tests__/llm-request-log-error-payload.test.ts +138 -0
package/src/__tests__/llm-request-log-source-clickhouse.test.ts +2 -0
package/src/__tests__/llm-resolver.test.ts +340 -3
package/src/__tests__/log-export-routes.test.ts +99 -2
package/src/__tests__/managed-profile-guard.test.ts +10 -0
package/src/__tests__/message-queue-steer.test.ts +114 -0
package/src/__tests__/notification-decision-fallback.test.ts +0 -91
package/src/__tests__/notification-decision-strategy.test.ts +14 -31
package/src/__tests__/notification-deep-link.test.ts +15 -0
package/src/__tests__/notification-guardian-path.test.ts +1 -2
package/src/__tests__/notification-platform-adapter.test.ts +5 -4
package/src/__tests__/notification-telegram-adapter.test.ts +1 -0
package/src/__tests__/notification-vellum-adapter.test.ts +113 -0
package/src/__tests__/openai-provider.test.ts +323 -3
package/src/__tests__/openai-responses-cutover-guard.test.ts +3 -3
package/src/__tests__/openai-responses-provider.test.ts +4 -4
package/src/__tests__/openrouter-provider-only.test.ts +51 -3
package/src/__tests__/openrouter-token-estimation.test.ts +34 -25
package/src/__tests__/outbound-slack-persistence.test.ts +187 -20
package/src/__tests__/pending-interactions-resolved-event.test.ts +190 -0
package/src/__tests__/platform-proxy-context.test.ts +6 -1
package/src/__tests__/platform.test.ts +0 -3
package/src/__tests__/plugin-source-watcher.test.ts +302 -0
package/src/__tests__/plugin-tool-contribution.test.ts +3 -3
package/src/__tests__/plugin-types.test.ts +2 -2
package/src/__tests__/process-message-background-slack.test.ts +1 -51
package/src/__tests__/process-message-display-content.test.ts +21 -16
package/src/__tests__/provider-catalog-visibility.test.ts +16 -0
package/src/__tests__/provider-platform-proxy-integration.test.ts +27 -25
package/src/__tests__/secret-routes-platform-proxy.test.ts +1 -1
package/src/__tests__/server-history-render.test.ts +83 -4
package/src/__tests__/steer-tool-repair.test.ts +249 -0
package/src/__tests__/system-prompt.test.ts +57 -101
package/src/__tests__/terminal-tools.test.ts +11 -1
package/src/__tests__/thinking-block-replay.test.ts +113 -0
package/src/__tests__/thread-backfill.test.ts +370 -22
package/src/__tests__/tool-executor.test.ts +90 -1
package/src/__tests__/tool-result-metadata-plumbing.test.ts +167 -0
package/src/__tests__/twilio-routes.test.ts +1 -1
package/src/__tests__/web-fetch.test.ts +2 -2
package/src/__tests__/workspace-git-service.test.ts +88 -5
package/src/__tests__/workspace-migration-087-memory-router-balanced-profile.test.ts +228 -0
package/src/__tests__/workspace-migration-088-deprecate-background-conversation-override.test.ts +158 -0
package/src/a2a/__tests__/agent-card.test.ts +98 -0
package/src/a2a/__tests__/e2e-a2a-channel.test.ts +597 -0
package/src/a2a/__tests__/protocol-helpers.test.ts +113 -0
package/src/a2a/__tests__/task-store.test.ts +246 -0
package/src/a2a/agent-card.ts +58 -0
package/src/a2a/feature-gate.ts +8 -0
package/src/a2a/protocol-constants.ts +21 -0
package/src/a2a/protocol-errors.ts +50 -0
package/src/a2a/protocol-types.ts +162 -0
package/src/a2a/task-store.ts +168 -0
package/src/agent/attachments.ts +1 -0
package/src/agent/loop.ts +208 -22
package/src/background-wake/next-wake.test.ts +289 -0
package/src/background-wake/next-wake.ts +172 -0
package/src/browser/operations.ts +15 -0
package/src/channels/config.ts +9 -0
package/src/channels/types.ts +14 -0
package/src/cli/commands/__tests__/conversations-slack.test.ts +572 -0
package/src/cli/commands/__tests__/memory-v2.test.ts +9 -12
package/src/cli/{__tests__ → commands/__tests__}/notifications.test.ts +201 -28
package/src/cli/commands/__tests__/schedules.test.ts +469 -0
package/src/cli/commands/conversations.ts +128 -1
package/src/cli/commands/inference-providers.ts +147 -1
package/src/cli/commands/memory-v2.ts +308 -0
package/src/cli/commands/notifications.ts +89 -37
package/src/cli/commands/plugins.ts +67 -0
package/src/cli/commands/schedules.ts +297 -5
package/src/cli/lib/__tests__/search-plugins.test.ts +261 -0
package/src/cli/lib/install-from-github.ts +8 -9
package/src/cli/lib/search-plugins.ts +163 -0
package/src/cli/program.ts +14 -0
package/src/cli/utils/conversation-id.ts +17 -5
package/src/config/assistant-feature-flags.ts +24 -54
package/src/config/bundled-skills/app-builder/SKILL.md +117 -1
package/src/config/bundled-skills/document-editor/SKILL.md +115 -0
package/src/config/bundled-skills/document-editor/TOOLS.json +240 -0
package/src/config/bundled-skills/document-editor/tools/comment-list.ts +12 -0
package/src/config/bundled-skills/document-editor/tools/comment-reply.ts +12 -0
package/src/config/bundled-skills/document-editor/tools/comment-resolve.ts +12 -0
package/src/config/bundled-skills/document-editor/tools/document-find.ts +12 -0
package/src/config/bundled-skills/document-editor/tools/document-replace-text.ts +12 -0
package/src/config/bundled-skills/media-processing/SKILL.md +8 -0
package/src/config/bundled-skills/phone-calls/SKILL.md +1 -1
package/src/config/bundled-skills/schedule/SKILL.md +8 -0
package/src/config/bundled-tool-registry.ts +22 -12
package/src/config/call-site-defaults.ts +124 -0
package/src/config/feature-flag-registry.json +111 -23
package/src/config/llm-resolver.ts +66 -1
package/src/config/schema.ts +2 -0
package/src/config/schemas/__tests__/memory-v2.test.ts +7 -3
package/src/config/schemas/call-site-catalog.ts +21 -0
package/src/config/schemas/channels.ts +9 -0
package/src/config/schemas/conversations.ts +10 -0
package/src/config/schemas/heartbeat.ts +14 -0
package/src/config/schemas/llm.ts +4 -3
package/src/config/schemas/memory-retrospective.ts +1 -1
package/src/config/schemas/memory-v2.ts +51 -4
package/src/config/schemas/memory.ts +3 -1
package/src/config/seed-inference-profiles.ts +99 -29
package/src/context/compactor.ts +80 -13
package/src/context/token-estimator.ts +72 -31
package/src/context/window-manager.ts +25 -0
package/src/credential-health/credential-health-service.ts +34 -19
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +3 -22
package/src/daemon/__tests__/conversation-tool-setup.test.ts +66 -6
package/src/daemon/__tests__/native-web-search-metadata.test.ts +357 -0
package/src/daemon/__tests__/web-search-status-text.test.ts +287 -0
package/src/daemon/conversation-agent-loop-handlers.ts +231 -23
package/src/daemon/conversation-agent-loop.ts +252 -56
package/src/daemon/conversation-lifecycle.ts +142 -116
package/src/daemon/conversation-messaging.ts +3 -0
package/src/daemon/conversation-process.ts +273 -0
package/src/daemon/conversation-queue-manager.ts +14 -0
package/src/daemon/conversation-runtime-assembly.ts +144 -75
package/src/daemon/conversation-slash.ts +37 -5
package/src/daemon/conversation-surfaces.ts +45 -2
package/src/daemon/conversation-tool-setup.ts +7 -0
package/src/daemon/conversation.ts +42 -12
package/src/daemon/date-context.ts +40 -0
package/src/daemon/first-greeting.ts +10 -0
package/src/daemon/guardian-action-generators.ts +1 -125
package/src/daemon/handlers/__tests__/config-a2a-accept.test.ts +498 -0
package/src/daemon/handlers/__tests__/config-a2a-complete.test.ts +248 -0
package/src/daemon/handlers/__tests__/config-a2a-invite.test.ts +154 -0
package/src/daemon/handlers/__tests__/config-a2a-redeem.test.ts +133 -0
package/src/daemon/handlers/__tests__/config-a2a.test.ts +95 -0
package/src/daemon/handlers/config-a2a.ts +449 -0
package/src/daemon/handlers/config-model.test.ts +1 -0
package/src/daemon/handlers/conversations.ts +80 -0
package/src/daemon/handlers/shared.ts +92 -29
package/src/daemon/host-app-control-proxy.ts +69 -18
package/src/daemon/host-bash-proxy.ts +1 -1
package/src/daemon/host-cu-proxy.ts +1 -1
package/src/daemon/host-file-proxy.ts +1 -1
package/src/daemon/host-proxy-preactivation.ts +85 -18
package/src/daemon/host-transfer-proxy.ts +1 -1
package/src/daemon/lifecycle.ts +67 -65
package/src/daemon/memory-v2-startup.ts +49 -13
package/src/daemon/message-protocol.ts +4 -0
package/src/daemon/message-types/conversations.ts +8 -0
package/src/daemon/message-types/document-comments.ts +50 -0
package/src/daemon/message-types/messages.ts +68 -1
package/src/daemon/message-types/notifications.ts +21 -0
package/src/daemon/message-types/surfaces.ts +3 -1
package/src/daemon/message-types/web-activity.ts +57 -0
package/src/daemon/pkb-reminder-builder.test.ts +10 -53
package/src/daemon/pkb-reminder-builder.ts +4 -19
package/src/daemon/plugin-source-watcher.ts +135 -3
package/src/daemon/process-message.ts +72 -12
package/src/daemon/query-complexity-router.ts +75 -0
package/src/daemon/skill-memory-refresh.ts +5 -1
package/src/daemon/trust-context.ts +6 -0
package/src/daemon/wake-target-adapter.ts +2 -0
package/src/documents/document-comments-store.test.ts +338 -0
package/src/documents/document-comments-store.ts +237 -0
package/src/documents/document-store.ts +202 -0
package/src/export/__tests__/transcript-formatter.test.ts +121 -0
package/src/export/transcript-formatter.ts +54 -20
package/src/heartbeat/__tests__/heartbeat-service.test.ts +44 -1
package/src/heartbeat/heartbeat-service.ts +35 -191
package/src/home/__tests__/feed-types.test.ts +40 -0
package/src/home/__tests__/suggested-prompts.test.ts +33 -2
package/src/home/feed-types.ts +20 -3
package/src/home/home-content-refresh.ts +52 -0
package/src/home/home-greeting-cache.ts +69 -0
package/src/home/home-greeting.ts +94 -0
package/src/home/suggested-prompts.ts +177 -9
package/src/ipc/cli-client.ts +147 -45
package/src/memory/__tests__/conversation-queries.test.ts +220 -0
package/src/memory/__tests__/jobs-worker-v2-schedule.test.ts +135 -2
package/src/memory/__tests__/memory-retrospective-enqueue.test.ts +2 -50
package/src/memory/__tests__/memory-retrospective-job.test.ts +407 -10
package/src/memory/conversation-crud.ts +133 -43
package/src/memory/conversation-queries.ts +87 -1
package/src/memory/conversation-title-service.ts +26 -4
package/src/memory/db-init.ts +22 -0
package/src/memory/delivery-crud.ts +41 -0
package/src/memory/delivery-status.ts +141 -15
package/src/memory/external-conversation-store.ts +32 -1
package/src/memory/graph/__tests__/conversation-graph-memory-v2-routing.test.ts +84 -3
package/src/memory/graph/conversation-graph-memory.ts +18 -6
package/src/memory/graph/tools.ts +6 -37
package/src/memory/invite-store.ts +53 -0
package/src/memory/jobs-worker.ts +21 -1
package/src/memory/llm-request-log-source-clickhouse.ts +7 -2
package/src/memory/llm-request-log-store.ts +92 -1
package/src/memory/memory-retrospective-constants.ts +28 -0
package/src/memory/memory-retrospective-enqueue.ts +4 -22
package/src/memory/memory-retrospective-job.ts +438 -21
package/src/memory/memory-retrospective-startup-cleanup.ts +3 -3
package/src/memory/memory-v2-activation-log-store.ts +26 -8
package/src/memory/migrations/100-core-tables.ts +1 -0
package/src/memory/migrations/109-external-conversation-bindings.ts +1 -0
package/src/memory/migrations/250-provider-connection-base-url-and-models.ts +28 -0
package/src/memory/migrations/251-a2a-tasks.ts +49 -0
package/src/memory/migrations/252-llm-request-log-agent-loop-exit-reason.ts +32 -0
package/src/memory/migrations/253-conversation-last-notified-profile.ts +15 -0
package/src/memory/migrations/253-document-comments.ts +47 -0
package/src/memory/migrations/254-external-conversation-binding-chat-name.ts +43 -0
package/src/memory/migrations/255-channel-inbound-delivery-attempts.ts +24 -0
package/src/memory/migrations/256-memory-v2-injection-events.ts +113 -0
package/src/memory/migrations/257-strip-base-url-non-openai-compatible.ts +22 -0
package/src/memory/migrations/258-onboarding-events-prior-assistants.ts +13 -0
package/src/memory/migrations/259-conversation-cleaned-at.ts +33 -0
package/src/memory/migrations/index.ts +20 -0
package/src/memory/migrations/registry.ts +33 -0
package/src/memory/onboarding-events-store.ts +7 -0
package/src/memory/schema/a2a.ts +15 -0
package/src/memory/schema/calls.ts +1 -0
package/src/memory/schema/conversations.ts +3 -0
package/src/memory/schema/index.ts +1 -0
package/src/memory/schema/inference.ts +2 -0
package/src/memory/schema/infrastructure.ts +2 -0
package/src/memory/v2/__tests__/activation-store.test.ts +25 -23
package/src/memory/v2/__tests__/cli-command-store.test.ts +404 -0
package/src/memory/v2/__tests__/frontmatter-sweep.test.ts +25 -4
package/src/memory/v2/__tests__/injection-events.test.ts +318 -0
package/src/memory/v2/__tests__/injection.test.ts +221 -17
package/src/memory/v2/__tests__/page-index.test.ts +365 -1
package/src/memory/v2/__tests__/router.test.ts +489 -1
package/src/memory/v2/__tests__/static-context.test.ts +12 -1
package/src/memory/v2/activation-store.ts +14 -16
package/src/memory/v2/cli-command-content.ts +19 -0
package/src/memory/v2/cli-command-store.ts +304 -0
package/src/memory/v2/consolidation-job.ts +14 -0
package/src/memory/v2/frontmatter-sweep.ts +7 -1
package/src/memory/v2/injection-events.ts +101 -0
package/src/memory/v2/injection.ts +69 -29
package/src/memory/v2/page-index.ts +246 -19
package/src/memory/v2/page-store.ts +18 -0
package/src/memory/v2/router.ts +209 -55
package/src/memory/v2/static-context.ts +4 -4
package/src/memory/v2/types.ts +23 -0
package/src/messaging/providers/a2a/__tests__/deliver.test.ts +274 -0
package/src/messaging/providers/a2a/deliver.ts +156 -0
package/src/messaging/providers/gmail/client.ts +9 -2
package/src/messaging/providers/index.ts +18 -3
package/src/messaging/providers/slack/__tests__/adapter-mention-rendering.test.ts +329 -3
package/src/messaging/providers/slack/__tests__/adapter-token-routing.test.ts +34 -1
package/src/messaging/providers/slack/adapter.ts +178 -25
package/src/messaging/providers/slack/api.test.ts +54 -0
package/src/messaging/providers/slack/api.ts +119 -3
package/src/messaging/providers/slack/client.ts +12 -0
package/src/messaging/providers/slack/deep-link.ts +20 -1
package/src/messaging/providers/slack/message-metadata.test.ts +48 -0
package/src/messaging/providers/slack/message-metadata.ts +156 -0
package/src/messaging/providers/slack/render-transcript.test.ts +107 -75
package/src/messaging/providers/slack/render-transcript.ts +176 -49
package/src/messaging/providers/slack/send.test.ts +77 -0
package/src/messaging/providers/slack/send.ts +8 -2
package/src/messaging/providers/slack/types.ts +14 -0
package/src/notifications/__tests__/broadcaster.test.ts +203 -0
package/src/notifications/__tests__/decision-engine.test.ts +283 -0
package/src/notifications/__tests__/deterministic-checks.test.ts +286 -0
package/src/notifications/__tests__/emit-signal-home-feed.test.ts +5 -1
package/src/notifications/__tests__/home-feed-side-effect.test.ts +521 -36
package/src/notifications/adapters/macos.ts +12 -2
package/src/notifications/broadcaster.ts +29 -4
package/src/notifications/conversation-seed-composer.ts +14 -2
package/src/notifications/copy-composer.ts +17 -64
package/src/notifications/decision-engine.ts +111 -44
package/src/notifications/deferred-emit.ts +135 -0
package/src/notifications/deterministic-checks.ts +96 -0
package/src/notifications/emit-signal.ts +10 -1
package/src/notifications/home-feed-side-effect.ts +136 -27
package/src/notifications/signal.ts +0 -4
package/src/notifications/types.ts +8 -0
package/src/oauth/connect-orchestrator.ts +3 -0
package/src/oauth/credential-token-resolver.ts +2 -0
package/src/oauth/manual-token-connection.ts +19 -0
package/src/oauth/oauth-store.ts +12 -0
package/src/oauth/platform-connection.test.ts +43 -3
package/src/oauth/platform-connection.ts +13 -4
package/src/oauth/seed-providers.ts +22 -0
package/src/permissions/prompter.ts +5 -2
package/src/permissions/secret-prompter.ts +4 -1
package/src/plugins/defaults/injectors.ts +118 -26
package/src/plugins/external-plugin-loader.ts +82 -10
package/src/plugins/types.ts +16 -7
package/src/prompts/__tests__/system-prompt.test.ts +44 -45
package/src/prompts/__tests__/task-progress-hint-section.test.ts +4 -8
package/src/prompts/normalize-onboarding.ts +40 -0
package/src/prompts/sections.ts +32 -14
package/src/prompts/system-prompt.ts +105 -76
package/src/prompts/template-detection.ts +37 -0
package/src/prompts/templates/BOOTSTRAP-CONTENT-AUTOMATION.md +141 -0
package/src/prompts/templates/BOOTSTRAP.md +13 -5
package/src/prompts/templates/VOICE.md +3 -0
package/src/prompts/templates/system-sections.ts +51 -10
package/src/providers/__tests__/inference.test.ts +2 -0
package/src/providers/anthropic/client.ts +132 -5
package/src/providers/call-site-routing.ts +24 -6
package/src/providers/connection-resolution.ts +63 -13
package/src/providers/fireworks/client.ts +20 -2
package/src/providers/inference/__tests__/adapter-factory-openai-compatible.test.ts +74 -0
package/src/providers/inference/__tests__/base-url-route-validation.test.ts +342 -0
package/src/providers/inference/__tests__/base-url-security.test.ts +189 -0
package/src/providers/inference/__tests__/codex-token-refresh.test.ts +254 -0
package/src/providers/inference/__tests__/connections-openai-compatible.test.ts +175 -0
package/src/providers/inference/__tests__/connections-status-label.test.ts +15 -0
package/src/providers/inference/adapter-factory.ts +24 -21
package/src/providers/inference/auth.ts +15 -3
package/src/providers/inference/backfill.ts +14 -1
package/src/providers/inference/codex-token-refresh.ts +128 -0
package/src/providers/inference/connections.ts +85 -5
package/src/providers/inference/resolve-auth.ts +50 -5
package/src/providers/model-catalog.ts +244 -242
package/src/providers/model-intents.ts +3 -3
package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +235 -0
package/src/providers/openai/chat-completions-provider.ts +215 -25
package/src/providers/openai/responses-provider.ts +9 -3
package/src/providers/openrouter/client.ts +46 -4
package/src/providers/platform-proxy/constants.ts +3 -4
package/src/providers/provider-catalog-visibility.ts +3 -1
package/src/providers/provider-send-message.ts +27 -12
package/src/providers/registry.ts +30 -1
package/src/providers/types.ts +25 -0
package/src/runtime/__tests__/agent-wake.test.ts +214 -0
package/src/runtime/__tests__/background-job-runner.test.ts +128 -0
package/src/runtime/agent-wake.ts +212 -57
package/src/runtime/auth/route-policy.ts +20 -3
package/src/runtime/background-job-runner.ts +26 -0
package/src/runtime/channel-reply-delivery.ts +182 -47
package/src/runtime/channel-retry-sweep.ts +141 -16
package/src/runtime/http-server.ts +7 -16
package/src/runtime/http-types.ts +7 -51
package/src/runtime/pending-interactions.ts +51 -8
package/src/runtime/routes/__tests__/consolidation-routes.test.ts +258 -0
package/src/runtime/routes/__tests__/content-source-routes.test.ts +162 -0
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +121 -5
package/src/runtime/routes/__tests__/inference-provider-connection-routes.test.ts +275 -44
package/src/runtime/routes/__tests__/llm-call-sites-routes.test.ts +12 -0
package/src/runtime/routes/__tests__/memory-v2-routes.test.ts +14 -0
package/src/runtime/routes/__tests__/memory-v2-simulate-route.test.ts +271 -0
package/src/runtime/routes/__tests__/sanity-routes.test.ts +280 -0
package/src/runtime/routes/__tests__/slack-channel-routes.test.ts +266 -0
package/src/runtime/routes/approval-routes.ts +4 -1
package/src/runtime/routes/channel-availability-routes.ts +5 -0
package/src/runtime/routes/chatgpt-subscription-auth-routes.ts +246 -0
package/src/runtime/routes/consolidation-routes.ts +100 -0
package/src/runtime/routes/content-source-routes.ts +78 -0
package/src/runtime/routes/conversation-cli-routes.ts +146 -1
package/src/runtime/routes/conversation-query-routes.ts +130 -12
package/src/runtime/routes/conversation-routes.ts +288 -76
package/src/runtime/routes/document-comments-routes.ts +287 -0
package/src/runtime/routes/documents-routes.ts +33 -0
package/src/runtime/routes/home-feed-routes.ts +6 -3
package/src/runtime/routes/host-app-control-routes.ts +1 -1
package/src/runtime/routes/host-browser-routes.ts +8 -1
package/src/runtime/routes/identity-routes.ts +21 -0
package/src/runtime/routes/inbound-message-handler.ts +288 -58
package/src/runtime/routes/inbound-stages/background-dispatch.test.ts +365 -6
package/src/runtime/routes/inbound-stages/background-dispatch.ts +283 -82
package/src/runtime/routes/index.ts +14 -4
package/src/runtime/routes/inference-provider-connection-routes.ts +192 -3
package/src/runtime/routes/integrations/a2a.ts +294 -0
package/src/runtime/routes/llm-call-sites-routes.ts +11 -1
package/src/runtime/routes/log-export-routes.ts +39 -0
package/src/runtime/routes/memory-v2-routes.ts +217 -0
package/src/runtime/routes/notification-routes.ts +19 -2
package/src/runtime/routes/question-routes.ts +4 -1
package/src/runtime/routes/sanity-routes.ts +159 -0
package/src/runtime/routes/slack-channel-routes.ts +187 -0
package/src/runtime/routes/subagents-routes.ts +41 -0
package/src/runtime/services/conversation-serializer.ts +30 -4
package/src/schedule/integration-status.ts +3 -1
package/src/security/__tests__/oauth2-device-code.test.ts +479 -0
package/src/security/oauth2-device-code.ts +307 -0
package/src/security/oauth2.ts +26 -9
package/src/security/secure-keys.ts +5 -0
package/src/skills/catalog-install.ts +6 -2
package/src/subagent/manager.ts +2 -0
package/src/tools/browser/__tests__/pinned-tabs.test.ts +80 -0
package/src/tools/browser/browser-execution.ts +93 -0
package/src/tools/browser/cdp-client/__tests__/factory.test.ts +28 -0
package/src/tools/browser/cdp-client/__tests__/types.test.ts +1 -0
package/src/tools/browser/cdp-client/cdp-inspect-client.ts +10 -0
package/src/tools/browser/cdp-client/extension-cdp-client.ts +15 -1
package/src/tools/browser/cdp-client/factory.ts +87 -3
package/src/tools/browser/cdp-client/local-cdp-client.ts +9 -0
package/src/tools/browser/cdp-client/types.ts +36 -0
package/src/tools/browser/pinned-tabs.ts +90 -0
package/src/tools/document/document-comment-tool.test.ts +379 -0
package/src/tools/document/document-comment-tool.ts +156 -0
package/src/tools/document/document-tool.ts +128 -2
package/src/tools/memory/register.ts +1 -9
package/src/tools/network/__tests__/web-fetch-metadata.test.ts +229 -0
package/src/tools/network/__tests__/web-search-metadata.test.ts +346 -0
package/src/tools/network/domain-normalize.ts +17 -0
package/src/tools/network/web-fetch.ts +213 -64
package/src/tools/network/web-search.ts +191 -66
package/src/tools/registry.ts +2 -2
package/src/tools/terminal/safe-env.ts +3 -2
package/src/tools/tool-approval-handler.ts +19 -12
package/src/tools/types.ts +41 -2
package/src/tools/ui-surface/definitions.ts +3 -1
package/src/types/onboarding-context.ts +4 -0
package/src/util/__tests__/favicon.test.ts +84 -0
package/src/util/favicon.ts +40 -0
package/src/util/platform.ts +0 -5
package/src/workspace/git-service.ts +75 -4
package/src/workspace/migrations/087-memory-router-balanced-profile.ts +91 -0
package/src/workspace/migrations/088-deprecate-background-conversation-override.ts +103 -0
package/src/workspace/migrations/registry.ts +4 -0
package/src/__tests__/guardian-action-conversation-turn.test.ts +0 -441
package/src/config/bundled-skills/document/SKILL.md +0 -54
package/src/config/bundled-skills/document/TOOLS.json +0 -106
package/src/daemon/seed-files.ts +0 -18
package/src/memory/graph/__tests__/remember-description.test.ts +0 -55
package/src/runtime/guardian-action-conversation-turn.ts +0 -99
package/src/runtime/routes/interface-routes.ts +0 -43
/package/src/config/bundled-skills/{document → document-editor}/tools/document-create.ts +0 -0
/package/src/config/bundled-skills/{document → document-editor}/tools/document-delete.ts +0 -0
/package/src/config/bundled-skills/{document → document-editor}/tools/document-list.ts +0 -0
/package/src/config/bundled-skills/{document → document-editor}/tools/document-read.ts +0 -0
/package/src/config/bundled-skills/{document → document-editor}/tools/document-update.ts +0 -0

package/src/config/schemas/memory-v2.ts CHANGED Viewed

@@ -194,6 +194,19 @@ export const MemoryV2ConfigSchema = z
       .describe(
         "Hours between scheduled consolidation runs that synthesize buffered memories into concept pages",
       ),
+    consolidation_max_buffer_lines: z
+      .number({
+        error: "memory.v2.consolidation_max_buffer_lines must be a number",
+      })
+      .int("memory.v2.consolidation_max_buffer_lines must be an integer")
+      .positive(
+        "memory.v2.consolidation_max_buffer_lines must be a positive integer",
+      )
+      .nullable()
+      .default(100)
+      .describe(
+        "Size-based trigger for consolidation. When `memory/buffer.md` reaches this many non-empty lines, consolidation runs even if the time-based interval hasn't elapsed. Defaults to 100. Set to `null` to disable the size trigger and rely solely on `consolidation_interval_hours`.",
+      ),
     max_page_chars: z
       .number({ error: "memory.v2.max_page_chars must be a number" })
       .int("memory.v2.max_page_chars must be an integer")
@@ -260,9 +273,9 @@ export const MemoryV2ConfigSchema = z
       .object({
         enabled: z
           .boolean()
-          .default(false)
+          .default(true)
           .describe(
-            "Whether to use the LLM router as the per-turn page-selection mechanism in place of spreading activation. Disabled by default — opt in once the router orchestration and dispatcher land.",
+            "Whether to use the LLM router as the per-turn page-selection mechanism in place of spreading activation. Enabled by default.",
           ),
         max_page_ids: z
           .number()
@@ -282,10 +295,44 @@ export const MemoryV2ConfigSchema = z
           .describe(
             "Optional path to a file whose contents replace the bundled router prompt. Absolute paths are used as-is, a leading `~/` is expanded to the home directory, otherwise the path is resolved under the workspace root. The loaded contents may include `{{ASSISTANT_NAME}}`, `{{USER_NAME}}`, and `{{PAGE_INDEX}}`, which are substituted at runtime. If the file is missing, unreadable, or empty, the bundled prompt is used and a warning is logged.",
           ),
+        batch_size: z
+          .number()
+          .int()
+          .min(1)
+          .nullable()
+          .default(null)
+          .describe(
+            "Target batch size for parallel page-index routing. `null` (default) sends the entire page index in one call — identical to v3 behavior. When set, pages are split into `ceil(N / batch_size)` batches by stable FNV-1a hash on slug (so adding/removing a single page only invalidates one batch's KV cache), routed in parallel, and the selected slugs are unioned. A failure in one batch does not abort the turn as long as at least one batch succeeds.",
+          ),
+        tier1_size: z
+          .number()
+          .int()
+          .min(1)
+          .nullable()
+          .default(null)
+          .describe(
+            "Pool size for the tier-1 'recently modified' batch. `null` (default) disables tier 1 entirely — all pages flow through tier 3 batching. When set, the top-N concept pages by file mtime become their own dedicated parallel batch with mtime-desc ordering; everything else is partitioned into tier 3 batches by `batch_size`. Synthetic entries (skills, CLI commands) have mtime=0 and naturally rank below real concept pages so they don't crowd tier 1.",
+          ),
+        tier2_size: z
+          .number()
+          .int()
+          .min(1)
+          .nullable()
+          .default(null)
+          .describe(
+            "Pool size for the tier-2 'useful' batch. `null` (default) disables tier 2 — pages skip straight from tier 1 to tier 3. When set, the top-M pages by injection-frequency EMA (excluding tier 1) become their own parallel batch ordered by score desc. Pages with score 0 (never selected since EMA tracking began) are ineligible for tier 2 and stay in tier 3 regardless of `tier2_size`. Score is the time-decayed sum `Σ exp(-λ(now - tᵢ))` with 3-day half-life, computed on read from `memory_v2_injection_events`.",
+          ),
+      })
+      .default({
+        enabled: true,
+        max_page_ids: 25,
+        router_prompt_path: null,
+        batch_size: null,
+        tier1_size: null,
+        tier2_size: null,
       })
-      .default({ enabled: false, max_page_ids: 25, router_prompt_path: null })
       .describe(
-        "LLM router configuration. When enabled, a single Sonnet router call replaces spreading activation for per-turn page selection.",
+        "LLM router configuration. When enabled, a single router LLM call replaces spreading activation for per-turn page selection.",
       ),
   })
   .describe(

package/src/config/schemas/memory.ts CHANGED Viewed

@@ -23,7 +23,9 @@ export const MemoryConfigSchema = z
     enabled: z
       .boolean({ error: "memory.enabled must be a boolean" })
       .default(true)
-      .describe("Whether the long-term memory system is enabled"),
+      .describe(
+        "Whether the long-term memory system is enabled — gates background memory jobs, embedding generation, and `<memory>` block injection into user messages",
+      ),
     embeddings: MemoryEmbeddingsConfigSchema.default(
       MemoryEmbeddingsConfigSchema.parse({}),
     ),

package/src/config/seed-inference-profiles.ts CHANGED Viewed

@@ -3,6 +3,8 @@ import {
   createConnection,
   disableManagedConnectionsForByokHatch,
   getConnection,
+  MANAGED_CONNECTION_NAMES,
+  PROVIDERS_REQUIRING_BASE_URL_AND_MODELS,
 } from "../providers/inference/connections.js";
 import { PROVIDER_CATALOG } from "../providers/model-catalog.js";
 import { resolveModelIntent } from "../providers/model-intents.js";
@@ -17,10 +19,6 @@ import {
 const log = getLogger("seed-inference-profiles");
-const MANAGED_CONNECTION_NAME = "anthropic-managed";
-const MANAGED_PROFILE_PROVIDER: NonNullable<ProfileEntry["provider"]> =
-  "anthropic";
 /**
  * Template for a daemon-managed inference profile. The profile's model is
  * resolved at seed time from `PROVIDER_MODEL_INTENTS` so the catalog stays the
@@ -31,16 +29,20 @@ type ManagedProfileTemplate = Omit<
   "provider" | "model" | "provider_connection"
 > & {
   intent: ModelIntent;
+  provider: NonNullable<ProfileEntry["provider"]>;
+  connectionName: string;
 };
 /**
- * Managed Anthropic profiles. Overwritten on every daemon boot so Vellum can
- * push model/config updates to customers in new releases. Platform overlays
+ * Managed profiles. Overwritten on every daemon boot so Vellum can push
+ * model/config updates to customers in new releases. Platform overlays
  * (`preserveProfileNames`) take precedence when present.
  */
 const MANAGED_PROFILE_TEMPLATES: Record<string, ManagedProfileTemplate> = {
   balanced: {
     intent: "balanced",
+    provider: "anthropic",
+    connectionName: "anthropic-managed",
     source: "managed",
     label: "Balanced",
     description: "Good balance of quality, cost, and speed",
@@ -51,6 +53,8 @@ const MANAGED_PROFILE_TEMPLATES: Record<string, ManagedProfileTemplate> = {
   },
   "quality-optimized": {
     intent: "quality-optimized",
+    provider: "anthropic",
+    connectionName: "anthropic-managed",
     source: "managed",
     label: "Quality",
     description: "Best results with the most capable model",
@@ -61,6 +65,8 @@ const MANAGED_PROFILE_TEMPLATES: Record<string, ManagedProfileTemplate> = {
   },
   "cost-optimized": {
     intent: "latency-optimized",
+    provider: "anthropic",
+    connectionName: "anthropic-managed",
     source: "managed",
     label: "Speed",
     description: "Fastest responses at lower cost",
@@ -74,11 +80,15 @@ const MANAGED_PROFILE_TEMPLATES: Record<string, ManagedProfileTemplate> = {
 /**
  * User profile templates. Materialized at hatch time for off-platform
  * installations. Each points at the user's personal provider connection
- * (backed by their API key in CES).
+ * (backed by their API key in CES). The `provider` and `connectionName`
+ * fields are placeholders — they are overridden at hatch time with the
+ * user's chosen provider and personal connection name.
  */
 const USER_PROFILE_TEMPLATES: Record<string, ManagedProfileTemplate> = {
   "custom-balanced": {
     intent: "balanced",
+    provider: "anthropic",
+    connectionName: "",
     source: "user",
     label: "Balanced",
     description: "Good balance of quality, cost, and speed",
@@ -89,6 +99,8 @@ const USER_PROFILE_TEMPLATES: Record<string, ManagedProfileTemplate> = {
   },
   "custom-quality-optimized": {
     intent: "quality-optimized",
+    provider: "anthropic",
+    connectionName: "",
     source: "user",
     label: "Quality",
     description: "Best results with the most capable model",
@@ -99,6 +111,8 @@ const USER_PROFILE_TEMPLATES: Record<string, ManagedProfileTemplate> = {
   },
   "custom-cost-optimized": {
     intent: "latency-optimized",
+    provider: "anthropic",
+    connectionName: "",
     source: "user",
     label: "Speed",
     description: "Fastest responses at lower cost",
@@ -164,11 +178,12 @@ export function seedInferenceProfiles(
   // BYOK mode = off-platform installs. The user is bringing their own provider
   // API key; managed profile labels get a " (Managed)" suffix to disambiguate
   // from the personal "custom-*" profiles that share base labels. Managed
-  // profile + connection status is initially "disabled" so the picker doesn't
-  // offer an unusable platform-auth option on day one — but ONLY at hatch
-  // time, and ONLY when the entry isn't already in the user's config (i.e.
-  // first materialization). Post-hatch user toggles survive every subsequent
-  // boot.
+  // profile + connection status is initially "disabled" for true BYOK hatches
+  // so the picker doesn't offer an unusable platform-auth option on day one.
+  // When the hatch overlay explicitly selects a managed profile, the matching
+  // managed connection stays active so the first post-onboarding message can
+  // use the user's chosen managed route. Post-hatch user toggles survive every
+  // subsequent boot.
   const isByokMode = !isPlatform;
   // 1. Managed profiles. Off-platform: overwrite on every boot so Vellum can
@@ -198,10 +213,18 @@ export function seedInferenceProfiles(
   //        rewritten to the suffixed form. Any other previous label value
   //        (user-set custom string, explicit null, already-suffixed) is
   //        preserved as-is.
-  //      • status: "disabled" on fresh materialization at hatch only —
-  //        gated on (isHatch && !previous) so post-hatch boots and existing
-  //        installs are never auto-disabled. A user re-enable persists
-  //        across boots via the key-presence preservation below.
+  //      • status: "disabled" on fresh materialization at BYOK hatch only —
+  //        gated on (isHatch && !previous) and skipped for any managed
+  //        connection explicitly selected by the hatch overlay. Post-hatch
+  //        boots and existing installs are never auto-disabled. A user
+  //        re-enable persists across boots via the key-presence preservation
+  //        below.
+  const hatchSelectedManagedConnection = getHatchSelectedManagedConnection(
+    llm,
+    profiles,
+    options,
+  );
   for (const [name, template] of Object.entries(MANAGED_PROFILE_TEMPLATES)) {
     if (preservedProfileNames.has(name)) continue;
     if (isPlatform && readObject(profiles[name]) !== null) continue;
@@ -212,10 +235,15 @@ export function seedInferenceProfiles(
       : template;
     const next = materializeProfile(
       effectiveTemplate,
-      MANAGED_PROFILE_PROVIDER,
-      MANAGED_CONNECTION_NAME,
+      template.provider,
+      template.connectionName,
     ) as Record<string, unknown>;
-    if (isByokMode && options.isHatch && !previous) {
+    if (
+      isByokMode &&
+      options.isHatch &&
+      !previous &&
+      template.connectionName !== hatchSelectedManagedConnection
+    ) {
       next.status = "disabled";
     }
     if (previous) {
@@ -238,17 +266,24 @@ export function seedInferenceProfiles(
   // 2. User profiles — only at hatch time for off-platform installations.
   let userConnectionName: string | undefined;
   if (options.isHatch && !isPlatform) {
-    // BYOK hatch: disable the three canonical managed connections so the
-    // picker doesn't surface unusable platform-auth options on day one.
-    // Runs only here, only at hatch — `seedCanonicalConnections` leaves
-    // `status` alone on subsequent boots so a post-hatch user re-enable
-    // persists.
+    // BYOK hatch: disable canonical managed connections so the picker doesn't
+    // surface unusable platform-auth options on day one. If the hatch overlay
+    // selected a managed profile, leave that connection active; the user has
+    // already chosen managed inference. Runs only here, only at hatch —
+    // `seedCanonicalConnections` leaves `status` alone on subsequent boots so
+    // a post-hatch user re-enable persists.
     if (options.db) {
-      disableManagedConnectionsForByokHatch(options.db);
+      disableManagedConnectionsForByokHatch(options.db, {
+        excludeConnection: hatchSelectedManagedConnection,
+      });
     }
     const hatchProvider = readString(readObject(llm.default)?.provider);
-    if (hatchProvider && hatchProvider !== "ollama") {
+    if (
+      hatchProvider &&
+      hatchProvider !== "ollama" &&
+      !PROVIDERS_REQUIRING_BASE_URL_AND_MODELS.has(hatchProvider)
+    ) {
       userConnectionName = `${hatchProvider}-personal`;
       if (options.db) {
@@ -269,8 +304,7 @@ export function seedInferenceProfiles(
         }
       }
-      const provider =
-        hatchProvider as NonNullable<ProfileEntry["provider"]>;
+      const provider = hatchProvider as NonNullable<ProfileEntry["provider"]>;
       for (const [name, template] of Object.entries(USER_PROFILE_TEMPLATES)) {
         if (preservedProfileNames.has(name)) continue;
         profiles[name] = materializeProfile(
@@ -342,7 +376,7 @@ function materializeProfile(
   provider: NonNullable<ProfileEntry["provider"]>,
   connectionName: string,
 ): ProfileEntry {
-  const { intent, ...rest } = template;
+  const { intent, provider: _p, connectionName: _c, ...rest } = template;
   return {
     ...rest,
     provider,
@@ -361,6 +395,42 @@ function readString(value: unknown): string | undefined {
   return typeof value === "string" && value.length > 0 ? value : undefined;
 }
+function getHatchSelectedManagedConnection(
+  llm: Record<string, unknown>,
+  profiles: Record<string, Record<string, unknown>>,
+  options: SeedInferenceProfilesOptions,
+): string | undefined {
+  if (!options.isHatch || options.preserveActiveProfile !== true) {
+    return undefined;
+  }
+  const activeProfile = readString(llm.activeProfile);
+  if (!activeProfile) return undefined;
+  const activeProfileEntry = readObject(profiles[activeProfile]);
+  if (
+    activeProfileEntry &&
+    Object.prototype.hasOwnProperty.call(
+      activeProfileEntry,
+      "provider_connection",
+    )
+  ) {
+    const explicitConnection = readString(
+      activeProfileEntry.provider_connection,
+    );
+    return explicitConnection &&
+      MANAGED_CONNECTION_NAMES.has(explicitConnection)
+      ? explicitConnection
+      : undefined;
+  }
+  const templateConnection =
+    MANAGED_PROFILE_TEMPLATES[activeProfile]?.connectionName;
+  return templateConnection && MANAGED_CONNECTION_NAMES.has(templateConnection)
+    ? templateConnection
+    : undefined;
+}
 /**
  * Format the human-readable label seeded onto a personal provider connection
  * at hatch time, e.g. `"Anthropic (Personal)"`. The display name is sourced

package/src/context/compactor.ts CHANGED Viewed

@@ -155,6 +155,11 @@ export interface CompactionRunResult {
   thresholdTokens: number;
   compactedMessages: number;
   compactedPersistedMessages: number;
+  /**
+   * Number of recent ("tail") messages preserved verbatim alongside the
+   * summary. Omitted on no-op / skipped results — defaults to 0 at render.
+   */
+  preservedTailMessages?: number;
   summaryCalls: number;
   summaryInputTokens: number;
   summaryOutputTokens: number;
@@ -327,7 +332,7 @@ export function renderImageManifest(entries: ManifestEntry[]): string {
  * runtime emitted — typically
  * `2026-04-02 (Thursday) 01:52:33 -05:00 (America/Chicago)`).
  */
-function extractTurnContextTimestamp(message: Message): string | null {
+export function extractTurnContextTimestamp(message: Message): string | null {
   if (message.role !== "user") return null;
   for (const block of message.content) {
     if (block.type !== "text") continue;
@@ -439,6 +444,44 @@ function resolveTailStartIndex(
   return null;
 }
+/**
+ * Walk a model-chosen tail index backward until it lands on a user message
+ * that does not contain client-side `tool_result` blocks. Prevents the
+ * orphan-`tool_result` failure where the matching assistant `tool_use` sits
+ * in the discarded prefix and Anthropic rejects the next call with
+ * `unexpected tool_use_id found in tool_result blocks`.
+ *
+ * Walking back (rather than forward) preserves the recent context the model
+ * deliberately chose to keep; the tail just expands by the few messages
+ * needed to re-anchor the orphaned `tool_result` against its `tool_use`.
+ *
+ * Returns 0 when the walk falls off the front — the caller treats this as
+ * "nothing to compact" via the existing `tailIndex === 0` branch.
+ *
+ * Only `type === "tool_result"` blocks count. Server-side tools
+ * (`server_tool_use` / `web_search_tool_result`) are self-paired inside an
+ * assistant message and never trigger an adjustment.
+ */
+export function adjustTailIndexForToolPairing(
+  messages: Message[],
+  tailIndex: number,
+): number {
+  let k = tailIndex;
+  while (k > 0) {
+    const m = messages[k];
+    if (
+      m.role === "user" &&
+      // guard:allow-tool-result-only — server-side web_search_tool_result is
+      // self-paired inside its assistant message and never spans user turns.
+      !m.content.some((block) => block.type === "tool_result")
+    ) {
+      return k;
+    }
+    k--;
+  }
+  return 0;
+}
 // ---------------------------------------------------------------------------
 // Retained-image hydration
 // ---------------------------------------------------------------------------
@@ -655,8 +698,12 @@ export async function runAssistantDrivenCompaction(
   }
   const timestamps = buildTimestampIndex(args.messages);
-  const tailIndex = resolveTailStartIndex(args.messages, timestamps, parsed);
-  if (tailIndex == null) {
+  const resolvedTailIndex = resolveTailStartIndex(
+    args.messages,
+    timestamps,
+    parsed,
+  );
+  if (resolvedTailIndex == null) {
     log.warn(
       {
         timestamp: parsed.tailStartTimestamp,
@@ -680,6 +727,22 @@ export async function runAssistantDrivenCompaction(
     };
   }
+  const tailIndex = adjustTailIndexForToolPairing(
+    args.messages,
+    resolvedTailIndex,
+  );
+  if (tailIndex !== resolvedTailIndex) {
+    log.info(
+      {
+        conversationId: args.conversationId,
+        originalTailIndex: resolvedTailIndex,
+        tailIndex,
+        walkedBy: resolvedTailIndex - tailIndex,
+      },
+      "Adjusted compaction tail backward to preserve tool_use/tool_result pairing",
+    );
+  }
   if (tailIndex === 0) {
     return {
       ...emptyResult(
@@ -762,6 +825,9 @@ export async function runAssistantDrivenCompaction(
       compactedMessages: compactableMessages.length,
       compactedPersistedMessages,
       tailIndex,
+      ...(tailIndex !== resolvedTailIndex
+        ? { originalTailIndex: resolvedTailIndex }
+        : {}),
       retainedImages: resolved.length,
       summaryChars: summaryText.length,
     },
@@ -780,6 +846,7 @@ export async function runAssistantDrivenCompaction(
     thresholdTokens,
     compactedMessages: compactableMessages.length,
     compactedPersistedMessages,
+    preservedTailMessages: args.messages.length - tailIndex,
     summaryCalls: 1,
     summaryInputTokens: response.usage.inputTokens,
     summaryOutputTokens: response.usage.outputTokens,
@@ -885,10 +952,12 @@ export async function runEmergencyCompaction(
   const splitIndex = findLastToolPairStart(args.messages);
   if (splitIndex == null || splitIndex === 0) {
-    log.info(
-      "Emergency compaction: no tool pair found — falling through",
+    log.info("Emergency compaction: no tool pair found — falling through");
+    return emptyResult(
+      args,
+      thresholdTokens,
+      "no tool pair for emergency split",
     );
-    return emptyResult(args, thresholdTokens, "no tool pair for emergency split");
   }
   const keptTail = stripInjectionsForCompaction(
@@ -904,8 +973,7 @@ export async function runEmergencyCompaction(
   const prefixBudget = args.maxInputTokens - instructionBudget - outputBudget;
   let prefixEstimate = estimatePromptTokens(prefix, args.systemPrompt, {
-    providerName:
-      args.provider.tokenEstimationProvider ?? args.provider.name,
+    providerName: args.provider.tokenEstimationProvider ?? args.provider.name,
   });
   if (prefixEstimate > prefixBudget && prefix.length > 1) {
@@ -920,10 +988,7 @@ export async function runEmergencyCompaction(
     // Drop messages from the front until we fit. Keep at least the first
     // message (may be an existing summary) and try to preserve recent context.
     let dropCount = 0;
-    while (
-      prefixEstimate > prefixBudget &&
-      dropCount < prefix.length - 1
-    ) {
+    while (prefixEstimate > prefixBudget && dropCount < prefix.length - 1) {
       dropCount++;
       const truncated = prefix.slice(dropCount);
       prefixEstimate = estimatePromptTokens(truncated, args.systemPrompt, {
@@ -1015,7 +1080,8 @@ export async function runEmergencyCompaction(
       compactedMessages: compactedCount,
       keptTailMessages: keptTail.length,
       summaryChars: summaryText.length,
-      prefixTruncated: prefix[0]?.content?.[0]?.type === "text" &&
+      prefixTruncated:
+        prefix[0]?.content?.[0]?.type === "text" &&
         (prefix[0].content[0] as { text: string }).text.includes("truncated"),
     },
     "Applied emergency mid-turn compaction",
@@ -1030,6 +1096,7 @@ export async function runEmergencyCompaction(
     thresholdTokens,
     compactedMessages: compactedCount,
     compactedPersistedMessages: Math.max(0, compactedCount - nonPersistedAway),
+    preservedTailMessages: keptTail.length,
     summaryCalls: 1,
     summaryInputTokens: response.usage.inputTokens,
     summaryOutputTokens: response.usage.outputTokens,

package/src/context/token-estimator.ts CHANGED Viewed

@@ -33,18 +33,42 @@ const OTHER_BLOCK_TOKENS = 16;
 const SYSTEM_PROMPT_OVERHEAD_TOKENS = 8;
 const GEMINI_INLINE_FILE_MIME_TYPES = new Set(["application/pdf"]);
-// Anthropic scales images to fit within 1568x1568 maintaining aspect ratio,
-// then charges ~(width * height) / 750 tokens.
-const ANTHROPIC_IMAGE_MAX_DIMENSION = 1568;
-// Anthropic caps images at ~1.2 megapixels in addition to the 1568px dimension limit.
-// Images exceeding this are further scaled down. The docs state images above ~1,600 tokens
-// are resized. 1,200,000 / 750 = 1,600 tokens, matching the documented threshold.
-// Reference table (max sizes that won't be resized):
+// Dimension-based image token estimate, used as a universal default for every
+// provider. The formula and constants below come from Anthropic's published
+// vision spec — scale to a 1568x1568 bounding box, then charge
+// ~(width * height) / 750 tokens, with a ~1.2-megapixel cap that lands at
+// ~1,600 tokens per image. Reference table (max sizes that won't be resized):
 //   1:1 → 1092x1092 (~1,590 tokens)   1:2 → 784x1568 (~1,639 tokens)
 // See: https://platform.claude.com/docs/en/build-with-claude/vision#evaluate-image-size
-const ANTHROPIC_IMAGE_MAX_PIXELS = 1_200_000;
-const ANTHROPIC_IMAGE_TOKENS_PER_PIXEL = 1 / 750;
-const ANTHROPIC_IMAGE_MAX_TOKENS = 1_600;
+//
+// Other multimodal providers (OpenAI/GPT-4V tile pricing, Moonshot/Kimi,
+// Gemini fixed-cost, OpenRouter pass-through) price differently in detail,
+// but every published rate lands in the same hundreds-to-low-thousands range
+// per image. Using this formula as the default gets compaction within ~2-3x
+// of reality instead of the ~30-100x over-counting produced by treating the
+// raw base64 payload as if it were text.
+const IMAGE_MAX_DIMENSION = 1568;
+const IMAGE_MAX_PIXELS = 1_200_000;
+const IMAGE_TOKENS_PER_PIXEL = 1 / 750;
+const IMAGE_MAX_TOKENS = 1_600;
+// Gemini prices images differently: any side ≤384px counts as a single 258-token
+// tile; anything larger is resized so the longest side is ≤3072px and then
+// split into 768x768 tiles at 258 tokens each. A 4000x4000 image clamps to
+// 3072x3072 → ceil(3072/768)^2 = 16 tiles = 4,128 tokens. Without the clamp
+// we'd over-count it as 36 tiles (~9,288 tokens) and trigger spurious
+// compaction. The clamped 16-tile, 4,128-token figure is also the per-image
+// ceiling we fall back to when dimensions are unparseable (e.g. HEIC/HEIF
+// from iOS attachments) — the generic 1,600 cap can under-count Gemini
+// images by ~2.5x.
+// See: https://ai.google.dev/gemini-api/docs/tokens#multimodal-tokens
+const GEMINI_IMAGE_SMALL_THRESHOLD = 384;
+const GEMINI_IMAGE_TILE_SIZE = 768;
+const GEMINI_IMAGE_TOKENS_PER_TILE = 258;
+const GEMINI_IMAGE_MAX_DIMENSION = 3072;
+const GEMINI_IMAGE_MAX_TOKENS =
+  Math.ceil(GEMINI_IMAGE_MAX_DIMENSION / GEMINI_IMAGE_TILE_SIZE) ** 2 *
+  GEMINI_IMAGE_TOKENS_PER_TILE;
 // Anthropic renders each PDF page as an image (~1,568 tokens at standard
 // resolution) plus any extracted text. Typical PDF pages are 50-150 KB.
@@ -103,45 +127,62 @@ function estimateFileDataTokens(
   return 0;
 }
-function estimateAnthropicImageTokens(width: number, height: number): number {
+function estimateImageTokensByDimensions(
+  width: number,
+  height: number,
+): number {
   // Step 1: Scale to fit within 1568px bounding box
-  const dimScale = Math.min(
-    1,
-    ANTHROPIC_IMAGE_MAX_DIMENSION / Math.max(width, height),
-  );
+  const dimScale = Math.min(1, IMAGE_MAX_DIMENSION / Math.max(width, height));
   let scaledWidth = Math.round(width * dimScale);
   let scaledHeight = Math.round(height * dimScale);
   // Step 2: Scale further if exceeds megapixel budget
   const pixels = scaledWidth * scaledHeight;
-  if (pixels > ANTHROPIC_IMAGE_MAX_PIXELS) {
-    const mpScale = Math.sqrt(ANTHROPIC_IMAGE_MAX_PIXELS / pixels);
+  if (pixels > IMAGE_MAX_PIXELS) {
+    const mpScale = Math.sqrt(IMAGE_MAX_PIXELS / pixels);
     scaledWidth = Math.round(scaledWidth * mpScale);
     scaledHeight = Math.round(scaledHeight * mpScale);
   }
-  return Math.ceil(
-    scaledWidth * scaledHeight * ANTHROPIC_IMAGE_TOKENS_PER_PIXEL,
-  );
+  return Math.ceil(scaledWidth * scaledHeight * IMAGE_TOKENS_PER_PIXEL);
+}
+function estimateGeminiImageTokens(width: number, height: number): number {
+  if (
+    width <= GEMINI_IMAGE_SMALL_THRESHOLD &&
+    height <= GEMINI_IMAGE_SMALL_THRESHOLD
+  ) {
+    return GEMINI_IMAGE_TOKENS_PER_TILE;
+  }
+  // Gemini resizes images so the longest side is ≤3072px before tiling.
+  const clampedWidth = Math.min(width, GEMINI_IMAGE_MAX_DIMENSION);
+  const clampedHeight = Math.min(height, GEMINI_IMAGE_MAX_DIMENSION);
+  const tilesWide = Math.ceil(clampedWidth / GEMINI_IMAGE_TILE_SIZE);
+  const tilesHigh = Math.ceil(clampedHeight / GEMINI_IMAGE_TILE_SIZE);
+  return tilesWide * tilesHigh * GEMINI_IMAGE_TOKENS_PER_TILE;
 }
 function estimateImageTokens(
   block: Extract<ContentBlock, { type: "image" }>,
   options?: TokenEstimatorOptions,
 ): number {
-  if (options?.providerName === "anthropic") {
-    const dims = parseImageDimensions(
-      block.source.data,
-      block.source.media_type,
-    );
-    if (dims) {
-      return estimateAnthropicImageTokens(dims.width, dims.height);
+  const dims = parseImageDimensions(block.source.data, block.source.media_type);
+  if (dims) {
+    if (options?.providerName === "gemini") {
+      return estimateGeminiImageTokens(dims.width, dims.height);
     }
-    // Fallback: if dimensions can't be parsed, use Anthropic's max
-    return ANTHROPIC_IMAGE_MAX_TOKENS;
+    return estimateImageTokensByDimensions(dims.width, dims.height);
+  }
+  // Dimensions unparseable (corrupt header, or formats parseImageDimensions
+  // doesn't recognize like HEIC/HEIF coming from iOS attachments). Fall back
+  // to the per-provider per-image ceiling rather than the raw base64 length,
+  // which over-counts by 30-100x. Gemini's tile pricing tops out well above
+  // the universal 1,600-token cap, so use its max-tile budget instead to
+  // avoid under-counting large iPhone screenshots.
+  if (options?.providerName === "gemini") {
+    return GEMINI_IMAGE_MAX_TOKENS;
   }
-  // Non-Anthropic: keep existing base64-size heuristic
-  return estimateTextTokens(block.source.data);
+  return IMAGE_MAX_TOKENS;
 }
 export function estimateContentBlockTokens(