npm - @vellumai/assistant - Versions diffs - 0.8.7 → 0.8.8 - Mend

@vellumai/assistant 0.8.7 → 0.8.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (387) hide show

package/Dockerfile +20 -4
package/docker-entrypoint.sh +4 -2
package/docker-init-apt-root.sh +3 -1
package/docker-kata-apt-env.sh +3 -1
package/docker-kata-runtime-family.sh +12 -0
package/docs/architecture/memory.md +1 -1
package/docs/plugins.md +75 -79
package/examples/plugins/echo/README.md +6 -12
package/examples/plugins/echo/register.ts +0 -41
package/node_modules/@vellumai/skill-host-contracts/src/server-message.ts +3 -3
package/openapi.yaml +3381 -348
package/package.json +1 -1
package/scripts/generate-openapi.ts +68 -41
package/src/__tests__/agent-loop-exit-reason.test.ts +34 -39
package/src/__tests__/agent-loop-provider-error-recording.test.ts +1 -1
package/src/__tests__/agent-loop.test.ts +37 -87
package/src/__tests__/agent-wake-disk-pressure-callsite.test.ts +2 -0
package/src/__tests__/annotate-activity-metadata.test.ts +262 -0
package/src/__tests__/annotate-risk-options.test.ts +2 -3
package/src/__tests__/anthropic-provider.test.ts +95 -2
package/src/__tests__/assistant-event-hub.test.ts +25 -0
package/src/__tests__/assistant-events-sse-shed.test.ts +8 -0
package/src/__tests__/{conversation-stream-state.test.ts → assistant-stream-state.test.ts} +252 -91
package/src/__tests__/auth-fallback-events-store.test.ts +116 -0
package/src/__tests__/background-workers-disk-pressure.test.ts +6 -0
package/src/__tests__/btw-routes.test.ts +62 -3
package/src/__tests__/build-persisted-content.test.ts +184 -0
package/src/__tests__/catalog-files.test.ts +1 -1
package/src/__tests__/clawhub-files.test.ts +1 -1
package/src/__tests__/compaction-pipeline.test.ts +1 -1
package/src/__tests__/compaction.benchmark.test.ts +0 -30
package/src/__tests__/config-watcher.test.ts +1 -1
package/src/__tests__/conversation-abort-tool-results.test.ts +57 -19
package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +6 -2
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +10 -4
package/src/__tests__/conversation-agent-loop-overflow.test.ts +313 -1136
package/src/__tests__/conversation-agent-loop.test.ts +596 -1616
package/src/__tests__/conversation-analysis-routes.test.ts +6 -0
package/src/__tests__/conversation-history-web-search.test.ts +11 -1
package/src/__tests__/conversation-pairing.test.ts +4 -31
package/src/__tests__/conversation-process-app-control-preactivation.test.ts +6 -0
package/src/__tests__/conversation-provider-retry-repair.test.ts +26 -5
package/src/__tests__/conversation-queue.test.ts +2 -0
package/src/__tests__/conversation-routes-disk-view.test.ts +3 -0
package/src/__tests__/conversation-routes-slash-commands.test.ts +6 -5
package/src/__tests__/conversation-runtime-assembly.test.ts +170 -229
package/src/__tests__/conversation-runtime-workspace.test.ts +3 -24
package/src/__tests__/conversation-slash-commands.test.ts +8 -42
package/src/__tests__/conversation-slash-queue.test.ts +6 -1
package/src/__tests__/conversation-surfaces-action-delivery.test.ts +84 -0
package/src/__tests__/conversation-sync-tags.test.ts +27 -15
package/src/__tests__/conversation-title-service.test.ts +135 -2
package/src/__tests__/conversation-workspace-injection.test.ts +6 -1
package/src/__tests__/cross-provider-web-search.test.ts +214 -1
package/src/__tests__/db-schedule-syntax-migration.test.ts +5 -0
package/src/__tests__/dm-persistence.test.ts +5 -1
package/src/__tests__/empty-response-hook.test.ts +304 -0
package/src/__tests__/feature-flag-test-helpers.ts +2 -2
package/src/__tests__/gemini-image-service.test.ts +13 -0
package/src/__tests__/helpers/mock-provider.ts +110 -0
package/src/__tests__/helpers/native-web-search-harness.ts +129 -0
package/src/__tests__/history-repair-hook.test.ts +1 -0
package/src/__tests__/identity-intro-cache.test.ts +12 -100
package/src/__tests__/identity-routes.test.ts +248 -7
package/src/__tests__/inbound-slack-persistence.test.ts +5 -1
package/src/__tests__/injector-background-turn.test.ts +2 -8
package/src/__tests__/injector-chain.test.ts +106 -270
package/src/__tests__/injector-disk-pressure.test.ts +3 -12
package/src/__tests__/injector-document-comments.test.ts +2 -2
package/src/__tests__/injector-pkb-v2-silenced.test.ts +30 -22
package/src/__tests__/injector-v3-suppression.test.ts +31 -37
package/src/__tests__/internal-telemetry-routes.test.ts +109 -0
package/src/__tests__/list-messages-page-latest.test.ts +60 -0
package/src/__tests__/list-messages-tool-merge.test.ts +20 -0
package/src/__tests__/llm-usage-store.test.ts +223 -1
package/src/__tests__/memory-retrieval-hook.test.ts +297 -0
package/src/__tests__/memory-v2-static-injector.test.ts +103 -35
package/src/__tests__/native-web-search.test.ts +191 -0
package/src/__tests__/onboarding-template-contract.test.ts +2 -0
package/src/__tests__/openai-image-service.test.ts +17 -0
package/src/__tests__/openai-provider.test.ts +31 -1
package/src/__tests__/persist-unsendable-image.test.ts +215 -0
package/src/__tests__/persistence-secret-redaction.test.ts +1 -0
package/src/__tests__/pipeline-runner.test.ts +29 -39
package/src/__tests__/pkb-autoinject.test.ts +2 -5
package/src/__tests__/plugin-bootstrap.test.ts +13 -28
package/src/__tests__/plugin-registry.test.ts +0 -27
package/src/__tests__/plugin-types.test.ts +2 -125
package/src/__tests__/process-message-display-content.test.ts +6 -2
package/src/__tests__/regenerate-fire-and-forget-trace.test.ts +5 -1
package/src/__tests__/resolve-trust-class.test.ts +4 -4
package/src/__tests__/runtime-events-sse-reconnect.test.ts +60 -23
package/src/__tests__/schedule-routes.test.ts +603 -2
package/src/__tests__/schedule-store.test.ts +41 -0
package/src/__tests__/schedule-tools.test.ts +35 -0
package/src/__tests__/server-history-render.test.ts +314 -1
package/src/__tests__/skillssh-files.test.ts +1 -1
package/src/__tests__/system-prompt.test.ts +20 -0
package/src/__tests__/task-scheduler.test.ts +162 -1
package/src/__tests__/terminal-tools.test.ts +6 -1
package/src/__tests__/title-generate-hook.test.ts +319 -0
package/src/__tests__/tool-error-hook.test.ts +278 -0
package/src/__tests__/tool-preview-lifecycle.test.ts +468 -5
package/src/__tests__/tool-result-metadata-plumbing.test.ts +1 -0
package/src/__tests__/tool-result-truncate-hook.test.ts +127 -0
package/src/__tests__/tool-result-truncation.test.ts +0 -2
package/src/__tests__/ui-choice-copy-surfaces.test.ts +254 -0
package/src/__tests__/ui-work-result-surface.test.ts +159 -0
package/src/__tests__/usage-routes.test.ts +285 -1
package/src/__tests__/user-plugin-loader.test.ts +2 -2
package/src/__tests__/voice-session-bridge.test.ts +6 -3
package/src/__tests__/web-search-backend-failure.test.ts +166 -0
package/src/agent/loop.ts +346 -442
package/src/api/events/assistant-thinking-delta.ts +33 -0
package/src/api/events/tool-output-chunk.ts +45 -0
package/src/api/events/tool-use-preview-start.ts +32 -0
package/src/api/events/trace-event.ts +69 -0
package/src/api/index.ts +48 -13
package/src/api/responses/conversation-message.ts +368 -0
package/src/avatar/__tests__/avatar-store.test.ts +34 -29
package/src/cli/commands/__tests__/notifications.test.ts +58 -14
package/src/cli/commands/notifications.ts +112 -60
package/src/config/assistant-feature-flags.ts +22 -11
package/src/config/bundled-skills/app-builder/SKILL.md +3 -20
package/src/config/bundled-skills/app-builder/references/examples/README.md +17 -0
package/src/config/bundled-skills/app-builder/references/examples/expense-tracker.md +515 -0
package/src/config/bundled-skills/app-builder/references/examples/focus-timer.md +342 -0
package/src/config/bundled-skills/app-builder/references/examples/habit-tracker.md +490 -0
package/src/config/bundled-skills/document-editor/SKILL.md +1 -1
package/src/config/bundled-skills/messaging/SKILL.md +0 -7
package/src/config/feature-flag-cache.ts +3 -3
package/src/config/feature-flag-registry.json +35 -3
package/src/config/schemas/__tests__/memory-v2.test.ts +1 -0
package/src/config/schemas/__tests__/memory-v3.test.ts +25 -0
package/src/config/schemas/llm.ts +1 -0
package/src/config/schemas/memory-v2.ts +8 -0
package/src/config/schemas/memory-v3.ts +8 -0
package/src/config/schemas/platform.ts +8 -0
package/src/config/seed-inference-profiles.ts +2 -2
package/src/config/skills.ts +13 -0
package/src/context/compactor.ts +1 -1
package/src/context/strip-injections.ts +122 -0
package/src/context/token-estimator.ts +23 -0
package/src/context/tool-result-truncation.ts +0 -23
package/src/context/window-manager.ts +3 -6
package/src/credential-execution/executable-discovery.ts +16 -0
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +6 -0
package/src/daemon/__tests__/inference-profile-notification.test.ts +153 -0
package/src/daemon/__tests__/native-web-search-metadata.test.ts +10 -8
package/src/daemon/assistant-attachments.ts +1 -1
package/src/daemon/config-watcher.ts +2 -2
package/src/daemon/context-overflow-reducer.ts +0 -1
package/src/daemon/conversation-agent-loop-handlers.ts +605 -153
package/src/daemon/conversation-agent-loop.ts +281 -760
package/src/daemon/conversation-history.ts +5 -4
package/src/daemon/conversation-lifecycle.ts +3 -4
package/src/daemon/conversation-messaging.ts +7 -6
package/src/daemon/conversation-process.ts +11 -16
package/src/daemon/conversation-runtime-assembly.ts +130 -347
package/src/daemon/conversation-slash.ts +6 -25
package/src/daemon/conversation-surfaces.ts +222 -4
package/src/daemon/conversation-tool-setup.ts +2 -29
package/src/daemon/conversation.ts +32 -14
package/src/daemon/external-plugins-bootstrap.ts +9 -10
package/src/daemon/handlers/config-a2a.ts +51 -36
package/src/daemon/handlers/config-slack-channel.ts +20 -14
package/src/daemon/handlers/config-telegram.ts +16 -2
package/src/daemon/handlers/shared.ts +156 -84
package/src/daemon/handlers/skills.ts +39 -10
package/src/daemon/lifecycle.ts +4 -0
package/src/daemon/message-types/apps.ts +1 -29
package/src/daemon/message-types/messages.ts +9 -57
package/src/daemon/message-types/skills.ts +2 -0
package/src/daemon/message-types/surfaces.ts +136 -3
package/src/daemon/now-scratchpad.ts +21 -0
package/src/daemon/orphan-reaper.test.ts +210 -0
package/src/daemon/orphan-reaper.ts +240 -0
package/src/daemon/persist-unsendable-image.ts +117 -0
package/src/daemon/process-message.ts +1 -3
package/src/daemon/trace-emitter.ts +6 -4
package/src/daemon/trust-context.ts +19 -0
package/src/daemon/wake-target-adapter.ts +3 -1
package/src/home/home-greeting-cache.ts +24 -1
package/src/ipc/gateway-client.test.ts +2 -2
package/src/ipc/gateway-client.ts +3 -3
package/src/media/gemini-image-service.ts +15 -0
package/src/media/openai-image-service.ts +14 -0
package/src/media/types.ts +34 -0
package/src/memory/__tests__/jobs-worker-v2-schedule.test.ts +56 -0
package/src/memory/auth-fallback-events-store.ts +94 -0
package/src/memory/conversation-title-service.ts +65 -41
package/src/memory/db-init.ts +4 -0
package/src/memory/graph/__tests__/conversation-graph-memory-registry.test.ts +119 -0
package/src/memory/graph/conversation-graph-memory.ts +65 -0
package/src/memory/jobs-store.ts +33 -0
package/src/memory/jobs-worker.ts +31 -4
package/src/memory/llm-usage-store.ts +224 -50
package/src/memory/migrations/222-strip-placeholder-sentinels-from-messages.ts +6 -5
package/src/memory/migrations/270-schedule-source-conversation.ts +13 -0
package/src/memory/migrations/271-create-auth-fallback-events.ts +21 -0
package/src/memory/migrations/index.ts +2 -0
package/src/memory/pkb/autoinject.ts +61 -0
package/src/memory/pkb/context.ts +50 -0
package/src/memory/pkb/types.ts +14 -0
package/src/memory/schedule-attribution-sql.ts +104 -0
package/src/memory/schema/infrastructure.ts +16 -0
package/src/memory/usage-grouped-buckets.ts +6 -1
package/src/memory/v2/__tests__/consolidation-job.test.ts +1 -1
package/src/memory/v2/consolidation-job.ts +1 -1
package/src/memory/v3/__tests__/health.test.ts +16 -0
package/src/memory/v3/__tests__/orchestrate.test.ts +45 -9
package/src/memory/v3/__tests__/provider-blocks.test.ts +13 -0
package/src/memory/v3/__tests__/router.test.ts +101 -29
package/src/memory/v3/__tests__/selector.test.ts +93 -27
package/src/memory/v3/__tests__/shadow-plugin.test.ts +23 -5
package/src/memory/v3/health.ts +0 -0
package/src/memory/v3/llm-retry.ts +32 -0
package/src/memory/v3/orchestrate.ts +26 -14
package/src/memory/v3/provider-blocks.ts +15 -5
package/src/memory/v3/router.ts +48 -42
package/src/memory/v3/selector.ts +57 -42
package/src/memory/v3/shadow-plugin.ts +47 -15
package/src/memory/v3/types.ts +8 -0
package/src/notifications/conversation-pairing.ts +8 -15
package/src/notifications/decision-engine.ts +6 -3
package/src/notifications/home-feed-side-effect.ts +12 -1
package/src/permissions/prompter.ts +4 -0
package/src/plugin-api/constants.ts +4 -0
package/src/plugin-api/index.ts +8 -1
package/src/plugin-api/types.ts +151 -1
package/src/plugins/defaults/empty-response/hooks/stop.ts +126 -0
package/src/plugins/defaults/empty-response/register.ts +8 -13
package/src/plugins/defaults/index.ts +1 -15
package/src/plugins/defaults/injectors/register.ts +243 -74
package/src/plugins/defaults/memory-retrieval/hooks/post-compact.ts +91 -0
package/src/plugins/defaults/memory-retrieval/hooks/user-prompt-submit-temp.ts +216 -0
package/src/plugins/defaults/memory-retrieval/injector-chain.ts +35 -0
package/src/plugins/defaults/title-generate/hooks/stop.ts +75 -0
package/src/plugins/defaults/title-generate/hooks/user-prompt-submit.ts +35 -0
package/src/plugins/defaults/title-generate/package.json +1 -1
package/src/plugins/defaults/title-generate/register.ts +18 -18
package/src/plugins/defaults/tool-error/hooks/post-tool-use.ts +118 -0
package/src/plugins/defaults/tool-error/package.json +1 -1
package/src/plugins/defaults/tool-error/register.ts +9 -21
package/src/plugins/defaults/tool-result-truncate/hooks/post-tool-use.ts +32 -0
package/src/plugins/defaults/tool-result-truncate/register.ts +10 -21
package/src/plugins/defaults/tool-result-truncate/terminal.ts +37 -18
package/src/plugins/pipeline.ts +6 -18
package/src/plugins/registry.ts +8 -25
package/src/plugins/types.ts +43 -474
package/src/proactive-artifact/aux-message-injector.ts +3 -3
package/src/proactive-artifact/job.test.ts +7 -12
package/src/prompts/__tests__/system-prompt.test.ts +36 -0
package/src/prompts/templates/BOOTSTRAP-ACTIVATION-RAIL.md +62 -0
package/src/prompts/templates/BOOTSTRAP.md +2 -2
package/src/prompts/templates/system-sections.ts +15 -0
package/src/providers/anthropic/client.ts +37 -29
package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +112 -0
package/src/providers/openai/chat-completions-provider.ts +44 -0
package/src/providers/openrouter/client.ts +1 -0
package/src/providers/placeholder-sentinels.ts +35 -0
package/src/runtime/__tests__/agent-wake.test.ts +5 -1
package/src/runtime/agent-wake.ts +2 -2
package/src/runtime/assistant-event-hub.ts +36 -6
package/src/runtime/{conversation-stream-state.ts → assistant-stream-state.ts} +132 -58
package/src/runtime/http-router.ts +16 -21
package/src/runtime/http-types.ts +16 -70
package/src/runtime/pending-interactions.ts +1 -0
package/src/runtime/routes/__tests__/consolidation-routes.test.ts +265 -2
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +31 -1
package/src/runtime/routes/__tests__/memory-v2-routes.test.ts +6 -2
package/src/runtime/routes/__tests__/tts-routes.test.ts +6 -2
package/src/runtime/routes/app-management-routes.ts +6 -117
package/src/runtime/routes/app-routes.ts +13 -15
package/src/runtime/routes/attachment-routes.ts +26 -15
package/src/runtime/routes/avatar-routes.ts +26 -0
package/src/runtime/routes/btw-routes.ts +29 -23
package/src/runtime/routes/consolidation-routes.ts +120 -20
package/src/runtime/routes/conversation-query-routes.ts +2 -0
package/src/runtime/routes/conversation-routes.ts +358 -184
package/src/runtime/routes/documents-routes.ts +4 -0
package/src/runtime/routes/domain-routes.ts +51 -37
package/src/runtime/routes/epoch-millis-range.ts +34 -0
package/src/runtime/routes/events-routes.ts +28 -34
package/src/runtime/routes/gateway-log-routes.ts +26 -4
package/src/runtime/routes/heartbeat-routes.ts +32 -12
package/src/runtime/routes/identity-intro-cache.ts +11 -34
package/src/runtime/routes/identity-routes.ts +208 -17
package/src/runtime/routes/image-generation-routes.ts +40 -2
package/src/runtime/routes/index.ts +2 -0
package/src/runtime/routes/integrations/a2a.ts +12 -10
package/src/runtime/routes/integrations/slack/__tests__/channel.test.ts +16 -0
package/src/runtime/routes/integrations/slack/channel.ts +4 -0
package/src/runtime/routes/integrations/slack/share.ts +27 -6
package/src/runtime/routes/integrations/telegram.ts +6 -0
package/src/runtime/routes/integrations/twilio.ts +42 -0
package/src/runtime/routes/internal-telemetry-routes.ts +88 -0
package/src/runtime/routes/log-export-routes.ts +8 -0
package/src/runtime/routes/memory-v2-routes.ts +15 -8
package/src/runtime/routes/memory-v3-routes.ts +50 -28
package/src/runtime/routes/oauth-apps.ts +66 -12
package/src/runtime/routes/oauth-providers.ts +44 -5
package/src/runtime/routes/platform-routes.ts +81 -5
package/src/runtime/routes/playground/__tests__/force-compact.test.ts +6 -4
package/src/runtime/routes/playground/force-compact.ts +1 -1
package/src/runtime/routes/rename-conversation-routes.ts +5 -0
package/src/runtime/routes/schedule-routes.ts +152 -42
package/src/runtime/routes/secret-routes.ts +14 -2
package/src/runtime/routes/skills-routes.ts +43 -14
package/src/runtime/routes/tool-call-confirmation-enrichment.test.ts +161 -0
package/src/runtime/routes/tool-call-confirmation-enrichment.ts +107 -0
package/src/runtime/routes/trust-rules-routes.ts +26 -2
package/src/runtime/routes/tts-routes.ts +35 -0
package/src/runtime/routes/types.ts +66 -8
package/src/runtime/routes/usage-routes.ts +47 -39
package/src/runtime/routes/webhook-routes.ts +41 -2
package/src/runtime/routes/workspace-routes.ts +4 -0
package/src/runtime/services/__tests__/analyze-conversation.test.ts +6 -0
package/src/runtime/services/analyze-conversation.ts +2 -2
package/src/schedule/schedule-store.ts +20 -1
package/src/schedule/schedule-usage-store.ts +83 -0
package/src/schedule/scheduler.ts +12 -5
package/src/skills/catalog-files.ts +2 -2
package/src/skills/catalog-install.ts +3 -0
package/src/skills/categories-cache.ts +118 -0
package/src/skills/clawhub-files.ts +1 -2
package/src/skills/skillssh-files.ts +1 -2
package/src/telemetry/types.ts +29 -1
package/src/telemetry/usage-telemetry-reporter.test.ts +112 -3
package/src/telemetry/usage-telemetry-reporter.ts +57 -2
package/src/tools/executor.ts +1 -53
package/src/tools/network/__tests__/web-search-metadata.test.ts +7 -1
package/src/tools/network/__tests__/web-search.test.ts +11 -3
package/src/tools/network/web-search-error.test.ts +248 -0
package/src/tools/network/web-search-error.ts +267 -0
package/src/tools/network/web-search.ts +207 -48
package/src/tools/schedule/create.ts +2 -0
package/src/tools/terminal/safe-env.ts +10 -1
package/src/tools/ui-surface/definitions.ts +9 -1
package/src/tts/__tests__/provider-catalog-consistency.test.ts +85 -1
package/src/tts/provider-catalog.ts +76 -1
package/src/util/mutex.ts +47 -0
package/src/workspace/git-service.ts +1 -42
package/src/workspace/migrations/095-bump-heartbeat-interval-30m-to-60m.ts +51 -0
package/src/workspace/migrations/096-reduce-quality-profile-effort.ts +72 -0
package/src/workspace/migrations/097-enable-adaptive-thinking-managed-profiles.ts +93 -0
package/src/workspace/migrations/registry.ts +6 -0
package/src/__tests__/bootstrap-turn-cleanup.test.ts +0 -44
package/src/__tests__/empty-response-pipeline.test.ts +0 -423
package/src/__tests__/llm-call-pipeline.test.ts +0 -287
package/src/__tests__/memory-retrieval-pipeline.test.ts +0 -418
package/src/__tests__/persistence-pipeline.test.ts +0 -503
package/src/__tests__/title-generate-pipeline.test.ts +0 -211
package/src/__tests__/token-estimate-pipeline.test.ts +0 -479
package/src/__tests__/tool-error-pipeline.test.ts +0 -241
package/src/__tests__/tool-execute-pipeline.test.ts +0 -417
package/src/__tests__/tool-result-truncate-pipeline.test.ts +0 -341
package/src/daemon/bootstrap-turn-cleanup.ts +0 -45
package/src/gallery/default-gallery.ts +0 -1359
package/src/gallery/gallery-manifest.ts +0 -28
package/src/home/feature-gate.ts +0 -22
package/src/plugins/defaults/empty-response/middlewares/emptyResponse.ts +0 -22
package/src/plugins/defaults/empty-response/terminal.ts +0 -106
package/src/plugins/defaults/injectors/package.json +0 -15
package/src/plugins/defaults/llm-call/middlewares/llmCall.ts +0 -17
package/src/plugins/defaults/llm-call/package.json +0 -15
package/src/plugins/defaults/llm-call/register.ts +0 -45
package/src/plugins/defaults/memory-retrieval/middlewares/memoryRetrieval.ts +0 -17
package/src/plugins/defaults/memory-retrieval/package.json +0 -15
package/src/plugins/defaults/memory-retrieval/register.ts +0 -181
package/src/plugins/defaults/persistence/middlewares/persistence.ts +0 -19
package/src/plugins/defaults/persistence/package.json +0 -15
package/src/plugins/defaults/persistence/register.ts +0 -38
package/src/plugins/defaults/persistence/terminal.ts +0 -83
package/src/plugins/defaults/title-generate/terminal.ts +0 -31
package/src/plugins/defaults/token-estimate/middlewares/tokenEstimate.ts +0 -23
package/src/plugins/defaults/token-estimate/package.json +0 -15
package/src/plugins/defaults/token-estimate/register.ts +0 -34
package/src/plugins/defaults/token-estimate/terminal.ts +0 -40
package/src/plugins/defaults/tool-error/middlewares/toolError.ts +0 -21
package/src/plugins/defaults/tool-error/terminal.ts +0 -47
package/src/plugins/defaults/tool-execute/middlewares/toolExecute.ts +0 -23
package/src/plugins/defaults/tool-execute/package.json +0 -15
package/src/plugins/defaults/tool-execute/register.ts +0 -49
package/src/plugins/defaults/tool-result-truncate/middlewares/toolResultTruncate.ts +0 -23
package/src/plugins/defaults/tool-result-truncate/types.ts +0 -22
package/src/skills/category-inference.ts +0 -111

package/src/daemon/conversation-agent-loop-handlers.ts CHANGED Viewed

@@ -17,6 +17,7 @@ import type {
 import { getConfig } from "../config/loader.js";
 import { recordEstimate } from "../context/estimator-calibration.js";
 import { getCalibrationProviderKey } from "../context/token-estimator.js";
+import type { ContextWindowResult } from "../context/window-manager.js";
 import { projectAssistantMessage } from "../memory/conversation-attention-store.js";
 import {
   deleteMessageById,
@@ -24,8 +25,12 @@ import {
   getMessageById,
   messageMetadataSchema,
   provenanceFromTrustContext,
+  reserveMessage,
+  setConversationHistoryStrippedAt,
+  setLastNotifiedInferenceProfile,
   updateMessageContent,
 } from "../memory/conversation-crud.js";
+import { syncMessageToDisk } from "../memory/conversation-disk-view.js";
 import { indexMessageNow } from "../memory/indexer.js";
 import {
   backfillMessageIdOnLogs,
@@ -41,20 +46,24 @@ import {
   type SlackMessageMetadata,
   writeSlackMetadata,
 } from "../messaging/providers/slack/message-metadata.js";
-import { defaultPersistenceTerminal } from "../plugins/defaults/persistence/terminal.js";
-import { DEFAULT_TIMEOUTS, runPipeline } from "../plugins/pipeline.js";
-import { getMiddlewaresFor } from "../plugins/registry.js";
 import type {
-  PersistArgs,
-  PersistReserveResult,
-  PersistResult,
-  TurnContext,
-} from "../plugins/types.js";
-import type { ContentBlock, ImageContent } from "../providers/types.js";
+  ContentBlock,
+  ImageContent,
+  Message,
+} from "../providers/types.js";
 import { isContextOverflowError } from "../providers/types.js";
+import {
+  getCurrentSeq,
+  recordPersistedSeq,
+} from "../runtime/assistant-stream-state.js";
 import { publishSyncInvalidation } from "../runtime/sync/sync-publisher.js";
 import { redactSecrets } from "../security/secret-scanner.js";
 import { extractDomain } from "../tools/network/domain-normalize.js";
+import {
+  classifyWebSearchFailure,
+  logWebSearchBackendFailure,
+  WEB_SEARCH_BACKEND_FAILURE_MESSAGE,
+} from "../tools/network/web-search-error.js";
 import {
   buildPricingUsage,
   resolveStructuredPricing,
@@ -87,45 +96,36 @@ import type {
 } from "./message-protocol.js";
 import { conversationMetadataSyncTag } from "./message-types/sync.js";
 import type {
+  ToolActivityMetadata,
   WebSearchMetadata,
   WebSearchResultItem,
 } from "./message-types/web-activity.js";
-import { FALLBACK_TURN_TRUST } from "./trust-context.js";
 const log = getLogger("agent-loop-handlers");
+/**
+ * Persist the history-stripped marker after the loop strips runtime injections
+ * for compaction / overflow recovery. The marker is a durability hint, not
+ * turn-critical state — a transient SQLite write failure (SQLITE_BUSY,
+ * disk-full, read-only FS) must not abort the turn, so failures log a warning
+ * and continue.
+ */
+export function markHistoryStrippedBestEffort(conversationId: string): void {
+  try {
+    setConversationHistoryStrippedAt(conversationId, Date.now());
+  } catch (err) {
+    log.warn(
+      { err, conversationId },
+      "Failed to persist history-stripped marker after compaction strip (non-fatal)",
+    );
+  }
+}
 // ── Partial-persistence tunables ─────────────────────────────────────
 // Debounce for mid-turn `updateContent` writes from text deltas.
 // Indexer + projector still fire ONLY at `handleMessageComplete`.
 const PARTIAL_PERSIST_DEBOUNCE_MS = 1000;
-/**
- * Build a {@link TurnContext} from the handler's deps for pipeline logging
- * and plugin attribution.
- *
- * Reads `turnIndex` from `deps.ctx.turnCount` — the orchestrator-owned
- * per-turn counter that is stable for the entire duration of a single
- * `runAgentLoopImpl` invocation. The handlers fire after the orchestrator
- * has completed its in-turn pipeline work but before `ctx.turnCount++` runs
- * in the outer `finally` block, so this value always reflects the turn the
- * handler's event belongs to. Trust pulls from the per-turn snapshot first,
- * then the conversation-level context, then the canonical `unknown`
- * fallback so the required field stays populated for edge cases (fresh
- * conversations before the trust resolver runs, heartbeat turns that never
- * bind an actor).
- */
-function buildHandlerTurnContext(deps: EventHandlerDeps): TurnContext {
-  return {
-    requestId: deps.reqId,
-    conversationId: deps.ctx.conversationId,
-    turnIndex: deps.ctx.turnCount,
-    trust:
-      deps.ctx.currentTurnTrustContext ??
-      deps.ctx.trustContext ??
-      FALLBACK_TURN_TRUST,
-  };
-}
 // ── Types ────────────────────────────────────────────────────────────
 export interface PendingToolResult {
@@ -137,6 +137,16 @@ export interface PendingToolResult {
 /** Mutable state shared across event handlers within a single agent loop run. */
 export interface EventHandlerState {
   llmCallStartedEmitted: boolean;
+  /**
+   * Profile key whose `model_profile` notice has been assembled into the turn
+   * context but not yet marked notified. Set when the turn injects the notice,
+   * and consumed the first time the model actually receives that context — i.e.
+   * on the first `message_complete`. Persisting on delivery (rather than inline
+   * before the provider call) means a cancelled or failed turn re-sends the
+   * notice next turn instead of silently marking the profile notified without
+   * the model ever having seen it.
+   */
+  pendingNotifiedInferenceProfile: string | null;
   pendingDirectiveDisplayBuffer: string;
   firstAssistantText: string;
   /** Most recent resolved provider for the current exchange's usage accounting. */
@@ -186,6 +196,15 @@ export interface EventHandlerState {
    */
   assistantRowAwaitingFinalization: boolean;
   readonly pendingToolResults: Map<string, PendingToolResult>;
+  /**
+   * Reservation of the grouped `user` tool-result row for the current batch,
+   * resolving to the row id. Shared across the concurrent `handleToolResult`
+   * calls of one parallel-tool batch so they reserve exactly one row and write
+   * into it as sibling results land. `undefined` until the first result of a
+   * batch triggers a reservation (reset on a failed reservation so the next
+   * arrival can retry) and again after the batch is finalized.
+   */
+  pendingToolResultRowReservation: Promise<string> | undefined;
   readonly persistedToolUseIds: Set<string>;
   readonly accumulatedDirectives: DirectiveRequest[];
   readonly accumulatedToolContentBlocks: ContentBlock[];
@@ -238,6 +257,13 @@ export interface EventHandlerState {
       riskDirectoryScopeOptions?: Array<{ scope: string; label: string }>;
     }
   >;
+  /**
+   * Structured tool activity (web_search / web_fetch) keyed by tool_use_id,
+   * captured when a result lands so it can be persisted on the tool's content
+   * block and survive a history reopen. Populated for both external provider
+   * tools (in handleToolResult) and native server tools (server_tool_complete).
+   */
+  readonly toolActivityMetadata: Map<string, ToolActivityMetadata>;
   /** tool_use_ids emitted in the current turn (populated in handleToolUse, cleared after annotation). */
   currentTurnToolUseIds: string[];
   /** Wall-clock time (ms since epoch) when the agent loop turn started, used as the display timestamp for assistant messages. */
@@ -246,12 +272,47 @@ export interface EventHandlerState {
   readonly serverToolStartedAt: Map<string, number>;
   /** Original input from server_tool_start, keyed by tool_use_id, so the complete handler can read the query. */
   readonly serverToolInputs: Map<string, Record<string, unknown>>;
+  /** Request ids for which a user-facing web_search backend-failure notice was already surfaced this turn (dedup noisy repeats). Keyed by request id; each turn has a fresh request id, so this grows at most one entry per turn. */
+  readonly webSearchBackendFailureNotified: Set<string>;
   /** Active debounce timer for partial persistence; `undefined` when idle. */
   pendingPartialFlushTimer: ReturnType<typeof setTimeout> | undefined;
   /** In-flight partial flush write awaited at finalize to avoid overwrite races. */
   pendingPartialFlushPromise: Promise<void> | undefined;
-  /** Running mirror of the in-flight assistant message's content. */
+  /**
+   * Running mirror of the in-flight assistant message's streamed content
+   * (text and thinking), flushed to the assistant row on the partial-persist
+   * debounce so a mid-turn snapshot reflects what the user is watching live.
+   */
   currentMessageContent: ContentBlock[];
+  /**
+   * `seq` of the most recent streamed content delta mirrored into
+   * `currentMessageContent`. Recorded as the conversation's persisted `seq`
+   * after each flush commits (the debounced partial flushes and the
+   * `message_complete` finalize), so the snapshot's advertised `seq` tracks
+   * exactly the streamed content the durable row holds. `undefined` until the
+   * first content delta of the in-flight message. Because every streamed
+   * content type rides the same mirror-and-flush path, this single field
+   * never claims content a flush has not yet written.
+   */
+  lastPersistedContentSeq: number | undefined;
+  /**
+   * Whether the workspace top-level block should be (re)injected on this
+   * turn. Compaction's prepare phase strips the workspace / NOW.md / PKB
+   * blocks off the tail, so it is set after any successful compaction to
+   * force the workspace overview back in. On an ordinary turn the block is
+   * already present in history, so it defaults `false` to avoid burning
+   * tokens re-injecting it redundantly.
+   */
+  shouldInjectWorkspace: boolean;
+  /**
+   * Whether the reducer has compacted `ctx.messages`, gating the Slack
+   * chronological-transcript override on re-injection. The captured
+   * transcript is the full persisted history; blindly replaying it after
+   * compaction would overwrite the reduced messages and undo compaction, so
+   * once this is `true` the override falls back to the reduced
+   * `ctx.messages`.
+   */
+  reducerCompacted: boolean;
 }
 /** Immutable context shared across event handlers within a single agent loop run. */
@@ -265,6 +326,18 @@ export interface EventHandlerDeps {
   readonly rlog: pino.Logger;
   readonly turnChannelContext: TurnChannelContext;
   readonly turnInterfaceContext: TurnInterfaceContext;
+  /**
+   * Commit a successful inline compaction to durable state. Invoked from the
+   * `compaction_completed` dispatch case (when `result.compacted`) with the
+   * loop's compaction result and the stripped pre-compaction `basis`. Supplied
+   * by the orchestrator because the body writes Conversation DB-record fields,
+   * projects Slack provenance, and emits transport the loop is intentionally
+   * blind to.
+   */
+  readonly applyCompaction: (
+    result: ContextWindowResult,
+    basis: Message[],
+  ) => Promise<void>;
 }
 // ── Factory ──────────────────────────────────────────────────────────
@@ -272,6 +345,7 @@ export interface EventHandlerDeps {
 export function createEventHandlerState(): EventHandlerState {
   return {
     llmCallStartedEmitted: false,
+    pendingNotifiedInferenceProfile: null,
     pendingDirectiveDisplayBuffer: "",
     firstAssistantText: "",
     exchangeProviderName: undefined,
@@ -292,6 +366,7 @@ export function createEventHandlerState(): EventHandlerState {
     lastAssistantMessageId: undefined,
     assistantRowAwaitingFinalization: false,
     pendingToolResults: new Map(),
+    pendingToolResultRowReservation: undefined,
     persistedToolUseIds: new Set(),
     accumulatedDirectives: [],
     accumulatedToolContentBlocks: [],
@@ -307,22 +382,28 @@ export function createEventHandlerState(): EventHandlerState {
     requestIdToToolUseId: new Map(),
     toolConfirmationOutcomes: new Map(),
     toolRiskOutcomes: new Map(),
+    toolActivityMetadata: new Map(),
     currentTurnToolUseIds: [],
     turnStartedAt: Date.now(),
     serverToolStartedAt: new Map(),
     serverToolInputs: new Map(),
+    webSearchBackendFailureNotified: new Set(),
     pendingPartialFlushTimer: undefined,
     pendingPartialFlushPromise: undefined,
     currentMessageContent: [],
+    lastPersistedContentSeq: undefined,
+    shouldInjectWorkspace: false,
+    reducerCompacted: false,
   };
 }
 // ── Partial-persistence helpers ──────────────────────────────────────
 /** Canonical persisted-content build: clean → append surfaces → redact. */
-function buildPersistedAssistantContent(
+export function buildPersistedAssistantContent(
   rawBlocks: readonly ContentBlock[],
   surfaces: readonly AssistantSurface[],
+  activityByToolUseId?: ReadonlyMap<string, ToolActivityMetadata>,
 ): ContentBlock[] {
   const { cleanedContent } = cleanAssistantContent(rawBlocks);
   const cleaned = cleanedContent as ContentBlock[];
@@ -345,6 +426,18 @@ function buildPersistedAssistantContent(
       const tb = block as Extract<ContentBlock, { type: "text" }>;
       return { ...tb, text: redactSecrets(tb.text) };
     }
+    // Native server tools (Anthropic web_search) resolve mid-stream — their
+    // `server_tool_complete` fires before `message_complete` — so the captured
+    // activity is available at persist time. Stamp it on the server_tool_use
+    // block here so the web-search card survives a history reopen. External
+    // tool_use activity arrives only with the later tool_result, so it is
+    // stamped in `annotatePersistedAssistantMessage` instead.
+    if (block.type === "server_tool_use" && activityByToolUseId) {
+      const activity = activityByToolUseId.get(block.id);
+      if (activity) {
+        return { ...block, _activityMetadata: activity } as ContentBlock;
+      }
+    }
     return block;
   });
 }
@@ -363,6 +456,30 @@ function appendTextToCurrentMessage(
   }
 }
+/**
+ * Append a streamed thinking chunk to `state.currentMessageContent`, fusing
+ * into the tail thinking block. The streamed delta carries no provider
+ * `signature` (that arrives only when the block closes), so the mirrored block
+ * holds an empty one; `message_complete` overwrites the row with the
+ * authoritative signed content before it is ever sent back to a provider.
+ */
+function appendThinkingToCurrentMessage(
+  state: EventHandlerState,
+  thinking: string,
+): void {
+  if (thinking.length === 0) return;
+  const tail = state.currentMessageContent.at(-1);
+  if (tail && tail.type === "thinking") {
+    tail.thinking = tail.thinking + thinking;
+  } else {
+    state.currentMessageContent.push({
+      type: "thinking",
+      thinking,
+      signature: "",
+    });
+  }
+}
 /** Reset partial-persist accumulator and any pending flush state. Idempotent. */
 function resetPartialPersistAccumulator(state: EventHandlerState): void {
   if (state.pendingPartialFlushTimer !== undefined) {
@@ -370,10 +487,11 @@ function resetPartialPersistAccumulator(state: EventHandlerState): void {
     state.pendingPartialFlushTimer = undefined;
   }
   state.currentMessageContent = [];
+  state.lastPersistedContentSeq = undefined;
   state.pendingPartialFlushPromise = undefined;
 }
-/** Flush `state.currentMessageContent` to the row via the persistence pipeline. */
+/** Flush `state.currentMessageContent` to the persisted assistant row. */
 async function flushAccumulatedContent(
   state: EventHandlerState,
   deps: EventHandlerDeps,
@@ -382,22 +500,24 @@ async function flushAccumulatedContent(
   if (messageId === undefined) return;
   if (state.currentMessageContent.length === 0) return;
-  const built = buildPersistedAssistantContent(state.currentMessageContent, []);
+  const built = buildPersistedAssistantContent(
+    state.currentMessageContent,
+    [],
+    state.toolActivityMetadata,
+  );
   const contentJson = JSON.stringify(built);
+  // Pair the seq with the exact content snapshot taken above: deltas that
+  // arrive while the write is in flight bump `lastPersistedContentSeq`
+  // again, but they are not part of this write.
+  const flushedSeq = state.lastPersistedContentSeq;
   try {
-    await runPipeline<PersistArgs, PersistResult>(
-      "persistence",
-      getMiddlewaresFor("persistence"),
-      defaultPersistenceTerminal,
-      {
-        op: "updateContent",
-        messageId,
-        content: contentJson,
-      },
-      buildHandlerTurnContext(deps),
-      DEFAULT_TIMEOUTS.persistence,
-    );
+    updateMessageContent(messageId, contentJson);
+    // Record only after the write commits, so the snapshot seq never
+    // claims content that is not yet durable.
+    if (flushedSeq != null) {
+      recordPersistedSeq(deps.ctx.conversationId, flushedSeq);
+    }
   } catch (err) {
     deps.rlog.warn(
       { err, messageId },
@@ -633,12 +753,6 @@ export async function handleLlmCallStarted(
   // the `assistantRowAwaitingFinalization` flag — `handleMessageComplete`
   // clears it after the successful `updateContent`, so the previous call's
   // committed row is never touched here.
-  //
-  // Direct `deleteMessageById` (not via the `persistence` pipeline) is
-  // intentional: a never-finalized reservation has no segments, no
-  // attachments, and no observable history — undoing it isn't a real
-  // persistence event for plugins to react to, so routing through the
-  // pipeline would only widen the mock surface for no observability win.
   if (state.assistantRowAwaitingFinalization && state.lastAssistantMessageId) {
     try {
       deleteMessageById(state.lastAssistantMessageId);
@@ -652,20 +766,12 @@ export async function handleLlmCallStarted(
   }
   const metadata = buildAssistantChannelMetadata(state, deps);
-  const reserveResult = (await runPipeline<PersistArgs, PersistResult>(
-    "persistence",
-    getMiddlewaresFor("persistence"),
-    defaultPersistenceTerminal,
-    {
-      op: "reserve",
-      conversationId: deps.ctx.conversationId,
-      role: "assistant",
-      metadata,
-    },
-    buildHandlerTurnContext(deps),
-    DEFAULT_TIMEOUTS.persistence,
-  )) as PersistReserveResult;
-  state.lastAssistantMessageId = reserveResult.message.id;
+  const reservedRow = await reserveMessage(
+    deps.ctx.conversationId,
+    "assistant",
+    metadata,
+  );
+  state.lastAssistantMessageId = reservedRow.id;
   state.assistantRowAwaitingFinalization = true;
   // Fresh row → fresh accumulator. If an earlier (failed) LLM call
   // within the same run left partial state behind, the
@@ -675,7 +781,7 @@ export async function handleLlmCallStarted(
   resetPartialPersistAccumulator(state);
   deps.onEvent({
     type: "assistant_turn_start",
-    messageId: reserveResult.message.id,
+    messageId: reservedRow.id,
     conversationId: deps.ctx.conversationId,
   });
 }
@@ -711,6 +817,11 @@ function handleTextDelta(
     // Mirror the drained delta into state.currentMessageContent so partial
     // flushes mid-turn see the same content the user is watching live.
     appendTextToCurrentMessage(state, drained.emitText);
+    // The hub stamps `seq` synchronously on the delta emitted above, so
+    // `getCurrentSeq()` here is that delta's seq -- the position the
+    // mirrored content now reflects. A partial flush snapshots this to
+    // record how far the durable rows track the live stream.
+    state.lastPersistedContentSeq = getCurrentSeq();
     schedulePartialFlush(state, deps);
   }
 }
@@ -746,6 +857,14 @@ function handleThinkingDelta(
     conversationId: deps.ctx.conversationId,
     messageId: state.lastAssistantMessageId,
   });
+  // Mirror thinking into the same running view as text so the debounced
+  // partial flush persists it mid-turn -- long reasoning streams survive a
+  // refresh that outlives the SSE replay window, exactly as long answers do.
+  appendThinkingToCurrentMessage(state, event.thinking);
+  // The hub stamps `seq` synchronously on the delta emitted above, so
+  // `getCurrentSeq()` is that delta's position in the mirrored content.
+  state.lastPersistedContentSeq = getCurrentSeq();
+  schedulePartialFlush(state, deps);
 }
 export function handleToolUse(
@@ -773,6 +892,14 @@ export function handleToolUse(
     toolUseId: event.id,
     messageId: state.lastAssistantMessageId,
   });
+  // `message_complete` always precedes tool events (see handleMessageComplete),
+  // so this tool_use block is already durable in the assistant row. The
+  // `tool_use_start` emitted just above is therefore the newest stamped event
+  // whose content the `/messages` snapshot already reflects -- advance the
+  // persisted seq to it. Without this the snapshot would advertise a seq below
+  // an event it already incorporates, and a client applying `seq > snapshot.seq`
+  // would replay this tool start.
+  recordPersistedSeq(deps.ctx.conversationId, getCurrentSeq());
 }
 export function handleToolUsePreviewStart(
@@ -890,11 +1017,244 @@ export function handleInputJsonDelta(
   });
 }
-export function handleToolResult(
+/**
+ * Build the persisted `tool_result` content blocks for the buffered results,
+ * redacting secrets from both the flat content and any structured blocks. All
+ * results of one assistant turn share a single `user` row (the shape providers
+ * expect for tool_result-in-user-turn).
+ */
+function buildToolResultBlocks(
+  pending: ReadonlyMap<string, PendingToolResult>,
+) {
+  return Array.from(pending.entries()).map(([toolUseId, result]) => ({
+    type: "tool_result",
+    tool_use_id: toolUseId,
+    content: redactSecrets(result.content),
+    is_error: result.isError,
+    ...(result.contentBlocks
+      ? {
+          contentBlocks: result.contentBlocks.map((block) =>
+            block.type === "text"
+              ? { ...block, text: redactSecrets(block.text) }
+              : block,
+          ),
+        }
+      : {}),
+  }));
+}
+/**
+ * Channel/interface provenance metadata for the grouped tool-result row,
+ * stamped from the turn context so the row carries the same provenance the
+ * snapshot reflects from the moment it lands in SQLite.
+ */
+function buildToolResultMetadata(
+  deps: EventHandlerDeps,
+): Record<string, unknown> {
+  return {
+    ...provenanceFromTrustContext(deps.ctx.trustContext),
+    userMessageChannel: deps.turnChannelContext.userMessageChannel,
+    assistantMessageChannel: deps.turnChannelContext.assistantMessageChannel,
+    userMessageInterface: deps.turnInterfaceContext.userMessageInterface,
+    assistantMessageInterface:
+      deps.turnInterfaceContext.assistantMessageInterface,
+  };
+}
+/**
+ * Reserve the grouped `user` tool-result row for the current batch exactly
+ * once. Parallel tool results are dispatched without awaiting (`agent/loop.ts`
+ * emits each `tool_result` synchronously), so concurrent `handleToolResult`
+ * calls can reach this before the first reservation resolves; sharing one
+ * in-flight reservation promise keeps the whole batch in a single row. A
+ * failed reservation resets the promise so the next caller can retry rather
+ * than inheriting a settled rejection.
+ */
+function ensureToolResultRowReserved(
+  state: EventHandlerState,
+  conversationId: string,
+  metadata: Record<string, unknown>,
+): Promise<string> {
+  if (state.pendingToolResultRowReservation === undefined) {
+    state.pendingToolResultRowReservation = reserveMessage(
+      conversationId,
+      "user",
+      metadata,
+    )
+      .then((reserved) => reserved.id)
+      .catch((err) => {
+        state.pendingToolResultRowReservation = undefined;
+        throw err;
+      });
+  }
+  return state.pendingToolResultRowReservation;
+}
+/**
+ * Persist the buffered tool results into their grouped `user` row as each
+ * result arrives, so a long-running tool's output survives a refresh that
+ * outlives the SSE replay window. The row is reserved once per batch and
+ * rewritten in place as sibling parallel results land, keeping all
+ * `tool_result` blocks of one turn in a single message. `seq` is the position
+ * stamped on the triggering `tool_result` event, captured by the caller before
+ * any await so it reflects exactly the content now durable in the row.
+ * Indexing and the buffer drain are deferred to `finalizePendingToolResultRow`.
+ */
+async function persistPendingToolResultRow(
+  state: EventHandlerState,
+  deps: EventHandlerDeps,
+  seq: number,
+): Promise<void> {
+  if (state.pendingToolResults.size === 0) return;
+  const rowId = await ensureToolResultRowReserved(
+    state,
+    deps.ctx.conversationId,
+    buildToolResultMetadata(deps),
+  );
+  // Serialize the content after the reservation resolves so the last of the
+  // concurrent writers reflects the fullest batch.
+  updateMessageContent(
+    rowId,
+    JSON.stringify(buildToolResultBlocks(state.pendingToolResults)),
+  );
+  recordPersistedSeq(deps.ctx.conversationId, seq);
+  const conv = getConversation(deps.ctx.conversationId);
+  if (conv != null) {
+    syncMessageToDisk(deps.ctx.conversationId, rowId, conv.createdAt);
+  }
+}
+/**
+ * Finalize the grouped tool-result row at a turn/loop boundary: ensure the row
+ * is reserved (a fallback for the case where every on-arrival write failed),
+ * rewrite it to the full batch, sync it to disk, index it for memory recall,
+ * and clear the batch state. Shared by `message_complete` and the orchestrator
+ * loop-exit flush so an aborted or yielded turn finalizes the same reserved row
+ * instead of writing a duplicate.
+ */
+export async function finalizePendingToolResultRow(
+  state: EventHandlerState,
+  conversationId: string,
+  metadata: Record<string, unknown>,
+  rlog: pino.Logger,
+): Promise<void> {
+  if (state.pendingToolResults.size === 0) return;
+  const rowId = await ensureToolResultRowReserved(
+    state,
+    conversationId,
+    metadata,
+  );
+  const contentJson = JSON.stringify(
+    buildToolResultBlocks(state.pendingToolResults),
+  );
+  updateMessageContent(rowId, contentJson);
+  // Sync the row to the JSONL disk view so it stays in lockstep with the DB.
+  // `getConversation` returns `ConversationRow | null`, so `!= null` gates on a
+  // real row (skipping the sync when the conversation was not found rather than
+  // asking the disk-view to resolve a missing id).
+  const conv = getConversation(conversationId);
+  if (conv != null) {
+    syncMessageToDisk(conversationId, rowId, conv.createdAt);
+  }
+  // `reserveMessage` + `updateMessageContent` are CRUD-only, so index the
+  // finalized tool-result content explicitly here (mirroring the assistant-row
+  // finalize) once it is durable. Non-fatal: a memory hiccup must not escalate
+  // a successful turn into a throw.
+  const row = getMessageById(rowId, conversationId);
+  if (row) {
+    let provenanceTrustClass:
+      | "guardian"
+      | "trusted_contact"
+      | "unknown"
+      | undefined;
+    let automated: boolean | undefined;
+    if (row.metadata) {
+      try {
+        const parsedMeta = messageMetadataSchema.safeParse(
+          JSON.parse(row.metadata),
+        );
+        if (parsedMeta.success) {
+          provenanceTrustClass = parsedMeta.data.provenanceTrustClass;
+          automated = parsedMeta.data.automated;
+        }
+      } catch {
+        // Malformed metadata JSON — index with undefined provenance fields.
+      }
+    }
+    try {
+      await indexMessageNow(
+        {
+          messageId: rowId,
+          conversationId,
+          role: "user",
+          content: contentJson,
+          createdAt: row.createdAt,
+          scopeId: "default",
+          provenanceTrustClass,
+          automated,
+        },
+        getConfig().memory,
+      );
+    } catch (err) {
+      rlog.warn(
+        { err, conversationId, messageId: rowId },
+        "Failed to index tool-result message for memory (non-fatal)",
+      );
+    }
+  }
+  for (const id of state.pendingToolResults.keys()) {
+    state.persistedToolUseIds.add(id);
+  }
+  state.pendingToolResults.clear();
+  state.pendingToolResultRowReservation = undefined;
+}
+export async function handleToolResult(
   state: EventHandlerState,
   deps: EventHandlerDeps,
   event: Extract<AgentEvent, { type: "tool_result" }>,
-): void {
+): Promise<void> {
+  // A synthesized cancellation (the tool never executed) is captured for
+  // persistence and forwarded to the client like any result, but skips every
+  // side effect that assumes the tool ran. A real result already captured or
+  // persisted for the same tool wins, so only fill genuine gaps.
+  if (event.cancelled) {
+    if (
+      state.pendingToolResults.has(event.toolUseId) ||
+      state.persistedToolUseIds.has(event.toolUseId)
+    ) {
+      return;
+    }
+    state.pendingToolResults.set(event.toolUseId, {
+      content: event.content,
+      isError: event.isError,
+    });
+    state.currentToolUseId = undefined;
+    deps.onEvent({
+      type: "tool_result",
+      toolName: "",
+      result: event.content,
+      isError: event.isError,
+      conversationId: deps.ctx.conversationId,
+      messageId: state.lastAssistantMessageId,
+      toolUseId: event.toolUseId,
+    });
+    // Capture the seq synchronously (before the persist await) so it reflects
+    // the just-stamped tool_result event, then persist on arrival. A failure
+    // here is non-fatal: the buffered result is still drained at
+    // `message_complete`.
+    const cancelledSeq = getCurrentSeq();
+    try {
+      await persistPendingToolResultRow(state, deps, cancelledSeq);
+    } catch (err) {
+      log.warn(
+        { err, conversationId: deps.ctx.conversationId },
+        "Failed to persist cancelled tool result on arrival (non-fatal; retried at message_complete)",
+      );
+    }
+    return;
+  }
   const imageBlocks = event.contentBlocks?.filter(
     (b): b is ImageContent => b.type === "image",
   );
@@ -945,6 +1305,13 @@ export function handleToolResult(
     });
   }
+  // Capture tool activity (web_search / web_fetch) so it can be persisted on
+  // the tool_use block and the activity card survives a history reopen,
+  // matching the live tool_result event's activityMetadata.
+  if (event.activityMetadata) {
+    state.toolActivityMetadata.set(event.toolUseId, event.activityMetadata);
+  }
   const toolName = state.toolUseIdToName.get(event.toolUseId);
   if (toolName === "file_write" || toolName === "bash") {
     deps.ctx.markWorkspaceTopLevelDirty();
@@ -1026,6 +1393,20 @@ export function handleToolResult(
     riskThreshold: event.riskThreshold,
     activityMetadata: event.activityMetadata,
   });
+  // Capture the seq synchronously (before the persist await) so it reflects the
+  // just-stamped tool_result event, then persist the grouped row on arrival. A
+  // failure here is non-fatal: the buffered result is still drained at
+  // `message_complete`.
+  const resultSeq = getCurrentSeq();
+  try {
+    await persistPendingToolResultRow(state, deps, resultSeq);
+  } catch (err) {
+    log.warn(
+      { err, conversationId: deps.ctx.conversationId },
+      "Failed to persist tool result on arrival (non-fatal; retried at message_complete)",
+    );
+  }
 }
 /**
@@ -1097,6 +1478,16 @@ function annotatePersistedAssistantMessage(
           rec._riskDirectoryScopeOptions = risk.riskDirectoryScopeOptions;
         modified = true;
       }
+      // External provider tools (brave/perplexity/tavily) + web_fetch produce
+      // their activity only when the tool_result lands, after message_complete
+      // has already persisted this block — so it is stamped here. Native
+      // server_tool_use activity is stamped earlier, at persist time, in
+      // `buildPersistedAssistantContent`.
+      const activity = state.toolActivityMetadata.get(id);
+      if (activity) {
+        rec._activityMetadata = activity;
+        modified = true;
+      }
     }
   }
@@ -1259,6 +1650,18 @@ export async function handleMessageComplete(
   deps: EventHandlerDeps,
   event: Extract<AgentEvent, { type: "message_complete" }>,
 ): Promise<void> {
+  // The model has now received the turn context, so persist any pending
+  // inference-profile-change notification. Guarded by the pending slot so it
+  // fires once per turn; a turn that fails before reaching delivery leaves the
+  // slot unconsumed and re-sends the notice next turn.
+  if (state.pendingNotifiedInferenceProfile != null) {
+    setLastNotifiedInferenceProfile(
+      deps.ctx.conversationId,
+      state.pendingNotifiedInferenceProfile,
+    );
+    state.pendingNotifiedInferenceProfile = null;
+  }
   // Reset per-turn tool tracking for the new turn.
   state.currentTurnToolUseIds = [];
@@ -1298,62 +1701,16 @@ export async function handleMessageComplete(
     state.pendingDirectiveDisplayBuffer = "";
   }
-  // Persist pending tool results
-  if (state.pendingToolResults.size > 0) {
-    const toolResultBlocks = Array.from(state.pendingToolResults.entries()).map(
-      ([toolUseId, result]) => ({
-        type: "tool_result",
-        tool_use_id: toolUseId,
-        content: redactSecrets(result.content),
-        is_error: result.isError,
-        ...(result.contentBlocks
-          ? {
-              contentBlocks: result.contentBlocks.map((block) =>
-                block.type === "text"
-                  ? { ...block, text: redactSecrets(block.text) }
-                  : block,
-              ),
-            }
-          : {}),
-      }),
-    );
-    const toolResultMetadata = {
-      ...provenanceFromTrustContext(deps.ctx.trustContext),
-      userMessageChannel: deps.turnChannelContext.userMessageChannel,
-      assistantMessageChannel: deps.turnChannelContext.assistantMessageChannel,
-      userMessageInterface: deps.turnInterfaceContext.userMessageInterface,
-      assistantMessageInterface:
-        deps.turnInterfaceContext.assistantMessageInterface,
-    };
-    // Route the add + disk-view sync through the `persistence` pipeline so
-    // plugins can observe or override both operations together. The default
-    // plugin's terminal performs the add and, when `syncToDisk` is true,
-    // immediately calls `syncMessageToDisk` against the just-persisted row.
-    // `getConversation` returns `ConversationRow | null`, so `!= null`
-    // gates on a real row (skipping the sync when the conversation was
-    // not found rather than asking the disk-view to resolve a missing id).
-    const convForToolResult = getConversation(deps.ctx.conversationId);
-    await runPipeline<PersistArgs, PersistResult>(
-      "persistence",
-      getMiddlewaresFor("persistence"),
-      defaultPersistenceTerminal,
-      {
-        op: "add",
-        conversationId: deps.ctx.conversationId,
-        role: "user",
-        content: JSON.stringify(toolResultBlocks),
-        metadata: toolResultMetadata,
-        syncToDisk: convForToolResult != null,
-        createdAtMs: convForToolResult?.createdAt,
-      },
-      buildHandlerTurnContext(deps),
-      DEFAULT_TIMEOUTS.persistence,
-    );
-    for (const id of state.pendingToolResults.keys()) {
-      state.persistedToolUseIds.add(id);
-    }
-    state.pendingToolResults.clear();
-  }
+  // Finalize the grouped tool-result row. Each result was persisted into this
+  // row as it arrived (`persistPendingToolResultRow`); this rewrites it to the
+  // full batch (covering the case where a mid-arrival write failed), indexes it
+  // for memory recall, and clears the batch state.
+  await finalizePendingToolResultRow(
+    state,
+    deps.ctx.conversationId,
+    buildToolResultMetadata(deps),
+    deps.rlog,
+  );
   // Accumulate directives + warnings from the assistant content for
   // downstream attachment processing. `cleanAssistantContent` is also
@@ -1391,6 +1748,7 @@ export async function handleMessageComplete(
   const contentForPersistence = buildPersistedAssistantContent(
     event.message.content as ContentBlock[],
     deps.ctx.currentTurnSurfaces,
+    state.toolActivityMetadata,
   );
   // The row was reserved at `llm_call_started` (with channel metadata
@@ -1407,28 +1765,30 @@ export async function handleMessageComplete(
     );
   }
   const contentJson = JSON.stringify(contentForPersistence);
-  await runPipeline<PersistArgs, PersistResult>(
-    "persistence",
-    getMiddlewaresFor("persistence"),
-    defaultPersistenceTerminal,
-    {
-      op: "updateContent",
-      messageId: assistantMessageId,
-      content: contentJson,
-    },
-    buildHandlerTurnContext(deps),
-    DEFAULT_TIMEOUTS.persistence,
-  );
+  updateMessageContent(assistantMessageId, contentJson);
   state.assistantRowAwaitingFinalization = false;
+  // The assistant row now holds the authoritative content (text + thinking +
+  // tool_use blocks from `event.message`), and any drained tool-result rows
+  // are durable. `lastPersistedContentSeq` is the last streamed text/thinking
+  // delta's seq -- the highest stamped content event this row reflects -- so
+  // recording it is honest. A drained tool result was stamped earlier in the
+  // turn, so this seq already covers it; a call that streams no content (a
+  // pure tool call) advances instead via `tool_use_start`. `recordPersistedSeq`
+  // clamps monotonically, so a lower value here never regresses the seq.
+  if (state.lastPersistedContentSeq != null) {
+    recordPersistedSeq(deps.ctx.conversationId, state.lastPersistedContentSeq);
+  }
   // Reset the partial-persist mirror so subsequent calls in this turn
   // start with an empty running view.
   state.currentMessageContent = [];
+  state.lastPersistedContentSeq = undefined;
-  // ── Indexing + attention projection (restored from the pre-B3 `add` path) ──
+  // ── Indexing + attention projection ──
   // `reserveMessage` + `updateMessageContent` are CRUD-only: they don't run
-  // the memory indexer or the attention-cursor projector. The pre-B3 path
-  // wrote the row via `addMessage`, which ran both as side-effects of the
-  // insert. Calling them here keeps the assistant row's external state
+  // the memory indexer or the attention-cursor projector (unlike `addMessage`,
+  // which runs both as side-effects of the insert). Because the assistant row
+  // is reserved empty and finalized via `updateMessageContent`, both must be
+  // invoked explicitly here to keep the assistant row's external state
   // (Qdrant segments, conversation attention cursor) in lockstep with the
   // finalized content. Both are non-fatal — a memory hiccup must not
   // escalate a successful generation into a turn-level throw. Indexing
@@ -1759,7 +2119,7 @@ export async function dispatchAgentEvent(
         handleInputJsonDelta(state, deps, event);
         break;
       case "tool_result":
-        handleToolResult(state, deps, event);
+        await handleToolResult(state, deps, event);
         break;
       case "server_tool_start": {
         const query =
@@ -1828,9 +2188,65 @@ export async function dispatchAgentEvent(
         // for them would mis-label the provider and ship empty results.
         const isAnthropicNative = deps.ctx.provider.name === "anthropic";
-        const errorMessage = event.isError
-          ? (event.errorMessage ?? event.errorCode ?? "Search failed")
-          : undefined;
+        // Classify provider failures through the shared normalizer so the same
+        // friendly copy propagates to every client via WebSearchMetadata, while
+        // the raw provider detail stays in telemetry only (ATL-727).
+        const classification = classifyWebSearchFailure({
+          errorCode: event.errorCode,
+          error: event.errorMessage,
+          isError: event.isError,
+          hasResults: results.length > 0,
+        });
+        let errorMessage: string | undefined;
+        let fallbackShown = false;
+        if (event.isError) {
+          // A genuine backend failure OR an unclassifiable, message-less native
+          // failure (e.g. `isError:true` with no `error_code`) both surface the
+          // friendly backend copy: a terse "Search failed" placeholder is the
+          // confusing copy this normalization exists to eliminate (ATL-727).
+          // Recoverable categories that carry a real user message
+          // (query_too_long, max_uses_exceeded) keep their own copy.
+          const useBackendCopy =
+            classification.isBackendFailure || !classification.userMessage;
+          if (useBackendCopy) {
+            // Dedup the user-facing friendly notice per turn (request id) so a
+            // burst of failures surfaces at most one full notice. The raw
+            // provider error is preserved on every failure via telemetry below.
+            const alreadyNotified = state.webSearchBackendFailureNotified.has(
+              deps.reqId,
+            );
+            if (alreadyNotified) {
+              errorMessage = "Search is still having trouble.";
+            } else {
+              state.webSearchBackendFailureNotified.add(deps.reqId);
+              errorMessage = WEB_SEARCH_BACKEND_FAILURE_MESSAGE;
+              fallbackShown = true;
+            }
+            // Backend-failure telemetry (provider outages / rate limits) must
+            // fire only for genuine backend classifications so it does not
+            // count recoverable input/quota errors — or a message-less unknown
+            // failure that merely borrows the friendly copy — as provider
+            // outages.
+            if (classification.isBackendFailure) {
+              logWebSearchBackendFailure(deps.rlog, {
+                provider: isAnthropicNative
+                  ? "anthropic-native"
+                  : deps.ctx.provider.name,
+                requestId: deps.reqId,
+                errorCategory: classification.category,
+                rawDetail: classification.rawDetail,
+                fallbackShown,
+                queryLength: query.length,
+              });
+            }
+          } else {
+            // Recoverable, non-backend categories with their own user-facing
+            // copy (query_too_long, max_uses_exceeded) keep that message.
+            errorMessage = classification.userMessage;
+          }
+        }
         const metadata: WebSearchMetadata | undefined = isAnthropicNative
           ? {
@@ -1847,6 +2263,14 @@ export async function dispatchAgentEvent(
           .map((r) => `${r.title}\n${r.url}`)
           .join("\n\n");
+        // Capture activity so it persists on the server_tool_use block and the
+        // web-search card survives a history reopen, matching the live event.
+        if (metadata) {
+          state.toolActivityMetadata.set(event.toolUseId, {
+            webSearch: metadata,
+          });
+        }
         deps.onEvent({
           type: "tool_result",
           toolName: "web_search",
@@ -1873,6 +2297,31 @@ export async function dispatchAgentEvent(
         // banner.
         deps.onEvent(event);
         break;
+      case "compaction_completed":
+        // Always commit the loop-stripped `basis` as the durable message base
+        // so re-injection re-applies onto the stripped history even when the
+        // pipeline ran but did not compact. When it did compact, commit the
+        // durable result (DB-record fields, Slack provenance, SSE) — which
+        // overwrites `ctx.messages` with the compacted history — and flip the
+        // per-turn re-injection guards the orchestrator reads. This runs
+        // before the loop's `reinject` hook (the loop awaits this dispatch),
+        // so the guards are set in time. A failed durable commit re-throws
+        // below to abort the turn rather than re-injecting against
+        // half-applied state.
+        deps.ctx.messages = event.basis;
+        if (event.result.compacted) {
+          await deps.applyCompaction(event.result, event.basis);
+          state.reducerCompacted = true;
+          state.shouldInjectWorkspace = true;
+        }
+        break;
+      case "history_stripped":
+        // Record the history-stripped DB marker right after the loop strips
+        // injections (before the pipeline). Best-effort: a transient marker
+        // write must not abort the turn, so unlike `compaction_completed` this
+        // is not on the re-throw allowlist below.
+        markHistoryStrippedBestEffort(deps.ctx.conversationId);
+        break;
       case "error":
         handleError(state, deps, event);
         break;
@@ -1925,10 +2374,13 @@ export async function dispatchAgentEvent(
     // - message_complete: persists assistant message to DB, sets state flags
     // - error: sets recovery flags (contextTooLargeDetected, orderingErrorDetected)
     // - usage: records token accounting
+    // - compaction_completed: durable compaction commit; aborting the turn is
+    //   safer than re-injecting against a half-applied compaction
     if (
       event.type === "message_complete" ||
       event.type === "error" ||
-      event.type === "usage"
+      event.type === "usage" ||
+      event.type === "compaction_completed"
     ) {
       throw err;
     }