npm - @vellumai/assistant - Versions diffs - 0.8.6 → 0.8.7-dev.202606052118.34cd356 - Mend

@vellumai/assistant 0.8.6 → 0.8.7-dev.202606052118.34cd356

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (1078) hide show

package/AGENTS.md +4 -4
package/Dockerfile +21 -4
package/bun.lock +13 -4
package/docker-entrypoint.sh +12 -8
package/docker-init-apt-root.sh +3 -1
package/docker-kata-apt-env.sh +3 -1
package/docker-kata-runtime-family.sh +12 -0
package/docs/architecture/memory.md +1 -1
package/docs/plugins.md +110 -83
package/examples/plugins/echo/README.md +13 -12
package/examples/plugins/echo/register.ts +0 -54
package/knip.json +1 -0
package/node_modules/@vellumai/environments/bun.lock +24 -0
package/node_modules/@vellumai/environments/package.json +18 -0
package/node_modules/@vellumai/environments/src/__tests__/package-boundary.test.ts +95 -0
package/node_modules/@vellumai/environments/src/index.ts +11 -0
package/node_modules/@vellumai/environments/src/seeds.ts +73 -0
package/node_modules/@vellumai/environments/src/types.ts +70 -0
package/node_modules/@vellumai/environments/tsconfig.json +20 -0
package/node_modules/@vellumai/skill-host-contracts/src/assistant-event.ts +11 -0
package/node_modules/@vellumai/skill-host-contracts/src/client.ts +3 -4
package/node_modules/@vellumai/skill-host-contracts/src/server-message.ts +3 -3
package/node_modules/@vellumai/skill-host-contracts/src/skill-host.ts +13 -8
package/openapi.yaml +6964 -539
package/package.json +8 -4
package/scripts/generate-openapi.ts +88 -54
package/src/__tests__/agent-loop-callsite-precedence.test.ts +42 -80
package/src/__tests__/agent-loop-exit-reason.test.ts +188 -45
package/src/__tests__/agent-loop-mutable-latest-user-message.test.ts +141 -0
package/src/__tests__/agent-loop-override-profile.test.ts +19 -32
package/src/__tests__/agent-loop-provider-error-recording.test.ts +7 -5
package/src/__tests__/agent-loop-thinking.test.ts +17 -12
package/src/__tests__/agent-loop.test.ts +238 -422
package/src/__tests__/agent-wake-disk-pressure-callsite.test.ts +6 -2
package/src/__tests__/agent-wake-override-profile.test.ts +22 -40
package/src/__tests__/annotate-activity-metadata.test.ts +262 -0
package/src/__tests__/annotate-risk-options.test.ts +2 -3
package/src/__tests__/anthropic-provider.test.ts +296 -57
package/src/__tests__/app-builder-skill-instructions.test.ts +22 -0
package/src/__tests__/app-control-flow.test.ts +6 -1
package/src/__tests__/app-dir-path-guard.test.ts +1 -0
package/src/__tests__/approval-cascade.test.ts +4 -11
package/src/__tests__/approval-routes-http.test.ts +8 -3
package/src/__tests__/assistant-event-hub.test.ts +25 -0
package/src/__tests__/assistant-event.test.ts +15 -0
package/src/__tests__/assistant-events-sse-shed.test.ts +8 -0
package/src/__tests__/assistant-feature-flags-integration.test.ts +2 -2
package/src/__tests__/assistant-stream-state.test.ts +645 -0
package/src/__tests__/auth-fallback-events-store.test.ts +116 -0
package/src/__tests__/avatar-e2e.test.ts +7 -37
package/src/__tests__/avatar-generator.test.ts +12 -42
package/src/__tests__/avatar-identity-sync.test.ts +28 -3
package/src/__tests__/background-shell-bash.test.ts +3 -7
package/src/__tests__/background-workers-disk-pressure.test.ts +6 -0
package/src/__tests__/btw-routes.test.ts +69 -15
package/src/__tests__/build-persisted-content.test.ts +184 -0
package/src/__tests__/call-pointer-messages.test.ts +5 -3
package/src/__tests__/call-site-routing-provider.test.ts +22 -40
package/src/__tests__/catalog-files.test.ts +1 -0
package/src/__tests__/channel-approval-routes.test.ts +49 -21
package/src/__tests__/channel-approvals.test.ts +4 -2
package/src/__tests__/channel-invite-transport.test.ts +1 -5
package/src/__tests__/channel-readiness-routes.test.ts +0 -4
package/src/__tests__/channel-readiness-slack-remote.test.ts +2 -7
package/src/__tests__/channel-retry-sweep.test.ts +71 -79
package/src/__tests__/clawhub-files.test.ts +1 -0
package/src/__tests__/compaction-circuit.test.ts +258 -0
package/src/__tests__/compaction-direct.test.ts +132 -0
package/src/__tests__/compaction-events.test.ts +5 -17
package/src/__tests__/compaction-trail-store.test.ts +1 -79
package/src/__tests__/compaction.benchmark.test.ts +0 -30
package/src/__tests__/compactor-image-manifest-trust.test.ts +112 -0
package/src/__tests__/computer-use-tools.test.ts +2 -2
package/src/__tests__/config-watcher.test.ts +28 -0
package/src/__tests__/context-search-agent-runner.test.ts +6 -3
package/src/__tests__/context-token-estimator.test.ts +34 -0
package/src/__tests__/context-window-manager-compact-retry.test.ts +291 -0
package/src/__tests__/conversation-abort-tool-results.test.ts +70 -25
package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +9 -7
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +22 -34
package/src/__tests__/conversation-agent-loop-overflow.test.ts +476 -963
package/src/__tests__/conversation-agent-loop.test.ts +823 -1321
package/src/__tests__/conversation-analysis-routes.test.ts +7 -3
package/src/__tests__/conversation-app-control-lifecycle.test.ts +1 -1
package/src/__tests__/conversation-clean-command.test.ts +5 -2
package/src/__tests__/conversation-clear-safety.test.ts +20 -10
package/src/__tests__/conversation-confirmation-signals.test.ts +15 -45
package/src/__tests__/conversation-disk-view-integration.test.ts +2 -2
package/src/__tests__/conversation-disk-view.test.ts +10 -17
package/src/__tests__/conversation-fork-crud.test.ts +86 -172
package/src/__tests__/conversation-fork-route.test.ts +16 -14
package/src/__tests__/conversation-history-web-search.test.ts +11 -1
package/src/__tests__/conversation-init.benchmark.test.ts +6 -6
package/src/__tests__/conversation-lifecycle.test.ts +3 -2
package/src/__tests__/conversation-load-history-repair.test.ts +3 -2
package/src/__tests__/conversation-load-history-stripped.test.ts +1 -1
package/src/__tests__/conversation-message-sync-tags.test.ts +3 -4
package/src/__tests__/conversation-pairing.test.ts +10 -7
package/src/__tests__/conversation-pre-run-repair.test.ts +1 -1
package/src/__tests__/conversation-process-app-control-preactivation.test.ts +10 -0
package/src/__tests__/conversation-process-callsite.test.ts +27 -30
package/src/__tests__/conversation-provider-retry-repair.test.ts +80 -51
package/src/__tests__/conversation-queue.test.ts +272 -164
package/src/__tests__/conversation-routes-disk-view.test.ts +6 -2
package/src/__tests__/conversation-routes-guardian-reply.test.ts +2 -2
package/src/__tests__/conversation-routes-slash-commands.test.ts +8 -7
package/src/__tests__/conversation-runtime-assembly.test.ts +317 -313
package/src/__tests__/conversation-runtime-workspace.test.ts +114 -36
package/src/__tests__/conversation-slash-commands.test.ts +8 -42
package/src/__tests__/conversation-slash-queue.test.ts +42 -31
package/src/__tests__/conversation-slash-unknown.test.ts +13 -15
package/src/__tests__/conversation-speed-override.test.ts +8 -22
package/src/__tests__/conversation-starter-routes.test.ts +14 -6
package/src/__tests__/conversation-surfaces-action-delivery.test.ts +90 -15
package/src/__tests__/conversation-surfaces-app-control.test.ts +32 -4
package/src/__tests__/conversation-surfaces-state-update.test.ts +5 -2
package/src/__tests__/conversation-surfaces-table-action.test.ts +6 -15
package/src/__tests__/conversation-sync-tags.test.ts +27 -15
package/src/__tests__/conversation-title-service.test.ts +135 -2
package/src/__tests__/conversation-tool-setup-app-refresh.test.ts +23 -11
package/src/__tests__/conversation-unread-route.test.ts +14 -2
package/src/__tests__/conversation-usage.test.ts +0 -2
package/src/__tests__/conversation-wipe.test.ts +1 -1
package/src/__tests__/conversation-workspace-cache-state.test.ts +20 -17
package/src/__tests__/conversation-workspace-injection.test.ts +114 -23
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +34 -13
package/src/__tests__/conversations-import-system-filter.test.ts +101 -0
package/src/__tests__/credential-execution-tools.test.ts +1 -2
package/src/__tests__/credential-security-invariants.test.ts +0 -1
package/src/__tests__/cross-provider-web-search.test.ts +220 -3
package/src/__tests__/cu-unified-flow.test.ts +26 -1
package/src/__tests__/db-acp-history.test.ts +101 -0
package/src/__tests__/db-schedule-syntax-migration.test.ts +16 -0
package/src/__tests__/disk-pressure-guard.test.ts +66 -0
package/src/__tests__/disk-pressure-routes.test.ts +9 -2
package/src/__tests__/dm-persistence.test.ts +12 -3
package/src/__tests__/dynamic-page-surface.test.ts +99 -0
package/src/__tests__/edit-propagation.test.ts +1 -2
package/src/__tests__/empty-response-hook.test.ts +304 -0
package/src/__tests__/feature-flag-test-helpers.ts +2 -2
package/src/__tests__/file-write-tool.test.ts +63 -0
package/src/__tests__/filing-service.test.ts +2 -2
package/src/__tests__/first-greeting.test.ts +55 -14
package/src/__tests__/gemini-image-service.test.ts +13 -0
package/src/__tests__/gemini-inline-media.test.ts +78 -0
package/src/__tests__/gemini-provider.test.ts +351 -28
package/src/__tests__/guardian-grant-minting.test.ts +1 -1
package/src/__tests__/guardian-routing-invariants.test.ts +2 -4
package/src/__tests__/guardian-routing-state.test.ts +60 -71
package/src/__tests__/handlers-user-message-approval-consumption.test.ts +10 -8
package/src/__tests__/heartbeat-disk-pressure.test.ts +2 -0
package/src/__tests__/heartbeat-service.test.ts +3 -1
package/src/__tests__/helpers/mock-provider.ts +110 -0
package/src/__tests__/helpers/native-web-search-harness.ts +129 -0
package/src/__tests__/history-repair-hook.test.ts +162 -0
package/src/__tests__/history-repair-observability.test.ts +1 -1
package/src/__tests__/history-repair.test.ts +2 -1
package/src/__tests__/host-app-control-proxy.test.ts +2 -0
package/src/__tests__/host-app-control-routes.test.ts +1 -1
package/src/__tests__/host-cu-proxy.test.ts +2 -0
package/src/__tests__/host-cu-routes-targeted.test.ts +3 -3
package/src/__tests__/host-file-edit-tool.test.ts +4 -2
package/src/__tests__/host-file-proxy.test.ts +31 -0
package/src/__tests__/host-file-read-tool.test.ts +4 -2
package/src/__tests__/host-file-write-tool.test.ts +9 -3
package/src/__tests__/host-proxy-preactivation.test.ts +53 -14
package/src/__tests__/host-shell-tool.test.ts +9 -4
package/src/__tests__/http-user-message-parity.test.ts +2 -2
package/src/__tests__/identity-intro-cache.test.ts +47 -114
package/src/__tests__/identity-routes.test.ts +248 -7
package/src/__tests__/inbound-slack-persistence.test.ts +12 -3
package/src/__tests__/injector-background-turn.test.ts +3 -9
package/src/__tests__/injector-chain.test.ts +139 -275
package/src/__tests__/injector-disk-pressure.test.ts +75 -41
package/src/__tests__/injector-document-comments.test.ts +3 -3
package/src/__tests__/injector-pkb-v2-silenced.test.ts +30 -22
package/src/__tests__/injector-v3-suppression.test.ts +214 -0
package/src/__tests__/internal-telemetry-routes.test.ts +109 -0
package/src/__tests__/list-messages-attachments.test.ts +7 -8
package/src/__tests__/list-messages-hidden-metadata.test.ts +55 -15
package/src/__tests__/list-messages-page-latest.test.ts +60 -1
package/src/__tests__/list-messages-tool-merge.test.ts +56 -6
package/src/__tests__/llm-request-log-turn-query.test.ts +42 -86
package/src/__tests__/llm-resolver.test.ts +23 -47
package/src/__tests__/llm-usage-store.test.ts +268 -1
package/src/__tests__/log-export-routes.test.ts +59 -0
package/src/__tests__/managed-skill-lifecycle.test.ts +1 -8
package/src/__tests__/mcp-auth-routes.test.ts +15 -10
package/src/__tests__/mcp-health-check.test.ts +18 -13
package/src/__tests__/memory-retrieval-hook.test.ts +297 -0
package/src/__tests__/memory-v2-static-injector.test.ts +103 -35
package/src/__tests__/messaging-send-tool.test.ts +8 -4
package/src/__tests__/migration-export-http.test.ts +12 -12
package/src/__tests__/migration-import-commit-http.test.ts +8 -8
package/src/__tests__/migration-import-preflight-http.test.ts +7 -7
package/src/__tests__/migration-validate-http.test.ts +3 -3
package/src/__tests__/native-web-search.test.ts +205 -20
package/src/__tests__/notification-decision-identity.test.ts +9 -18
package/src/__tests__/notification-decision-recipient-context.test.ts +3 -6
package/src/__tests__/oauth-commands-routes.test.ts +1 -1
package/src/__tests__/onboarding-template-contract.test.ts +12 -0
package/src/__tests__/openai-image-service.test.ts +17 -0
package/src/__tests__/openai-provider.test.ts +97 -71
package/src/__tests__/openai-responses-provider.test.ts +21 -77
package/src/__tests__/outbound-slack-persistence.test.ts +2 -1
package/src/__tests__/{overflow-reduce-pipeline.test.ts → overflow-reduction-loop.test.ts} +64 -286
package/src/__tests__/parallel-tool.benchmark.test.ts +24 -36
package/src/__tests__/persist-unsendable-image.test.ts +215 -0
package/src/__tests__/persistence-secret-redaction.test.ts +3 -1
package/src/__tests__/pipeline-runner.test.ts +31 -43
package/src/__tests__/pkb-autoinject.test.ts +2 -5
package/src/__tests__/plugin-bootstrap.test.ts +62 -51
package/src/__tests__/plugin-registry.test.ts +0 -27
package/src/__tests__/plugin-route-contribution.test.ts +6 -16
package/src/__tests__/plugin-skill-contribution.test.ts +7 -17
package/src/__tests__/plugin-tool-contribution.test.ts +10 -26
package/src/__tests__/plugin-types.test.ts +8 -173
package/src/__tests__/prechat-onboarding-contract.test.ts +23 -0
package/src/__tests__/process-message-background-slack.test.ts +17 -16
package/src/__tests__/process-message-display-content.test.ts +36 -44
package/src/__tests__/provider-commit-message-generator.test.ts +19 -14
package/src/__tests__/provider-error-scenarios.test.ts +7 -6
package/src/__tests__/provider-platform-proxy-integration.test.ts +3 -8
package/src/__tests__/provider-send-message-override-profile.test.ts +9 -25
package/src/__tests__/provider-streaming.benchmark.test.ts +12 -22
package/src/__tests__/provider-usage-tracking.test.ts +0 -6
package/src/__tests__/ratelimit.test.ts +9 -4
package/src/__tests__/reaction-persistence.test.ts +1 -1
package/src/__tests__/regenerate-fire-and-forget-trace.test.ts +5 -1
package/src/__tests__/relay-server.test.ts +20 -13
package/src/__tests__/resolve-trust-class.test.ts +4 -4
package/src/__tests__/retry-openrouter-only-normalization.test.ts +5 -8
package/src/__tests__/retry-thinking-tool-choice.test.ts +10 -13
package/src/__tests__/retry-verbosity-normalization.test.ts +5 -8
package/src/__tests__/runtime-events-sse-reconnect.test.ts +390 -0
package/src/__tests__/schedule-routes.test.ts +683 -12
package/src/__tests__/schedule-store.test.ts +108 -0
package/src/__tests__/schedule-tools.test.ts +160 -0
package/src/__tests__/secret-ingress-http.test.ts +2 -2
package/src/__tests__/secret-prompt-log-hygiene.test.ts +11 -7
package/src/__tests__/secret-prompter-channel-fallback.test.ts +11 -9
package/src/__tests__/secret-response-routing.test.ts +13 -11
package/src/__tests__/send-endpoint-busy.test.ts +6 -2
package/src/__tests__/server-history-render.test.ts +314 -1
package/src/__tests__/shell-observability.test.ts +249 -0
package/src/__tests__/skill-feature-flags-integration.test.ts +44 -11
package/src/__tests__/skill-feature-flags.test.ts +6 -6
package/src/__tests__/skill-load-feature-flag.test.ts +10 -10
package/src/__tests__/skills-files-catalog-fallback.test.ts +10 -0
package/src/__tests__/skillssh-files.test.ts +1 -0
package/src/__tests__/starter-task-flow.test.ts +6 -6
package/src/__tests__/strip-memory-injections.test.ts +102 -14
package/src/__tests__/subagent-call-site-routing.test.ts +3 -3
package/src/__tests__/subagent-fork-notifications.test.ts +1 -3
package/src/__tests__/subagent-fork-spawn.test.ts +1 -1
package/src/__tests__/subagent-manager-notify.test.ts +1 -3
package/src/__tests__/subagent-notify-parent.test.ts +1 -3
package/src/__tests__/subagent-spawn-tool-fork.test.ts +1 -1
package/src/__tests__/suggestion-routes.test.ts +3 -3
package/src/__tests__/sync-message-contract.test.ts +19 -16
package/src/__tests__/system-prompt.test.ts +74 -0
package/src/__tests__/task-scheduler.test.ts +162 -1
package/src/__tests__/terminal-tools.test.ts +9 -25
package/src/__tests__/thread-backfill.test.ts +4 -9
package/src/__tests__/title-generate-hook.test.ts +319 -0
package/src/__tests__/tool-error-hook.test.ts +278 -0
package/src/__tests__/tool-preview-lifecycle.test.ts +481 -16
package/src/__tests__/tool-result-metadata-plumbing.test.ts +1 -0
package/src/__tests__/tool-result-truncate-hook.test.ts +127 -0
package/src/__tests__/tool-result-truncation.test.ts +1 -1
package/src/__tests__/tools-audio-read.test.ts +113 -0
package/src/__tests__/turn-boundary-resolution.test.ts +44 -84
package/src/__tests__/turn-events-store.test.ts +11 -7
package/src/__tests__/ui-choice-copy-surfaces.test.ts +254 -0
package/src/__tests__/ui-work-result-surface.test.ts +159 -0
package/src/__tests__/usage-routes.test.ts +285 -1
package/src/__tests__/user-plugin-loader.test.ts +2 -2
package/src/__tests__/voice-scoped-grant-consumer.test.ts +8 -6
package/src/__tests__/voice-session-bridge.test.ts +19 -10
package/src/__tests__/web-search-backend-failure.test.ts +166 -0
package/src/acp/__tests__/agent-process.test.ts +161 -0
package/src/acp/__tests__/client-handler.test.ts +40 -0
package/src/acp/__tests__/helpers/acp-history-db.ts +82 -0
package/src/acp/__tests__/helpers/exec-file-stub.ts +101 -0
package/src/acp/__tests__/prepare-agent-env.test.ts +143 -31
package/src/acp/__tests__/session-manager-persistence.test.ts +95 -28
package/src/acp/__tests__/session-manager-resume.test.ts +695 -0
package/src/acp/agent-process.ts +61 -1
package/src/acp/auto-install.test.ts +125 -0
package/src/acp/auto-install.ts +174 -0
package/src/acp/client-handler.ts +31 -0
package/src/acp/feature-gate.test.ts +48 -0
package/src/acp/feature-gate.ts +34 -0
package/src/acp/prepare-agent-env.ts +52 -11
package/src/acp/resolve-agent.test.ts +147 -6
package/src/acp/resolve-agent.ts +81 -7
package/src/acp/resume-hint.ts +22 -0
package/src/acp/session-manager.ts +487 -71
package/src/agent/compaction-circuit.ts +98 -0
package/src/agent/loop.ts +651 -450
package/src/api/README.md +19 -17
package/src/api/constants/tool-execution.ts +21 -0
package/src/api/events/assistant-activity-state.ts +75 -0
package/src/api/events/assistant-outbound-attachment.ts +25 -27
package/src/api/events/assistant-text-delta.ts +6 -8
package/src/api/events/assistant-thinking-delta.ts +33 -0
package/src/api/events/assistant-turn-start.ts +5 -7
package/src/api/events/avatar-updated.ts +24 -0
package/src/api/events/compaction-circuit-closed.ts +26 -0
package/src/api/events/compaction-circuit-open.ts +28 -0
package/src/api/events/confirmation-request.ts +114 -0
package/src/api/events/contact-request.ts +33 -0
package/src/api/events/conversation-error.ts +77 -0
package/src/api/events/conversation-list-invalidated.ts +38 -0
package/src/api/events/conversation-title-updated.ts +24 -0
package/src/api/events/disk-pressure-status-changed.ts +61 -0
package/src/api/events/document-comment-created.ts +24 -28
package/src/api/events/document-comment-deleted.ts +6 -8
package/src/api/events/document-comment-reopened.ts +6 -8
package/src/api/events/document-comment-resolved.ts +8 -10
package/src/api/events/document-editor-update.ts +27 -0
package/src/api/events/error.ts +32 -0
package/src/api/events/generation-cancelled.ts +4 -6
package/src/api/events/generation-handoff.ts +13 -15
package/src/api/events/home-feed-updated.ts +26 -0
package/src/api/events/identity-changed.ts +32 -0
package/src/api/events/interaction-resolved.ts +50 -0
package/src/api/events/message-complete.ts +10 -12
package/src/api/events/message-dequeued.ts +21 -0
package/src/api/events/message-queued-deleted.ts +23 -0
package/src/api/events/message-queued.ts +22 -0
package/src/api/events/message-request-complete.ts +29 -0
package/src/api/events/navigate-settings.ts +20 -0
package/src/api/events/notification-intent.ts +33 -0
package/src/api/events/open-url.ts +6 -8
package/src/api/events/question-request.ts +67 -0
package/src/api/events/relationship-state-updated.ts +4 -6
package/src/api/events/secret-request.ts +42 -0
package/src/api/events/subagent-event.ts +79 -0
package/src/api/events/subagent-spawned.ts +40 -0
package/src/api/events/subagent-status-changed.ts +65 -0
package/src/api/events/sync-changed.ts +29 -0
package/src/api/events/tool-output-chunk.ts +45 -0
package/src/api/events/tool-result.ts +129 -0
package/src/api/events/tool-use-preview-start.ts +32 -0
package/src/api/events/tool-use-start.ts +8 -10
package/src/api/events/trace-event.ts +69 -0
package/src/api/events/turn-profile-auto-routed.ts +28 -0
package/src/api/events/ui-surface-complete.ts +30 -0
package/src/api/events/ui-surface-dismiss.ts +22 -0
package/src/api/events/ui-surface-show.ts +67 -0
package/src/api/events/ui-surface-update.ts +26 -0
package/src/api/events/usage-update.ts +34 -0
package/src/api/events/user-message-echo.ts +35 -0
package/src/api/index.ts +389 -0
package/src/api/requests/dictation.ts +45 -0
package/src/api/responses/conversation-message.ts +374 -0
package/src/api/responses/disk-pressure-status.ts +26 -0
package/src/api/responses/home.ts +217 -0
package/src/api/responses/llm-context-response.ts +2 -0
package/src/api/responses/memory-v3-selection-log.ts +50 -0
package/src/api/responses/subagent-detail.ts +48 -0
package/src/approvals/guardian-decision-primitive.ts +7 -15
package/src/approvals/guardian-request-resolvers.ts +7 -10
package/src/avatar/__tests__/avatar-manifest.test.ts +236 -0
package/src/avatar/__tests__/avatar-store.test.ts +198 -0
package/src/avatar/avatar-manifest.ts +195 -0
package/src/avatar/avatar-store.ts +113 -0
package/src/avatar/traits-png-sync.ts +8 -2
package/src/background-wake/next-wake.test.ts +31 -1
package/src/background-wake/next-wake.ts +5 -1
package/src/calls/call-conversation-messages.ts +6 -4
package/src/calls/guardian-action-sweep.ts +6 -4
package/src/calls/relay-server.ts +12 -8
package/src/calls/voice-session-bridge.ts +13 -27
package/src/cli/commands/__tests__/memory-v3.test.ts +245 -0
package/src/cli/commands/__tests__/notifications.test.ts +58 -14
package/src/cli/commands/avatar.ts +17 -11
package/src/cli/commands/conversations.ts +15 -1
package/src/cli/commands/db/__tests__/repair.test.ts +540 -0
package/src/cli/commands/db/__tests__/status.test.ts +253 -0
package/src/cli/commands/db/format.ts +48 -0
package/src/cli/commands/db/index.ts +29 -0
package/src/cli/commands/db/repair-step-conversation-backfill.ts +345 -0
package/src/cli/commands/db/repair-step-integrity.ts +146 -0
package/src/cli/commands/db/repair-steps.ts +164 -0
package/src/cli/commands/db/repair.ts +141 -0
package/src/cli/commands/db/status.ts +366 -0
package/src/cli/commands/memory-v3.ts +159 -445
package/src/cli/commands/notifications.ts +112 -60
package/src/cli/lib/cli-colors.ts +24 -6
package/src/cli/program.ts +4 -5
package/src/config/__tests__/feature-flag-registry-guard.test.ts +4 -4
package/src/config/acp-defaults.test.ts +10 -0
package/src/config/acp-defaults.ts +6 -0
package/src/config/assistant-feature-flags.ts +24 -13
package/src/config/bundled-skills/acp/SKILL.md +64 -30
package/src/config/bundled-skills/acp/TOOLS.json +4 -4
package/src/config/bundled-skills/app-builder/SKILL.md +224 -387
package/src/config/bundled-skills/app-builder/TOOLS.json +29 -0
package/src/config/bundled-skills/app-builder/references/DESIGN_SYSTEM.md +48 -0
package/src/config/bundled-skills/app-builder/references/RESPONSIVE.md +57 -0
package/src/config/bundled-skills/app-builder/references/SLIDES.md +38 -0
package/src/config/bundled-skills/app-builder/references/examples/README.md +17 -0
package/src/config/bundled-skills/app-builder/references/examples/expense-tracker.md +515 -0
package/src/config/bundled-skills/app-builder/references/examples/focus-timer.md +342 -0
package/src/config/bundled-skills/app-builder/references/examples/habit-tracker.md +490 -0
package/src/config/bundled-skills/app-builder/tools/app-list.ts +62 -0
package/src/config/bundled-skills/document-editor/SKILL.md +28 -23
package/src/config/bundled-skills/document-editor/TOOLS.json +1 -1
package/src/config/bundled-skills/media-processing/services/reduce.ts +6 -9
package/src/config/bundled-skills/messaging/SKILL.md +0 -7
package/src/config/bundled-skills/messaging/tools/messaging-send.ts +7 -2
package/src/config/bundled-skills/schedule/SKILL.md +1 -1
package/src/config/bundled-skills/schedule/TOOLS.json +8 -0
package/src/config/bundled-tool-registry.ts +2 -0
package/src/config/call-site-defaults.ts +2 -7
package/src/config/feature-flag-cache.ts +3 -3
package/src/config/feature-flag-registry.json +68 -12
package/src/config/schemas/__tests__/memory-v2.test.ts +2 -226
package/src/config/schemas/__tests__/memory-v3.test.ts +25 -0
package/src/config/schemas/call-site-catalog.ts +8 -15
package/src/config/schemas/heartbeat.ts +9 -0
package/src/config/schemas/llm.ts +3 -3
package/src/config/schemas/memory-lifecycle.ts +24 -0
package/src/config/schemas/memory-v2.ts +8 -253
package/src/config/schemas/memory-v3.ts +47 -0
package/src/config/schemas/memory.ts +6 -1
package/src/config/schemas/platform.ts +8 -0
package/src/config/schemas/timeouts.ts +3 -1
package/src/config/seed-inference-profiles.ts +2 -2
package/src/config/skills.ts +13 -0
package/src/context/compactor.ts +55 -32
package/src/context/strip-injections.ts +128 -0
package/src/context/token-estimator.ts +42 -0
package/src/context/tool-result-truncation.ts +1 -66
package/src/context/window-manager.ts +141 -26
package/src/credential-execution/executable-discovery.ts +16 -0
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +6 -0
package/src/daemon/__tests__/conversation-surfaces-launch.test.ts +2 -2
package/src/daemon/__tests__/inference-profile-notification.test.ts +153 -0
package/src/daemon/__tests__/native-web-search-metadata.test.ts +10 -8
package/src/daemon/__tests__/web-search-status-text.test.ts +10 -6
package/src/daemon/approval-generators.ts +4 -4
package/src/daemon/assistant-attachments.ts +1 -1
package/src/daemon/config-watcher.ts +7 -1
package/src/daemon/context-overflow-reducer.ts +0 -1
package/src/daemon/conversation-agent-loop-handlers.ts +793 -215
package/src/daemon/conversation-agent-loop.ts +487 -1478
package/src/daemon/conversation-error.ts +7 -7
package/src/daemon/conversation-history.ts +27 -10
package/src/daemon/conversation-launch.ts +4 -8
package/src/daemon/conversation-lifecycle.ts +13 -42
package/src/daemon/conversation-messaging.ts +8 -9
package/src/daemon/conversation-notifiers.ts +7 -5
package/src/daemon/conversation-process.ts +109 -93
package/src/daemon/conversation-registry.ts +159 -0
package/src/daemon/conversation-runtime-assembly.ts +209 -382
package/src/daemon/conversation-slash.ts +6 -25
package/src/daemon/conversation-store.ts +15 -95
package/src/daemon/conversation-surfaces.ts +277 -73
package/src/daemon/conversation-tool-setup.ts +5 -29
package/src/daemon/conversation-workspace.ts +17 -0
package/src/daemon/conversation.ts +123 -146
package/src/daemon/daemon-skill-host.ts +2 -6
package/src/daemon/disk-pressure-guard.ts +35 -29
package/src/daemon/external-plugins-bootstrap.ts +53 -32
package/src/daemon/first-greeting.ts +26 -4
package/src/daemon/guardian-action-generators.ts +2 -2
package/src/daemon/handlers/config-a2a.ts +51 -36
package/src/daemon/handlers/config-slack-channel.ts +20 -14
package/src/daemon/handlers/config-telegram.ts +16 -2
package/src/daemon/handlers/conversations.ts +9 -23
package/src/daemon/handlers/shared.ts +158 -82
package/src/daemon/handlers/skills.ts +53 -20
package/src/daemon/host-app-control-proxy.ts +54 -1
package/src/daemon/host-cu-proxy.ts +46 -22
package/src/daemon/host-file-proxy.ts +25 -1
package/src/daemon/host-proxy-preactivation.ts +25 -6
package/src/daemon/lifecycle.ts +53 -55
package/src/daemon/message-protocol.ts +2 -3
package/src/daemon/message-provenance.ts +49 -0
package/src/daemon/message-types/apps.ts +1 -29
package/src/daemon/message-types/contacts.ts +3 -20
package/src/daemon/message-types/conversations.ts +13 -111
package/src/daemon/message-types/documents.ts +3 -9
package/src/daemon/message-types/home.ts +4 -17
package/src/daemon/message-types/integrations.ts +2 -6
package/src/daemon/message-types/messages.ts +37 -400
package/src/daemon/message-types/notifications.ts +2 -32
package/src/daemon/message-types/settings.ts +3 -8
package/src/daemon/message-types/skills.ts +4 -0
package/src/daemon/message-types/surfaces.ts +138 -3
package/src/daemon/message-types/sync.ts +12 -25
package/src/daemon/message-types/workspace.ts +3 -11
package/src/daemon/now-scratchpad.ts +21 -0
package/src/daemon/orphan-reaper.test.ts +210 -0
package/src/daemon/orphan-reaper.ts +240 -0
package/src/daemon/overflow-reduction-loop.ts +230 -0
package/src/daemon/persist-unsendable-image.ts +117 -0
package/src/daemon/process-message.ts +50 -49
package/src/daemon/server.ts +14 -0
package/src/daemon/tool-side-effects.ts +10 -7
package/src/daemon/trace-emitter.ts +6 -4
package/src/daemon/trust-context.ts +32 -0
package/src/daemon/wake-target-adapter.ts +14 -2
package/src/heartbeat/__tests__/heartbeat-service.test.ts +6 -1
package/src/heartbeat/heartbeat-run-store.ts +54 -1
package/src/heartbeat/heartbeat-service.ts +42 -0
package/src/home/feed-types.ts +36 -221
package/src/home/home-greeting-cache.ts +24 -1
package/src/ipc/__tests__/browser-ipc.test.ts +1 -1
package/src/ipc/__tests__/email-ipc.test.ts +0 -9
package/src/ipc/__tests__/ui-request-route.test.ts +3 -3
package/src/ipc/gateway-client.test.ts +2 -2
package/src/ipc/gateway-client.ts +3 -3
package/src/ipc/routes/__tests__/route-adapter.test.ts +244 -0
package/src/ipc/routes/route-adapter.ts +45 -6
package/src/ipc/skill-routes/__tests__/memory.test.ts +33 -9
package/src/ipc/skill-routes/__tests__/providers.test.ts +10 -10
package/src/ipc/skill-routes/__tests__/registries.test.ts +28 -18
package/src/ipc/skill-routes/memory.ts +29 -14
package/src/ipc/skill-routes/providers.ts +5 -6
package/src/ipc/skill-routes/registries.ts +13 -61
package/src/live-voice/__tests__/live-voice-archive.test.ts +24 -11
package/src/media/gemini-image-service.ts +15 -0
package/src/media/openai-image-service.ts +14 -0
package/src/media/types.ts +34 -0
package/src/memory/__tests__/conversation-queries.test.ts +192 -8
package/src/memory/__tests__/db-maintenance.test.ts +128 -0
package/src/memory/__tests__/jobs-store-job-classes.test.ts +5 -4
package/src/memory/__tests__/jobs-worker-v2-schedule.test.ts +56 -0
package/src/memory/__tests__/memory-retrospective-job.test.ts +10 -6
package/src/memory/__tests__/memory-v3-selections-migration.test.ts +103 -0
package/src/memory/auth-fallback-events-store.ts +94 -0
package/src/memory/context-search/agent-runner.ts +2 -4
package/src/memory/conversation-crud.ts +39 -8
package/src/memory/conversation-queries.ts +78 -22
package/src/memory/conversation-starter-checkpoints.ts +1 -0
package/src/memory/conversation-title-service.ts +65 -41
package/src/memory/db-init.ts +14 -0
package/src/memory/db-maintenance.ts +18 -2
package/src/memory/graph/__tests__/conversation-graph-memory-registry.test.ts +119 -0
package/src/memory/graph/consolidation.ts +8 -11
package/src/memory/graph/conversation-graph-memory.ts +106 -8
package/src/memory/graph/extraction.ts +6 -9
package/src/memory/graph/narrative.ts +2 -2
package/src/memory/graph/pattern-scan.ts +2 -2
package/src/memory/graph/retriever.ts +20 -26
package/src/memory/graph/tools.ts +4 -4
package/src/memory/job-handlers/conversation-starters.ts +45 -34
package/src/memory/job-handlers/summarization.ts +1 -2
package/src/memory/jobs-store.ts +36 -1
package/src/memory/jobs-worker.ts +82 -43
package/src/memory/llm-request-log-source-clickhouse.ts +5 -31
package/src/memory/llm-request-log-source-local.ts +0 -11
package/src/memory/llm-request-log-source.ts +9 -25
package/src/memory/llm-request-log-store.ts +0 -41
package/src/memory/llm-usage-store.ts +234 -50
package/src/memory/memory-marker.ts +17 -0
package/src/memory/memory-retrospective-job.ts +6 -2
package/src/memory/memory-v2-activation-log-store.ts +1 -83
package/src/memory/migrations/222-strip-placeholder-sentinels-from-messages.ts +6 -5
package/src/memory/migrations/267-llm-usage-events-add-assistant-version.ts +46 -0
package/src/memory/migrations/268-add-memory-v3-selections.ts +28 -0
package/src/memory/migrations/269-schedule-script-timeout.ts +11 -0
package/src/memory/migrations/270-messages-role-created-at-index.ts +18 -0
package/src/memory/migrations/270-schedule-source-conversation.ts +13 -0
package/src/memory/migrations/271-create-auth-fallback-events.ts +21 -0
package/src/memory/migrations/272-acp-session-history-cwd.ts +36 -0
package/src/memory/migrations/__tests__/267-llm-usage-events-add-assistant-version.test.ts +117 -0
package/src/memory/migrations/index.ts +7 -0
package/src/memory/pkb/autoinject.ts +61 -0
package/src/memory/pkb/context.ts +50 -0
package/src/memory/pkb/types.ts +14 -0
package/src/memory/schedule-attribution-sql.ts +104 -0
package/src/memory/schema/acp.ts +4 -0
package/src/memory/schema/infrastructure.ts +27 -0
package/src/memory/usage-grouped-buckets.ts +6 -1
package/src/memory/v2/__tests__/consolidation-job.test.ts +125 -1
package/src/memory/v2/__tests__/migration.test.ts +11 -3
package/src/memory/v2/__tests__/page-index.test.ts +37 -1
package/src/memory/v2/__tests__/router.test.ts +14 -4
package/src/memory/v2/__tests__/sweep-job.test.ts +6 -5
package/src/memory/v2/backfill-jobs.ts +6 -0
package/src/memory/v2/consolidation-job.ts +99 -10
package/src/memory/v2/migration.ts +5 -3
package/src/memory/v2/page-index.ts +11 -0
package/src/memory/v2/router.ts +8 -11
package/src/memory/v2/sweep-job.ts +8 -11
package/src/memory/v2/types.ts +1 -0
package/src/messaging/providers/slack/render-transcript.test.ts +1 -1
package/src/messaging/providers/slack/render-transcript.ts +2 -2
package/src/messaging/style-analyzer.ts +8 -11
package/src/notifications/conversation-pairing.ts +8 -13
package/src/notifications/decision-engine.ts +16 -16
package/src/notifications/home-feed-side-effect.ts +12 -1
package/src/notifications/preference-extractor.ts +11 -14
package/src/permissions/prompter.ts +46 -36
package/src/permissions/question-prompter.test.ts +35 -26
package/src/permissions/question-prompter.ts +6 -10
package/src/plugin-api/constants.ts +4 -0
package/src/plugin-api/index.ts +10 -1
package/src/plugin-api/types.ts +176 -4
package/src/plugins/defaults/compaction/compact.ts +59 -0
package/src/plugins/defaults/compaction/package.json +15 -0
package/src/plugins/defaults/compaction/register.ts +24 -0
package/src/plugins/defaults/empty-response/hooks/stop.ts +126 -0
package/src/plugins/defaults/empty-response/package.json +15 -0
package/src/plugins/defaults/empty-response/register.ts +23 -0
package/src/plugins/defaults/history-repair/hooks/user-prompt-submit.ts +35 -0
package/src/plugins/defaults/history-repair/package.json +15 -0
package/src/plugins/defaults/history-repair/register.ts +24 -0
package/src/{daemon/history-repair.ts → plugins/defaults/history-repair/terminal.ts} +48 -35
package/src/plugins/defaults/index.ts +22 -49
package/src/plugins/defaults/memory-retrieval/hooks/post-compact.ts +95 -0
package/src/plugins/defaults/memory-retrieval/hooks/user-prompt-submit-temp.ts +216 -0
package/src/plugins/defaults/memory-retrieval/injector-chain.ts +35 -0
package/src/plugins/defaults/{injectors.ts → memory-retrieval/injectors.ts} +295 -112
package/src/plugins/defaults/memory-v3-shadow/__tests__/assign.test.ts +242 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/capabilities.test.ts +118 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/core.test.ts +39 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/fixtures/eval-turns.json +36 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/fixtures/live-turns.json +37 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/health.test.ts +219 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/live-integration.test.ts +330 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/maintain-job.test.ts +288 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/needle.test.ts +107 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/orchestrate.test.ts +436 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/provider-blocks.test.ts +13 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/reconcile.test.ts +274 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/render-injection.test.ts +61 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/router.test.ts +332 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/selection-log-store.test.ts +179 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/selector.test.ts +470 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/shadow-plugin.test.ts +432 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/snapshot.test.ts +168 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/tree.test.ts +192 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/types.test.ts +54 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/working-set-eviction.test.ts +106 -0
package/src/plugins/defaults/memory-v3-shadow/__tests__/working-set-skeleton.test.ts +44 -0
package/src/plugins/defaults/memory-v3-shadow/assign.ts +268 -0
package/src/plugins/defaults/memory-v3-shadow/capabilities.ts +124 -0
package/src/plugins/defaults/memory-v3-shadow/core.ts +26 -0
package/src/plugins/defaults/memory-v3-shadow/data/README.md +84 -0
package/src/plugins/defaults/memory-v3-shadow/data/assignments.json +5 -0
package/src/plugins/defaults/memory-v3-shadow/data/core.json +1 -0
package/src/plugins/defaults/memory-v3-shadow/data/leaves/domain-a/topic-x.md +9 -0
package/src/plugins/defaults/memory-v3-shadow/data/leaves/domain-a/topic-y.md +9 -0
package/src/plugins/defaults/memory-v3-shadow/data/leaves/domain-b/topic-z.md +9 -0
package/src/plugins/defaults/memory-v3-shadow/health.ts +0 -0
package/src/plugins/defaults/memory-v3-shadow/hooks/post-compact.ts +14 -0
package/src/plugins/defaults/memory-v3-shadow/hooks/user-prompt-submit.ts +19 -0
package/src/plugins/defaults/memory-v3-shadow/injector.ts +75 -0
package/src/plugins/defaults/memory-v3-shadow/llm-retry.ts +32 -0
package/src/plugins/defaults/memory-v3-shadow/maintain-job.ts +314 -0
package/src/plugins/defaults/memory-v3-shadow/needle.ts +115 -0
package/src/plugins/defaults/memory-v3-shadow/orchestrate.ts +126 -0
package/src/plugins/defaults/memory-v3-shadow/package.json +15 -0
package/src/plugins/defaults/memory-v3-shadow/page-content.ts +34 -0
package/src/plugins/defaults/memory-v3-shadow/provider-blocks.ts +26 -0
package/src/plugins/defaults/memory-v3-shadow/reconcile.ts +523 -0
package/src/plugins/defaults/memory-v3-shadow/register.ts +26 -0
package/src/plugins/defaults/memory-v3-shadow/render-injection.ts +32 -0
package/src/plugins/defaults/memory-v3-shadow/router.ts +190 -0
package/src/plugins/defaults/memory-v3-shadow/selection-log-store.ts +84 -0
package/src/plugins/defaults/memory-v3-shadow/selector.ts +226 -0
package/src/plugins/defaults/memory-v3-shadow/shadow-plugin.ts +349 -0
package/src/plugins/defaults/memory-v3-shadow/snapshot.ts +209 -0
package/src/plugins/defaults/memory-v3-shadow/tree.ts +174 -0
package/src/plugins/defaults/memory-v3-shadow/types.ts +59 -0
package/src/plugins/defaults/memory-v3-shadow/working-set.ts +88 -0
package/src/plugins/defaults/title-generate/hooks/stop.ts +75 -0
package/src/plugins/defaults/title-generate/hooks/user-prompt-submit.ts +35 -0
package/src/plugins/defaults/title-generate/package.json +15 -0
package/src/plugins/defaults/title-generate/register.ts +35 -0
package/src/plugins/defaults/tool-error/hooks/post-tool-use.ts +118 -0
package/src/plugins/defaults/tool-error/package.json +15 -0
package/src/plugins/defaults/tool-error/register.ts +23 -0
package/src/plugins/defaults/tool-result-truncate/hooks/post-tool-use.ts +32 -0
package/src/plugins/defaults/tool-result-truncate/package.json +15 -0
package/src/plugins/defaults/tool-result-truncate/register.ts +24 -0
package/src/plugins/defaults/tool-result-truncate/terminal.ts +132 -0
package/src/plugins/external-plugin-loader.ts +2 -2
package/src/plugins/pipeline.ts +8 -35
package/src/plugins/registry.ts +8 -25
package/src/plugins/types.ts +62 -721
package/src/plugins/user-loader.ts +4 -3
package/src/proactive-artifact/aux-message-injector.ts +4 -5
package/src/proactive-artifact/job.test.ts +28 -21
package/src/proactive-artifact/job.ts +3 -1
package/src/prompts/__tests__/system-prompt.test.ts +42 -0
package/src/prompts/sections.ts +20 -7
package/src/prompts/templates/BOOTSTRAP-ACTIVATION-RAIL.md +64 -0
package/src/prompts/templates/BOOTSTRAP-CONTENT-AUTOMATION.md +2 -2
package/src/prompts/templates/BOOTSTRAP.md +7 -3
package/src/prompts/templates/system-sections.ts +21 -0
package/src/providers/__tests__/retry-callsite.test.ts +25 -25
package/src/providers/__tests__/satellite-connection-routing.test.ts +7 -21
package/src/providers/anthropic/client.ts +61 -34
package/src/providers/call-site-routing.ts +1 -9
package/src/providers/gemini/client.ts +152 -34
package/src/providers/gemini/inline-media.ts +74 -0
package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +112 -2
package/src/providers/openai/chat-completions-provider.ts +45 -4
package/src/providers/openai/responses-provider.ts +1 -4
package/src/providers/openrouter/client.ts +2 -6
package/src/providers/placeholder-sentinels.ts +35 -0
package/src/providers/provider-send-message.ts +6 -6
package/src/providers/ratelimit.ts +1 -9
package/src/providers/retry.ts +0 -5
package/src/providers/types.ts +11 -2
package/src/providers/usage-tracking.ts +1 -9
package/src/runtime/__tests__/agent-wake.test.ts +141 -32
package/src/runtime/__tests__/background-job-runner.test.ts +1 -3
package/src/runtime/__tests__/interactive-ui.test.ts +1 -1
package/src/runtime/agent-wake.ts +95 -23
package/src/runtime/assistant-event-hub.ts +38 -8
package/src/runtime/assistant-stream-state.ts +368 -0
package/src/runtime/auth/__tests__/guard-tests.test.ts +75 -109
package/src/runtime/auth/__tests__/route-policy.test.ts +153 -170
package/src/runtime/auth/route-policy.ts +42 -1079
package/src/runtime/background-job-runner.ts +1 -4
package/src/runtime/btw-sidechain.ts +3 -1
package/src/runtime/channel-approvals.ts +4 -15
package/src/runtime/channel-invite-transport.ts +5 -6
package/src/runtime/channel-readiness-service.ts +2 -5
package/src/runtime/channel-retry-sweep.ts +12 -16
package/src/runtime/http-router.ts +35 -43
package/src/runtime/http-types.ts +23 -71
package/src/runtime/interactive-ui.ts +1 -1
package/src/runtime/invite-instruction-generator.ts +3 -3
package/src/runtime/pending-interactions.ts +3 -2
package/src/runtime/routes/__tests__/acp-routes.test.ts +253 -55
package/src/runtime/routes/__tests__/avatar-state-routes.test.ts +565 -0
package/src/runtime/routes/__tests__/consolidation-routes.test.ts +265 -2
package/src/runtime/routes/__tests__/content-source-routes.test.ts +4 -4
package/src/runtime/routes/__tests__/conversation-compaction-routes.test.ts +62 -32
package/src/runtime/routes/__tests__/conversation-list-routes.test.ts +237 -0
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +31 -1
package/src/runtime/routes/__tests__/inference-provider-connection-routes.test.ts +13 -22
package/src/runtime/routes/__tests__/memory-v2-routes.test.ts +6 -2
package/src/runtime/routes/__tests__/memory-v2-simulate-route.test.ts +7 -2
package/src/runtime/routes/__tests__/sanity-routes.test.ts +6 -6
package/src/runtime/routes/__tests__/stt-routes.test.ts +3 -3
package/src/runtime/routes/__tests__/suggest-trust-rule-routes.test.ts +5 -2
package/src/runtime/routes/__tests__/surface-action-routes.test.ts +5 -4
package/src/runtime/routes/__tests__/surface-content-routes.test.ts +4 -1
package/src/runtime/routes/__tests__/tts-routes.test.ts +9 -5
package/src/runtime/routes/acp-routes.test.ts +186 -100
package/src/runtime/routes/acp-routes.ts +110 -35
package/src/runtime/routes/app-management-routes.ts +93 -131
package/src/runtime/routes/app-routes.ts +38 -20
package/src/runtime/routes/approval-routes.ts +17 -5
package/src/runtime/routes/attachment-routes.ts +51 -16
package/src/runtime/routes/audio-routes.ts +1 -0
package/src/runtime/routes/audit-routes.ts +5 -0
package/src/runtime/routes/auth-routes.ts +5 -0
package/src/runtime/routes/avatar-routes.ts +264 -59
package/src/runtime/routes/background-tool-routes.ts +9 -0
package/src/runtime/routes/background-wake-routes.ts +13 -3
package/src/runtime/routes/backup-routes.ts +45 -0
package/src/runtime/routes/bookmark-routes.ts +13 -0
package/src/runtime/routes/brain-graph-routes.ts +9 -0
package/src/runtime/routes/browser-routes.ts +6 -1
package/src/runtime/routes/browser-tabs-routes.ts +11 -10
package/src/runtime/routes/btw-routes.ts +34 -24
package/src/runtime/routes/cache-routes.ts +13 -0
package/src/runtime/routes/call-routes.ts +21 -10
package/src/runtime/routes/channel-availability-routes.ts +5 -1
package/src/runtime/routes/channel-readiness-routes.ts +37 -4
package/src/runtime/routes/channel-route-definitions.ts +21 -0
package/src/runtime/routes/channel-verification-routes.ts +21 -0
package/src/runtime/routes/chatgpt-subscription-auth-routes.ts +9 -2
package/src/runtime/routes/client-routes.ts +9 -0
package/src/runtime/routes/consolidation-routes.ts +133 -25
package/src/runtime/routes/contact-prompt-routes.ts +9 -0
package/src/runtime/routes/contact-routes.ts +90 -23
package/src/runtime/routes/content-source-routes.ts +5 -1
package/src/runtime/routes/conversation-analysis-routes.ts +5 -1
package/src/runtime/routes/conversation-attention-routes.ts +5 -0
package/src/runtime/routes/conversation-cli-routes.ts +54 -7
package/src/runtime/routes/conversation-compaction-routes.ts +54 -25
package/src/runtime/routes/conversation-list-routes.ts +81 -12
package/src/runtime/routes/conversation-management-routes.ts +57 -14
package/src/runtime/routes/conversation-query-routes.ts +90 -41
package/src/runtime/routes/conversation-routes.ts +446 -204
package/src/runtime/routes/conversation-starter-routes.ts +35 -20
package/src/runtime/routes/conversations-import-routes.ts +30 -8
package/src/runtime/routes/credential-prompt-routes.ts +5 -0
package/src/runtime/routes/credential-routes.ts +25 -6
package/src/runtime/routes/debug-bash-routes.ts +5 -0
package/src/runtime/routes/debug-routes.ts +11 -2
package/src/runtime/routes/defer-routes.ts +13 -0
package/src/runtime/routes/diagnostics-routes.ts +37 -46
package/src/runtime/routes/disk-pressure-routes.ts +17 -31
package/src/runtime/routes/document-comments-routes.ts +46 -27
package/src/runtime/routes/documents-routes.ts +25 -10
package/src/runtime/routes/domain-routes.ts +98 -51
package/src/runtime/routes/email-routes.ts +33 -0
package/src/runtime/routes/epoch-millis-range.ts +34 -0
package/src/runtime/routes/events-routes.ts +107 -8
package/src/runtime/routes/filing-routes.ts +9 -4
package/src/runtime/routes/gateway-log-routes.ts +31 -4
package/src/runtime/routes/global-search-routes.ts +53 -50
package/src/runtime/routes/group-routes.ts +21 -5
package/src/runtime/routes/guardian-action-routes.ts +9 -0
package/src/runtime/routes/guardian-approval-interception.ts +0 -31
package/src/runtime/routes/heartbeat-routes.ts +57 -21
package/src/runtime/routes/home-feed-routes.ts +23 -19
package/src/runtime/routes/home-state-routes.ts +8 -40
package/src/runtime/routes/host-app-control-routes.ts +6 -1
package/src/runtime/routes/host-bash-routes.ts +5 -0
package/src/runtime/routes/host-browser-routes.ts +13 -0
package/src/runtime/routes/host-cu-routes.ts +6 -1
package/src/runtime/routes/host-file-routes.ts +26 -6
package/src/runtime/routes/host-transfer-routes.ts +13 -2
package/src/runtime/routes/http-adapter.ts +1 -2
package/src/runtime/routes/identity-intro-cache.ts +28 -40
package/src/runtime/routes/identity-routes.ts +236 -20
package/src/runtime/routes/image-generation-routes.ts +45 -2
package/src/runtime/routes/inbound-message-handler.ts +16 -12
package/src/runtime/routes/inbound-stages/background-dispatch.test.ts +0 -12
package/src/runtime/routes/inbound-stages/background-dispatch.ts +15 -19
package/src/runtime/routes/index.ts +2 -0
package/src/runtime/routes/inference-profile-session-routes.ts +13 -3
package/src/runtime/routes/inference-provider-connection-routes.ts +21 -5
package/src/runtime/routes/inference-send-routes.ts +11 -11
package/src/runtime/routes/integrations/a2a.ts +32 -7
package/src/runtime/routes/integrations/slack/__tests__/channel.test.ts +16 -0
package/src/runtime/routes/integrations/slack/channel.ts +23 -3
package/src/runtime/routes/integrations/slack/share.ts +36 -8
package/src/runtime/routes/integrations/telegram.ts +34 -9
package/src/runtime/routes/integrations/twilio.ts +77 -7
package/src/runtime/routes/integrations/vercel.ts +3 -3
package/src/runtime/routes/internal-oauth-routes.ts +5 -0
package/src/runtime/routes/internal-telemetry-routes.ts +88 -0
package/src/runtime/routes/internal-twilio-routes.ts +13 -0
package/src/runtime/routes/llm-call-sites-routes.ts +39 -4
package/src/runtime/routes/log-export-routes.ts +36 -10
package/src/runtime/routes/mcp-auth-routes.ts +25 -0
package/src/runtime/routes/memory-item-routes.ts +21 -10
package/src/runtime/routes/memory-v2-routes.ts +105 -44
package/src/runtime/routes/memory-v3-routes.ts +306 -408
package/src/runtime/routes/migration-rollback-routes.ts +5 -1
package/src/runtime/routes/migration-routes.ts +29 -0
package/src/runtime/routes/notification-routes.ts +17 -1
package/src/runtime/routes/oauth-apps.ts +99 -23
package/src/runtime/routes/oauth-commands-routes.ts +37 -14
package/src/runtime/routes/oauth-connect-routes.ts +9 -0
package/src/runtime/routes/oauth-lifecycle-routes.ts +5 -1
package/src/runtime/routes/oauth-providers.ts +79 -15
package/src/runtime/routes/platform-routes.ts +102 -5
package/src/runtime/routes/playground/__tests__/force-compact.test.ts +9 -6
package/src/runtime/routes/playground/__tests__/inject-failures.test.ts +37 -16
package/src/runtime/routes/playground/__tests__/reset-circuit.test.ts +7 -3
package/src/runtime/routes/playground/__tests__/state.test.ts +10 -3
package/src/runtime/routes/playground/force-compact.ts +2 -2
package/src/runtime/routes/playground/helpers.ts +1 -2
package/src/runtime/routes/playground/inject-failures.ts +13 -8
package/src/runtime/routes/playground/reset-circuit.ts +14 -9
package/src/runtime/routes/playground/seed-conversation.ts +1 -1
package/src/runtime/routes/playground/seeded-conversations.ts +3 -3
package/src/runtime/routes/playground/state.ts +4 -3
package/src/runtime/routes/plugins-routes.ts +22 -19
package/src/runtime/routes/profiler-routes.ts +17 -4
package/src/runtime/routes/ps-routes.ts +5 -0
package/src/runtime/routes/publish-routes.ts +13 -3
package/src/runtime/routes/question-routes.ts +5 -0
package/src/runtime/routes/recording-routes.ts +25 -12
package/src/runtime/routes/rename-conversation-routes.ts +10 -0
package/src/runtime/routes/sanity-routes.ts +9 -2
package/src/runtime/routes/schedule-routes.ts +288 -88
package/src/runtime/routes/secret-routes.ts +31 -6
package/src/runtime/routes/sequence-routes.ts +33 -0
package/src/runtime/routes/settings-routes.ts +65 -19
package/src/runtime/routes/skills-routes.ts +166 -73
package/src/runtime/routes/slack-channel-routes.ts +5 -0
package/src/runtime/routes/stt-routes.ts +13 -6
package/src/runtime/routes/subagents-routes.ts +24 -18
package/src/runtime/routes/suggest-trust-rule-routes.ts +7 -2
package/src/runtime/routes/surface-action-routes.ts +9 -0
package/src/runtime/routes/surface-content-routes.ts +10 -2
package/src/runtime/routes/surface-conversation-resolver.ts +4 -3
package/src/runtime/routes/task-routes.ts +37 -0
package/src/runtime/routes/telemetry-routes.ts +9 -0
package/src/runtime/routes/tool-call-confirmation-enrichment.test.ts +161 -0
package/src/runtime/routes/tool-call-confirmation-enrichment.ts +107 -0
package/src/runtime/routes/trace-event-routes.ts +42 -1
package/src/runtime/routes/trust-rules-routes.ts +31 -2
package/src/runtime/routes/tts-routes.ts +48 -6
package/src/runtime/routes/types.ts +83 -16
package/src/runtime/routes/ui-request-routes.ts +5 -0
package/src/runtime/routes/upgrade-broadcast-routes.ts +5 -0
package/src/runtime/routes/usage-routes.ts +118 -42
package/src/runtime/routes/user-routes-cli.ts +9 -0
package/src/runtime/routes/user-routes.ts +5 -1
package/src/runtime/routes/wake-conversation-routes.ts +5 -0
package/src/runtime/routes/watcher-routes.ts +21 -0
package/src/runtime/routes/webhook-routes.ts +50 -2
package/src/runtime/routes/wipe-conversation-routes.ts +5 -0
package/src/runtime/routes/work-items-routes.ts +49 -23
package/src/runtime/routes/workspace-commit-routes.ts +5 -0
package/src/runtime/routes/workspace-routes.test.ts +42 -0
package/src/runtime/routes/workspace-routes.ts +124 -9
package/src/runtime/services/__tests__/analyze-conversation.test.ts +8 -4
package/src/runtime/services/analyze-conversation.ts +5 -8
package/src/runtime/services/conversation-serializer.ts +24 -2
package/src/runtime/sync/resource-sync-events.ts +16 -2
package/src/runtime/sync/sync-publisher.ts +2 -2
package/src/schedule/run-script.ts +28 -3
package/src/schedule/schedule-store.ts +28 -1
package/src/schedule/schedule-usage-store.ts +83 -0
package/src/schedule/scheduler.ts +15 -6
package/src/signals/cancel.ts +2 -4
package/src/signals/user-message.ts +5 -8
package/src/skills/catalog-files.ts +4 -1
package/src/skills/catalog-install.ts +3 -0
package/src/skills/categories-cache.ts +118 -0
package/src/skills/clawhub-files.ts +1 -0
package/src/skills/skillssh-files.ts +1 -0
package/src/subagent/manager.ts +20 -11
package/src/telemetry/types.ts +55 -1
package/src/telemetry/usage-telemetry-reporter.test.ts +250 -4
package/src/telemetry/usage-telemetry-reporter.ts +88 -2
package/src/tools/acp/context.ts +20 -0
package/src/tools/acp/list-agents.test.ts +7 -1
package/src/tools/acp/spawn.test.ts +198 -93
package/src/tools/acp/spawn.ts +32 -70
package/src/tools/acp/steer.test.ts +105 -8
package/src/tools/acp/steer.ts +48 -17
package/src/tools/apps/definitions.ts +8 -4
package/src/tools/apps/executors.ts +13 -8
package/src/tools/ask-question/ask-question-tool.test.ts +120 -105
package/src/tools/ask-question/ask-question-tool.ts +85 -90
package/src/tools/computer-use/definitions.ts +28 -24
package/src/tools/credential-execution/make-authenticated-request.ts +56 -51
package/src/tools/credential-execution/manage-secure-command-tool.ts +2 -2
package/src/tools/credential-execution/run-authenticated-command.ts +82 -77
package/src/tools/credentials/vault.ts +112 -111
package/src/tools/execution-target.ts +1 -1
package/src/tools/execution-timeout.ts +3 -4
package/src/tools/executor.ts +1 -53
package/src/tools/filesystem/edit.ts +45 -42
package/src/tools/filesystem/list.ts +33 -30
package/src/tools/filesystem/read.ts +54 -35
package/src/tools/filesystem/write.ts +69 -32
package/src/tools/host-filesystem/edit.ts +44 -42
package/src/tools/host-filesystem/read.ts +49 -35
package/src/tools/host-filesystem/transfer.ts +121 -108
package/src/tools/host-filesystem/write.ts +33 -31
package/src/tools/host-terminal/host-shell.ts +50 -48
package/src/tools/memory/register.ts +23 -24
package/src/tools/network/__tests__/web-search-metadata.test.ts +7 -1
package/src/tools/network/__tests__/web-search.test.ts +11 -3
package/src/tools/network/web-fetch.ts +49 -46
package/src/tools/network/web-search-error.test.ts +248 -0
package/src/tools/network/web-search-error.ts +267 -0
package/src/tools/network/web-search.ts +223 -61
package/src/tools/registry.ts +39 -16
package/src/tools/schedule/create.ts +13 -0
package/src/tools/schedule/update.ts +16 -0
package/src/tools/shared/filesystem/audio-read.ts +122 -0
package/src/tools/shared/filesystem/image-read.ts +1 -1
package/src/tools/skills/execute.ts +34 -31
package/src/tools/skills/load.ts +29 -23
package/src/tools/subagent/notify-parent.ts +35 -32
package/src/tools/subagent/spawn.ts +2 -4
package/src/tools/system/avatar-generator.ts +13 -22
package/src/tools/system/request-permission.ts +30 -27
package/src/tools/terminal/safe-env.ts +10 -1
package/src/tools/terminal/shell.ts +190 -61
package/src/tools/tool-defaults.ts +20 -9
package/src/tools/tool-manifest.ts +4 -4
package/src/tools/types.ts +74 -23
package/src/tools/ui-surface/definitions.ts +99 -10
package/src/tts/__tests__/provider-catalog-consistency.test.ts +85 -1
package/src/tts/provider-catalog.ts +76 -1
package/src/usage/types.ts +10 -0
package/src/util/errors.ts +2 -2
package/src/util/map-limit.ts +27 -0
package/src/util/mutex.ts +47 -0
package/src/util/platform.ts +15 -12
package/src/work-items/work-item-runner.ts +7 -2
package/src/workspace/git-service.ts +1 -42
package/src/workspace/migrations/028-recover-conversations-from-disk-view.ts +7 -20
package/src/workspace/migrations/092-backfill-v3-leaves.ts +169 -0
package/src/workspace/migrations/093-backfill-leaf-ids.ts +144 -0
package/src/workspace/migrations/094-seed-avatar-manifest.ts +155 -0
package/src/workspace/migrations/095-bump-heartbeat-interval-30m-to-60m.ts +51 -0
package/src/workspace/migrations/096-reduce-quality-profile-effort.ts +72 -0
package/src/workspace/migrations/097-enable-adaptive-thinking-managed-profiles.ts +117 -0
package/src/workspace/migrations/__tests__/094-seed-avatar-manifest.test.ts +136 -0
package/src/workspace/migrations/__tests__/backfill-leaf-ids.test.ts +175 -0
package/src/workspace/migrations/__tests__/backfill-v3-leaves.test.ts +124 -0
package/src/workspace/migrations/registry.ts +12 -0
package/src/workspace/provider-commit-message-generator.ts +15 -17
package/tsconfig.json +4 -1
package/src/__tests__/bootstrap-turn-cleanup.test.ts +0 -44
package/src/__tests__/circuit-breaker-pipeline.test.ts +0 -405
package/src/__tests__/compaction-pipeline.test.ts +0 -210
package/src/__tests__/compaction-timeout-recovery.test.ts +0 -262
package/src/__tests__/empty-response-pipeline.test.ts +0 -301
package/src/__tests__/history-repair-pipeline.test.ts +0 -396
package/src/__tests__/llm-call-pipeline.test.ts +0 -281
package/src/__tests__/memory-retrieval-pipeline.test.ts +0 -418
package/src/__tests__/persistence-pipeline.test.ts +0 -514
package/src/__tests__/title-generate-pipeline.test.ts +0 -211
package/src/__tests__/token-estimate-pipeline.test.ts +0 -481
package/src/__tests__/tool-error-pipeline.test.ts +0 -241
package/src/__tests__/tool-execute-pipeline.test.ts +0 -417
package/src/__tests__/tool-result-truncate-pipeline.test.ts +0 -344
package/src/cli/commands/__tests__/memory-v3-render.test.ts +0 -340
package/src/cli/commands/memory-v3-render.ts +0 -491
package/src/daemon/bootstrap-turn-cleanup.ts +0 -45
package/src/daemon/message-types/disk-pressure.ts +0 -9
package/src/email/feature-gate.ts +0 -23
package/src/gallery/default-gallery.ts +0 -1359
package/src/gallery/gallery-manifest.ts +0 -28
package/src/memory/v3/__tests__/coactivation-store.test.ts +0 -422
package/src/memory/v3/__tests__/consolidation-job.test.ts +0 -466
package/src/memory/v3/__tests__/coretrieval-seed.test.ts +0 -270
package/src/memory/v3/__tests__/edge-learning-job.test.ts +0 -324
package/src/memory/v3/__tests__/edges.test.ts +0 -706
package/src/memory/v3/__tests__/filter.test.ts +0 -560
package/src/memory/v3/__tests__/gate.test.ts +0 -637
package/src/memory/v3/__tests__/index-composition.test.ts +0 -291
package/src/memory/v3/__tests__/loop.test.ts +0 -775
package/src/memory/v3/__tests__/retriever.test.ts +0 -226
package/src/memory/v3/__tests__/scouts.test.ts +0 -489
package/src/memory/v3/__tests__/shadow-diff.test.ts +0 -225
package/src/memory/v3/__tests__/shadow-middleware.test.ts +0 -398
package/src/memory/v3/__tests__/system-prompts.test.ts +0 -154
package/src/memory/v3/__tests__/traversal.test.ts +0 -508
package/src/memory/v3/__tests__/tree-index.test.ts +0 -280
package/src/memory/v3/__tests__/tree-store.test.ts +0 -529
package/src/memory/v3/__tests__/tree-walk.test.ts +0 -784
package/src/memory/v3/__tests__/validate.test.ts +0 -277
package/src/memory/v3/auto-edges.ts +0 -223
package/src/memory/v3/coactivation-store.ts +0 -124
package/src/memory/v3/consolidation-job.ts +0 -323
package/src/memory/v3/coretrieval-seed.ts +0 -240
package/src/memory/v3/edge-learning-job.ts +0 -160
package/src/memory/v3/edges.ts +0 -286
package/src/memory/v3/filter.ts +0 -286
package/src/memory/v3/gate.ts +0 -349
package/src/memory/v3/index-composition.ts +0 -126
package/src/memory/v3/llm-capture.ts +0 -46
package/src/memory/v3/loop.ts +0 -430
package/src/memory/v3/maintenance.ts +0 -144
package/src/memory/v3/prompt-context.ts +0 -33
package/src/memory/v3/prompts/consolidation.ts +0 -458
package/src/memory/v3/prompts/system-prompts.ts +0 -196
package/src/memory/v3/retriever.ts +0 -33
package/src/memory/v3/scouts.ts +0 -431
package/src/memory/v3/shadow-diff.ts +0 -287
package/src/memory/v3/shadow-middleware.ts +0 -347
package/src/memory/v3/traversal.ts +0 -211
package/src/memory/v3/tree-index.ts +0 -237
package/src/memory/v3/tree-store.ts +0 -394
package/src/memory/v3/tree-walk.ts +0 -356
package/src/memory/v3/types.ts +0 -65
package/src/memory/v3/validate.ts +0 -323
package/src/plugins/defaults/circuit-breaker.ts +0 -141
package/src/plugins/defaults/compaction.ts +0 -141
package/src/plugins/defaults/empty-response.ts +0 -124
package/src/plugins/defaults/history-repair.ts +0 -83
package/src/plugins/defaults/llm-call.ts +0 -77
package/src/plugins/defaults/memory-retrieval.ts +0 -219
package/src/plugins/defaults/overflow-reduce.ts +0 -185
package/src/plugins/defaults/persistence.ts +0 -146
package/src/plugins/defaults/title-generate.ts +0 -90
package/src/plugins/defaults/token-estimate.ts +0 -101
package/src/plugins/defaults/tool-error.ts +0 -119
package/src/plugins/defaults/tool-execute.ts +0 -87
package/src/plugins/defaults/tool-result-truncate.ts +0 -84
package/src/runtime/routes/__tests__/memory-v3-simulate-params.test.ts +0 -35
package/src/skills/category-inference.ts +0 -111

package/src/daemon/conversation-agent-loop.ts CHANGED Viewed

@@ -7,8 +7,6 @@
  * runAgentLoop method here via the AgentLoopConversationContext interface.
  */
-import { join } from "node:path";
 import { v4 as uuid } from "uuid";
 import { optimizeImageForTransport } from "../agent/image-optimize.js";
@@ -17,7 +15,7 @@ import type {
   AgentLoop,
   AgentLoopExitReason,
   CheckpointDecision,
-  CheckpointInfo,
+  MidLoopCompaction,
 } from "../agent/loop.js";
 import { createAssistantMessage } from "../agent/message-types.js";
 import type {
@@ -26,6 +24,7 @@ import type {
   TurnChannelContext,
   TurnInterfaceContext,
 } from "../channels/types.js";
+import { isAssistantFeatureFlagEnabled } from "../config/assistant-feature-flags.js";
 import {
   contextWindowConfigFromEffective,
   type EffectiveContextWindow,
@@ -45,10 +44,13 @@ import {
 } from "../context/post-turn-tool-result-truncation.js";
 import {
   estimatePromptTokens,
+  estimatePromptTokensWithTools,
   getCalibrationProviderKey,
 } from "../context/token-estimator.js";
-import type { ContextWindowManager } from "../context/window-manager.js";
-import { getDocumentsForConversation } from "../documents/document-store.js";
+import type {
+  ContextWindowCompactOptions,
+  ContextWindowManager,
+} from "../context/window-manager.js";
 import type { ToolProfiler } from "../events/tool-profiling-listener.js";
 import { writeRelationshipState } from "../home/relationship-state-writer.js";
 import {
@@ -56,9 +58,9 @@ import {
   setSentryConversationContext,
 } from "../instrument.js";
 import { commitAppTurnChanges } from "../memory/app-git-service.js";
-import { getApp, listAppFiles, resolveAppDir } from "../memory/app-store.js";
 import { enqueueAutoAnalysisOnCompaction } from "../memory/auto-analysis-enqueue.js";
 import {
+  addMessage,
   deleteMessageById,
   getConversation,
   getConversationOriginChannel,
@@ -67,86 +69,40 @@ import {
   getLastUserTimestampBefore,
   getMessageById,
   provenanceFromTrustContext,
-  setConversationHistoryStrippedAt,
-  setLastNotifiedInferenceProfile,
   updateConversationContextWindow,
   updateConversationSlackContextWatermark,
+  updateMessageMetadata,
 } from "../memory/conversation-crud.js";
 import { getResolvedConversationDirPath } from "../memory/conversation-directories.js";
 import { syncMessageToDisk } from "../memory/conversation-disk-view.js";
-import {
-  isReplaceableTitle,
-  queueRegenerateConversationTitle,
-} from "../memory/conversation-title-service.js";
+import { isReplaceableTitle } from "../memory/conversation-title-service.js";
 import { isBackgroundConversationType } from "../memory/conversation-types.js";
 import type { ConversationGraphMemory } from "../memory/graph/conversation-graph-memory.js";
 import {
   backfillMessageIdOnLogs,
   recordSyntheticAgentErrorMessageLog,
 } from "../memory/llm-request-log-store.js";
-import { recordMemoryRecallLog } from "../memory/memory-recall-log-store.js";
 import { enqueueMemoryRetrospectiveOnCompaction } from "../memory/memory-retrospective-enqueue.js";
-import { PKB_WORKSPACE_SCOPE } from "../memory/pkb/types.js";
-import type { QdrantSparseVector } from "../memory/qdrant-client.js";
-import {
-  readMemoryV2StaticContent,
-  shouldExposePersonalMemory,
-} from "../memory/v2/static-context.js";
 import type { PermissionPrompter } from "../permissions/prompter.js";
 import { HOOKS } from "../plugin-api/constants.js";
 import type { UserPromptSubmitContext } from "../plugin-api/types.js";
-import { defaultCompactionTerminal } from "../plugins/defaults/compaction.js";
-import { defaultHistoryRepairTerminal } from "../plugins/defaults/history-repair.js";
-import {
-  asDefaultGraphPayload,
-  type DefaultMemoryRetrievalDeps,
-  type GraphMemoryPayload,
-  runDefaultMemoryRetrieval,
-} from "../plugins/defaults/memory-retrieval.js";
-import { defaultPersistenceTerminal } from "../plugins/defaults/persistence.js";
-import { defaultTitleGenerateTerminal } from "../plugins/defaults/title-generate.js";
-import { defaultTokenEstimateTerminal } from "../plugins/defaults/token-estimate.js";
-import { DEFAULT_TIMEOUTS, runHook, runPipeline } from "../plugins/pipeline.js";
-import { getMiddlewaresFor } from "../plugins/registry.js";
-import type {
-  CircuitBreakerArgs,
-  CircuitBreakerResult,
-  CompactionArgs,
-  CompactionResult,
-  EstimateArgs,
-  EstimateResult,
-  HistoryRepairArgs,
-  HistoryRepairResult,
-  MemoryArgs,
-  MemoryResult,
-  OverflowReduceArgs,
-  OverflowReduceResult,
-  PersistAddResult,
-  PersistArgs,
-  PersistResult,
-  TurnContext as PluginTurnContext,
-} from "../plugins/types.js";
-import { PluginExecutionError, PluginTimeoutError } from "../plugins/types.js";
-import {
-  hasProactiveArtifactCompleted,
-  runProactiveArtifactJob,
-  tryClaimProactiveArtifactTrigger,
-} from "../proactive-artifact/index.js";
-import type {
-  ContentBlock,
-  Message,
-  ToolDefinition,
-} from "../providers/types.js";
+import { defaultCompact } from "../plugins/defaults/compaction/compact.js";
+import { deepRepairHistory } from "../plugins/defaults/history-repair/terminal.js";
+import postCompactReinject from "../plugins/defaults/memory-retrieval/hooks/post-compact.js";
+import userPromptSubmitMemoryRetrieval, {
+  type MemoryRetrievalHookContext,
+} from "../plugins/defaults/memory-retrieval/hooks/user-prompt-submit-temp.js";
+import { runHook } from "../plugins/pipeline.js";
+import type { TurnContext as PluginTurnContext } from "../plugins/types.js";
+import type { ContentBlock, Message } from "../providers/types.js";
 import type { Provider } from "../providers/types.js";
 import { resolveActorTrust } from "../runtime/actor-trust-resolver.js";
 import { broadcastMessage } from "../runtime/assistant-event-hub.js";
 import { DAEMON_INTERNAL_ASSISTANT_ID } from "../runtime/assistant-scope.js";
 import { publishConversationMessagesChanged } from "../runtime/sync/resource-sync-events.js";
-import { redactSecrets } from "../security/secret-scanner.js";
 import { getSubagentManager } from "../subagent/index.js";
 import type { UsageActor } from "../usage/actors.js";
 import { getLogger } from "../util/logger.js";
-import { getWorkspaceDir } from "../util/platform.js";
 import { timeAgo } from "../util/time.js";
 import { truncate } from "../util/truncate.js";
 import { getWorkspaceGitService } from "../workspace/git-service.js";
@@ -155,7 +111,6 @@ import {
   type AssistantAttachmentDraft,
   cleanAssistantContent,
 } from "./assistant-attachments.js";
-import { cleanupBootstrapAfterTurnThreshold } from "./bootstrap-turn-cleanup.js";
 import { resolveOverflowAction } from "./context-overflow-policy.js";
 import {
   createInitialReducerState,
@@ -166,6 +121,8 @@ import {
   createEventHandlerState,
   dispatchAgentEvent,
   type EventHandlerDeps,
+  finalizePendingToolResultRow,
+  markHistoryStrippedBestEffort,
 } from "./conversation-agent-loop-handlers.js";
 import {
   approveHostAttachmentRead,
@@ -181,7 +138,6 @@ import { raceWithTimeout } from "./conversation-media-retry.js";
 import type { MessageQueue } from "./conversation-queue-manager.js";
 import type { QueueDrainReason } from "./conversation-queue-manager.js";
 import type {
-  ActiveSurfaceContext,
   ChannelCapabilities,
   InboundActorContext,
   InjectionMode,
@@ -190,8 +146,6 @@ import {
   applyRuntimeInjections,
   buildSubagentStatusBlock,
   buildUnifiedTurnContextBlock,
-  findLastInjectedNowContent,
-  getPkbAutoInjectList,
   getSlackCompactionWatermarkForPrefix,
   inboundActorContextFromTrust,
   inboundActorContextFromTrustContext,
@@ -202,7 +156,6 @@ import {
 } from "./conversation-runtime-assembly.js";
 import type { SkillProjectionCache } from "./conversation-skill-tools.js";
 import { markSurfaceCompleted } from "./conversation-surfaces.js";
-import { resolveTrustClass } from "./conversation-tool-setup.js";
 import { recordUsage } from "./conversation-usage.js";
 import {
   formatTurnTimestamp,
@@ -210,47 +163,28 @@ import {
 } from "./date-context.js";
 import { getDiskPressureStatus } from "./disk-pressure-guard.js";
 import { classifyDiskPressureTurnPolicy } from "./disk-pressure-policy.js";
-import { deepRepairHistory } from "./history-repair.js";
 import type {
-  DynamicPageSurfaceData,
   ServerMessage,
   SurfaceData,
   SurfaceType,
   UsageStats,
 } from "./message-protocol.js";
-import type { MemoryRecalled } from "./message-types/memory.js";
 import type { ConfirmationStateChanged } from "./message-types/messages.js";
-import { conversationMetadataSyncTag } from "./message-types/sync.js";
+import {
+  type OverflowReduceArgs,
+  runOverflowReductionLoop,
+} from "./overflow-reduction-loop.js";
 import { parseActualTokensFromError } from "./parse-actual-tokens-from-error.js";
+import {
+  persistUnsendableImageDowngrades,
+  UNSENDABLE_IMAGE_NOTE,
+} from "./persist-unsendable-image.js";
 import type { TraceEmitter } from "./trace-emitter.js";
-import type { TrustContext } from "./trust-context.js";
+import { resolveTrustClass, type TrustContext } from "./trust-context.js";
 import { stripHistoricalWebSearchResults } from "./web-search-history.js";
 const log = getLogger("conversation-agent-loop");
-/**
- * Best-effort persistence of the history-stripped marker after an
- * injection-strip event (compaction / overflow recovery). The marker is a
- * durability hint, not turn-critical state — a transient SQLite write failure
- * (SQLITE_BUSY, disk-full, read-only FS) must not abort the turn. Logs a
- * warning and continues on failure, preserving the long-standing non-fatal
- * contract for this metadata write.
- */
-function markHistoryStrippedBestEffort(
-  conversationId: string,
-  strippedAt: number,
-  logger: ReturnType<typeof getLogger>,
-): void {
-  try {
-    setConversationHistoryStrippedAt(conversationId, strippedAt);
-  } catch (err) {
-    logger.warn(
-      { err },
-      "Failed to persist history-stripped marker after compaction strip (non-fatal)",
-    );
-  }
-}
 const DISK_PRESSURE_ERROR_CODE = "DISK_SPACE_CRITICAL" as const;
 const DISK_PRESSURE_ERROR_CATEGORY = "disk_pressure";
@@ -276,163 +210,15 @@ function formatDiskPressureBlockedMessage(): string {
   return "Storage is critically low, so background processes are paused and remote messages are ignored until the guardian frees enough space. Remote senders should try again later.";
 }
-// ── Compaction circuit-breaker pipeline helpers ─────────────────────
-//
-// The circuit-breaker behavior (3 consecutive summary-LLM failures trips a
-// 1-hour cooldown) is now implemented by the `circuitBreaker` plugin
-// pipeline. The default plugin (`plugins/defaults/circuit-breaker.ts`)
-// replicates the legacy threshold/cooldown constants and event-emission
-// semantics exactly — it operates on the `consecutiveCompactionFailures` /
-// `compactionCircuitOpenUntil` fields the conversation still owns so the
-// dev-only playground routes (`POST /playground/reset-compaction-circuit`,
-// `POST /playground/inject-compaction-failures`) continue to read and
-// mutate those fields directly.
-//
-// The helpers below build the pipeline inputs and invoke the runner. They
-// are the sole entry points the rest of the daemon uses to query or update
-// the compaction circuit.
-/** Circuit-breaker key for a specific conversation's compaction pipeline. */
-function compactionCircuitKey(conversationId: string): string {
-  return `compaction:${conversationId}`;
-}
-/**
- * Build the minimal {@link TurnContext} the pipeline runner requires. Called
- * both from inside the agent loop (where turn identifiers are available) and
- * from non-turn invocations like `Conversation.forceCompact` (which falls
- * back to stable placeholders so the runner's log records still carry the
- * conversation identifier).
- */
-function buildCircuitTurnContext(ctx: {
-  readonly conversationId: string;
-  currentRequestId?: string;
-  currentTurnTrustContext?: TrustContext;
-  trustContext?: TrustContext;
-  turnCount: number;
-}): PluginTurnContext {
-  const trust: TrustContext =
-    ctx.currentTurnTrustContext ?? ctx.trustContext ?? FALLBACK_TURN_TRUST;
-  return {
-    requestId: ctx.currentRequestId ?? "circuit-breaker",
-    conversationId: ctx.conversationId,
-    turnIndex: ctx.turnCount,
-    trust,
-  };
-}
-/**
- * Run the `circuitBreaker` pipeline for the compaction circuit on this
- * conversation. When `outcome` is provided, state is updated (and transition
- * events emit via `onEvent`); when omitted the call is query-only.
- *
- * Returns the post-call decision from the pipeline. Callers gate auto-paths
- * on `!result.open` and admit forced paths regardless of the decision.
- */
-async function runCompactionCircuitPipeline(
-  ctx: {
-    readonly conversationId: string;
-    consecutiveCompactionFailures: number;
-    compactionCircuitOpenUntil: number | null;
-    currentRequestId?: string;
-    currentTurnTrustContext?: TrustContext;
-    trustContext?: TrustContext;
-    turnCount: number;
-  },
-  args: {
-    outcome?: "success" | "failure";
-    onEvent?: (msg: ServerMessage) => void;
-  },
-): Promise<CircuitBreakerResult> {
-  const turnContext = buildCircuitTurnContext(ctx);
-  return runPipeline<CircuitBreakerArgs, CircuitBreakerResult>(
-    "circuitBreaker",
-    getMiddlewaresFor("circuitBreaker"),
-    async (terminalArgs) => {
-      // No plugin in the chain produced a decision. This should be
-      // unreachable in production because the default plugin registers a
-      // `circuitBreaker` middleware that always returns a decision, but we
-      // defensively derive the state here so test setups that intentionally
-      // omit the default plugin still get a sensible response.
-      const openUntil = terminalArgs.state.compactionCircuitOpenUntil;
-      const now = Date.now();
-      if (openUntil !== null && now < openUntil) {
-        return { open: true, cooldownRemainingMs: openUntil - now };
-      }
-      return { open: false };
-    },
-    {
-      key: compactionCircuitKey(ctx.conversationId),
-      // Pass the ctx directly as the mutable state container. The
-      // `CircuitBreakerArgs.state` shape deliberately matches the subset of
-      // fields the conversation owns so plugins mutate the same object the
-      // playground routes read and write.
-      state: ctx,
-      ...(args.outcome !== undefined ? { outcome: args.outcome } : {}),
-      ...(args.onEvent ? { onEvent: args.onEvent } : {}),
-    },
-    turnContext,
-    DEFAULT_TIMEOUTS.circuitBreaker,
-  );
-}
-/**
- * Query-only: is the compaction circuit breaker currently open for this
- * conversation? Thin wrapper around {@link runCompactionCircuitPipeline}
- * with no outcome. Async because the pipeline runner is async, but the
- * default plugin resolves synchronously on its microtask.
- */
-async function isCompactionCircuitOpen(ctx: {
-  readonly conversationId: string;
-  consecutiveCompactionFailures: number;
-  compactionCircuitOpenUntil: number | null;
-  currentRequestId?: string;
-  currentTurnTrustContext?: TrustContext;
-  trustContext?: TrustContext;
-  turnCount: number;
-}): Promise<boolean> {
-  const decision = await runCompactionCircuitPipeline(ctx, {});
-  return decision.open;
-}
-/**
- * Update the compaction circuit breaker with the outcome of a `maybeCompact`
- * call and emit any transition event. A `summaryFailed` value of `undefined`
- * means the summary LLM never ran (early return) — callers must guard with
- * `summaryFailed !== undefined` before invoking this helper so early-return
- * paths don't silently reset the 3-strike counter.
- *
- * The default plugin handles threshold-based tripping and cooldown reset;
- * see `plugins/defaults/circuit-breaker.ts` for the canonical semantics.
- */
-export async function trackCompactionOutcome(
-  ctx: {
-    readonly conversationId: string;
-    consecutiveCompactionFailures: number;
-    compactionCircuitOpenUntil: number | null;
-    currentRequestId?: string;
-    currentTurnTrustContext?: TrustContext;
-    trustContext?: TrustContext;
-    turnCount: number;
-  },
-  summaryFailed: boolean,
-  onEvent: (msg: ServerMessage) => void,
-): Promise<void> {
-  await runCompactionCircuitPipeline(ctx, {
-    outcome: summaryFailed ? "failure" : "success",
-    onEvent,
-  });
-}
 // ── Plugin pipeline helpers ──────────────────────────────────────────
 //
 // Canonical {@link PluginTurnContext} builder threaded into every
-// `runPipeline` call inside `runAgentLoopImpl`. The orchestrator composes
+// `runHook` call inside `runAgentLoopImpl`. The orchestrator composes
 // the context on demand at each call site from ambient state rather than
 // carrying a persistent `TurnContext` instance across the turn.
 /**
- * Synthetic fallback trust context used when the orchestrator fires a pipeline
+ * Synthetic fallback trust context used when the orchestrator fires a hook
  * before the per-turn trust snapshot has been captured (e.g. invocations that
  * bypass `processMessage` / `drainQueue`). We bias to `unknown` rather than
  * `guardian` so a missing snapshot cannot accidentally grant elevated trust
@@ -444,14 +230,14 @@ const FALLBACK_TURN_TRUST: TrustContext = {
 };
 /**
- * Build the {@link TurnContext} passed to {@link runPipeline}.
+ * Build the {@link TurnContext} passed to {@link runHook}.
  *
- * Canonical source of truth for every pipeline call site inside the agent
- * loop. Every `runPipeline` invocation in `runAgentLoopImpl` (and in the
+ * Canonical source of truth for every hook call site inside the agent
+ * loop. Every `runHook` invocation in `runAgentLoopImpl` (and in the
  * handlers that share its ambient state) must route through this helper
  * rather than constructing a `TurnContext` literal inline — this keeps
  * `turnIndex`, trust resolution, and the `contextWindowManager` attachment
- * consistent across pipeline slots, which in turn keeps structured logs
+ * consistent across hooks, which in turn keeps structured logs
  * filtered by `conversationId`/`turnIndex` coherent across slots.
  *
  * Behavior:
@@ -463,9 +249,9 @@ const FALLBACK_TURN_TRUST: TrustContext = {
  *   level context, then {@link FALLBACK_TURN_TRUST}. The cascade matches
  *   the one inside the orchestrator's inline injection assembly so
  *   middleware reads the same trust class the runtime sees.
- * - `contextWindowManager` is attached unconditionally. Pipelines that
- *   don't need it can ignore it; the default compaction plugin reads it
- *   via the typed optional field on `TurnContext`.
+ * - `contextWindowManager` is attached unconditionally. Hooks that
+ *   don't need it can ignore it; it remains available via the typed
+ *   optional field on `TurnContext`.
  */
 function buildPluginTurnContext(
   ctx: AgentLoopConversationContext,
@@ -479,17 +265,62 @@ function buildPluginTurnContext(
     turnIndex: ctx.turnCount,
     trust,
     contextWindowManager: ctx.contextWindowManager,
+    callSite: ctx.currentCallSite,
   };
 }
+/**
+ * Trust class of the actor whose turn is in progress, for the compactor's
+ * image manifest filter. Prefers the turn-start snapshot
+ * ({@link AgentLoopConversationContext.currentTurnTrustContext}) over the live
+ * trust context so compaction running in a later tool iteration can't pick up
+ * a concurrent request's actor.
+ */
+function resolveTurnActorTrustClass(
+  ctx: AgentLoopConversationContext,
+): TrustContext["trustClass"] | undefined {
+  return (ctx.currentTurnTrustContext ?? ctx.trustContext)?.trustClass;
+}
 // ── Context Interface ────────────────────────────────────────────────
+/**
+ * Per-surface entry tracked on the current turn. Inline shape kept stable so
+ * routes and persistence helpers can consume it via a named import instead of
+ * `infer`-extracting from {@link AgentLoopConversationContext}.
+ */
+export interface AssistantSurface {
+  surfaceId: string;
+  surfaceType: SurfaceType;
+  title?: string;
+  data: SurfaceData;
+  actions?: Array<{
+    id: string;
+    label: string;
+    style?: string;
+    data?: Record<string, unknown>;
+  }>;
+  display?: string;
+  persistent?: boolean;
+  /** Id of the tool call that produced this surface (the `ui_show` proxy tool). Persisted so app previews can gate on the tool result's arrival rather than whole-turn streaming state. */
+  toolCallId?: string;
+}
 export interface AgentLoopConversationContext {
   readonly conversationId: string;
   messages: Message[];
-  processing: boolean;
+  isProcessing(): boolean;
+  setProcessing(value: boolean): void;
   abortController: AbortController | null;
   currentRequestId?: string;
+  /**
+   * The {@link LLMCallSite} of the in-flight turn, set at turn start from
+   * `options?.callSite ?? "mainAgent"`. Read by {@link buildPluginTurnContext}
+   * so pipeline/injector plugins can tell the main reply apart from
+   * background agent-loop work (compaction, subagents, …) on this same
+   * conversation. Per-turn mutable, mirroring {@link currentRequestId}.
+   */
+  currentCallSite?: LLMCallSite;
   readonly agentLoop: AgentLoop;
   readonly provider: Provider;
@@ -507,10 +338,6 @@ export interface AgentLoopConversationContext {
    * happened just before this turn).
    */
   pendingPostCompactReinject: boolean;
-  /** Tracks consecutive compaction failures (summary LLM call threw). */
-  consecutiveCompactionFailures: number;
-  /** Timestamp (ms since epoch) until which the circuit breaker is open. */
-  compactionCircuitOpenUntil: number | null;
   readonly graphMemory: ConversationGraphMemory;
@@ -533,24 +360,9 @@ export interface AgentLoopConversationContext {
   pendingSurfaceActions: Map<string, { surfaceType: SurfaceType }>;
   surfaceActionRequestIds: Set<string>;
   approvedViaPromptThisTurn?: boolean;
-  currentTurnSurfaces: Array<{
-    surfaceId: string;
-    surfaceType: SurfaceType;
-    title?: string;
-    data: SurfaceData;
-    actions?: Array<{
-      id: string;
-      label: string;
-      style?: string;
-      data?: Record<string, unknown>;
-    }>;
-    display?: string;
-    persistent?: boolean;
-  }>;
+  currentTurnSurfaces: AssistantSurface[];
   workingDir: string;
-  workspaceTopLevelContext: string | null;
-  workspaceTopLevelDirty: boolean;
   channelCapabilities?: ChannelCapabilities;
   /** Per-turn snapshot of trustContext, frozen at message-processing start. */
   currentTurnTrustContext?: TrustContext;
@@ -624,9 +436,11 @@ export interface AgentLoopConversationContext {
       | "message_complete"
       | "generation_cancelled"
       | "error_terminal",
-    anchor?: "assistant_turn" | "user_turn" | "global",
-    requestId?: string,
-    statusText?: string,
+    options?: {
+      anchor?: "assistant_turn" | "user_turn" | "global";
+      requestId?: string;
+      statusText?: string;
+    },
   ): void;
   emitConfirmationStateChanged(
     params: ConfirmationStateChanged extends {
@@ -644,14 +458,12 @@ export interface AgentLoopConversationContext {
   onConfirmationOutcome?: (
     requestId: string,
     state: string,
-    toolName?: string,
     toolUseId?: string,
   ) => void;
   getWorkspaceGitService?: (workspaceDir: string) => GitServiceInitializer;
   commitTurnChanges?: typeof commitTurnChanges;
-  refreshWorkspaceTopLevelContextIfNeeded(): void;
   markWorkspaceTopLevelDirty(): void;
   getQueueDepth(): number;
   hasQueuedMessages(): boolean;
@@ -712,6 +524,13 @@ export async function runAgentLoopImpl(
   });
   let yieldedForHandoff = false;
   let yieldedForBudget = false;
+  // Whether the most recent agent-loop run produced at least one new assistant
+  // message — the loop's own forward-progress signal, used by the ordering
+  // retry gate and the overflow convergence fold.
+  let lastRunAppendedNewMessages = false;
+  // The messages the most recent agent-loop run appended on top of its base —
+  // the loop's own new-output boundary, persisted as this turn's new messages.
+  let lastRunNewMessages: Message[] = [];
   let pendingCheckpointYield: "budget" | "handoff" | null = null;
   // Captured when the auto_compress_latest_turn rerun yields at the mid-loop
   // budget checkpoint. SSE emission happens immediately at the detection site;
@@ -730,6 +549,9 @@ export async function runAgentLoopImpl(
   // `resolveCallSiteConfig`, picking up any user overrides under
   // `llm.callSites.mainAgent` (falling back to `llm.default` when absent).
   const turnCallSite: LLMCallSite = options?.callSite ?? "mainAgent";
+  // Expose the turn's call site to plugin pipeline/injector contexts (read by
+  // buildPluginTurnContext) so plugins can scope behaviour to the main reply.
+  ctx.currentCallSite = turnCallSite;
   // Read the conversation row once for both the override-profile derivation
   // below and the title-replaceability check at turn start. Later reads in
@@ -859,6 +681,25 @@ export async function runAgentLoopImpl(
       preflightBudget: Math.floor(providerMaxTokens * (1 - safetyMargin)),
     };
   };
+  /**
+   * The agent loop's window into the orchestrator's current effective
+   * context window. The loop reads `maxInputTokens` for tool-result
+   * truncation and `overflowRecovery` for its mid-loop budget gate, applying
+   * the long-history safety-margin bump itself off its own running history.
+   * Resolved fresh on each access so a mid-turn profile change is reflected.
+   */
+  const resolveContextWindow = (): {
+    maxInputTokens: number;
+    overflowRecovery: { enabled: boolean; safetyMarginRatio: number };
+  } => {
+    refreshCurrentProfileState();
+    const { enabled, safetyMarginRatio } =
+      currentEffectiveContextWindow.overflowRecovery;
+    return {
+      maxInputTokens: currentEffectiveContextWindow.maxInputTokens,
+      overflowRecovery: { enabled, safetyMarginRatio },
+    };
+  };
   // Initial value for `createToolExecutor` to read into
   // `ToolContext.overrideProfile`. `resolveCurrentOverrideProfile` refreshes
@@ -924,10 +765,6 @@ export async function runAgentLoopImpl(
         : null,
     },
   );
-  const diskPressureContext =
-    diskPressureDecision.action === "allow-cleanup-mode"
-      ? { cleanupModeActive: true }
-      : null;
   ctx.diskPressureCleanupModeActive =
     diskPressureDecision.action === "allow-cleanup-mode";
@@ -968,7 +805,10 @@ export async function runAgentLoopImpl(
         { reason: diskPressureDecision.reason },
         "Blocked turn during disk pressure cleanup mode",
       );
-      ctx.emitActivityState("idle", "error_terminal", "global", reqId);
+      ctx.emitActivityState("idle", "error_terminal", {
+        anchor: "global",
+        requestId: reqId,
+      });
       ctx.traceEmitter.emit("request_error", message, {
         requestId: reqId,
         status: "error",
@@ -1027,55 +867,6 @@ export async function runAgentLoopImpl(
       }
     }
-    // Generate title early — the user message alone is sufficient context.
-    // Firing before the main LLM call removes the delay of waiting for the
-    // full assistant response. The second-pass regeneration at turn 3 will
-    // refine the title with more context.
-    // No abort signal — title generation should complete even if the user
-    // cancels the response, since the user message is already persisted.
-    // Deferred via setTimeout so the main agent loop LLM call enqueues
-    // first, avoiding rate-limit slot contention on strict configs.
-    if (isReplaceableTitle(turnStartConversation?.title ?? null)) {
-      // TurnContext routed through the canonical builder so the pipeline's
-      // log record reports the same `conversationId`/`turnIndex` shape as
-      // every other slot in this turn. Title generation does not depend on
-      // the context-window manager attached by the builder, but sharing the
-      // builder keeps the invariant enforced in one place.
-      const titlePipelineCtx = buildPluginTurnContext(ctx, reqId);
-      const titleArgs = {
-        conversationId: ctx.conversationId,
-        provider: ctx.provider,
-        userMessage: options?.titleText ?? content,
-        onTitleUpdated: (title: string) => {
-          onEvent({
-            type: "conversation_title_updated",
-            conversationId: ctx.conversationId,
-            title,
-          });
-          onEvent({
-            type: "sync_changed",
-            tags: [conversationMetadataSyncTag(ctx.conversationId)],
-          });
-        },
-      };
-      setTimeout(() => {
-        runPipeline(
-          "titleGenerate",
-          getMiddlewaresFor("titleGenerate"),
-          defaultTitleGenerateTerminal,
-          titleArgs,
-          titlePipelineCtx,
-          DEFAULT_TIMEOUTS.titleGenerate,
-        ).catch((err) => {
-          // Fire-and-forget — keep previous non-propagating semantics.
-          // queueGenerateConversationTitle already swallows internal
-          // errors; this catch covers pipeline-layer errors (timeouts,
-          // middleware throws) without surfacing them to the agent loop.
-          rlog.warn({ err }, "titleGenerate pipeline failed (non-fatal)");
-        });
-      }, 0);
-    }
     const isFirstMessage = ctx.messages.length === 1;
     // Promote a pending post-compaction re-inject signal (e.g. from `/compact`)
     // into `compactedThisTurn` so NOW.md / PKB / v2 static blocks land on this
@@ -1083,7 +874,6 @@ export async function runAgentLoopImpl(
     // so this fires exactly once per `/compact` event.
     const consumedPostCompactReinject = ctx.pendingPostCompactReinject;
     ctx.pendingPostCompactReinject = false;
-    let shouldInjectWorkspace = isFirstMessage || consumedPostCompactReinject;
     let compactedThisTurn = consumedPostCompactReinject;
     let slackCompactedThisTurn = false;
     const isSlackConversation = ctx.channelCapabilities?.channel === "slack";
@@ -1220,74 +1010,42 @@ export async function runAgentLoopImpl(
     );
     // Skip auto-compaction while the circuit breaker is open. Force paths
     // and user-initiated /compact bypass this check.
-    const autoCompactAllowed = !(await isCompactionCircuitOpen(ctx));
+    const autoCompactAllowed =
+      !(await ctx.agentLoop.compactionCircuit.isOpen());
     if (compactCheck.needed && autoCompactAllowed) {
-      ctx.emitActivityState(
-        "thinking",
-        "context_compacting",
-        "assistant_turn",
-        reqId,
-      );
+      ctx.emitActivityState("thinking", "context_compacting", {
+        requestId: reqId,
+      });
     }
-    const compactionOptions = {
-      lastCompactedAt: ctx.contextCompactedAt ?? undefined,
-      precomputedEstimate: compactCheck.estimatedTokens,
-      conversationOriginChannel:
-        getConversationOriginChannel(ctx.conversationId) ?? undefined,
-      overrideProfile: resolveCurrentOverrideProfile() ?? null,
-    };
     let compacted: Awaited<
       ReturnType<typeof ctx.contextWindowManager.maybeCompact>
     > | null = null;
     if (autoCompactAllowed) {
-      try {
-        compacted = (await runPipeline<CompactionArgs, CompactionResult>(
-          "compaction",
-          getMiddlewaresFor("compaction"),
-          (args) =>
-            defaultCompactionTerminal(args, buildPluginTurnContext(ctx, reqId)),
-          {
-            messages: messagesForStartOfTurnCompaction,
-            signal: abortController.signal,
-            options: compactionOptions,
-          },
-          buildPluginTurnContext(ctx, reqId),
-          DEFAULT_TIMEOUTS.compaction,
-        )) as Awaited<ReturnType<typeof ctx.contextWindowManager.maybeCompact>>;
-      } catch (err) {
-        if (err instanceof PluginTimeoutError) {
-          // Pipeline exceeded its budget. Record the failure so the circuit
-          // breaker tracks consecutive timeouts (it trips after three),
-          // then degrade gracefully by skipping compaction this turn —
-          // the turn proceeds with the un-compacted history rather than
-          // hard-failing. The inner summary call has been aborted by the
-          // runner's signal-linking, so updateSummary's local fallback
-          // also ran before this catch block is reached.
-          rlog.warn(
-            { err, phase: "start-of-turn-compaction" },
-            "Compaction pipeline timed out — skipping compaction this turn",
-          );
-          await trackCompactionOutcome(ctx, true, onEvent);
-          compacted = null;
-        } else {
-          throw err;
-        }
-      }
+      compacted = await defaultCompact({
+        manager: ctx.contextWindowManager,
+        messages: messagesForStartOfTurnCompaction,
+        signal: abortController.signal,
+        precomputedEstimate: compactCheck.estimatedTokens,
+        overrideProfile: resolveCurrentOverrideProfile() ?? null,
+        actorTrustClass: resolveTurnActorTrustClass(ctx),
+      });
     }
     // Only track circuit-breaker state when a summary LLM call actually ran.
     // `summaryFailed` is `undefined` on early returns (compaction disabled,
-    // below threshold, cooldown active, no eligible messages, truncation-only
+    // below threshold, no eligible messages, truncation-only
     // path) — treating those as "successful" compactions would silently reset
     // the 3-strike counter and break the invariant.
     if (compacted && compacted.summaryFailed !== undefined) {
-      await trackCompactionOutcome(ctx, compacted.summaryFailed, onEvent);
+      await ctx.agentLoop.compactionCircuit.recordOutcome(
+        compacted.summaryFailed,
+        onEvent,
+      );
     }
     if (compacted?.compacted) {
       await applySuccessfulCompaction(
         compacted,
         messagesForStartOfTurnCompaction,
       );
-      shouldInjectWorkspace = true;
       if (compacted.compactedPersistedMessages > 0) {
         compactedThisTurn = true;
       }
@@ -1295,12 +1053,7 @@ export async function runAgentLoopImpl(
     // Register confirmation outcome tracker so the agent loop can link
     // confirmation decisions to tool_use_ids for persistence.
-    ctx.onConfirmationOutcome = (
-      requestId,
-      confirmationState,
-      toolName,
-      toolUseId,
-    ) => {
+    ctx.onConfirmationOutcome = (requestId, confirmationState, toolUseId) => {
       if (confirmationState === "pending") {
         // Use the toolUseId passed from the prompter (which knows which tool
         // requested confirmation) instead of the ambient state.currentToolUseId,
@@ -1317,7 +1070,7 @@ export async function runAgentLoopImpl(
         const resolvedId =
           state.requestIdToToolUseId.get(requestId) ?? toolUseId;
         if (resolvedId) {
-          const name = state.toolUseIdToName.get(resolvedId) ?? toolName ?? "";
+          const name = state.toolUseIdToName.get(resolvedId) ?? "";
           // Build a friendly label from the tool name
           const label =
             TOOL_FRIENDLY_LABEL[name] ??
@@ -1330,213 +1083,10 @@ export async function runAgentLoopImpl(
       }
     };
-    let runMessages = ctx.messages;
-    // Memory retrieval pipeline — fetches PKB, NOW.md, and memory-graph
-    // outputs through a single `memoryRetrieval` pipeline. Plugins may
-    // replace the terminal behavior by registering a middleware that
-    // short-circuits with its own `MemoryResult`; the default terminal
-    // below runs `runDefaultMemoryRetrieval` which reproduces the prior
-    // in-lined behavior (PKB/NOW reads + gated graph call).
-    const isTrustedActor = resolveTrustClass(ctx.trustContext) === "guardian";
-    // Canonical builder — pulls trust from per-turn snapshot, then
-    // conversation-level, then the synthetic fallback. Memory retrieval
-    // does not need the context-window handle the builder attaches, but
-    // keeping every call site on one helper is load-bearing for log
-    // coherence across pipeline slots.
-    const memoryPluginTurnCtx = buildPluginTurnContext(ctx, reqId);
-    const memoryArgs: MemoryArgs = {
-      conversationId: ctx.conversationId,
-      trustContext: ctx.trustContext,
-      turnIndex: ctx.turnCount,
-      // Pass the abort signal via `args` (not `deps`) so the pipeline
-      // runner's `linkAbortSignal` can swap it for a signal linked to the
-      // pipeline's internal controller — on a plugin-set timeout or
-      // external cancel, the linked signal aborts and `prepareMemory`
-      // stops mutating graph state / emitting events after the pipeline
-      // has already errored.
-      signal: abortController.signal,
-    };
-    const memoryDeps: DefaultMemoryRetrievalDeps = {
-      messages: ctx.messages,
-      graphMemory: ctx.graphMemory,
-      config: getConfig(),
-      onEvent,
-      isTrustedActor,
-    };
-    const memoryResult: MemoryResult = await runPipeline(
-      "memoryRetrieval",
-      getMiddlewaresFor("memoryRetrieval"),
-      (args) => runDefaultMemoryRetrieval(args, memoryDeps),
-      memoryArgs,
-      memoryPluginTurnCtx,
-      DEFAULT_TIMEOUTS.memoryRetrieval,
-    );
-    // Consume the memory-graph block when the default retriever emitted
-    // one. Custom plugins that substitute their own blocks without the
-    // default discriminator are expected to handle their own side effects
-    // (event emission, metric persistence) inside their middleware; this
-    // block short-circuits to the original no-op behavior in that case.
-    const defaultGraphPayload: GraphMemoryPayload | null =
-      asDefaultGraphPayload(memoryResult.memoryGraphBlocks);
-    let pkbQueryVector: number[] | undefined;
-    let pkbSparseVector: QdrantSparseVector | undefined;
-    if (defaultGraphPayload) {
-      const graphResult = defaultGraphPayload.result;
-      runMessages = graphResult.runMessages;
-      // Select dense+sparse as a matched pair so RRF fusion combines two
-      // signals aligned to the same query text:
-      //   1. Context-load with a user query: user-query dense + user-query
-      //      sparse — the cleanest pairing.
-      //   2. Otherwise (context-load without a user query, or per-turn):
-      //      whatever `queryVector` / `sparseVector` the retriever produced,
-      //      which are themselves co-aligned (both summary-derived in
-      //      context-load, both user-last-message-derived in per-turn).
-      // Never pair a user-query dense with a summary-aligned sparse.
-      if (graphResult.userQueryVector) {
-        pkbQueryVector = graphResult.userQueryVector;
-        pkbSparseVector = graphResult.userQuerySparseVector;
-      } else {
-        pkbQueryVector = graphResult.queryVector;
-        pkbSparseVector = graphResult.sparseVector;
-      }
-      // Persist the injected block text in message metadata so it survives
-      // conversation reloads (eviction, restart, fork). loadFromDb re-injects
-      // from metadata. Routed through the `persistence` pipeline so plugins
-      // can observe or override metadata updates alongside add/delete.
-      if (graphResult.injectedBlockText) {
-        try {
-          await runPipeline<PersistArgs, PersistResult>(
-            "persistence",
-            getMiddlewaresFor("persistence"),
-            defaultPersistenceTerminal,
-            {
-              op: "update",
-              messageId: userMessageId,
-              updates: {
-                memoryInjectedBlock: graphResult.injectedBlockText,
-              },
-            },
-            buildPluginTurnContext(ctx, reqId),
-            DEFAULT_TIMEOUTS.persistence,
-          );
-        } catch (err) {
-          rlog.warn(
-            { err },
-            "Failed to persist memory injection to metadata (non-fatal)",
-          );
-        }
-      }
-      const m = graphResult.metrics;
-      try {
-        recordMemoryRecallLog({
-          conversationId: ctx.conversationId,
-          enabled: true,
-          degraded: false,
-          provider: m?.embeddingProvider ?? undefined,
-          model: m?.embeddingModel ?? undefined,
-          semanticHits: m?.semanticHits ?? 0,
-          mergedCount: m?.mergedCount ?? 0,
-          selectedCount: m?.selectedCount ?? 0,
-          tier1Count: m?.tier1Count ?? 0,
-          tier2Count: m?.tier2Count ?? 0,
-          hybridSearchLatencyMs: m?.hybridSearchLatencyMs ?? 0,
-          sparseVectorUsed: m?.sparseVectorUsed ?? false,
-          injectedTokens: graphResult.injectedTokens,
-          latencyMs: graphResult.latencyMs,
-          topCandidatesJson: (m?.topCandidates ?? []).map((c) => ({
-            key: c.nodeId,
-            type: c.type,
-            kind: "graph",
-            finalScore: c.score,
-            semantic: c.semanticSimilarity,
-            recency: c.recencyBoost,
-          })),
-          injectedText: graphResult.injectedBlockText ?? undefined,
-          reason: `graph:${graphResult.mode}`,
-          queryContext: m?.queryContext ?? undefined,
-        });
-      } catch (err) {
-        log.warn({ err }, "Failed to persist memory recall log (non-fatal)");
-      }
-      if (m) {
-        const memoryRecalledEvent: MemoryRecalled = {
-          type: "memory_recalled",
-          provider: m.embeddingProvider ?? "unknown",
-          model: m.embeddingModel ?? "unknown",
-          semanticHits: m.semanticHits,
-          mergedCount: m.mergedCount,
-          selectedCount: m.selectedCount,
-          tier1Count: m.tier1Count,
-          tier2Count: m.tier2Count,
-          hybridSearchLatencyMs: m.hybridSearchLatencyMs,
-          sparseVectorUsed: m.sparseVectorUsed,
-          injectedTokens: graphResult.injectedTokens,
-          latencyMs: graphResult.latencyMs,
-          topCandidates: m.topCandidates.map((c) => ({
-            key: c.nodeId,
-            type: c.type,
-            kind: "graph",
-            finalScore: c.score,
-            semantic: c.semanticSimilarity,
-            recency: c.recencyBoost,
-          })),
-        };
-        onEvent(memoryRecalledEvent);
-      }
-    }
-    // Build active surface context
-    let activeSurface: ActiveSurfaceContext | null = null;
-    if (ctx.currentActiveSurfaceId) {
-      const stored = ctx.surfaceState.get(ctx.currentActiveSurfaceId);
-      if (stored && stored.surfaceType === "dynamic_page") {
-        const data = stored.data as DynamicPageSurfaceData;
-        activeSurface = {
-          surfaceId: ctx.currentActiveSurfaceId,
-          html: data.html,
-          currentPage: ctx.currentPage,
-        };
-        if (data.appId) {
-          const app = getApp(data.appId);
-          if (app) {
-            activeSurface.appId = app.id;
-            activeSurface.appName = app.name;
-            activeSurface.appDirName = resolveAppDir(app.id).dirName;
-            activeSurface.appSchemaJson = app.schemaJson;
-            activeSurface.appFiles = listAppFiles(app.id);
-            if (app.pages && Object.keys(app.pages).length > 0) {
-              activeSurface.appPages = app.pages;
-            }
-          }
-        }
-      }
-    }
-    // Query active documents for this conversation so the injector chain
-    // can surface them to the assistant (prevents duplicate document_create
-    // calls when existing documents should be targeted with document_update).
-    const conversationDocs = getDocumentsForConversation(ctx.conversationId);
-    const activeDocuments =
-      conversationDocs.length > 0
-        ? conversationDocs.map((d) => ({
-            surfaceId: d.surfaceId,
-            title: d.title,
-            wordCount: d.wordCount,
-            updatedAt: d.updatedAt,
-          }))
-        : null;
-    ctx.refreshWorkspaceTopLevelContextIfNeeded();
-    // Compute fresh turn timestamp for date grounding.
-    // Absolute "now" is always anchored to assistant host clock, while local
-    // date semantics prefer configured user timezone, then device timezones.
+    // Resolve the turn's timezone cascade up front. It depends only on config
+    // and the inbound request — never on retrieval output — so it can be
+    // settled before context assembly. Local date semantics prefer the
+    // configured user timezone, then device timezones, then the host clock.
     const hostTimeZone = Intl.DateTimeFormat().resolvedOptions().timeZone;
     const timezoneContext = resolveTurnTimezoneContext({
       configuredUserTimeZone: config.ui.userTimezone ?? null,
@@ -1544,9 +1094,6 @@ export async function runAgentLoopImpl(
       detectedTimezone: config.ui.detectedTimezone ?? null,
       hostTimeZone,
     });
-    const timestamp = formatTurnTimestamp({
-      timeZone: timezoneContext.effectiveTimezone,
-    });
     // Resolve the inbound actor context for the unified <turn_context> block.
     // When the conversation carries enough identity info, use the unified
@@ -1570,8 +1117,10 @@ export async function runAgentLoopImpl(
       }
     }
-    // Build unified turn context block that replaces the separate temporal,
-    // channel, interface, and actor context blocks.
+    // Resolve the channel/interface labels and the guardian flag for this
+    // turn. These derive only from the captured turn context and the resolved
+    // actor trust class — never from retrieval — so they settle before context
+    // assembly.
     const interfaceName =
       capturedTurnInterfaceContext.userMessageInterface ?? undefined;
     const channelName =
@@ -1616,9 +1165,54 @@ export async function runAgentLoopImpl(
       });
       const label = profileEntry?.label ?? effectiveProfileKey;
       modelProfileStr = resolved.model ? `${label} (${resolved.model})` : label;
-      setLastNotifiedInferenceProfile(ctx.conversationId, effectiveProfileKey);
+      // Record the notification for persistence on delivery rather than here:
+      // the model only "learns" the profile once it receives this turn
+      // context, signalled by the first `message_complete`. Persisting inline
+      // would mark the profile notified even if the turn is cancelled or fails
+      // before the model ever sees the notice.
+      state.pendingNotifiedInferenceProfile = effectiveProfileKey;
     }
+    // Memory retrieval — fetches PKB, NOW.md, and memory-graph outputs and
+    // persists the retrieval's own side effects (injected-block metadata,
+    // recall log, `memory_recalled` event). Runs at the early "prompt
+    // submitted, before context assembly" moment because its outputs feed the
+    // injection and overflow-reduction transforms below. It is shaped as the
+    // `user-prompt-submit-temp` hook handler but invoked directly for now: it
+    // must run early, while the canonical late `user-prompt-submit` hook
+    // (history repair, title) runs after those transforms, so the two cannot
+    // share a fire site until compaction is cleared from the gap between them.
+    const isTrustedActor = resolveTrustClass(ctx.trustContext) === "guardian";
+    const memoryCtx: MemoryRetrievalHookContext = {
+      graphMemory: ctx.graphMemory,
+      config: getConfig(),
+      onEvent,
+      isTrustedActor,
+      conversationId: ctx.conversationId,
+      userMessageId,
+      logger: rlog,
+      // An external cancel aborts `prepareMemory` instead of letting it run
+      // to completion after the turn has already been torn down.
+      signal: abortController.signal,
+      latestMessages: ctx.messages,
+    };
+    await userPromptSubmitMemoryRetrieval(memoryCtx);
+    // The retriever owns its side effects (injected-block metadata, recall
+    // log, `memory_recalled` event) and records the dense/sparse PKB query
+    // pair on the graph handle for the PKB-reminder injector to read back; the
+    // loop only reuses the injected message list downstream.
+    let runMessages = memoryCtx.latestMessages;
+    // Capture wall-clock "now" at its point of use, after the blocking memory
+    // retrieval, so the injected `<turn_context>` timestamp reflects current
+    // time rather than the moment the turn began.
+    const timestamp = formatTurnTimestamp({
+      timeZone: timezoneContext.effectiveTimezone,
+    });
+    // Build unified turn context block that replaces the separate temporal,
+    // channel, interface, and actor context blocks.
     const baseTurnContext = {
       timestamp,
       interfaceName,
@@ -1640,64 +1234,6 @@ export async function runAgentLoopImpl(
     // The `remember` tool handles scratchpad-style memory writes directly to the graph.
-    // Personal-memory trust gate: PKB, NOW.md, and v2 static blocks all
-    // hold private user content. Block exposure to non-guardian actors
-    // arriving over a remote channel; internal/local flows pass through.
-    // See `shouldExposePersonalMemory` for the threat model.
-    const personalMemoryAllowed = shouldExposePersonalMemory({
-      sourceChannel: ctx.trustContext?.sourceChannel,
-      isTrustedActor,
-    });
-    // Inject NOW.md and PKB content only on the first turn (or after
-    // compaction re-strips them).  Old injections persist in history and
-    // are never stripped on normal turns — this preserves the cached prefix.
-    // PKB/NOW content is sourced from the `memoryRetrieval` pipeline above
-    // so plugins can override either source without touching the agent loop.
-    // NOW.md injection can be disabled via `memory.retrieval.scratchpadInjection.enabled`.
-    const scratchpadInjectionEnabled =
-      getConfig().memory.retrieval.scratchpadInjection.enabled;
-    const currentNowContent =
-      personalMemoryAllowed && scratchpadInjectionEnabled
-        ? memoryResult.nowContent
-        : null;
-    const shouldInjectNowAndPkb = isFirstMessage || compactedThisTurn;
-    const nowScratchpad = shouldInjectNowAndPkb ? currentNowContent : null;
-    const currentPkbContent = personalMemoryAllowed
-      ? memoryResult.pkbContent
-      : null;
-    const pkbContext = shouldInjectNowAndPkb ? currentPkbContent : null;
-    const pkbActive = currentPkbContent !== null;
-    // V2 static memory block (essentials/threads/recent/buffer).
-    // `currentMemoryV2Static` is the trust-gated content reused by every
-    // re-injection path — it stays non-null on non-full-mode turns so
-    // that mid-turn reducer compaction (which strips the prior `<info>`
-    // block) can restore the freshest content. `memoryV2Static` is the
-    // first-turn / post-compaction cadence-gated value for initial
-    // injection only. `readMemoryV2StaticContent` self-gates on the v2
-    // flag + config and returns null when v2 is off.
-    const currentMemoryV2Static = personalMemoryAllowed
-      ? readMemoryV2StaticContent()
-      : null;
-    const memoryV2Static = shouldInjectNowAndPkb ? currentMemoryV2Static : null;
-    // PKB relevance-hint inputs. Resolved once per turn and reused across
-    // re-injections so post-compaction rebuilds pick up fresh hints against
-    // the updated conversation history.
-    const pkbRoot = pkbActive ? join(getWorkspaceDir(), "pkb") : undefined;
-    const pkbAutoInjectList = pkbRoot
-      ? getPkbAutoInjectList(pkbRoot)
-      : undefined;
-    // Pass `ctx` directly — `PkbContextConversation` is structural and
-    // `getInContextPkbPaths` re-reads `conversation.messages` on each call,
-    // so post-compaction re-injects see the updated history.
-    const pkbConversation = pkbActive ? ctx : undefined;
-    // PKB points live under a single workspace sentinel scope.
-    // See `PKB_WORKSPACE_SCOPE` for why.
-    const pkbScopeId = pkbActive ? PKB_WORKSPACE_SCOPE : undefined;
     // Subagent status injection — gives the parent LLM visibility into active/completed children.
     // Skipped when this conversation IS a subagent (no nesting) or has no children.
     const subagentStatusBlock = ctx.isSubagent
@@ -1752,36 +1288,23 @@ export async function runAgentLoopImpl(
         )
       : null;
-    // Guards the chronological-transcript override on re-injection after
-    // the reducer compacts `ctx.messages`. The captured transcript is the
-    // full persisted history; blindly replaying it on every re-inject would
-    // overwrite the reducer's compacted messages and undo compaction. Flip
-    // to `true` after any compaction so subsequent re-injections fall back
-    // to the reduced `ctx.messages`.
-    let reducerCompacted = compactedThisTurn;
+    state.reducerCompacted = compactedThisTurn;
+    // memory-v3-live: when on, the provider anchors its long-TTL cache
+    // breakpoint on the most recent STABLE user message, since the latest user
+    // message now carries the volatile per-turn `<memory>` block the v3
+    // injector emits. The matching v2-suppression strip is owned by
+    // `applyRuntimeInjections`, which reads the same flag itself. Flag off →
+    // bit-for-bit identical to today's v2 path.
+    const memoryV3Live = isAssistantFeatureFlagEnabled(
+      "memory-v3-live",
+      getConfig(),
+    );
     // Shared injection options — reused whenever we need to re-inject after reduction.
     const injectionOpts = {
-      diskPressureContext,
-      activeSurface,
-      activeDocuments,
-      workspaceTopLevelContext: shouldInjectWorkspace
-        ? ctx.workspaceTopLevelContext
-        : null,
-      channelCapabilities: ctx.channelCapabilities ?? null,
       channelCommandContext: ctx.commandIntent ?? null,
       unifiedTurnContext: unifiedTurnContextStr,
-      pkbContext,
-      pkbActive,
-      pkbQueryVector,
-      pkbSparseVector,
-      pkbScopeId,
-      pkbConversation,
-      pkbAutoInjectList,
-      pkbRoot,
-      pkbWorkingDir: pkbActive ? ctx.workingDir : undefined,
-      memoryV2Static,
-      nowScratchpad,
       voiceCallControlPrompt: ctx.voiceCallControlPrompt ?? null,
       transportHints: ctx.transportHints ?? null,
       isNonInteractive: !isInteractiveResolved,
@@ -1803,7 +1326,7 @@ export async function runAgentLoopImpl(
     const injection = await applyRuntimeInjections(runMessages, {
       ...injectionOpts,
-      slackChronologicalMessages: reducerCompacted
+      slackChronologicalMessages: state.reducerCompacted
         ? null
         : injectionOpts.slackChronologicalMessages,
       mode: currentInjectionMode,
@@ -1849,18 +1372,7 @@ export async function runAgentLoopImpl(
           metadataUpdates.memoryV2StaticBlock =
             injection.blocks.memoryV2StaticBlock;
         }
-        await runPipeline<PersistArgs, PersistResult>(
-          "persistence",
-          getMiddlewaresFor("persistence"),
-          defaultPersistenceTerminal,
-          {
-            op: "update",
-            messageId: userMessageId,
-            updates: metadataUpdates,
-          },
-          buildPluginTurnContext(ctx, reqId),
-          DEFAULT_TIMEOUTS.persistence,
-        );
+        updateMessageMetadata(userMessageId, metadataUpdates);
       } catch (err) {
         rlog.warn({ err }, "Failed to persist injection metadata (non-fatal)");
       }
@@ -1876,51 +1388,18 @@ export async function runAgentLoopImpl(
     let reducerState: ReducerState | undefined;
     const toolTokenBudget = ctx.agentLoop.getToolTokenBudget(runMessages);
-    // Canonical calibration key — passed to the `tokenEstimate` pipeline for
-    // every preflight/mid-loop estimate, the overflow reducer config, and the
-    // convergence-path `estimatePromptTokens` call. Matches the key recorded
-    // by `handleUsage` for wrapper providers (OpenRouter routing to
-    // Anthropic → key is `"anthropic"`).
+    // Canonical calibration key — used by the preflight estimate, the
+    // overflow reducer config, and the convergence-path `estimatePromptTokens`
+    // call. Matches the key recorded by `handleUsage` for wrapper providers
+    // (OpenRouter routing to Anthropic → key is `"anthropic"`).
     const estimationProviderName = getCalibrationProviderKey(ctx.provider);
-    // Shared `TurnContext` for every `tokenEstimate` pipeline invocation in
-    // this turn. The pipeline is the extension point for plugins that want
-    // to substitute an alternate estimator (e.g. provider-native tokenization)
-    // without touching orchestrator code.
-    //
-    // Routed through the canonical builder — `turnIndex` is `ctx.turnCount`,
-    // trust cascades through per-turn/conversation-level/fallback, and the
-    // context-window handle rides along so any middleware that wants to
-    // reuse the manager (e.g. to compute compaction-aware estimates) can.
-    const pipelineTurnCtx = buildPluginTurnContext(ctx, reqId);
-    const runTokenEstimatePipeline = (
-      history: Message[],
-    ): Promise<EstimateResult> =>
-      runPipeline<EstimateArgs, EstimateResult>(
-        "tokenEstimate",
-        getMiddlewaresFor("tokenEstimate"),
-        defaultTokenEstimateTerminal,
-        {
-          // Shallow-frozen copies so a misbehaving middleware that mutates
-          // `args.history` or `args.tools` in place (e.g. trims the array
-          // before calling next) can't silently strip prompt context from
-          // the orchestrator's live `runMessages` / resolved-tools arrays.
-          // TypeScript `readonly` on `EstimateArgs` does not prevent
-          // `push`/`splice` at runtime; the frozen wrapper throws in strict
-          // mode and isolates any mutation attempts from the call-site state.
-          history: Object.freeze([...history]) as Message[],
-          systemPrompt: ctx.systemPrompt,
-          tools: Object.freeze([
-            ...ctx.agentLoop.getResolvedTools(history),
-          ]) as ToolDefinition[],
-          providerName: estimationProviderName,
-        },
-        pipelineTurnCtx,
-        DEFAULT_TIMEOUTS.tokenEstimate,
-      );
-    const preflightTokens = await runTokenEstimatePipeline(runMessages);
+    const preflightTokens = estimatePromptTokensWithTools(
+      runMessages,
+      ctx.systemPrompt,
+      ctx.agentLoop.getResolvedTools(runMessages),
+      estimationProviderName,
+    );
     if (overflowRecovery.enabled && preflightTokens > preflightBudget) {
       rlog.warn(
@@ -1932,16 +1411,12 @@ export async function runAgentLoopImpl(
         "Preflight budget exceeded — running overflow reducer before provider call",
       );
-      // Overflow reduction runs through the plugin pipeline. The default
-      // middleware (`default-overflow-reduce`, registered at bootstrap)
-      // contains the historical tier loop — forced compaction → tool-result
-      // truncation → media stubbing → injection downgrade — plus the
-      // re-inject/re-estimate convergence check. The callbacks below are
-      // the orchestrator-specific side effects that the plugin coordinates
-      // per iteration (activity emission, compaction application, runtime
-      // injection reassembly, token re-estimation). Registered plugins that
-      // wrap the `overflowReduce` slot see each iteration through their own
-      // middleware `next` callback.
+      // `runOverflowReductionLoop` drives the tier loop — forced compaction →
+      // tool-result truncation → media stubbing → injection downgrade — plus
+      // the re-inject/re-estimate convergence check. The callbacks below are
+      // the orchestrator-specific side effects it coordinates per iteration
+      // (activity emission, compaction application, runtime injection
+      // reassembly, token re-estimation).
       const messagesForPreflightOverflowReduction =
         slackChronologicalContext?.messages ?? ctx.messages;
       const overflowArgs: OverflowReduceArgs = {
@@ -1955,75 +1430,23 @@ export async function runAgentLoopImpl(
         maxAttempts: resolveCurrentContextBudget().overflowRecovery.maxAttempts,
         abortSignal: abortController.signal,
         compactFn: async (msgs, signal, opts) => {
-          // Route the reducer's forced-compaction tier through the
-          // `compaction` pipeline so registered plugins observe these
-          // invocations. Without this, custom compaction middleware only
-          // sees the three orchestrator-owned call sites and misses the
-          // reducer-initiated forced compactions entirely.
-          //
-          // Pipeline timeouts must be caught locally — a `PluginTimeoutError`
-          // bubbling out of here would abort the overflow-reducer tier loop
-          // entirely, skipping fallback tiers (tool-result truncation, media
-          // stubbing, injection downgrade) and bypassing circuit-breaker
-          // bookkeeping. On timeout, record the failure and return a
-          // `compacted: false` result so the reducer falls through to the
-          // next tier.
-          try {
-            return (await runPipeline<CompactionArgs, CompactionResult>(
-              "compaction",
-              getMiddlewaresFor("compaction"),
-              (args) =>
-                defaultCompactionTerminal(
-                  args,
-                  buildPluginTurnContext(ctx, reqId),
-                ),
-              {
-                messages: msgs,
-                signal,
-                options: {
-                  ...(opts ?? {}),
-                  overrideProfile: resolveCurrentOverrideProfile() ?? null,
-                },
-              },
-              buildPluginTurnContext(ctx, reqId),
-              DEFAULT_TIMEOUTS.compaction,
-            )) as Awaited<
-              ReturnType<typeof ctx.contextWindowManager.maybeCompact>
-            >;
-          } catch (err) {
-            if (err instanceof PluginTimeoutError) {
-              rlog.warn(
-                { err, phase: "overflow-reducer-forced-compaction" },
-                "Compaction pipeline timed out — falling through to next reducer tier",
-              );
-              await trackCompactionOutcome(ctx, true, onEvent);
-              return {
-                messages: msgs,
-                compacted: false,
-                previousEstimatedInputTokens: 0,
-                estimatedInputTokens: 0,
-                maxInputTokens: 0,
-                thresholdTokens: 0,
-                compactedMessages: 0,
-                compactedPersistedMessages: 0,
-                summaryCalls: 0,
-                summaryInputTokens: 0,
-                summaryOutputTokens: 0,
-                summaryModel: "",
-                summaryText: "",
-                reason: "compaction pipeline timed out",
-              };
-            }
-            throw err;
-          }
+          // Delegate the reducer's forced-compaction tier to the default
+          // compaction plugin, overlaying the turn's resolved inference
+          // profile and actor trust class onto the reducer-supplied options.
+          const reducerOptions = (opts ?? {}) as ContextWindowCompactOptions;
+          return defaultCompact({
+            manager: ctx.contextWindowManager,
+            messages: msgs,
+            signal,
+            ...reducerOptions,
+            overrideProfile: resolveCurrentOverrideProfile() ?? null,
+            actorTrustClass: resolveTurnActorTrustClass(ctx),
+          });
         },
         emitActivityState: () => {
-          ctx.emitActivityState(
-            "thinking",
-            "context_compacting",
-            "assistant_turn",
-            reqId,
-          );
+          ctx.emitActivityState("thinking", "context_compacting", {
+            requestId: reqId,
+          });
         },
         onCompactionResult: async (result, compactedBasis) => {
           // Track circuit-breaker state whenever the reducer invoked
@@ -2036,11 +1459,13 @@ export async function runAgentLoopImpl(
           // truncation-only path, etc.) that shouldn't influence the
           // breaker.
           if (result.summaryFailed !== undefined) {
-            await trackCompactionOutcome(ctx, result.summaryFailed, onEvent);
+            await ctx.agentLoop.compactionCircuit.recordOutcome(
+              result.summaryFailed,
+              onEvent,
+            );
           }
           if (result.compacted) {
             await applySuccessfulCompaction(result, compactedBasis);
-            shouldInjectWorkspace = true;
           }
         },
         reinjectForMode: async (
@@ -2051,27 +1476,25 @@ export async function runAgentLoopImpl(
         ) => {
           // Mirror the pre-PR-23 behavior: `ctx.messages` must track the
           // reducer's latest output before re-injection runs, because other
-          // sites consulted through `injectionOpts` (`workspaceTopLevelContext`,
-          // slack history, etc.) depend on it and `applyCompactionResult`
-          // only updates `ctx.messages` on a compaction tier. Assigning here
+          // sites consulted through `injectionOpts` (slack history, etc.) and
+          // the injectors' own message-presence scans depend on it, and
+          // `applyCompactionResult` only updates `ctx.messages` on a
+          // compaction tier. Assigning here
           // keeps non-compaction tiers (tool-result truncation, media
           // stubbing, injection downgrade) observable to downstream
           // injection assembly on the same turn.
           ctx.messages = reducedMessages;
-          // When THIS iteration compacted, it stripped existing NOW.md /
-          // PKB blocks — so we re-inject current content. A later iteration
-          // that only truncates or downgrades must NOT re-force PKB/NOW,
+          // When THIS iteration compacted, it stripped the existing
+          // memory-static block — so we re-inject current content. A later
+          // iteration that only truncates or downgrades must NOT re-force it,
           // or each round would grow the token count.
           // Gate: only the iteration that actually compacted re-injects.
+          // (The `<knowledge_base>`, NOW.md, and v2 static `<info>` blocks
+          // self-gate inside their injectors on whether they are already
+          // present in `reducedMessages`.)
           const injection = await applyRuntimeInjections(reducedMessages, {
             ...injectionOpts,
-            ...(stepCompacted && { pkbContext: currentPkbContent }),
-            ...(stepCompacted && { memoryV2Static: currentMemoryV2Static }),
-            ...(stepCompacted && { nowScratchpad: currentNowContent }),
-            workspaceTopLevelContext: shouldInjectWorkspace
-              ? ctx.workspaceTopLevelContext
-              : null,
             // Once ANY iteration has compacted `ctx.messages`, the captured
             // `slackChronologicalMessages` snapshot (built from the full
             // persisted transcript) would overwrite the compacted history
@@ -2097,86 +1520,14 @@ export async function runAgentLoopImpl(
           }),
       };
-      const overflowResult = await runPipeline<
-        OverflowReduceArgs,
-        OverflowReduceResult
-      >(
-        "overflowReduce",
-        getMiddlewaresFor("overflowReduce"),
-        // Terminal — only reached when every registered middleware calls
-        // `next` and delegates past the innermost layer. The default plugin
-        // is a terminal itself (it doesn't call `next`), so in practice
-        // this fallback fires only when the default has been explicitly
-        // deregistered (tests) and no user plugin replaces it. Strict-fail
-        // semantics: throw so the missing terminal surfaces as a visible
-        // error instead of silently returning the history untouched.
-        async () => {
-          throw new PluginExecutionError(
-            "overflowReduce pipeline has no terminal handler — every reducer middleware called next() without providing a replacement",
-            "overflowReduce",
-          );
-        },
-        overflowArgs,
-        buildPluginTurnContext(ctx, reqId),
-        DEFAULT_TIMEOUTS.overflowReduce,
-      );
+      const overflowResult = await runOverflowReductionLoop(overflowArgs);
       ctx.messages = overflowResult.messages;
       runMessages = overflowResult.runMessages;
       currentInjectionMode = overflowResult.injectionMode;
       reducerState = overflowResult.reducerState;
       if (overflowResult.reducerCompacted) {
-        reducerCompacted = true;
-      }
-    }
-    // Pre-run repair — routed through the `historyRepair` plugin pipeline so
-    // plugins can observe or override repair behavior. The default plugin's
-    // middleware is a passthrough; the actual repair runs in the terminal
-    // (`defaultHistoryRepairTerminal`).
-    let preRepairMessages = runMessages;
-    let preRunRepair: HistoryRepairResult | null = null;
-    try {
-      preRunRepair = await runPipeline<HistoryRepairArgs, HistoryRepairResult>(
-        "historyRepair",
-        getMiddlewaresFor("historyRepair"),
-        async (args) => defaultHistoryRepairTerminal(args),
-        { history: runMessages, provider: ctx.provider.name },
-        buildPluginTurnContext(ctx, reqId),
-        DEFAULT_TIMEOUTS.historyRepair,
-      );
-    } catch (err) {
-      if (err instanceof PluginTimeoutError) {
-        // Pipeline exceeded its budget — likely a misbehaving third-party
-        // middleware. Degrade gracefully by proceeding with the un-repaired
-        // history rather than turn-fatal-erroring; un-repaired history is
-        // strictly better than no turn at all, and the provider call itself
-        // will still error visibly if the drift is unrecoverable.
-        rlog.warn(
-          { err, phase: "pre_run" },
-          "historyRepair pipeline timed out — proceeding with un-repaired history",
-        );
-      } else {
-        throw err;
-      }
-    }
-    if (preRunRepair !== null) {
-      // Always adopt the pipeline's output history — a user `historyRepair`
-      // middleware may rewrite `messages` (e.g. provider-specific
-      // normalization) without incrementing any of the built-in repair
-      // counters. Gating the assignment on `stats` would silently discard
-      // those edits and send the un-rewritten history to the provider.
-      runMessages = preRunRepair.messages;
-      if (
-        preRunRepair.stats.assistantToolResultsMigrated > 0 ||
-        preRunRepair.stats.missingToolResultsInserted > 0 ||
-        preRunRepair.stats.orphanToolResultsDowngraded > 0 ||
-        preRunRepair.stats.consecutiveSameRoleMerged > 0
-      ) {
-        rlog.warn(
-          { phase: "pre_run", ...preRunRepair.stats },
-          "Repaired runtime history before provider call",
-        );
+        state.reducerCompacted = true;
       }
     }
@@ -2195,22 +1546,22 @@ export async function runAgentLoopImpl(
     }
     // user-prompt-submit hook: plugins may transform `runMessages` right
-    // before the agent loop receives them. Fires once per user turn at
-    // the primary `agentLoop.run` only — the re-entry / retry calls
-    // further down in this function do not refire it (they're not new
-    // user submissions). Plugins may mutate `ctx.latestMessages` in place
-    // OR return a new context with a fresh array; `runHook` forwards
-    // whichever the chain settles on. Order is plugin registration order.
+    // before the agent loop receives them. Fires once per user turn at the
+    // primary `agentLoop.run` only — the re-entry / retry calls further down
+    // in this function do not refire it (they're not new user submissions).
+    // Plugins may mutate `ctx.latestMessages` in place OR return a new
+    // context with a fresh array; `runHook` forwards whichever the chain
+    // settles on. Order is plugin registration order.
     //
-    // Fires BEFORE `preRunHistoryLength` is captured so the boundary
-    // between pre-existing and hook-emitted messages — consumed by the
-    // ordering-error retry gate, the post-run reconcile loop, and the
-    // new-message extraction for persistence — reflects exactly what
-    // `agentLoop.run` receives.
+    // Fires BEFORE the agent loop runs so the hook-emitted messages are part
+    // of the loop's input; the loop then reports its own appended output via
+    // `AgentLoopRunResult.newMessages`, which is what persistence consumes.
     const userPromptCtx: UserPromptSubmitContext = {
       conversationId: ctx.conversationId,
+      prompt: options?.titleText ?? content,
       originalMessages: ctx.messages,
       latestMessages: runMessages,
+      logger: rlog,
     };
     const finalUserPromptCtx = await runHook(
       HOOKS.USER_PROMPT_SUBMIT,
@@ -2218,8 +1569,6 @@ export async function runAgentLoopImpl(
     );
     runMessages = finalUserPromptCtx.latestMessages;
-    let preRunHistoryLength = runMessages.length;
     const shouldGenerateTitle = isReplaceableTitle(
       getConversation(ctx.conversationId)?.title ?? null,
     );
@@ -2233,42 +1582,18 @@ export async function runAgentLoopImpl(
       rlog,
       turnChannelContext: capturedTurnChannelContext,
       turnInterfaceContext: capturedTurnInterfaceContext,
+      applyCompaction: applySuccessfulCompaction,
     };
-    const eventHandler = (event: AgentEvent) =>
+    const eventHandler = (event: AgentEvent): Promise<void> =>
       dispatchAgentEvent(state, deps, event);
     emitTerminalExit = async (reason: AgentLoopExitReason): Promise<void> => {
       await eventHandler({ type: "agent_loop_exit", reason });
     };
-    const onCheckpoint = async (
-      checkpoint: CheckpointInfo,
-    ): Promise<CheckpointDecision> => {
-      state.currentTurnToolNames = [];
+    const onCheckpoint = async (): Promise<CheckpointDecision> => {
       if (ctx.canHandoffAtCheckpoint()) {
-        yieldedForHandoff = true;
-        pendingCheckpointYield = "handoff";
-        return "yield";
+        return "handoff";
       }
-      // Mid-loop token budget check: estimate current context size and
-      // yield if we're approaching the preflight budget. This lets the
-      // conversation-agent-loop run compaction before the provider rejects.
-      if (overflowRecovery.enabled) {
-        const midLoopThreshold =
-          resolveCurrentContextBudget().preflightBudget * 0.85;
-        const estimated = await runTokenEstimatePipeline(checkpoint.history);
-        if (estimated > midLoopThreshold) {
-          rlog.warn(
-            { phase: "mid-loop", estimated, threshold: midLoopThreshold },
-            "Token estimate approaching budget — yielding for compaction",
-          );
-          yieldedForBudget = true;
-          pendingCheckpointYield = "budget";
-          return "yield";
-        }
-      }
       return "continue";
     };
@@ -2277,26 +1602,83 @@ export async function runAgentLoopImpl(
     rlog.info({ callSite: turnCallSite }, "Starting agent loop run");
     // Thread the orchestrator's canonical per-turn context into the agent
-    // loop so its internal pipeline invocations (llmCall, emptyResponse,
-    // toolError, toolResultTruncate, toolExecute) see the real
-    // conversation identity / trust / contextWindowManager instead of the
-    // synthesized `"agent-loop"` placeholder. The loop clones this value
+    // loop so its internal pipeline invocations (e.g. compaction) see the
+    // real conversation identity / trust / contextWindowManager instead of
+    // the synthesized `"agent-loop"` placeholder. The loop clones this value
     // and overwrites `turnIndex` with its own tool-use iteration counter.
     const loopTurnCtx = buildPluginTurnContext(ctx, reqId);
-    let updatedHistory = await ctx.agentLoop.run(
-      runMessages,
-      eventHandler,
-      abortController.signal,
-      reqId,
-      onCheckpoint,
-      turnCallSite,
-      loopTurnCtx,
-      turnOverrideProfile,
-      resolveCurrentMaxInputTokens(),
-      resolveCurrentOverrideProfile,
-      resolveCurrentMaxInputTokens,
-    );
+    // Hook for the loop-owned mid-loop compaction. The agent loop owns the
+    // trigger (its budget gate), the `compaction` pipeline call, the result
+    // interpretation (circuit-breaker bookkeeping + the exhaustion decision),
+    // and the inline continue; this callback bridges the injection state the
+    // loop is intentionally blind to. Durable persistence is signalled via
+    // events; re-injection stays orchestrator-supplied for now.
+    const midLoopCompaction: MidLoopCompaction = {
+      postCompactionHook: async ({ history, turnContext }) => {
+        // stripInjectionsForCompaction() unconditionally removed the existing
+        // memory-static block, so re-inject the current content regardless of
+        // whether compaction actually ran. The `<knowledge_base>`, NOW.md, and
+        // v2 static `<info>` blocks self-gate inside their injectors on block
+        // presence.
+        const injection = await postCompactReinject({
+          ...injectionOpts,
+          // Suppress the chronological-transcript snapshot once the reducer
+          // has collapsed `ctx.messages`; the captured snapshot reflects the
+          // full persisted transcript and would overwrite compaction.
+          slackChronologicalMessages: state.reducerCompacted
+            ? null
+            : injectionOpts.slackChronologicalMessages,
+          mode: currentInjectionMode,
+          turnContext,
+          history,
+          logger: rlog,
+        });
+        return injection.messages;
+      },
+    };
+    /**
+     * Shared closure: runs the agent loop with the orchestrator's turn
+     * context and maps the loop's returned checkpoint pause-reason into the
+     * orchestrator's yield bookkeeping. Returns the updated history so call
+     * sites consume it exactly as before. Pass `compaction` only for the
+     * primary run, where the loop compacts in place when its budget gate
+     * trips; reruns omit it and keep yielding for budget.
+     */
+    const runAgentLoop = async (
+      msgs: Message[],
+      compaction?: MidLoopCompaction,
+    ): Promise<Message[]> => {
+      const { history, exitReason, appendedNewMessages, newMessages } =
+        await ctx.agentLoop.run(msgs, eventHandler, {
+          signal: abortController.signal,
+          requestId: reqId,
+          onCheckpoint,
+          callSite: turnCallSite,
+          turnContext: loopTurnCtx,
+          overrideProfile: turnOverrideProfile,
+          resolveOverrideProfile: resolveCurrentOverrideProfile,
+          resolveContextWindow,
+          compaction,
+          // memory-v3-live: the latest user message carries the volatile v3
+          // `<memory>` block, so anchor the provider's long-TTL cache breakpoint
+          // on the most recent stable message instead.
+          mutableLatestUserMessage: memoryV3Live,
+        });
+      lastRunAppendedNewMessages = appendedNewMessages;
+      lastRunNewMessages = newMessages;
+      if (exitReason === "handoff") {
+        yieldedForHandoff = true;
+        pendingCheckpointYield = "handoff";
+      } else if (exitReason === "budget") {
+        yieldedForBudget = true;
+        pendingCheckpointYield = "budget";
+      }
+      return history;
+    };
+    let updatedHistory = await runAgentLoop(runMessages, midLoopCompaction);
     rlog.info(
       { resultMessageCount: updatedHistory.length },
@@ -2308,211 +1690,43 @@ export async function runAgentLoopImpl(
       pendingCheckpointYield = null;
     }
-    // ── Proactive mid-loop compaction ───────────────────────────────
-    // When the agent loop yielded because the token budget check in
-    // onCheckpoint detected approaching limits, run compaction on the
-    // accumulated history and re-enter the agent loop. This is distinct
-    // from the reactive convergence loop below that fires after a
-    // provider rejection — here we compact *before* hitting the limit.
-    let midLoopCompactAttempts = 0;
-    while (
-      yieldedForBudget &&
-      midLoopCompactAttempts <
-        resolveCurrentContextBudget().overflowRecovery.maxAttempts &&
-      !state.contextTooLargeDetected &&
-      !abortController.signal.aborted
-    ) {
-      midLoopCompactAttempts++;
-      yieldedForBudget = false;
-      pendingCheckpointYield = null;
-      rlog.info(
-        { phase: "mid-loop-compact" },
-        "Running compaction after checkpoint yield",
-      );
-      // Strip injected context from updated history before compacting,
-      // so we compact the "raw" persistent messages.
-      const rawHistory = stripInjectionsForCompaction(updatedHistory);
-      ctx.messages = rawHistory;
-      markHistoryStrippedBestEffort(ctx.conversationId, Date.now(), rlog);
-      ctx.emitActivityState(
-        "thinking",
-        "context_compacting",
-        "assistant_turn",
-        reqId,
-        "Compacting context",
-      );
-      let midLoopCompact: Awaited<
-        ReturnType<typeof ctx.contextWindowManager.maybeCompact>
-      >;
-      try {
-        midLoopCompact = (await runPipeline<CompactionArgs, CompactionResult>(
-          "compaction",
-          getMiddlewaresFor("compaction"),
-          (args) =>
-            defaultCompactionTerminal(args, buildPluginTurnContext(ctx, reqId)),
-          {
-            messages: ctx.messages,
-            signal: abortController.signal,
-            options: {
-              lastCompactedAt: ctx.contextCompactedAt ?? undefined,
-              force: true,
-              targetInputTokensOverride:
-                resolveCurrentContextBudget().preflightBudget,
-              conversationOriginChannel:
-                getConversationOriginChannel(ctx.conversationId) ?? undefined,
-              overrideProfile: resolveCurrentOverrideProfile() ?? null,
-            },
-          },
-          buildPluginTurnContext(ctx, reqId),
-          DEFAULT_TIMEOUTS.compaction,
-        )) as Awaited<ReturnType<typeof ctx.contextWindowManager.maybeCompact>>;
-      } catch (err) {
-        if (err instanceof PluginTimeoutError) {
-          // Mid-loop compaction timed out. Record the failure for the
-          // circuit breaker and escalate to the convergence loop's more
-          // aggressive reducer tiers (tool-result truncation, media
-          // stubbing, injection downgrade) by flipping the overflow flag
-          // and breaking out of the mid-loop retry. The existing
-          // "exhausted all attempts" block further down handles the
-          // escalation.
-          rlog.warn(
-            { err, phase: "mid-loop-compact" },
-            "Compaction pipeline timed out — escalating to convergence loop",
-          );
-          await trackCompactionOutcome(ctx, true, onEvent);
-          state.contextTooLargeDetected = true;
-          break;
-        }
-        throw err;
-      }
-      // `force: true` bypasses the cooldown/threshold gates but early returns
-      // for "no eligible messages" / "insufficient messages" still leave
-      // `summaryFailed` undefined. Only track when the summary LLM actually ran.
-      if (midLoopCompact.summaryFailed !== undefined) {
-        await trackCompactionOutcome(
-          ctx,
-          midLoopCompact.summaryFailed,
-          onEvent,
-        );
-      }
-      if (midLoopCompact.compacted) {
-        await applySuccessfulCompaction(midLoopCompact, rawHistory);
-        reducerCompacted = true;
-        shouldInjectWorkspace = true;
-      }
-      // Re-inject runtime context and re-enter the agent loop.
-      // stripInjectionsForCompaction() unconditionally removed the existing
-      // NOW.md block from ctx.messages above, so we must always re-inject
-      // the current content regardless of whether compaction actually ran.
-      const injection = await applyRuntimeInjections(ctx.messages, {
-        ...injectionOpts,
-        pkbContext: currentPkbContent,
-        memoryV2Static: currentMemoryV2Static,
-        nowScratchpad: currentNowContent,
-        workspaceTopLevelContext: shouldInjectWorkspace
-          ? ctx.workspaceTopLevelContext
-          : null,
-        // Suppress the chronological-transcript snapshot once the reducer
-        // has collapsed `ctx.messages`; the captured snapshot reflects the
-        // full persisted transcript and would overwrite compaction.
-        slackChronologicalMessages: reducerCompacted
-          ? null
-          : injectionOpts.slackChronologicalMessages,
-        mode: currentInjectionMode,
-        turnContext: buildPluginTurnContext(ctx, reqId),
-      });
-      runMessages = injection.messages;
-      if (isTrustedActor && currentInjectionMode !== "minimal") {
-        ctx.graphMemory.retrackCachedNodes();
-      }
-      const midLoopCompactStrip = stripHistoricalWebSearchResults(runMessages);
-      if (midLoopCompactStrip.stats.blocksStripped > 0) {
-        rlog.info(
-          { phase: "mid-loop-compact", ...midLoopCompactStrip.stats },
-          "Converted historical web_search_tool_result blocks to text summaries",
-        );
-        runMessages = midLoopCompactStrip.messages;
-      }
-      preRepairMessages = runMessages;
-      preRunHistoryLength = runMessages.length;
-      updatedHistory = await ctx.agentLoop.run(
-        runMessages,
-        eventHandler,
-        abortController.signal,
-        reqId,
-        onCheckpoint,
-        turnCallSite,
-        loopTurnCtx,
-        turnOverrideProfile,
-        resolveCurrentMaxInputTokens(),
-        resolveCurrentOverrideProfile,
-        resolveCurrentMaxInputTokens,
-      );
-    }
-    // If mid-loop compaction exhausted all attempts but the agent loop
-    // still yielded (yieldedForBudget is true), the turn is incomplete.
-    // Escalate to the convergence loop's more aggressive reducer tiers
-    // (tool-result truncation, media stubbing, injection downgrade)
-    // instead of silently treating an incomplete turn as done.
+    // The loop compacts in place when its budget gate trips and only yields
+    // `exitReason = "budget"` when that inline compaction timed out or
+    // exhausted its retry budget (the `reinject` hook has already restored
+    // runtime context for the productive case). Escalate to the convergence
+    // loop's more aggressive reducer tiers so a half-finished turn doesn't
+    // reach the user.
     if (yieldedForBudget && !abortController.signal.aborted) {
       rlog.warn(
-        {
-          phase: "mid-loop-compact",
-          midLoopCompactAttempts,
-          maxAttempts:
-            resolveCurrentContextBudget().overflowRecovery.maxAttempts,
-        },
-        "Mid-loop compaction exhausted all attempts — escalating to convergence loop",
+        { phase: "mid-loop-compact" },
+        "Inline compaction could not get under budget — escalating to convergence loop",
       );
       state.contextTooLargeDetected = true;
     }
     // One-shot ordering error retry
-    if (
-      state.orderingErrorDetected &&
-      updatedHistory.length === preRunHistoryLength
-    ) {
+    if (state.orderingErrorDetected && !lastRunAppendedNewMessages) {
       rlog.warn(
         { phase: "retry" },
         "Provider ordering error detected, attempting one-shot deep-repair retry",
       );
-      // Design note: deep-repair intentionally bypasses the `historyRepair`
-      // plugin pipeline. Deep-repair is a recovery-only path triggered by a
-      // provider ordering error — it must be deterministic and unaffected by
-      // user middleware that might have caused (or be unable to recover from)
-      // the original drift. Plugins can already observe / override the
-      // pre-run repair via the `historyRepair` pipeline above; widening that
-      // surface to deep-repair is intentionally deferred until there's a
-      // concrete plugin-level use case. Do not route this call through
-      // `runPipeline` without first revisiting that contract.
-      const retryRepair = deepRepairHistory(runMessages);
+      // Design note: deep-repair intentionally stays a direct call rather
+      // than running through the `user-prompt-submit` hook chain. Deep-repair
+      // is a recovery-only path triggered by a provider ordering error — it
+      // must be deterministic and unaffected by user hooks that might have
+      // caused (or be unable to recover from) the original drift. Plugins can
+      // already observe / transform the pre-run repair via the
+      // `user-prompt-submit` hook (the default history-repair plugin runs
+      // `repairHistory` there); widening that surface to deep-repair is
+      // intentionally deferred until there's a concrete plugin-level use case.
+      const retryRepair = deepRepairHistory(updatedHistory);
       runMessages = retryRepair.messages;
       const retryStrip = stripHistoricalWebSearchResults(runMessages);
       runMessages = retryStrip.messages;
-      preRepairMessages = runMessages;
-      preRunHistoryLength = runMessages.length;
       state.orderingErrorDetected = false;
       state.deferredOrderingError = null;
-      updatedHistory = await ctx.agentLoop.run(
-        runMessages,
-        eventHandler,
-        abortController.signal,
-        reqId,
-        onCheckpoint,
-        turnCallSite,
-        loopTurnCtx,
-        turnOverrideProfile,
-        resolveCurrentMaxInputTokens(),
-        resolveCurrentOverrideProfile,
-        resolveCurrentMaxInputTokens,
-      );
+      updatedHistory = await runAgentLoop(runMessages);
       if (state.orderingErrorDetected) {
         rlog.error(
@@ -2561,29 +1775,31 @@ export async function runAgentLoopImpl(
             }
             // Can't resize — replace with a text annotation so the model
             // can explain the situation rather than silently dropping context
-            return [
-              {
-                type: "text" as const,
-                text: "(An image was attached but could not be sent — its dimensions exceed the provider limit and automatic resize was not available. Please resize the image and try again.)",
-              },
-            ];
+            return [{ type: "text" as const, text: UNSENDABLE_IMAGE_NOTE }];
           }),
         };
       });
+      // The transform above only mutates ctx.messages for the current retry.
+      // Persist the downgrade for images that can never be sent so the rejected
+      // upload doesn't rehydrate from the DB and resurface on later turns. This
+      // is cleanup for future turns, so a persistence failure must never abort
+      // the retry that is about to run — log it and continue.
+      try {
+        const rewritten = persistUnsendableImageDowngrades(ctx.conversationId);
+        if (rewritten > 0) {
+          rlog.info(
+            { phase: "image-recovery", rewritten },
+            "Persisted unsendable-image downgrades so they cannot resurface",
+          );
+        }
+      } catch (err) {
+        rlog.warn(
+          { phase: "image-recovery", err },
+          "Failed to persist unsendable-image downgrade; continuing with in-memory recovery",
+        );
+      }
       runMessages = ctx.messages;
-      updatedHistory = await ctx.agentLoop.run(
-        runMessages,
-        eventHandler,
-        abortController.signal,
-        reqId,
-        onCheckpoint,
-        turnCallSite,
-        loopTurnCtx,
-        turnOverrideProfile,
-        resolveCurrentMaxInputTokens(),
-        resolveCurrentOverrideProfile,
-        resolveCurrentMaxInputTokens,
-      );
+      updatedHistory = await runAgentLoop(runMessages);
       if (state.imageTooLargeDetected) {
         rlog.error(
           { phase: "image-recovery" },
@@ -2610,19 +1826,9 @@ export async function runAgentLoopImpl(
     // limit), incorporate those new messages into ctx.messages so the
     // convergence loop operates on the full (larger) history.
     if (state.contextTooLargeDetected) {
-      // Detect whether ctx.messages currently lacks NOW.md so we know if
-      // it needs to be re-injected.  Mid-loop compaction (line ~1067) may
-      // have already stripped injections before escalating here, so we
-      // check actual message state rather than tracking mutation sites.
-      let convergenceStripped =
-        findLastInjectedNowContent(ctx.messages) === null;
-      if (updatedHistory.length > preRunHistoryLength) {
+      if (lastRunAppendedNewMessages) {
         ctx.messages = stripInjectionsForCompaction(updatedHistory);
-        markHistoryStrippedBestEffort(ctx.conversationId, Date.now(), rlog);
-        convergenceStripped = true;
-        preRepairMessages = updatedHistory;
-        preRunHistoryLength = updatedHistory.length;
+        markHistoryStrippedBestEffort(ctx.conversationId);
       }
       if (!reducerState) {
         reducerState = createInitialReducerState();
@@ -2703,15 +1909,13 @@ export async function runAgentLoopImpl(
               "Emergency mid-turn compaction succeeded — bypassing reducer tiers",
             );
             if (emergencyResult.summaryFailed !== undefined) {
-              await trackCompactionOutcome(
-                ctx,
+              await ctx.agentLoop.compactionCircuit.recordOutcome(
                 emergencyResult.summaryFailed,
                 onEvent,
               );
             }
             if (emergencyResult.compacted) {
               await applySuccessfulCompaction(emergencyResult, ctx.messages);
-              shouldInjectWorkspace = true;
             }
             // Clear the overflow flag and re-run the agent loop with
             // the compacted context.
@@ -2744,12 +1948,9 @@ export async function runAgentLoopImpl(
           "Context too large — applying next reducer tier",
         );
-        ctx.emitActivityState(
-          "thinking",
-          "context_compacting",
-          "assistant_turn",
-          reqId,
-        );
+        ctx.emitActivityState("thinking", "context_compacting", {
+          requestId: reqId,
+        });
         const convergenceCompactionBasis = ctx.messages;
         const step = await reduceContextOverflow(
           convergenceCompactionBasis,
@@ -2765,6 +1966,7 @@ export async function runAgentLoopImpl(
             ctx.contextWindowManager.maybeCompact(msgs, signal!, {
               ...(opts ?? {}),
               overrideProfile: resolveCurrentOverrideProfile() ?? null,
+              actorTrustClass: resolveTurnActorTrustClass(ctx),
             }),
           abortController.signal,
         );
@@ -2781,8 +1983,7 @@ export async function runAgentLoopImpl(
           step.compactionResult &&
           step.compactionResult.summaryFailed !== undefined
         ) {
-          await trackCompactionOutcome(
-            ctx,
+          await ctx.agentLoop.compactionCircuit.recordOutcome(
             step.compactionResult.summaryFailed,
             onEvent,
           );
@@ -2793,22 +1994,17 @@ export async function runAgentLoopImpl(
             step.compactionResult,
             convergenceCompactionBasis,
           );
-          shouldInjectWorkspace = true;
-          reducerCompacted = true;
+          state.reducerCompacted = true;
         }
-        // Only re-inject NOW.md when ctx.messages was actually stripped;
-        // otherwise the existing NOW.md block is still present and
-        // re-injecting would duplicate it.
+        // Only re-inject the memory-static block when ctx.messages was
+        // actually stripped; otherwise the existing block is still present and
+        // re-injecting would duplicate it. (The `<knowledge_base>` and NOW.md
+        // blocks self-gate inside their injectors on whether they are already
+        // present in `ctx.messages`.)
         const injection = await applyRuntimeInjections(ctx.messages, {
           ...injectionOpts,
-          pkbContext: currentPkbContent,
-          memoryV2Static: convergenceStripped ? currentMemoryV2Static : null,
-          nowScratchpad: convergenceStripped ? currentNowContent : null,
-          workspaceTopLevelContext: shouldInjectWorkspace
-            ? ctx.workspaceTopLevelContext
-            : null,
-          slackChronologicalMessages: reducerCompacted
+          slackChronologicalMessages: state.reducerCompacted
             ? null
             : injectionOpts.slackChronologicalMessages,
           mode: currentInjectionMode,
@@ -2826,24 +2022,10 @@ export async function runAgentLoopImpl(
           );
           runMessages = convergenceStrip.messages;
         }
-        preRepairMessages = runMessages;
-        preRunHistoryLength = runMessages.length;
         state.contextTooLargeDetected = false;
         yieldedForBudget = false;
-        updatedHistory = await ctx.agentLoop.run(
-          runMessages,
-          eventHandler,
-          abortController.signal,
-          reqId,
-          onCheckpoint,
-          turnCallSite,
-          loopTurnCtx,
-          turnOverrideProfile,
-          resolveCurrentMaxInputTokens(),
-          resolveCurrentOverrideProfile,
-          resolveCurrentMaxInputTokens,
-        );
+        updatedHistory = await runAgentLoop(runMessages);
         // If the rerun still yields at checkpoint, the turn is still
         // incomplete — continue reducing through the remaining tiers
@@ -2862,12 +2044,9 @@ export async function runAgentLoopImpl(
           // Fold rerun progress into ctx.messages so the next reducer
           // tier operates on up-to-date history instead of stale
           // pre-rerun messages.
-          if (updatedHistory.length > preRunHistoryLength) {
+          if (lastRunAppendedNewMessages) {
             ctx.messages = stripInjectionsForCompaction(updatedHistory);
-            markHistoryStrippedBestEffort(ctx.conversationId, Date.now(), rlog);
-            convergenceStripped = true;
-            preRepairMessages = updatedHistory;
-            preRunHistoryLength = updatedHistory.length;
+            markHistoryStrippedBestEffort(ctx.conversationId);
           }
         }
       }
@@ -2884,88 +2063,38 @@ export async function runAgentLoopImpl(
         if (action === "auto_compress_latest_turn") {
           // Auto-compress without asking — users opt out via the "drop" policy.
-          ctx.emitActivityState(
-            "thinking",
-            "context_compacting",
-            "assistant_turn",
-            reqId,
-          );
-          let emergencyCompact: Awaited<
-            ReturnType<typeof ctx.contextWindowManager.maybeCompact>
-          > | null = null;
-          try {
-            emergencyCompact = (await runPipeline<
-              CompactionArgs,
-              CompactionResult
-            >(
-              "compaction",
-              getMiddlewaresFor("compaction"),
-              (args) =>
-                defaultCompactionTerminal(
-                  args,
-                  buildPluginTurnContext(ctx, reqId),
-                ),
-              {
-                messages: ctx.messages,
-                signal: abortController.signal,
-                options: {
-                  lastCompactedAt: ctx.contextCompactedAt ?? undefined,
-                  force: true,
-                  minKeepRecentUserTurns: 0,
-                  targetInputTokensOverride: correctedTarget,
-                  overrideProfile: resolveCurrentOverrideProfile() ?? null,
-                },
-              },
-              buildPluginTurnContext(ctx, reqId),
-              DEFAULT_TIMEOUTS.compaction,
-            )) as Awaited<
-              ReturnType<typeof ctx.contextWindowManager.maybeCompact>
-            >;
-          } catch (err) {
-            if (err instanceof PluginTimeoutError) {
-              // Emergency compaction timed out. Record the circuit-breaker
-              // failure and fall through to the graceful-error path below
-              // (the unsuccessful-compaction fallback) rather than hard-
-              // failing the turn.
-              rlog.warn(
-                { err, phase: "emergency-compaction" },
-                "Emergency compaction pipeline timed out — continuing with overflow fallback",
-              );
-              await trackCompactionOutcome(ctx, true, onEvent);
-              emergencyCompact = null;
-            } else {
-              throw err;
-            }
-          }
+          ctx.emitActivityState("thinking", "context_compacting", {
+            requestId: reqId,
+          });
+          const emergencyCompact = await defaultCompact({
+            manager: ctx.contextWindowManager,
+            messages: ctx.messages,
+            signal: abortController.signal,
+            force: true,
+            minKeepRecentUserTurns: 0,
+            overrideProfile: resolveCurrentOverrideProfile() ?? null,
+          });
           // Only track when the summary LLM actually ran; `force: true`
-          // bypasses the cooldown but not the early-return paths.
-          if (
-            emergencyCompact &&
-            emergencyCompact.summaryFailed !== undefined
-          ) {
-            await trackCompactionOutcome(
-              ctx,
+          // bypasses the auto-threshold gate but not the early-return paths.
+          if (emergencyCompact.summaryFailed !== undefined) {
+            await ctx.agentLoop.compactionCircuit.recordOutcome(
               emergencyCompact.summaryFailed,
               onEvent,
             );
           }
-          if (emergencyCompact?.compacted) {
+          if (emergencyCompact.compacted) {
             await applySuccessfulCompaction(emergencyCompact, ctx.messages);
-            reducerCompacted = true;
-            shouldInjectWorkspace = true;
+            state.reducerCompacted = true;
           }
-          // Only re-inject NOW.md when ctx.messages was actually stripped;
-          // otherwise the existing block is still present.
+          // Only re-inject the memory-static block when ctx.messages was
+          // actually stripped; otherwise the existing block is still present.
+          // (The `<knowledge_base>`, NOW.md, and v2 static `<info>` blocks
+          // self-gate inside their injectors on whether they are already
+          // present in `ctx.messages`.)
           const injection = await applyRuntimeInjections(ctx.messages, {
             ...injectionOpts,
-            pkbContext: currentPkbContent,
-            memoryV2Static: convergenceStripped ? currentMemoryV2Static : null,
-            nowScratchpad: convergenceStripped ? currentNowContent : null,
-            workspaceTopLevelContext: shouldInjectWorkspace
-              ? ctx.workspaceTopLevelContext
-              : null,
-            slackChronologicalMessages: reducerCompacted
+            slackChronologicalMessages: state.reducerCompacted
               ? null
               : injectionOpts.slackChronologicalMessages,
             mode: currentInjectionMode,
@@ -2983,23 +2112,9 @@ export async function runAgentLoopImpl(
             );
             runMessages = fallbackStrip.messages;
           }
-          preRepairMessages = runMessages;
-          preRunHistoryLength = runMessages.length;
           state.contextTooLargeDetected = false;
-          updatedHistory = await ctx.agentLoop.run(
-            runMessages,
-            eventHandler,
-            abortController.signal,
-            reqId,
-            onCheckpoint,
-            turnCallSite,
-            loopTurnCtx,
-            turnOverrideProfile,
-            resolveCurrentMaxInputTokens(),
-            resolveCurrentOverrideProfile,
-            resolveCurrentMaxInputTokens,
-          );
+          updatedHistory = await runAgentLoop(runMessages);
         }
         // action === "fail_gracefully" falls through to the final error below
       }
@@ -3050,44 +2165,11 @@ export async function runAgentLoopImpl(
       onEvent(buildConversationErrorMessage(ctx.conversationId, classified));
     }
-    // Reconcile synthesized cancellation tool_results
-    for (let i = preRunHistoryLength; i < updatedHistory.length; i++) {
-      const msg = updatedHistory[i];
-      if (msg.role === "user") {
-        for (const block of msg.content) {
-          if (
-            block.type === "tool_result" &&
-            !state.pendingToolResults.has(block.tool_use_id) &&
-            !state.persistedToolUseIds.has(block.tool_use_id)
-          ) {
-            state.pendingToolResults.set(block.tool_use_id, {
-              content: block.content,
-              isError: block.is_error ?? false,
-            });
-          }
-        }
-      }
-    }
-    // Flush remaining tool results
+    // Flush remaining tool results. On a normal turn these drain at the next
+    // `message_complete`; an aborted or yielded loop exits with them still
+    // buffered, so finalize the (possibly already on-arrival-reserved) grouped
+    // row here rather than writing a duplicate.
     if (state.pendingToolResults.size > 0) {
-      const toolResultBlocks = Array.from(
-        state.pendingToolResults.entries(),
-      ).map(([toolUseId, result]) => ({
-        type: "tool_result",
-        tool_use_id: toolUseId,
-        content: redactSecrets(result.content),
-        is_error: result.isError,
-        ...(result.contentBlocks
-          ? {
-              contentBlocks: result.contentBlocks.map((block) =>
-                block.type === "text"
-                  ? { ...block, text: redactSecrets(block.text) }
-                  : block,
-              ),
-            }
-          : {}),
-      }));
       const toolResultMetadata = {
         ...provenanceFromTrustContext(ctx.trustContext),
         userMessageChannel: capturedTurnChannelContext.userMessageChannel,
@@ -3097,21 +2179,12 @@ export async function runAgentLoopImpl(
         assistantMessageInterface:
           capturedTurnInterfaceContext.assistantMessageInterface,
       };
-      await runPipeline<PersistArgs, PersistResult>(
-        "persistence",
-        getMiddlewaresFor("persistence"),
-        defaultPersistenceTerminal,
-        {
-          op: "add",
-          conversationId: ctx.conversationId,
-          role: "user",
-          content: JSON.stringify(toolResultBlocks),
-          metadata: toolResultMetadata,
-        },
-        buildPluginTurnContext(ctx, reqId),
-        DEFAULT_TIMEOUTS.persistence,
+      await finalizePendingToolResultRow(
+        state,
+        ctx.conversationId,
+        toolResultMetadata,
+        rlog,
       );
-      state.pendingToolResults.clear();
     }
     // Persist the budget_yield_unrecovered notice now that any pending
@@ -3135,24 +2208,13 @@ export async function runAgentLoopImpl(
       };
       let yieldNoticePersistedId: string | null = null;
       try {
-        const yieldPersistResult = (await runPipeline<
-          PersistArgs,
-          PersistResult
-        >(
-          "persistence",
-          getMiddlewaresFor("persistence"),
-          defaultPersistenceTerminal,
-          {
-            op: "add",
-            conversationId: ctx.conversationId,
-            role: "assistant",
-            content: JSON.stringify(yieldNoticeMessage.content),
-            metadata: yieldNoticeMetadata,
-          },
-          buildPluginTurnContext(ctx, reqId),
-          DEFAULT_TIMEOUTS.persistence,
-        )) as PersistAddResult;
-        yieldNoticePersistedId = yieldPersistResult.message.id;
+        const yieldRow = await addMessage(
+          ctx.conversationId,
+          "assistant",
+          JSON.stringify(yieldNoticeMessage.content),
+          { metadata: yieldNoticeMetadata },
+        );
+        yieldNoticePersistedId = yieldRow.id;
       } catch (err) {
         // Non-fatal — a DB hiccup must not escalate a budget-yield exit into
         // a turn-level throw. The live SSE event was already emitted, so the
@@ -3208,7 +2270,7 @@ export async function runAgentLoopImpl(
     }
     // Reconstruct history
-    const newMessages = updatedHistory.slice(preRunHistoryLength).map((msg) => {
+    const newMessages = lastRunNewMessages.map((msg) => {
       if (msg.role !== "assistant") return msg;
       const { cleanedContent } = cleanAssistantContent(msg.content);
       const cleanedBlocks = cleanedContent as ContentBlock[];
@@ -3239,10 +2301,6 @@ export async function runAgentLoopImpl(
         state.assistantRowAwaitingFinalization &&
         state.lastAssistantMessageId
       ) {
-        // Direct `deleteMessageById` (not via the `persistence` pipeline):
-        // see the same rationale on the matching cleanup in
-        // `handleLlmCallStarted` — an unfinalized reservation has no
-        // observable history for plugins.
         try {
           deleteMessageById(state.lastAssistantMessageId);
         } catch (err) {
@@ -3264,20 +2322,12 @@ export async function runAgentLoopImpl(
       const errorAssistantMessage = createAssistantMessage(
         state.providerErrorUserMessage,
       );
-      const errorPersistResult = (await runPipeline<PersistArgs, PersistResult>(
-        "persistence",
-        getMiddlewaresFor("persistence"),
-        defaultPersistenceTerminal,
-        {
-          op: "add",
-          conversationId: ctx.conversationId,
-          role: "assistant",
-          content: JSON.stringify(errorAssistantMessage.content),
-          metadata: errChannelMeta,
-        },
-        buildPluginTurnContext(ctx, reqId),
-        DEFAULT_TIMEOUTS.persistence,
-      )) as PersistAddResult;
+      const errorRow = await addMessage(
+        ctx.conversationId,
+        "assistant",
+        JSON.stringify(errorAssistantMessage.content),
+        { metadata: errChannelMeta },
+      );
       persistedErrorAssistantMessage = true;
       // Repoint `lastAssistantMessageId` at the synthetic error row so the
       // post-loop sync, attachment resolution, and `message_complete`/
@@ -3286,7 +2336,7 @@ export async function runAgentLoopImpl(
       // above. Mark finalization complete so the next LLM call in this run
       // (or a downstream handler) doesn't try to clean up an id that
       // already corresponds to a finalized row.
-      state.lastAssistantMessageId = errorPersistResult.message.id;
+      state.lastAssistantMessageId = errorRow.id;
       state.assistantRowAwaitingFinalization = false;
       newMessages.push(errorAssistantMessage);
       // Pipe the just-assigned message id into any orphaned LLM request log
@@ -3300,10 +2350,7 @@ export async function runAgentLoopImpl(
       // other conversations cannot collide. Non-fatal — a DB hiccup must
       // not escalate a provider rejection into a turn-level throw.
       try {
-        backfillMessageIdOnLogs(
-          ctx.conversationId,
-          errorPersistResult.message.id,
-        );
+        backfillMessageIdOnLogs(ctx.conversationId, errorRow.id);
       } catch (err) {
         rlog.warn(
           { err },
@@ -3316,7 +2363,16 @@ export async function runAgentLoopImpl(
       // would create a duplicate plain-text bubble below the alert card.
     }
-    let restoredHistory = [...preRepairMessages, ...newMessages];
+    // Base persisted into `ctx.messages` is the loop's own returned history
+    // (minus the tail it appended this run), with the cleaned `newMessages`
+    // re-appended on top. Sourcing the base from the loop keeps it in lockstep
+    // with any in-loop compaction without the orchestrator maintaining a
+    // parallel snapshot across re-entry sites.
+    const loopBase = updatedHistory.slice(
+      0,
+      updatedHistory.length - lastRunNewMessages.length,
+    );
+    let restoredHistory = [...loopBase, ...newMessages];
     // Post-turn tool result truncation: save large results to disk and
     // replace in-context content with a prefix/suffix stub + file pointer.
@@ -3389,7 +2445,10 @@ export async function runAgentLoopImpl(
     // so the client can re-enable the UI without delay.
     if (abortController.signal.aborted) {
       syncLastAssistantMessageToDisk();
-      ctx.emitActivityState("idle", "generation_cancelled", "global", reqId);
+      ctx.emitActivityState("idle", "generation_cancelled", {
+        anchor: "global",
+        requestId: reqId,
+      });
       ctx.traceEmitter.emit(
         "generation_cancelled",
         "Generation cancelled by user",
@@ -3433,7 +2492,10 @@ export async function runAgentLoopImpl(
           await emitTerminalExit?.("aborted_after_checkpoint");
           pendingCheckpointYield = null;
         }
-        ctx.emitActivityState("idle", "generation_cancelled", "global", reqId);
+        ctx.emitActivityState("idle", "generation_cancelled", {
+          anchor: "global",
+          requestId: reqId,
+        });
         ctx.traceEmitter.emit(
           "generation_cancelled",
           "Generation cancelled by user",
@@ -3474,7 +2536,10 @@ export async function runAgentLoopImpl(
         });
         publishLoopMessagesChanged();
       } else {
-        ctx.emitActivityState("idle", "message_complete", "global", reqId);
+        ctx.emitActivityState("idle", "message_complete", {
+          anchor: "global",
+          requestId: reqId,
+        });
         ctx.traceEmitter.emit(
           "message_complete",
           "Message processing complete",
@@ -3497,68 +2562,8 @@ export async function runAgentLoopImpl(
             : {}),
         });
         publishLoopMessagesChanged();
-        // Proactive artifact: fire once when the processed turn was the 4th user message.
-        // Only trigger for real user-authored turns (not subagent/system messages).
-        {
-          const paConv = getConversation(ctx.conversationId);
-          if (
-            paConv &&
-            paConv.conversationType === "standard" &&
-            options?.isUserMessage
-          ) {
-            void (async () => {
-              try {
-                if (hasProactiveArtifactCompleted()) return;
-                const userMsg = getMessageById(
-                  userMessageId,
-                  ctx.conversationId,
-                );
-                if (!userMsg) return;
-                if (!tryClaimProactiveArtifactTrigger(userMsg.createdAt))
-                  return;
-                await runProactiveArtifactJob({
-                  conversationId: ctx.conversationId,
-                  userMessageCutoff: userMsg.createdAt,
-                  assistantMessageId: state.lastAssistantMessageId,
-                  suppressAppBuild: state.appBuildToolUsedThisRun,
-                  broadcastMessage,
-                });
-              } catch (err) {
-                log.warn(
-                  { err, conversationId: ctx.conversationId },
-                  "Proactive artifact trigger failed",
-                );
-              }
-            })();
-          }
-        }
       }
     }
-    // Second title pass: after 3 completed turns, re-generate the title
-    // using the last 3 messages for better context. Only fires when the
-    // current title was auto-generated (isAutoTitle = 1) and the user
-    // has not opted out via `conversations.skipAutoRetitling`.
-    if (ctx.turnCount === 2 && !getConfig().conversations.skipAutoRetitling) {
-      // turnCount is 0-indexed, incremented in finally; 2 = about to become 3rd turn
-      queueRegenerateConversationTitle({
-        conversationId: ctx.conversationId,
-        provider: ctx.provider,
-        onTitleUpdated: (title) => {
-          onEvent({
-            type: "conversation_title_updated",
-            conversationId: ctx.conversationId,
-            title,
-          });
-          onEvent({
-            type: "sync_changed",
-            tags: [conversationMetadataSyncTag(ctx.conversationId)],
-          });
-        },
-        signal: abortController.signal,
-      });
-    }
   } catch (err) {
     const errorCtx = {
       phase: "agent_loop" as const,
@@ -3569,7 +2574,10 @@ export async function runAgentLoopImpl(
         await emitTerminalExit?.("aborted_after_checkpoint");
         pendingCheckpointYield = null;
       }
-      ctx.emitActivityState("idle", "generation_cancelled", "global", reqId);
+      ctx.emitActivityState("idle", "generation_cancelled", {
+        anchor: "global",
+        requestId: reqId,
+      });
       rlog.info("Generation cancelled by user");
       ctx.traceEmitter.emit(
         "generation_cancelled",
@@ -3585,7 +2593,10 @@ export async function runAgentLoopImpl(
       });
       publishLoopMessagesChanged();
     } else {
-      ctx.emitActivityState("idle", "error_terminal", "global", reqId);
+      ctx.emitActivityState("idle", "error_terminal", {
+        anchor: "global",
+        requestId: reqId,
+      });
       const message = err instanceof Error ? err.message : String(err);
       const errorClass = err instanceof Error ? err.constructor.name : "Error";
       rlog.error({ err }, "Conversation processing error");
@@ -3612,8 +2623,6 @@ export async function runAgentLoopImpl(
     }
   } finally {
     if (turnStarted) {
-      cleanupBootstrapAfterTurnThreshold(ctx.conversationId);
       ctx.turnCount++;
       const config = getConfig();
       const maxWait = config.workspaceGit?.turnCommitMaxWaitMs ?? 4000;
@@ -3651,7 +2660,7 @@ export async function runAgentLoopImpl(
     ctx.profiler.emitSummary(ctx.traceEmitter, reqId);
     ctx.abortController = null;
-    ctx.processing = false;
+    ctx.setProcessing(false);
     ctx.onConfirmationOutcome = undefined;
     ctx.surfaceActionRequestIds.delete(ctx.currentRequestId ?? "");
     ctx.approvedViaPromptThisTurn = false;
@@ -3798,7 +2807,7 @@ export async function applyCompactionResult(
     result.summaryText,
     ctx.contextCompactedMessageCount,
   );
-  markHistoryStrippedBestEffort(ctx.conversationId, compactedAt, log);
+  markHistoryStrippedBestEffort(ctx.conversationId);
   if (options.slackContextCompactionWatermarkTs) {
     updateConversationSlackContextWatermark(
       ctx.conversationId,