npm - @vellumai/assistant - Versions diffs - 0.8.7 → 0.8.8 - Mend

@vellumai/assistant 0.8.7 → 0.8.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (387) hide show

package/Dockerfile +20 -4
package/docker-entrypoint.sh +4 -2
package/docker-init-apt-root.sh +3 -1
package/docker-kata-apt-env.sh +3 -1
package/docker-kata-runtime-family.sh +12 -0
package/docs/architecture/memory.md +1 -1
package/docs/plugins.md +75 -79
package/examples/plugins/echo/README.md +6 -12
package/examples/plugins/echo/register.ts +0 -41
package/node_modules/@vellumai/skill-host-contracts/src/server-message.ts +3 -3
package/openapi.yaml +3381 -348
package/package.json +1 -1
package/scripts/generate-openapi.ts +68 -41
package/src/__tests__/agent-loop-exit-reason.test.ts +34 -39
package/src/__tests__/agent-loop-provider-error-recording.test.ts +1 -1
package/src/__tests__/agent-loop.test.ts +37 -87
package/src/__tests__/agent-wake-disk-pressure-callsite.test.ts +2 -0
package/src/__tests__/annotate-activity-metadata.test.ts +262 -0
package/src/__tests__/annotate-risk-options.test.ts +2 -3
package/src/__tests__/anthropic-provider.test.ts +95 -2
package/src/__tests__/assistant-event-hub.test.ts +25 -0
package/src/__tests__/assistant-events-sse-shed.test.ts +8 -0
package/src/__tests__/{conversation-stream-state.test.ts → assistant-stream-state.test.ts} +252 -91
package/src/__tests__/auth-fallback-events-store.test.ts +116 -0
package/src/__tests__/background-workers-disk-pressure.test.ts +6 -0
package/src/__tests__/btw-routes.test.ts +62 -3
package/src/__tests__/build-persisted-content.test.ts +184 -0
package/src/__tests__/catalog-files.test.ts +1 -1
package/src/__tests__/clawhub-files.test.ts +1 -1
package/src/__tests__/compaction-pipeline.test.ts +1 -1
package/src/__tests__/compaction.benchmark.test.ts +0 -30
package/src/__tests__/config-watcher.test.ts +1 -1
package/src/__tests__/conversation-abort-tool-results.test.ts +57 -19
package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +6 -2
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +10 -4
package/src/__tests__/conversation-agent-loop-overflow.test.ts +313 -1136
package/src/__tests__/conversation-agent-loop.test.ts +596 -1616
package/src/__tests__/conversation-analysis-routes.test.ts +6 -0
package/src/__tests__/conversation-history-web-search.test.ts +11 -1
package/src/__tests__/conversation-pairing.test.ts +4 -31
package/src/__tests__/conversation-process-app-control-preactivation.test.ts +6 -0
package/src/__tests__/conversation-provider-retry-repair.test.ts +26 -5
package/src/__tests__/conversation-queue.test.ts +2 -0
package/src/__tests__/conversation-routes-disk-view.test.ts +3 -0
package/src/__tests__/conversation-routes-slash-commands.test.ts +6 -5
package/src/__tests__/conversation-runtime-assembly.test.ts +170 -229
package/src/__tests__/conversation-runtime-workspace.test.ts +3 -24
package/src/__tests__/conversation-slash-commands.test.ts +8 -42
package/src/__tests__/conversation-slash-queue.test.ts +6 -1
package/src/__tests__/conversation-surfaces-action-delivery.test.ts +84 -0
package/src/__tests__/conversation-sync-tags.test.ts +27 -15
package/src/__tests__/conversation-title-service.test.ts +135 -2
package/src/__tests__/conversation-workspace-injection.test.ts +6 -1
package/src/__tests__/cross-provider-web-search.test.ts +214 -1
package/src/__tests__/db-schedule-syntax-migration.test.ts +5 -0
package/src/__tests__/dm-persistence.test.ts +5 -1
package/src/__tests__/empty-response-hook.test.ts +304 -0
package/src/__tests__/feature-flag-test-helpers.ts +2 -2
package/src/__tests__/gemini-image-service.test.ts +13 -0
package/src/__tests__/helpers/mock-provider.ts +110 -0
package/src/__tests__/helpers/native-web-search-harness.ts +129 -0
package/src/__tests__/history-repair-hook.test.ts +1 -0
package/src/__tests__/identity-intro-cache.test.ts +12 -100
package/src/__tests__/identity-routes.test.ts +248 -7
package/src/__tests__/inbound-slack-persistence.test.ts +5 -1
package/src/__tests__/injector-background-turn.test.ts +2 -8
package/src/__tests__/injector-chain.test.ts +106 -270
package/src/__tests__/injector-disk-pressure.test.ts +3 -12
package/src/__tests__/injector-document-comments.test.ts +2 -2
package/src/__tests__/injector-pkb-v2-silenced.test.ts +30 -22
package/src/__tests__/injector-v3-suppression.test.ts +31 -37
package/src/__tests__/internal-telemetry-routes.test.ts +109 -0
package/src/__tests__/list-messages-page-latest.test.ts +60 -0
package/src/__tests__/list-messages-tool-merge.test.ts +20 -0
package/src/__tests__/llm-usage-store.test.ts +223 -1
package/src/__tests__/memory-retrieval-hook.test.ts +297 -0
package/src/__tests__/memory-v2-static-injector.test.ts +103 -35
package/src/__tests__/native-web-search.test.ts +191 -0
package/src/__tests__/onboarding-template-contract.test.ts +2 -0
package/src/__tests__/openai-image-service.test.ts +17 -0
package/src/__tests__/openai-provider.test.ts +31 -1
package/src/__tests__/persist-unsendable-image.test.ts +215 -0
package/src/__tests__/persistence-secret-redaction.test.ts +1 -0
package/src/__tests__/pipeline-runner.test.ts +29 -39
package/src/__tests__/pkb-autoinject.test.ts +2 -5
package/src/__tests__/plugin-bootstrap.test.ts +13 -28
package/src/__tests__/plugin-registry.test.ts +0 -27
package/src/__tests__/plugin-types.test.ts +2 -125
package/src/__tests__/process-message-display-content.test.ts +6 -2
package/src/__tests__/regenerate-fire-and-forget-trace.test.ts +5 -1
package/src/__tests__/resolve-trust-class.test.ts +4 -4
package/src/__tests__/runtime-events-sse-reconnect.test.ts +60 -23
package/src/__tests__/schedule-routes.test.ts +603 -2
package/src/__tests__/schedule-store.test.ts +41 -0
package/src/__tests__/schedule-tools.test.ts +35 -0
package/src/__tests__/server-history-render.test.ts +314 -1
package/src/__tests__/skillssh-files.test.ts +1 -1
package/src/__tests__/system-prompt.test.ts +20 -0
package/src/__tests__/task-scheduler.test.ts +162 -1
package/src/__tests__/terminal-tools.test.ts +6 -1
package/src/__tests__/title-generate-hook.test.ts +319 -0
package/src/__tests__/tool-error-hook.test.ts +278 -0
package/src/__tests__/tool-preview-lifecycle.test.ts +468 -5
package/src/__tests__/tool-result-metadata-plumbing.test.ts +1 -0
package/src/__tests__/tool-result-truncate-hook.test.ts +127 -0
package/src/__tests__/tool-result-truncation.test.ts +0 -2
package/src/__tests__/ui-choice-copy-surfaces.test.ts +254 -0
package/src/__tests__/ui-work-result-surface.test.ts +159 -0
package/src/__tests__/usage-routes.test.ts +285 -1
package/src/__tests__/user-plugin-loader.test.ts +2 -2
package/src/__tests__/voice-session-bridge.test.ts +6 -3
package/src/__tests__/web-search-backend-failure.test.ts +166 -0
package/src/agent/loop.ts +346 -442
package/src/api/events/assistant-thinking-delta.ts +33 -0
package/src/api/events/tool-output-chunk.ts +45 -0
package/src/api/events/tool-use-preview-start.ts +32 -0
package/src/api/events/trace-event.ts +69 -0
package/src/api/index.ts +48 -13
package/src/api/responses/conversation-message.ts +368 -0
package/src/avatar/__tests__/avatar-store.test.ts +34 -29
package/src/cli/commands/__tests__/notifications.test.ts +58 -14
package/src/cli/commands/notifications.ts +112 -60
package/src/config/assistant-feature-flags.ts +22 -11
package/src/config/bundled-skills/app-builder/SKILL.md +3 -20
package/src/config/bundled-skills/app-builder/references/examples/README.md +17 -0
package/src/config/bundled-skills/app-builder/references/examples/expense-tracker.md +515 -0
package/src/config/bundled-skills/app-builder/references/examples/focus-timer.md +342 -0
package/src/config/bundled-skills/app-builder/references/examples/habit-tracker.md +490 -0
package/src/config/bundled-skills/document-editor/SKILL.md +1 -1
package/src/config/bundled-skills/messaging/SKILL.md +0 -7
package/src/config/feature-flag-cache.ts +3 -3
package/src/config/feature-flag-registry.json +35 -3
package/src/config/schemas/__tests__/memory-v2.test.ts +1 -0
package/src/config/schemas/__tests__/memory-v3.test.ts +25 -0
package/src/config/schemas/llm.ts +1 -0
package/src/config/schemas/memory-v2.ts +8 -0
package/src/config/schemas/memory-v3.ts +8 -0
package/src/config/schemas/platform.ts +8 -0
package/src/config/seed-inference-profiles.ts +2 -2
package/src/config/skills.ts +13 -0
package/src/context/compactor.ts +1 -1
package/src/context/strip-injections.ts +122 -0
package/src/context/token-estimator.ts +23 -0
package/src/context/tool-result-truncation.ts +0 -23
package/src/context/window-manager.ts +3 -6
package/src/credential-execution/executable-discovery.ts +16 -0
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +6 -0
package/src/daemon/__tests__/inference-profile-notification.test.ts +153 -0
package/src/daemon/__tests__/native-web-search-metadata.test.ts +10 -8
package/src/daemon/assistant-attachments.ts +1 -1
package/src/daemon/config-watcher.ts +2 -2
package/src/daemon/context-overflow-reducer.ts +0 -1
package/src/daemon/conversation-agent-loop-handlers.ts +605 -153
package/src/daemon/conversation-agent-loop.ts +281 -760
package/src/daemon/conversation-history.ts +5 -4
package/src/daemon/conversation-lifecycle.ts +3 -4
package/src/daemon/conversation-messaging.ts +7 -6
package/src/daemon/conversation-process.ts +11 -16
package/src/daemon/conversation-runtime-assembly.ts +130 -347
package/src/daemon/conversation-slash.ts +6 -25
package/src/daemon/conversation-surfaces.ts +222 -4
package/src/daemon/conversation-tool-setup.ts +2 -29
package/src/daemon/conversation.ts +32 -14
package/src/daemon/external-plugins-bootstrap.ts +9 -10
package/src/daemon/handlers/config-a2a.ts +51 -36
package/src/daemon/handlers/config-slack-channel.ts +20 -14
package/src/daemon/handlers/config-telegram.ts +16 -2
package/src/daemon/handlers/shared.ts +156 -84
package/src/daemon/handlers/skills.ts +39 -10
package/src/daemon/lifecycle.ts +4 -0
package/src/daemon/message-types/apps.ts +1 -29
package/src/daemon/message-types/messages.ts +9 -57
package/src/daemon/message-types/skills.ts +2 -0
package/src/daemon/message-types/surfaces.ts +136 -3
package/src/daemon/now-scratchpad.ts +21 -0
package/src/daemon/orphan-reaper.test.ts +210 -0
package/src/daemon/orphan-reaper.ts +240 -0
package/src/daemon/persist-unsendable-image.ts +117 -0
package/src/daemon/process-message.ts +1 -3
package/src/daemon/trace-emitter.ts +6 -4
package/src/daemon/trust-context.ts +19 -0
package/src/daemon/wake-target-adapter.ts +3 -1
package/src/home/home-greeting-cache.ts +24 -1
package/src/ipc/gateway-client.test.ts +2 -2
package/src/ipc/gateway-client.ts +3 -3
package/src/media/gemini-image-service.ts +15 -0
package/src/media/openai-image-service.ts +14 -0
package/src/media/types.ts +34 -0
package/src/memory/__tests__/jobs-worker-v2-schedule.test.ts +56 -0
package/src/memory/auth-fallback-events-store.ts +94 -0
package/src/memory/conversation-title-service.ts +65 -41
package/src/memory/db-init.ts +4 -0
package/src/memory/graph/__tests__/conversation-graph-memory-registry.test.ts +119 -0
package/src/memory/graph/conversation-graph-memory.ts +65 -0
package/src/memory/jobs-store.ts +33 -0
package/src/memory/jobs-worker.ts +31 -4
package/src/memory/llm-usage-store.ts +224 -50
package/src/memory/migrations/222-strip-placeholder-sentinels-from-messages.ts +6 -5
package/src/memory/migrations/270-schedule-source-conversation.ts +13 -0
package/src/memory/migrations/271-create-auth-fallback-events.ts +21 -0
package/src/memory/migrations/index.ts +2 -0
package/src/memory/pkb/autoinject.ts +61 -0
package/src/memory/pkb/context.ts +50 -0
package/src/memory/pkb/types.ts +14 -0
package/src/memory/schedule-attribution-sql.ts +104 -0
package/src/memory/schema/infrastructure.ts +16 -0
package/src/memory/usage-grouped-buckets.ts +6 -1
package/src/memory/v2/__tests__/consolidation-job.test.ts +1 -1
package/src/memory/v2/consolidation-job.ts +1 -1
package/src/memory/v3/__tests__/health.test.ts +16 -0
package/src/memory/v3/__tests__/orchestrate.test.ts +45 -9
package/src/memory/v3/__tests__/provider-blocks.test.ts +13 -0
package/src/memory/v3/__tests__/router.test.ts +101 -29
package/src/memory/v3/__tests__/selector.test.ts +93 -27
package/src/memory/v3/__tests__/shadow-plugin.test.ts +23 -5
package/src/memory/v3/health.ts +0 -0
package/src/memory/v3/llm-retry.ts +32 -0
package/src/memory/v3/orchestrate.ts +26 -14
package/src/memory/v3/provider-blocks.ts +15 -5
package/src/memory/v3/router.ts +48 -42
package/src/memory/v3/selector.ts +57 -42
package/src/memory/v3/shadow-plugin.ts +47 -15
package/src/memory/v3/types.ts +8 -0
package/src/notifications/conversation-pairing.ts +8 -15
package/src/notifications/decision-engine.ts +6 -3
package/src/notifications/home-feed-side-effect.ts +12 -1
package/src/permissions/prompter.ts +4 -0
package/src/plugin-api/constants.ts +4 -0
package/src/plugin-api/index.ts +8 -1
package/src/plugin-api/types.ts +151 -1
package/src/plugins/defaults/empty-response/hooks/stop.ts +126 -0
package/src/plugins/defaults/empty-response/register.ts +8 -13
package/src/plugins/defaults/index.ts +1 -15
package/src/plugins/defaults/injectors/register.ts +243 -74
package/src/plugins/defaults/memory-retrieval/hooks/post-compact.ts +91 -0
package/src/plugins/defaults/memory-retrieval/hooks/user-prompt-submit-temp.ts +216 -0
package/src/plugins/defaults/memory-retrieval/injector-chain.ts +35 -0
package/src/plugins/defaults/title-generate/hooks/stop.ts +75 -0
package/src/plugins/defaults/title-generate/hooks/user-prompt-submit.ts +35 -0
package/src/plugins/defaults/title-generate/package.json +1 -1
package/src/plugins/defaults/title-generate/register.ts +18 -18
package/src/plugins/defaults/tool-error/hooks/post-tool-use.ts +118 -0
package/src/plugins/defaults/tool-error/package.json +1 -1
package/src/plugins/defaults/tool-error/register.ts +9 -21
package/src/plugins/defaults/tool-result-truncate/hooks/post-tool-use.ts +32 -0
package/src/plugins/defaults/tool-result-truncate/register.ts +10 -21
package/src/plugins/defaults/tool-result-truncate/terminal.ts +37 -18
package/src/plugins/pipeline.ts +6 -18
package/src/plugins/registry.ts +8 -25
package/src/plugins/types.ts +43 -474
package/src/proactive-artifact/aux-message-injector.ts +3 -3
package/src/proactive-artifact/job.test.ts +7 -12
package/src/prompts/__tests__/system-prompt.test.ts +36 -0
package/src/prompts/templates/BOOTSTRAP-ACTIVATION-RAIL.md +62 -0
package/src/prompts/templates/BOOTSTRAP.md +2 -2
package/src/prompts/templates/system-sections.ts +15 -0
package/src/providers/anthropic/client.ts +37 -29
package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +112 -0
package/src/providers/openai/chat-completions-provider.ts +44 -0
package/src/providers/openrouter/client.ts +1 -0
package/src/providers/placeholder-sentinels.ts +35 -0
package/src/runtime/__tests__/agent-wake.test.ts +5 -1
package/src/runtime/agent-wake.ts +2 -2
package/src/runtime/assistant-event-hub.ts +36 -6
package/src/runtime/{conversation-stream-state.ts → assistant-stream-state.ts} +132 -58
package/src/runtime/http-router.ts +16 -21
package/src/runtime/http-types.ts +16 -70
package/src/runtime/pending-interactions.ts +1 -0
package/src/runtime/routes/__tests__/consolidation-routes.test.ts +265 -2
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +31 -1
package/src/runtime/routes/__tests__/memory-v2-routes.test.ts +6 -2
package/src/runtime/routes/__tests__/tts-routes.test.ts +6 -2
package/src/runtime/routes/app-management-routes.ts +6 -117
package/src/runtime/routes/app-routes.ts +13 -15
package/src/runtime/routes/attachment-routes.ts +26 -15
package/src/runtime/routes/avatar-routes.ts +26 -0
package/src/runtime/routes/btw-routes.ts +29 -23
package/src/runtime/routes/consolidation-routes.ts +120 -20
package/src/runtime/routes/conversation-query-routes.ts +2 -0
package/src/runtime/routes/conversation-routes.ts +358 -184
package/src/runtime/routes/documents-routes.ts +4 -0
package/src/runtime/routes/domain-routes.ts +51 -37
package/src/runtime/routes/epoch-millis-range.ts +34 -0
package/src/runtime/routes/events-routes.ts +28 -34
package/src/runtime/routes/gateway-log-routes.ts +26 -4
package/src/runtime/routes/heartbeat-routes.ts +32 -12
package/src/runtime/routes/identity-intro-cache.ts +11 -34
package/src/runtime/routes/identity-routes.ts +208 -17
package/src/runtime/routes/image-generation-routes.ts +40 -2
package/src/runtime/routes/index.ts +2 -0
package/src/runtime/routes/integrations/a2a.ts +12 -10
package/src/runtime/routes/integrations/slack/__tests__/channel.test.ts +16 -0
package/src/runtime/routes/integrations/slack/channel.ts +4 -0
package/src/runtime/routes/integrations/slack/share.ts +27 -6
package/src/runtime/routes/integrations/telegram.ts +6 -0
package/src/runtime/routes/integrations/twilio.ts +42 -0
package/src/runtime/routes/internal-telemetry-routes.ts +88 -0
package/src/runtime/routes/log-export-routes.ts +8 -0
package/src/runtime/routes/memory-v2-routes.ts +15 -8
package/src/runtime/routes/memory-v3-routes.ts +50 -28
package/src/runtime/routes/oauth-apps.ts +66 -12
package/src/runtime/routes/oauth-providers.ts +44 -5
package/src/runtime/routes/platform-routes.ts +81 -5
package/src/runtime/routes/playground/__tests__/force-compact.test.ts +6 -4
package/src/runtime/routes/playground/force-compact.ts +1 -1
package/src/runtime/routes/rename-conversation-routes.ts +5 -0
package/src/runtime/routes/schedule-routes.ts +152 -42
package/src/runtime/routes/secret-routes.ts +14 -2
package/src/runtime/routes/skills-routes.ts +43 -14
package/src/runtime/routes/tool-call-confirmation-enrichment.test.ts +161 -0
package/src/runtime/routes/tool-call-confirmation-enrichment.ts +107 -0
package/src/runtime/routes/trust-rules-routes.ts +26 -2
package/src/runtime/routes/tts-routes.ts +35 -0
package/src/runtime/routes/types.ts +66 -8
package/src/runtime/routes/usage-routes.ts +47 -39
package/src/runtime/routes/webhook-routes.ts +41 -2
package/src/runtime/routes/workspace-routes.ts +4 -0
package/src/runtime/services/__tests__/analyze-conversation.test.ts +6 -0
package/src/runtime/services/analyze-conversation.ts +2 -2
package/src/schedule/schedule-store.ts +20 -1
package/src/schedule/schedule-usage-store.ts +83 -0
package/src/schedule/scheduler.ts +12 -5
package/src/skills/catalog-files.ts +2 -2
package/src/skills/catalog-install.ts +3 -0
package/src/skills/categories-cache.ts +118 -0
package/src/skills/clawhub-files.ts +1 -2
package/src/skills/skillssh-files.ts +1 -2
package/src/telemetry/types.ts +29 -1
package/src/telemetry/usage-telemetry-reporter.test.ts +112 -3
package/src/telemetry/usage-telemetry-reporter.ts +57 -2
package/src/tools/executor.ts +1 -53
package/src/tools/network/__tests__/web-search-metadata.test.ts +7 -1
package/src/tools/network/__tests__/web-search.test.ts +11 -3
package/src/tools/network/web-search-error.test.ts +248 -0
package/src/tools/network/web-search-error.ts +267 -0
package/src/tools/network/web-search.ts +207 -48
package/src/tools/schedule/create.ts +2 -0
package/src/tools/terminal/safe-env.ts +10 -1
package/src/tools/ui-surface/definitions.ts +9 -1
package/src/tts/__tests__/provider-catalog-consistency.test.ts +85 -1
package/src/tts/provider-catalog.ts +76 -1
package/src/util/mutex.ts +47 -0
package/src/workspace/git-service.ts +1 -42
package/src/workspace/migrations/095-bump-heartbeat-interval-30m-to-60m.ts +51 -0
package/src/workspace/migrations/096-reduce-quality-profile-effort.ts +72 -0
package/src/workspace/migrations/097-enable-adaptive-thinking-managed-profiles.ts +93 -0
package/src/workspace/migrations/registry.ts +6 -0
package/src/__tests__/bootstrap-turn-cleanup.test.ts +0 -44
package/src/__tests__/empty-response-pipeline.test.ts +0 -423
package/src/__tests__/llm-call-pipeline.test.ts +0 -287
package/src/__tests__/memory-retrieval-pipeline.test.ts +0 -418
package/src/__tests__/persistence-pipeline.test.ts +0 -503
package/src/__tests__/title-generate-pipeline.test.ts +0 -211
package/src/__tests__/token-estimate-pipeline.test.ts +0 -479
package/src/__tests__/tool-error-pipeline.test.ts +0 -241
package/src/__tests__/tool-execute-pipeline.test.ts +0 -417
package/src/__tests__/tool-result-truncate-pipeline.test.ts +0 -341
package/src/daemon/bootstrap-turn-cleanup.ts +0 -45
package/src/gallery/default-gallery.ts +0 -1359
package/src/gallery/gallery-manifest.ts +0 -28
package/src/home/feature-gate.ts +0 -22
package/src/plugins/defaults/empty-response/middlewares/emptyResponse.ts +0 -22
package/src/plugins/defaults/empty-response/terminal.ts +0 -106
package/src/plugins/defaults/injectors/package.json +0 -15
package/src/plugins/defaults/llm-call/middlewares/llmCall.ts +0 -17
package/src/plugins/defaults/llm-call/package.json +0 -15
package/src/plugins/defaults/llm-call/register.ts +0 -45
package/src/plugins/defaults/memory-retrieval/middlewares/memoryRetrieval.ts +0 -17
package/src/plugins/defaults/memory-retrieval/package.json +0 -15
package/src/plugins/defaults/memory-retrieval/register.ts +0 -181
package/src/plugins/defaults/persistence/middlewares/persistence.ts +0 -19
package/src/plugins/defaults/persistence/package.json +0 -15
package/src/plugins/defaults/persistence/register.ts +0 -38
package/src/plugins/defaults/persistence/terminal.ts +0 -83
package/src/plugins/defaults/title-generate/terminal.ts +0 -31
package/src/plugins/defaults/token-estimate/middlewares/tokenEstimate.ts +0 -23
package/src/plugins/defaults/token-estimate/package.json +0 -15
package/src/plugins/defaults/token-estimate/register.ts +0 -34
package/src/plugins/defaults/token-estimate/terminal.ts +0 -40
package/src/plugins/defaults/tool-error/middlewares/toolError.ts +0 -21
package/src/plugins/defaults/tool-error/terminal.ts +0 -47
package/src/plugins/defaults/tool-execute/middlewares/toolExecute.ts +0 -23
package/src/plugins/defaults/tool-execute/package.json +0 -15
package/src/plugins/defaults/tool-execute/register.ts +0 -49
package/src/plugins/defaults/tool-result-truncate/middlewares/toolResultTruncate.ts +0 -23
package/src/plugins/defaults/tool-result-truncate/types.ts +0 -22
package/src/skills/category-inference.ts +0 -111

package/src/proactive-artifact/job.test.ts CHANGED Viewed

@@ -190,7 +190,7 @@ mock.module("../runtime/sync/resource-sync-events.js", () => ({
 // findConversation mock
 type MockConversation = {
-  processing: boolean;
+  isProcessing(): boolean;
   messages: unknown[];
   getMessages: () => unknown[];
 };
@@ -426,7 +426,7 @@ describe("runProactiveArtifactJob", () => {
       // Set up an idle conversation so injection works fully
       const convMessages: unknown[] = [];
       mockConversations.set("conv-1", {
-        processing: false,
+        isProcessing: () => false,
         messages: convMessages,
         getMessages: () => convMessages,
       });
@@ -510,7 +510,7 @@ describe("runProactiveArtifactJob", () => {
         "MESSAGE: I created a monthly budget guide tailored to your needs.";
       mockConversations.set("conv-1", {
-        processing: false,
+        isProcessing: () => false,
         messages: [],
         getMessages: () => [],
       });
@@ -646,7 +646,7 @@ describe("runProactiveArtifactJob", () => {
       ];
       mockConversations.set("conv-1", {
-        processing: false,
+        isProcessing: () => false,
         messages: [],
         getMessages: () => [],
       });
@@ -710,7 +710,7 @@ describe("injectAuxAssistantMessage", () => {
   test("idle conversation: persists with skipIndexing, pushes to getMessages(), broadcasts delta + complete(aux) + list sync", async () => {
     const messages: unknown[] = [];
     mockConversations.set("conv-inject-1", {
-      processing: false,
+      isProcessing: () => false,
       messages,
       getMessages: () => messages,
     });
@@ -767,12 +767,7 @@ describe("injectAuxAssistantMessage", () => {
     const messages: unknown[] = [];
     let processingFlag = true;
     const conv: MockConversation = {
-      get processing() {
-        return processingFlag;
-      },
-      set processing(v: boolean) {
-        processingFlag = v;
-      },
+      isProcessing: () => processingFlag,
       messages,
       getMessages: () => messages,
     };
@@ -801,7 +796,7 @@ describe("injectAuxAssistantMessage", () => {
     const messages: unknown[] = [];
     // Conversation stays processing permanently — never becomes idle
     const conv: MockConversation = {
-      processing: true,
+      isProcessing: () => true,
       messages,
       getMessages: () => messages,
     };

package/src/prompts/__tests__/system-prompt.test.ts CHANGED Viewed

@@ -114,3 +114,39 @@ describe("maybeReseedBootstrap — content-automation template", () => {
     expect(content).toContain("VOICE.md");
   });
 });
+describe("maybeReseedBootstrap — activation rail template", () => {
+  const templatesDir = join(import.meta.dirname!, "..", "templates");
+  beforeEach(() => {
+    mkdirSync(TEST_DIR, { recursive: true });
+    copyFileSync(
+      join(templatesDir, "BOOTSTRAP.md"),
+      join(TEST_DIR, "BOOTSTRAP.md"),
+    );
+  });
+  test("replaces generic bootstrap with the activation rail template", () => {
+    maybeReseedBootstrap("BOOTSTRAP-ACTIVATION-RAIL.md");
+    const content = readFileSync(join(TEST_DIR, "BOOTSTRAP.md"), "utf-8");
+    expect(content).toContain("BOOTSTRAP — Activation Rail");
+    expect(content).toContain("People don't read");
+    expect(content).toContain("Speed wins");
+    // Propose: anti-speculation boundary on what "unstated" means.
+    expect(content).toContain("status word");
+    expect(content).toContain("don't say it");
+    // Propose: infer-first framing — recommendation bound to the click.
+    expect(content).toContain("You didn't say this");
+    expect(content).toContain("the recommendation IS the click");
+    // Propose: a surviving extract-and-offer mechanic.
+    expect(content).toContain("clickable component, strongest first");
+    // Propose: the extract-shape vs infer-shape example block.
+    expect(content).toContain("extract-shape");
+    expect(content).toContain("infer-shape");
+  });
+});

package/src/prompts/templates/BOOTSTRAP-ACTIVATION-RAIL.md ADDED Viewed

@@ -0,0 +1,62 @@
+_Replaces BOOTSTRAP.md for users in cohort experiment-activation-flow-2026-06-03._ _Same delete-on-wrap lifecycle as BOOTSTRAP.md._
+# BOOTSTRAP — Activation Rail
+The user just finished pre-chat. You know their name and vibe; maybe their Google. Your job in this conversation is to get them to a real first-run. Something they actually use, not a demo.
+## The shape
+Four moves. Goals, not steps.
+**Port.** Pull their existing assistant context with two pastes — about a minute, no upload, no export. You write a prompt, they paste it into Claude or ChatGPT, they paste the response back. Cheap signal, real signal.
+The prompt should be one-click copyable. Inline paragraph text the user has to select isn't. Neither is a custom-built widget with a fake copy button. If the affordance needs you to build an app or a new surface to render, you've over-built the move. Use what chat already gives you.
+**Propose.** Don't organize what they already told you — infer what they didn't. Name the unstated thing sitting in their context and say *why* you think it: point at the specific surface that made you say it. "You didn't say this, but —". Then recommend, and lean one way; the recommendation IS the click, not a neutral menu of equally-weighted options.
+"Unstated" is inference, not invention. Read only three surfaces, each a positive signal you can point at in the paste: dates / recency / time gaps; entities that recur (people, projects, accounts named more than once); and status words ("stuck", "behind", "waiting on", "still"). If you can't point to the surface that made you say it, don't say it — no free-speculating about goals, feelings, or facts that aren't traceable to the paste, and no "you didn't mention X" absence-inference.
+Surface the outcome as a clickable component, strongest first. The component is the question — don't follow it with a prose "or something else?" Pick from skills you already have loaded first; fall back to `vellum-skills-catalog` `skill_search` for what's missing. Compose the offer in their language, not in skill names.
+- ✗ extract-shape: "I see three meetings in your paste — want help with one?"
+- ✓ infer-shape (dates/recency): "Two of these are with the same client and the last was 3 weeks ago — looks stalled; I'd send a re-engage note." (The recommendation lands as the clickable surface — no trailing "want me to?")
+- ✗ extract-shape: "You mentioned a launch and a hiring plan — which one?"
+- ✓ infer-shape (repeated entity + status word): "Acme comes up four times and you said you're 'waiting on' them — that's the thing actually blocking the launch; I'd chase it first."
+**Run.** Do it. Real tools, real data. The user watches something happen.
+**Follow-through.** Offer the next concrete thing. One primary recommendation.
+If the user opens with a task instead of a conversation, do the task. You're already at Follow-through. Backfill the Port move at the first natural lull, or skip it.
+Pick. Be wrong recoverably. Move. The user can tell when you're hedging.
+## People don't read
+Brevity is the product. Lead with the move, not the rationale for the move. If the rationale takes more than one short sentence, cut it. Meta-narration about what you're trying to do ("I want to make this useful...") is rationale. Cut it harder.
+One CTA per turn. If your CTA is a clickable surface, don't follow it with a prose "or..." / "unless..." / "is there something else?" — the surface IS the menu. Open-ended questions after a structured offer are the most common version of a stacked CTA.
+No hedging the offer. Not "worth doing if you have history to bring." Make the move and let them say no.
+If an action requires the user to type a path or remember a string, the affordance is wrong. Move it inside a surface they can click.
+Every CTA surface must commit on the surface. If the user can select but can't confirm, the surface is broken. "They can just type a reply" doesn't count. Either selecting must commit the choice on click, or there must be a visible submit button below the options. The most common version of this bug: a radio or checkbox list with nothing clickable underneath.
+## Feeling seen
+The summary after the Port move is the first place the user can feel like you actually heard them. The follow-through in the final move is the second. In both, the bar is the same surface-grounded inference Propose already runs: notice what they hedged, point at the mechanism behind what they described, reframe what they're really asking for. Specific observations earn the rest of the conversation. Generic recap loses it.
+## What to defer
+Identity writes (IDENTITY.md, SOUL.md), user-profile writes, journal entries: all wait until the rail produces real signal, which is Moment 1 output at the earliest. None of them delay a user-visible response. None of them happen alongside the opening turn.
+The base BOOTSTRAP task_preferences fallback is not on this rail. Your opener is the Port pitch.
+## Wrap
+When the user is clearly done with this conversation, write one journal entry: what they needed, which outcome they accepted, what follow-through they took. Update NOW.md. Delete this file.
+The rail-completion shape in your journal is the dataset for v2 tuning. Which outcome they took at Propose, whether they bounced to "what else?", which follow-through they picked. Write it so the next iteration has signal to learn from.
+Speed wins until the rail produces real signal. Trust yourself.

package/src/prompts/templates/BOOTSTRAP.md CHANGED Viewed

@@ -26,9 +26,9 @@ Private setup waits until there is enough signal to justify it. Low-signal bante
 ## Opening move
-The first message in your conversation context is a system trigger used to generate the canned greeting. Don't reference it, quote it, or respond to it as if the user said it.
+Some first conversations include an internal opener such as "Wake up, my friend!" only to generate the canned greeting. If you see that system trigger, don't reference it, quote it, or respond to it as if the user said it. If the first visible user turn is an onboarding self-introduction like "Hi <assistant>, I'm <user>. Nice to meet you.", treat it as the real first user turn: answer it briefly without re-introducing yourself, and if there is no task yet include the migration offer from `## Assistant migration`.
-If an `onboarding` JSON context is present, treat it as known — not as a briefing. Don't surface the selections as a list. Don't say "you mentioned" or "I see you use." Just apply the knowledge. Tools and tasks selected are context for how you respond, not content to recap. The canned first greeting already introduced you by name, so don't repeat introductions.
+If an `onboarding` JSON context is present, treat it as known — not as a briefing. Don't surface the selections as a list. Don't say "you mentioned" or "I see you use." Just apply the knowledge. Tools and tasks selected are context for how you respond, not content to recap. If the opener already introduced names, don't repeat introductions.
 If there's no onboarding context, pick a working name for yourself ("I'll go by Pax") and get to work. Their name can come up later, or never.

package/src/prompts/templates/system-sections.ts CHANGED Viewed

@@ -230,6 +230,21 @@ export const BUNDLED_SYSTEM_SECTIONS: readonly BundledSection[] = [
     body: "",
     enabled: "!excludeCustomPrefix",
   },
+  {
+    id: "01-communication",
+    body: `## Communication
+Keep your reasoning, planning, and deliberation in your private thinking — never in user-facing text. A user-facing message is only ever: an optional one-line acknowledgement when starting longer work, the actual answer or question the user needs, and a single concise summary when you're done.
+Keep reasoning and tool calls adjacent (think, call a tool, think, call a tool) with no user-facing prose between them, so one stream of work renders as one block.
+Meet your user where they are. If they are nontechnical, prefer "Gmail needs reconnecting," not "the OAuth token expired". You can use more acronyms and industry-specific jargon if your user is a subject matter expert in the domain you are working together on. This applies for marketers, engineers, consultants, entrepreneurs, etc.
+Err toward brevity; expand only when the user follows up or their style calls for more.
+These are default guidelines. Always prioritize communication preferences that you've established through your relationship with your human.
+`,
+  },
   {
     id: "01-parallel-tool-calls",
     body: `<use_parallel_tool_calls>

package/src/providers/anthropic/client.ts CHANGED Viewed

@@ -5,6 +5,11 @@ import { ProviderError } from "../../util/errors.js";
 import { getLogger } from "../../util/logger.js";
 import { extractRetryAfterMs } from "../../util/retry.js";
 import { stripOrphanedSurrogatesDeep } from "../../util/unicode.js";
+import {
+  isPlaceholderSentinelText,
+  PLACEHOLDER_BLOCKS_OMITTED,
+  PLACEHOLDER_EMPTY_TURN,
+} from "../placeholder-sentinels.js";
 import { createStreamTimeout } from "../stream-timeout.js";
 import type {
   ContentBlock,
@@ -161,33 +166,6 @@ function sanitizeToolId(id: string): string {
 const SYNTHETIC_RESULT =
   "<synthesized_result>tool result missing from history</synthesized_result>";
-// Null-byte prefix makes these placeholders impossible to produce via normal
-// model output or user input, preventing false positives in isPlaceholder().
-export const PLACEHOLDER_EMPTY_TURN =
-  "\x00__PLACEHOLDER__[empty assistant turn]";
-export const PLACEHOLDER_BLOCKS_OMITTED =
-  "\x00__PLACEHOLDER__[internal blocks omitted]";
-// Compared against the payload with any leading `\x00` stripped, so the check
-// matches both the prefixed sentinel we emit and any bare variant that lost
-// the null byte in transit (e.g. the model echoing the text back without
-// reproducing the control character).
-const PLACEHOLDER_SENTINEL_BARE: ReadonlySet<string> = new Set([
-  PLACEHOLDER_EMPTY_TURN.slice(1),
-  PLACEHOLDER_BLOCKS_OMITTED.slice(1),
-]);
-/**
- * True when the text is one of the provider's internal alternation-preserving
- * sentinels, with or without the null-byte prefix. These must never be
- * persisted or rendered to users — they exist only in outbound Anthropic API
- * request bodies.
- */
-export function isPlaceholderSentinelText(text: string): boolean {
-  const normalized = text.startsWith("\x00") ? text.slice(1) : text;
-  return PLACEHOLDER_SENTINEL_BARE.has(normalized);
-}
 /**
  * Synthetic placeholder injected as user-message content when Anthropic API
  * alternation requires a user turn but no real user content exists. Uses the
@@ -1230,6 +1208,23 @@ export class AnthropicProvider implements Provider {
         sentMessages = params.messages;
       }
+      // Haiku does not support the extended-cache-ttl beta, so it must never
+      // receive a `ttl` on any cache_control. The client's own breakpoints
+      // already omit it for Haiku, but callers (e.g. v3's `cachedTextBlock`)
+      // can stamp a `ttl` on message blocks before the provider sees them —
+      // strip it here so the request stays valid on Haiku models.
+      if (isHaiku) {
+        for (const msg of sentMessages) {
+          if (!Array.isArray(msg.content)) continue;
+          for (const block of msg.content) {
+            if (typeof block === "string") continue;
+            const cc = (block as { cache_control?: { ttl?: unknown } })
+              .cache_control;
+            if (cc && "ttl" in cc) delete cc.ttl;
+          }
+        }
+      }
       const { signal: timeoutSignal, cleanup: cleanupTimeout } =
         createStreamTimeout(this.streamTimeoutMs, signal);
       innerTimeoutSignal = timeoutSignal;
@@ -1650,8 +1645,21 @@ export class AnthropicProvider implements Provider {
     block: ContentBlock,
   ): Anthropic.ContentBlockParam | null {
     switch (block.type) {
-      case "text":
-        return { type: "text", text: block.text };
+      case "text": {
+        // Preserve a caller-stamped cache_control breakpoint (e.g. v3's
+        // `cachedTextBlock`, which marks a stable per-leaf / leaf-tree prefix
+        // that should be cached on its own rather than only as part of the
+        // per-turn anchor prefix). The internal ContentBlock type omits the
+        // field, so reach for it via cast. The Haiku ttl-strip downstream still
+        // applies. Only v3 stamps this today, so the per-request breakpoint
+        // budget (≤4) is unaffected for other callers.
+        const cacheControl = (
+          block as { cache_control?: Anthropic.CacheControlEphemeral }
+        ).cache_control;
+        return cacheControl
+          ? { type: "text", text: block.text, cache_control: cacheControl }
+          : { type: "text", text: block.text };
+      }
       case "thinking":
         if (!block.signature) {
           return null;

package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts CHANGED Viewed

@@ -1,6 +1,8 @@
 import { describe, expect, test } from "bun:test";
+import { isPlaceholderSentinelText } from "../../placeholder-sentinels.js";
 import {
+  EMPTY_ASSISTANT_TURN_PLACEHOLDER,
   OpenAIChatCompletionsProvider,
   type OpenAIChatCompletionsProviderOptions,
 } from "../chat-completions-provider.js";
@@ -348,6 +350,116 @@ describe("OpenAIChatCompletionsProvider reasoning parsing", () => {
     expect(assistantMsg.reasoning_content).toBeUndefined();
   });
+  test("backfills placeholder content for a reasoning-only assistant turn when enabled", async () => {
+    const { provider, requests } = stubProvider(
+      [
+        {
+          choices: [{ delta: { content: "ok" }, finish_reason: "stop" }],
+          usage: { prompt_tokens: 2, completion_tokens: 1 },
+        },
+      ],
+      {
+        assistantReasoningField: "reasoning",
+        backfillEmptyAssistantContent: true,
+      },
+    );
+    await provider.sendMessage([
+      { role: "user", content: [{ type: "text", text: "question" }] },
+      {
+        role: "assistant",
+        content: [
+          {
+            type: "thinking",
+            thinking: "truncated chain of thought",
+            signature: "",
+          },
+        ],
+      },
+    ]);
+    const params = requests[0] as {
+      messages: Array<{
+        role: string;
+        content: string | null;
+        reasoning?: string;
+        tool_calls?: unknown;
+      }>;
+    };
+    const assistantMsg = params.messages.find((m) => m.role === "assistant")!;
+    // content or tool_calls must be set; reasoning alone does not satisfy it.
+    expect(assistantMsg.content).toBe(EMPTY_ASSISTANT_TURN_PLACEHOLDER);
+    expect(assistantMsg.tool_calls).toBeUndefined();
+    expect(assistantMsg.reasoning).toBe("truncated chain of thought");
+    // The placeholder is a recognized sentinel, so it is stripped from
+    // persisted/rendered history if a model echoes it back, and it carries no
+    // control characters that a strict OpenAI-compatible backend might reject.
+    expect(isPlaceholderSentinelText(EMPTY_ASSISTANT_TURN_PLACEHOLDER)).toBe(
+      true,
+    );
+    expect(EMPTY_ASSISTANT_TURN_PLACEHOLDER).not.toContain("\x00");
+  });
+  test("leaves reasoning-only assistant content null when backfill is disabled", async () => {
+    const { provider, requests } = stubProvider(
+      [
+        {
+          choices: [{ delta: { content: "ok" }, finish_reason: "stop" }],
+          usage: { prompt_tokens: 2, completion_tokens: 1 },
+        },
+      ],
+      { assistantReasoningField: "reasoning_content" },
+    );
+    await provider.sendMessage([
+      { role: "user", content: [{ type: "text", text: "question" }] },
+      {
+        role: "assistant",
+        content: [
+          {
+            type: "thinking",
+            thinking: "truncated chain of thought",
+            signature: "",
+          },
+        ],
+      },
+    ]);
+    const params = requests[0] as {
+      messages: Array<{ role: string; content: string | null }>;
+    };
+    const assistantMsg = params.messages.find((m) => m.role === "assistant")!;
+    // Backfill defaults off, so providers that tolerate null assistant content
+    // (e.g. OpenAI proper) are unaffected by the OpenRouter-specific guard.
+    expect(assistantMsg.content).toBeNull();
+  });
+  test("does not backfill content when tool calls are present", async () => {
+    const { provider, requests } = stubProvider([
+      {
+        choices: [{ delta: { content: "ok" }, finish_reason: "stop" }],
+        usage: { prompt_tokens: 2, completion_tokens: 1 },
+      },
+    ]);
+    await provider.sendMessage([
+      {
+        role: "assistant",
+        content: [
+          { type: "tool_use", id: "call_1", name: "search", input: { q: "x" } },
+        ],
+      },
+    ]);
+    const params = requests[0] as {
+      messages: Array<{ role: string; content: string | null }>;
+    };
+    // Tool-call-only assistant messages keep null content (preferred by
+    // Anthropic-proxy/Bedrock backends); the placeholder is only for the
+    // neither-content-nor-tool_calls case.
+    expect(params.messages[0].content).toBeNull();
+  });
   test("skips Anthropic-originated thinking blocks (with signatures)", async () => {
     const { provider, requests } = stubProvider(
       [

package/src/providers/openai/chat-completions-provider.ts CHANGED Viewed

@@ -4,6 +4,7 @@ import { isAbortReason } from "../../util/abort-reasons.js";
 import { ProviderError } from "../../util/errors.js";
 import { extractRetryAfterMs } from "../../util/retry.js";
 import { escapeXmlAttr } from "../../util/xml.js";
+import { PLACEHOLDER_EMPTY_TURN } from "../placeholder-sentinels.js";
 import { createStreamTimeout } from "../stream-timeout.js";
 import type {
   ContentBlock,
@@ -100,6 +101,26 @@ export function extractApiErrorDetail(
  *  OpenRouter's `error.metadata.raw` strings, which are typically <1KB. */
 const MAX_API_ERROR_DETAIL_CHARS = 2000;
+/**
+ * Fallback `content` for an assistant turn that has neither visible text nor
+ * tool calls (e.g. a reasoning-only turn truncated at the output-token limit).
+ *
+ * The OpenAI chat-completions schema requires an assistant message to carry
+ * `content` or `tool_calls`. OpenAI itself tolerates `content: null`/`""` here,
+ * but strict OpenAI-compatible backends do not: DeepSeek via OpenRouter rejects
+ * the request with `Invalid assistant message: content or tool_calls must be
+ * set`, and vLLM-style validators coerce empty-string content back to null and
+ * reject it the same way. The placeholder must therefore be a non-empty string.
+ *
+ * We reuse the shared empty-turn sentinel so that
+ * `isPlaceholderSentinelText`/`cleanAssistantContent` strip it from persisted
+ * and rendered history if a model ever echoes it back. The null-byte prefix is
+ * dropped because some OpenAI-compatible backends reject control characters in
+ * message content; the bare form is still recognized by
+ * `isPlaceholderSentinelText`.
+ */
+export const EMPTY_ASSISTANT_TURN_PLACEHOLDER = PLACEHOLDER_EMPTY_TURN.slice(1);
 /**
  * Read the first matching header from an SDK error's headers object,
  * tolerating both Map-like (`Headers.get()`) and plain-object shapes.
@@ -153,6 +174,13 @@ export interface OpenAIChatCompletionsProviderOptions {
    *  DeepSeek/Fireworks use `"reasoning_content"`; OpenRouter uses `"reasoning"`.
    *  When unset, thinking blocks are dropped from outbound assistant messages. */
   assistantReasoningField?: "reasoning" | "reasoning_content";
+  /** Backfill a non-empty placeholder for assistant turns that would otherwise
+   *  serialize with neither `content` nor `tool_calls` (e.g. reasoning-only
+   *  turns). Off by default; enabled for OpenRouter, whose downstream providers
+   *  (e.g. DeepSeek) reject such messages with `Invalid assistant message:
+   *  content or tool_calls must be set`. See {@link
+   *  EMPTY_ASSISTANT_TURN_PLACEHOLDER}. */
+  backfillEmptyAssistantContent?: boolean;
 }
 /** Wire-level reasoning_effort values. The OpenAI SDK type doesn't include
@@ -228,6 +256,7 @@ export class OpenAIChatCompletionsProvider implements Provider {
     | "reasoning"
     | "reasoning_content"
     | undefined;
+  private backfillEmptyAssistantContent: boolean;
   constructor(
     apiKey: string,
@@ -251,6 +280,8 @@ export class OpenAIChatCompletionsProvider implements Provider {
     this.requestHeaders = options.requestHeaders ?? {};
     this.parseThinkTags = options.parseThinkTags ?? false;
     this.assistantReasoningField = options.assistantReasoningField;
+    this.backfillEmptyAssistantContent =
+      options.backfillEmptyAssistantContent ?? false;
   }
   async sendMessage(
@@ -794,6 +825,19 @@ export class OpenAIChatCompletionsProvider implements Provider {
       result.tool_calls = toolCalls;
     }
+    // An assistant message must carry `content` or `tool_calls`. A turn with
+    // neither (e.g. reasoning-only) would serialize to null/empty content with
+    // no tool calls, which strict OpenAI-compatible backends reject. Reasoning
+    // lives in a separate field and does not satisfy this constraint. Scoped to
+    // providers that need it (OpenRouter) via `backfillEmptyAssistantContent`.
+    if (
+      this.backfillEmptyAssistantContent &&
+      !result.tool_calls &&
+      (result.content === null || result.content === "")
+    ) {
+      result.content = EMPTY_ASSISTANT_TURN_PLACEHOLDER;
+    }
     return result;
   }

package/src/providers/openrouter/client.ts CHANGED Viewed

@@ -122,6 +122,7 @@ export class OpenRouterProvider extends OpenAIChatCompletionsProvider {
       streamTimeoutMs: options.streamTimeoutMs,
       requestHeaders: OPENROUTER_APP_ATTRIBUTION_HEADERS,
       assistantReasoningField: "reasoning",
+      backfillEmptyAssistantContent: true,
     });
     this.openRouterApiKey = apiKey;
     this.defaultModel = model;

package/src/providers/placeholder-sentinels.ts ADDED Viewed

@@ -0,0 +1,35 @@
+// Internal placeholder sentinels injected as assistant-message content when a
+// turn would otherwise serialize with neither text nor tool calls. Provider
+// request bodies must keep a non-empty content slot (Anthropic to preserve
+// role alternation; strict OpenAI-compatible backends to satisfy the
+// "content or tool_calls must be set" constraint), but these markers must
+// never be persisted or rendered to users.
+//
+// The null-byte prefix makes the prefixed form impossible to produce via
+// normal model output or user input, preventing false positives. Some
+// OpenAI-compatible backends reject control characters in message content, so
+// the OpenAI path emits the bare (prefix-stripped) form, which
+// `isPlaceholderSentinelText` still recognizes.
+export const PLACEHOLDER_EMPTY_TURN =
+  "\x00__PLACEHOLDER__[empty assistant turn]";
+export const PLACEHOLDER_BLOCKS_OMITTED =
+  "\x00__PLACEHOLDER__[internal blocks omitted]";
+// Compared against the payload with any leading `\x00` stripped, so the check
+// matches both the prefixed sentinel we emit and any bare variant that lost
+// the null byte in transit (e.g. the model echoing the text back without
+// reproducing the control character).
+const PLACEHOLDER_SENTINEL_BARE: ReadonlySet<string> = new Set([
+  PLACEHOLDER_EMPTY_TURN.slice(1),
+  PLACEHOLDER_BLOCKS_OMITTED.slice(1),
+]);
+/**
+ * True when the text is one of the internal alternation-preserving sentinels,
+ * with or without the null-byte prefix. These must never be persisted or
+ * rendered to users — they exist only in outbound provider request bodies.
+ */
+export function isPlaceholderSentinelText(text: string): boolean {
+  const normalized = text.startsWith("\x00") ? text.slice(1) : text;
+  return PLACEHOLDER_SENTINEL_BARE.has(normalized);
+}

package/src/runtime/__tests__/agent-wake.test.ts CHANGED Viewed

@@ -136,6 +136,10 @@ import {
 const runResult = (history: Message[]): AgentLoopRunResult => ({
   history,
   exitReason: null,
+  appendedNewMessages: true,
+  // The wake path slices its own new-message boundary off the returned
+  // history (it never destructures `newMessages`), so this is type-only.
+  newMessages: [],
 });
 interface MockTarget extends WakeTarget {
@@ -1077,7 +1081,7 @@ describe("wakeAgentForOpportunity", () => {
     expect(target.drainQueueCalls).toBe(1);
     // Critical ordering invariant: drain runs after processing=false.
     // If drain ran while processing was still true,
-    // `enqueueMessage`'s `if (!ctx.processing) return ...` gate would
+    // `enqueueMessage`'s `if (!ctx.isProcessing()) return ...` gate would
     // see processing=true and the drained item would itself just
     // re-enqueue — no progress. Snapshot the live flag *inside* drain
     // (rather than inferring from toggle order) so a future regression

package/src/runtime/agent-wake.ts CHANGED Viewed

@@ -140,7 +140,7 @@ export interface WakeTarget {
    * The wake invokes this in its `finally` block AFTER
    * `markProcessing(false)`. Order matters: if drain ran while
    * processing was still true, `enqueueMessage`'s gate
-   * (`if (!ctx.processing) return ...`) would still see processing=true
+   * (`if (!ctx.isProcessing()) return ...`) would still see processing=true
    * and the drain itself would be a no-op against any racy late sends.
    * Running drain after processing is released matches the canonical
    * user-turn finally path in `conversation-agent-loop.ts`.
@@ -963,7 +963,7 @@ export async function wakeAgentForOpportunity(
       // Run completed cleanly. The canonical user-turn pattern
       // (conversation-agent-loop.ts:1860, 2106-2126) updates
-      // `ctx.messages` first, then resets `ctx.processing = false`, then
+      // `ctx.messages` first, then clears the flag via `ctx.setProcessing(false)`, then
       // calls `ctx.drainQueue(...)`. We mirror that order so a message
       // queued during the wake dequeues against an already-updated
       // history — otherwise `drainSingleMessage` reads `ctx.messages`