npm - @vellumai/assistant - Versions diffs - 0.4.56 → 0.4.57 - Mend

@vellumai/assistant 0.4.56 → 0.4.57

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (450) hide show

package/ARCHITECTURE.md +10 -10
package/Dockerfile +3 -0
package/README.md +11 -11
package/docs/architecture/integrations.md +2 -2
package/docs/architecture/memory.md +3 -4
package/docs/credential-execution-service.md +13 -20
package/node_modules/@vellumai/ces-contracts/src/error.ts +5 -4
package/package.json +1 -1
package/src/__tests__/actor-token-service.test.ts +7 -7
package/src/__tests__/anthropic-provider.test.ts +172 -0
package/src/__tests__/app-builder-tool-scripts.test.ts +15 -1
package/src/__tests__/approval-cascade.test.ts +2 -2
package/src/__tests__/approval-routes-http.test.ts +3 -4
package/src/__tests__/asset-materialize-tool.test.ts +5 -5
package/src/__tests__/asset-search-tool.test.ts +1 -1
package/src/__tests__/assistant-attachments.test.ts +5 -5
package/src/__tests__/assistant-events-sse-hardening.test.ts +1 -1
package/src/__tests__/assistant-feature-flags-integration.test.ts +50 -38
package/src/__tests__/attachments-store.test.ts +2 -2
package/src/__tests__/avatar-e2e.test.ts +5 -3
package/src/__tests__/browser-skill-endstate.test.ts +0 -1
package/src/__tests__/call-routes-http.test.ts +2 -2
package/src/__tests__/callback-handoff-copy.test.ts +1 -1
package/src/__tests__/cancel-resolves-conversation-key.test.ts +158 -0
package/src/__tests__/channel-readiness-routes.test.ts +0 -1
package/src/__tests__/channel-readiness-service.test.ts +0 -1
package/src/__tests__/checker.test.ts +31 -32
package/src/__tests__/chrome-cdp.test.ts +47 -18
package/src/__tests__/claude-code-skill-regression.test.ts +2 -2
package/src/__tests__/config-schema-cmd.test.ts +2 -2
package/src/__tests__/config-schema.test.ts +9 -18
package/src/__tests__/confirmation-request-guardian-bridge.test.ts +1 -1
package/src/__tests__/conversation-abort-tool-results.test.ts +4 -4
package/src/__tests__/conversation-agent-loop-overflow.test.ts +2 -2
package/src/__tests__/conversation-agent-loop.test.ts +11 -4
package/src/__tests__/conversation-attachments.test.ts +1 -1
package/src/__tests__/conversation-confirmation-signals.test.ts +2 -2
package/src/__tests__/conversation-error.test.ts +33 -0
package/src/__tests__/conversation-init.benchmark.test.ts +0 -1
package/src/__tests__/conversation-load-history-repair.test.ts +1 -1
package/src/__tests__/conversation-pairing.test.ts +1 -1
package/src/__tests__/conversation-pre-run-repair.test.ts +4 -4
package/src/__tests__/conversation-provider-retry-repair.test.ts +4 -4
package/src/__tests__/conversation-queue.test.ts +23 -14
package/src/__tests__/conversation-routes-slash-commands.test.ts +3 -3
package/src/__tests__/conversation-runtime-assembly.test.ts +185 -173
package/src/__tests__/conversation-seed-composer.test.ts +1 -1
package/src/__tests__/conversation-slash-queue.test.ts +4 -4
package/src/__tests__/conversation-slash-unknown.test.ts +4 -4
package/src/__tests__/conversation-starter-routes.test.ts +291 -0
package/src/__tests__/conversation-wipe.test.ts +438 -0
package/src/__tests__/conversation-workspace-cache-state.test.ts +2 -3
package/src/__tests__/conversation-workspace-injection.test.ts +4 -5
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +4 -5
package/src/__tests__/credential-security-e2e.test.ts +20 -0
package/src/__tests__/credential-security-invariants.test.ts +1 -0
package/src/__tests__/credential-vault-unit.test.ts +227 -0
package/src/__tests__/credentials-cli.test.ts +3 -0
package/src/__tests__/date-context.test.ts +59 -377
package/src/__tests__/drop-capability-card-state-migration.test.ts +169 -0
package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +11 -45
package/src/__tests__/emit-signal-routing-intent.test.ts +3 -3
package/src/__tests__/encrypted-store.test.ts +237 -15
package/src/__tests__/ephemeral-permissions.test.ts +4 -5
package/src/__tests__/event-bus.test.ts +3 -3
package/src/__tests__/gateway-only-enforcement.test.ts +2 -2
package/src/__tests__/gateway-only-guard.test.ts +1 -0
package/src/__tests__/gemini-image-service.test.ts +4 -4
package/src/__tests__/gemini-provider.test.ts +6 -9
package/src/__tests__/guardian-binding-drift-heal.test.ts +128 -0
package/src/__tests__/guardian-dispatch.test.ts +0 -1
package/src/__tests__/host-shell-tool.test.ts +6 -6
package/src/__tests__/http-user-message-parity.test.ts +2 -2
package/src/__tests__/intent-routing.test.ts +51 -99
package/src/__tests__/invite-routes-http.test.ts +5 -0
package/src/__tests__/list-messages-attachments.test.ts +1 -1
package/src/__tests__/managed-proxy-context.test.ts +2 -5
package/src/__tests__/managed-skill-lifecycle.test.ts +8 -8
package/src/__tests__/media-generate-image.test.ts +32 -15
package/src/__tests__/media-reuse-story.e2e.test.ts +1 -1
package/src/__tests__/memory-context-benchmark.benchmark.test.ts +1 -1
package/src/__tests__/memory-lifecycle-e2e.test.ts +24 -18
package/src/__tests__/memory-recall-quality.test.ts +4 -3
package/src/__tests__/memory-regressions.test.ts +86 -90
package/src/__tests__/migration-cross-version-compatibility.test.ts +32 -32
package/src/__tests__/migration-export-http.test.ts +26 -27
package/src/__tests__/migration-import-commit-http.test.ts +165 -37
package/src/__tests__/migration-import-preflight-http.test.ts +81 -20
package/src/__tests__/migration-validate-http.test.ts +16 -16
package/src/__tests__/model-intents.test.ts +1 -1
package/src/__tests__/no-domain-routing-in-prompt-guard.test.ts +1 -1
package/src/__tests__/notification-broadcaster.test.ts +1 -1
package/src/__tests__/notification-decision-fallback.test.ts +2 -2
package/src/__tests__/notification-decision-identity.test.ts +8 -9
package/src/__tests__/notification-decision-strategy.test.ts +1 -1
package/src/__tests__/notification-deep-link.test.ts +1 -1
package/src/__tests__/notification-guardian-path.test.ts +0 -1
package/src/__tests__/notification-schedule-dedup.test.ts +7 -7
package/src/__tests__/oauth-store.test.ts +1 -3
package/src/__tests__/oauth2-gateway-transport.test.ts +6 -1
package/src/__tests__/onboarding-template-contract.test.ts +23 -59
package/src/__tests__/provider-error-scenarios.test.ts +154 -0
package/src/__tests__/provider-fail-open-selection.test.ts +2 -2
package/src/__tests__/provider-managed-proxy-integration.test.ts +8 -9
package/src/__tests__/provider-registry-ollama.test.ts +5 -2
package/src/__tests__/qdrant-manager.test.ts +7 -7
package/src/__tests__/ratelimit.test.ts +0 -74
package/src/__tests__/recording-handler.test.ts +0 -1
package/src/__tests__/require-fresh-approval.test.ts +1 -1
package/src/__tests__/runtime-attachment-metadata.test.ts +1 -1
package/src/__tests__/runtime-events-sse-parity.test.ts +1 -1
package/src/__tests__/runtime-events-sse.test.ts +1 -1
package/src/__tests__/scheduler-recurrence.test.ts +46 -2
package/src/__tests__/schema-transforms.test.ts +114 -54
package/src/__tests__/secret-onetime-send.test.ts +20 -0
package/src/__tests__/secret-routes-managed-proxy.test.ts +5 -2
package/src/__tests__/secret-scanner-executor.test.ts +1 -2
package/src/__tests__/send-endpoint-busy.test.ts +63 -4
package/src/__tests__/send-notification-tool.test.ts +2 -2
package/src/__tests__/shell-credential-ref.test.ts +0 -1
package/src/__tests__/shell-tool-proxy-mode.test.ts +1 -2
package/src/__tests__/skill-memory.test.ts +547 -0
package/src/__tests__/skill-script-runner-sandbox.test.ts +1 -2
package/src/__tests__/slack-app-setup-skill-regression.test.ts +37 -0
package/src/__tests__/slack-channel-config.test.ts +109 -94
package/src/__tests__/swarm-conversation-integration.test.ts +2 -2
package/src/__tests__/swarm-recursion.test.ts +2 -2
package/src/__tests__/swarm-tool.test.ts +2 -2
package/src/__tests__/system-prompt.test.ts +19 -66
package/src/__tests__/telegram-config.test.ts +121 -0
package/src/__tests__/terminal-tools.test.ts +1 -1
package/src/__tests__/tool-execution-abort-cleanup.test.ts +1 -2
package/src/__tests__/tool-executor-lifecycle-events.test.ts +1 -1
package/src/__tests__/tool-executor-shell-integration.test.ts +1 -1
package/src/__tests__/tool-executor.test.ts +1 -1
package/src/__tests__/trace-emitter.test.ts +8 -1
package/src/__tests__/trust-store.test.ts +7 -8
package/src/__tests__/twilio-routes.test.ts +1 -18
package/src/__tests__/user-reference.test.ts +82 -2
package/src/__tests__/vbundle-pax-and-symlink.test.ts +196 -0
package/src/__tests__/verification-control-plane-policy.test.ts +1 -1
package/src/approvals/guardian-request-resolvers.ts +3 -3
package/src/avatar/ascii-renderer.ts +2 -2
package/src/avatar/png-renderer.ts +2 -2
package/src/avatar/resvg-lazy.ts +21 -0
package/src/calls/guardian-dispatch.ts +1 -1
package/src/calls/relay-access-wait.ts +2 -2
package/src/calls/twilio-rest.ts +0 -248
package/src/cli/AGENTS.md +5 -8
package/src/cli/__tests__/notifications.test.ts +5 -5
package/src/cli/commands/avatar.ts +64 -2
package/src/cli/commands/conversations.ts +131 -1
package/src/cli/commands/credentials.ts +2 -0
package/src/cli/commands/notifications.ts +3 -3
package/src/cli.ts +10 -0
package/src/config/bundled-skills/acp/SKILL.md +5 -5
package/src/config/bundled-skills/acp/TOOLS.json +6 -6
package/src/config/bundled-skills/app-builder/SKILL.md +42 -42
package/src/config/bundled-skills/app-builder/TOOLS.json +10 -10
package/src/config/bundled-skills/browser/SKILL.md +15 -15
package/src/config/bundled-skills/browser/TOOLS.json +14 -14
package/src/config/bundled-skills/chatgpt-import/SKILL.md +2 -2
package/src/config/bundled-skills/chatgpt-import/TOOLS.json +1 -1
package/src/config/bundled-skills/chatgpt-import/tools/chatgpt-import.ts +1 -1
package/src/config/bundled-skills/claude-code/SKILL.md +5 -5
package/src/config/bundled-skills/computer-use/SKILL.md +2 -2
package/src/config/bundled-skills/computer-use/TOOLS.json +15 -15
package/src/config/bundled-skills/contacts/SKILL.md +3 -3
package/src/config/bundled-skills/contacts/TOOLS.json +4 -4
package/src/config/bundled-skills/document/SKILL.md +4 -4
package/src/config/bundled-skills/document/TOOLS.json +2 -2
package/src/config/bundled-skills/followups/TOOLS.json +3 -3
package/src/config/bundled-skills/gmail/SKILL.md +32 -32
package/src/config/bundled-skills/gmail/TOOLS.json +16 -16
package/src/config/bundled-skills/gmail/tools/gmail-archive.ts +1 -1
package/src/config/bundled-skills/gmail/tools/gmail-sender-digest.ts +1 -1
package/src/config/bundled-skills/google-calendar/SKILL.md +1 -1
package/src/config/bundled-skills/google-calendar/TOOLS.json +5 -5
package/src/config/bundled-skills/google-calendar/types.ts +1 -1
package/src/config/bundled-skills/heartbeat/SKILL.md +43 -0
package/src/config/bundled-skills/image-studio/SKILL.md +3 -3
package/src/config/bundled-skills/image-studio/TOOLS.json +2 -3
package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +16 -12
package/src/config/bundled-skills/media-processing/SKILL.md +40 -40
package/src/config/bundled-skills/media-processing/TOOLS.json +8 -8
package/src/config/bundled-skills/media-processing/__tests__/concurrency-pool.test.ts +2 -2
package/src/config/bundled-skills/media-processing/__tests__/preprocess.test.ts +1 -1
package/src/config/bundled-skills/media-processing/services/gemini-map.ts +5 -5
package/src/config/bundled-skills/media-processing/services/gemini-video.ts +2 -2
package/src/config/bundled-skills/media-processing/services/preprocess.ts +2 -2
package/src/config/bundled-skills/media-processing/services/processing-pipeline.ts +2 -2
package/src/config/bundled-skills/media-processing/services/reduce.ts +3 -3
package/src/config/bundled-skills/media-processing/tools/generate-clip.ts +2 -2
package/src/config/bundled-skills/media-processing/tools/query-media-events.ts +1 -1
package/src/config/bundled-skills/messaging/SKILL.md +29 -25
package/src/config/bundled-skills/messaging/TOOLS.json +11 -11
package/src/config/bundled-skills/messaging/tools/messaging-send.ts +1 -1
package/src/config/bundled-skills/messaging/tools/shared.ts +1 -1
package/src/config/bundled-skills/notifications/SKILL.md +3 -3
package/src/config/bundled-skills/notifications/TOOLS.json +2 -2
package/src/config/bundled-skills/notifications/tools/send-notification.ts +3 -3
package/src/config/bundled-skills/orchestration/SKILL.md +1 -1
package/src/config/bundled-skills/orchestration/TOOLS.json +1 -1
package/src/config/bundled-skills/phone-calls/SKILL.md +18 -14
package/src/config/bundled-skills/phone-calls/TOOLS.json +3 -3
package/src/config/bundled-skills/phone-calls/references/CONFIG.md +2 -2
package/src/config/bundled-skills/phone-calls/references/TRANSCRIPTS.md +2 -2
package/src/config/bundled-skills/phone-calls/references/TROUBLESHOOTING.md +1 -1
package/src/config/bundled-skills/playbooks/TOOLS.json +4 -4
package/src/config/bundled-skills/schedule/SKILL.md +26 -26
package/src/config/bundled-skills/schedule/TOOLS.json +5 -5
package/src/config/bundled-skills/screen-watch/SKILL.md +3 -3
package/src/config/bundled-skills/screen-watch/TOOLS.json +1 -1
package/src/config/bundled-skills/sequences/SKILL.md +2 -2
package/src/config/bundled-skills/sequences/TOOLS.json +10 -10
package/src/config/bundled-skills/sequences/tools/sequence-analytics.ts +2 -2
package/src/config/bundled-skills/sequences/tools/sequence-enroll.ts +2 -2
package/src/config/bundled-skills/sequences/tools/sequence-enrollment-list.ts +1 -1
package/src/config/bundled-skills/sequences/tools/sequence-get.ts +1 -1
package/src/config/bundled-skills/sequences/tools/sequence-import.ts +3 -3
package/src/config/bundled-skills/sequences/tools/sequence-list.ts +1 -1
package/src/config/bundled-skills/sequences/tools/sequence-update.ts +1 -1
package/src/config/bundled-skills/settings/TOOLS.json +3 -3
package/src/config/bundled-skills/settings/tools/open-system-settings.ts +1 -1
package/src/config/bundled-skills/skill-management/TOOLS.json +5 -5
package/src/config/bundled-skills/skills-catalog/SKILL.md +84 -0
package/src/config/bundled-skills/slack/SKILL.md +2 -2
package/src/config/bundled-skills/slack/TOOLS.json +8 -8
package/src/config/bundled-skills/slack/tools/slack-scan-digest.ts +3 -3
package/src/config/bundled-skills/subagent/TOOLS.json +5 -5
package/src/config/bundled-skills/tasks/SKILL.md +1 -1
package/src/config/bundled-skills/tasks/TOOLS.json +9 -9
package/src/config/bundled-skills/transcribe/SKILL.md +5 -5
package/src/config/bundled-skills/transcribe/TOOLS.json +1 -1
package/src/config/bundled-skills/transcribe/tools/transcribe-media.ts +10 -10
package/src/config/bundled-skills/watcher/SKILL.md +4 -4
package/src/config/bundled-skills/watcher/TOOLS.json +5 -5
package/src/config/feature-flag-registry.json +33 -17
package/src/config/schemas/sandbox.ts +1 -1
package/src/config/schemas/services.ts +13 -3
package/src/config/schemas/timeouts.ts +0 -10
package/src/contacts/contact-store.ts +63 -0
package/src/contacts/contacts-write.ts +1 -1
package/src/daemon/assistant-attachments.ts +2 -2
package/src/daemon/conversation-agent-loop-handlers.ts +2 -2
package/src/daemon/conversation-agent-loop.ts +7 -30
package/src/daemon/conversation-error.ts +24 -0
package/src/daemon/conversation-memory.ts +8 -7
package/src/daemon/conversation-runtime-assembly.ts +139 -274
package/src/daemon/conversation-slash.ts +7 -26
package/src/daemon/conversation-surfaces.ts +14 -0
package/src/daemon/conversation-tool-setup.ts +9 -8
package/src/daemon/conversation.ts +2 -0
package/src/daemon/daemon-control.ts +1 -1
package/src/daemon/date-context.ts +10 -83
package/src/daemon/handlers/config-channels.ts +12 -2
package/src/daemon/handlers/config-slack-channel.ts +7 -1
package/src/daemon/handlers/config-telegram.ts +6 -1
package/src/daemon/handlers/conversations.ts +2 -2
package/src/daemon/handlers/skills.ts +4 -0
package/src/daemon/lifecycle.ts +28 -4
package/src/daemon/providers-setup.ts +1 -1
package/src/daemon/server.ts +1 -5
package/src/daemon/shutdown-handlers.ts +9 -3
package/src/daemon/tool-side-effects.ts +40 -0
package/src/daemon/trace-emitter.ts +25 -2
package/src/events/domain-events.ts +1 -1
package/src/events/tool-permission-telemetry-listener.ts +46 -0
package/src/inbound/platform-callback-registration.ts +0 -18
package/src/media/app-icon-generator.ts +15 -8
package/src/media/avatar-router.ts +15 -8
package/src/media/gemini-image-service.ts +125 -21
package/src/memory/attachments-store.ts +3 -3
package/src/memory/channel-verification-sessions.ts +6 -6
package/src/memory/conversation-crud.ts +196 -1
package/src/memory/{thread-starters-cadence.ts → conversation-starters-cadence.ts} +9 -42
package/src/memory/conversation-title-service.ts +2 -3
package/src/memory/db-init.ts +25 -1
package/src/memory/invite-store.ts +4 -4
package/src/memory/items-extractor.ts +4 -4
package/src/memory/job-handlers/{thread-starters.ts → conversation-starters.ts} +123 -38
package/src/memory/jobs-store.ts +3 -2
package/src/memory/jobs-worker.ts +7 -5
package/src/memory/lifecycle-events-store.ts +63 -0
package/src/memory/migrations/172-rename-created-by-session-id.ts +27 -0
package/src/memory/migrations/173-rename-source-session-id.ts +16 -0
package/src/memory/migrations/174-rename-thread-starters-table.ts +52 -0
package/src/memory/migrations/175-create-lifecycle-events.ts +15 -0
package/src/memory/migrations/176-drop-capability-card-state.ts +36 -0
package/src/memory/migrations/177-create-trace-events-table.ts +40 -0
package/src/memory/migrations/index.ts +6 -0
package/src/memory/migrations/registry.ts +13 -0
package/src/memory/retriever.test.ts +223 -96
package/src/memory/retriever.ts +115 -138
package/src/memory/schema/calls.ts +1 -1
package/src/memory/schema/contacts.ts +1 -1
package/src/memory/schema/infrastructure.ts +29 -0
package/src/memory/schema/memory-core.ts +7 -17
package/src/memory/schema/notifications.ts +1 -1
package/src/memory/search/formatting.ts +23 -6
package/src/memory/search/lexical.ts +2 -0
package/src/memory/search/semantic.ts +2 -0
package/src/memory/search/staleness.ts +1 -0
package/src/memory/search/types.ts +4 -0
package/src/memory/task-memory-cleanup.ts +96 -6
package/src/memory/trace-event-store.ts +148 -0
package/src/notifications/README.md +1 -1
package/src/notifications/decision-engine.ts +2 -2
package/src/notifications/emit-signal.ts +4 -4
package/src/notifications/events-store.ts +4 -4
package/src/notifications/signal.ts +1 -1
package/src/oauth/manual-token-connection.ts +49 -25
package/src/permissions/checker.ts +6 -5
package/src/permissions/defaults.ts +4 -4
package/src/prompts/__tests__/build-cli-reference-section.test.ts +9 -90
package/src/prompts/cache-boundary.ts +8 -0
package/src/prompts/system-prompt.ts +105 -634
package/src/prompts/templates/BOOTSTRAP.md +166 -33
package/src/prompts/templates/IDENTITY.md +8 -23
package/src/prompts/templates/SOUL.md +20 -41
package/src/prompts/templates/USER.md +3 -19
package/src/prompts/user-reference.ts +14 -16
package/src/providers/anthropic/client.ts +46 -2
package/src/providers/gemini/client.ts +6 -9
package/src/providers/managed-proxy/constants.ts +1 -7
package/src/providers/managed-proxy/context.ts +0 -1
package/src/providers/model-intents.ts +5 -5
package/src/providers/openai/client.ts +10 -1
package/src/providers/openrouter/client.ts +1 -0
package/src/providers/ratelimit.ts +0 -35
package/src/providers/registry.ts +3 -5
package/src/providers/retry.ts +18 -1
package/src/runtime/access-request-helper.ts +1 -1
package/src/runtime/auth/route-policy.ts +7 -0
package/src/runtime/channel-verification-service.ts +1 -1
package/src/runtime/confirmation-request-guardian-bridge.ts +1 -1
package/src/runtime/guardian-vellum-migration.ts +63 -1
package/src/runtime/http-server.ts +8 -4
package/src/runtime/migrations/vbundle-builder.ts +212 -32
package/src/runtime/migrations/vbundle-import-analyzer.ts +74 -8
package/src/runtime/migrations/vbundle-importer.ts +66 -1
package/src/runtime/migrations/vbundle-validator.ts +17 -3
package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +4 -4
package/src/runtime/routes/attachment-routes.ts +2 -2
package/src/runtime/routes/btw-routes.ts +9 -0
package/src/runtime/routes/channel-verification-routes.ts +19 -2
package/src/runtime/routes/conversation-management-routes.ts +55 -1
package/src/runtime/routes/conversation-query-routes.ts +1 -1
package/src/runtime/routes/conversation-routes.ts +49 -5
package/src/runtime/routes/conversation-starter-routes.ts +207 -0
package/src/runtime/routes/guardian-bootstrap-routes.ts +13 -9
package/src/runtime/routes/inbound-stages/escalation-intercept.ts +1 -1
package/src/runtime/routes/inbound-stages/verification-intercept.ts +1 -1
package/src/runtime/routes/migration-routes.ts +25 -13
package/src/runtime/routes/secret-routes.ts +18 -0
package/src/runtime/routes/settings-routes.ts +8 -8
package/src/runtime/routes/telemetry-routes.ts +53 -0
package/src/runtime/routes/trace-event-routes.ts +62 -0
package/src/runtime/tool-grant-request-helper.ts +1 -1
package/src/runtime/verification-outbound-actions.ts +47 -31
package/src/security/encrypted-store.ts +263 -78
package/src/skills/catalog-install.ts +10 -0
package/src/skills/managed-store.ts +2 -0
package/src/skills/skill-memory.ts +220 -0
package/src/subagent/manager.ts +1 -4
package/src/telemetry/types.ts +10 -1
package/src/telemetry/usage-telemetry-reporter.test.ts +1 -1
package/src/telemetry/usage-telemetry-reporter.ts +51 -4
package/src/tools/AGENTS.md +11 -11
package/src/tools/acp/spawn.ts +1 -1
package/src/tools/apps/executors.ts +8 -8
package/src/tools/apps/registry.ts +1 -1
package/src/tools/assets/materialize.ts +6 -6
package/src/tools/assets/search.ts +10 -10
package/src/tools/browser/__tests__/auth-cache.test.ts +2 -2
package/src/tools/browser/__tests__/auth-detector.test.ts +4 -4
package/src/tools/browser/auth-detector.ts +6 -6
package/src/tools/browser/browser-execution.ts +13 -13
package/src/tools/browser/browser-manager.ts +3 -3
package/src/tools/browser/chrome-cdp.ts +5 -5
package/src/tools/browser/jit-auth.ts +2 -2
package/src/tools/browser/network-recorder.test.ts +2 -2
package/src/tools/browser/network-recorder.ts +3 -3
package/src/tools/browser/runtime-check.ts +3 -3
package/src/tools/claude-code/claude-code.ts +2 -2
package/src/tools/computer-use/definitions.ts +18 -18
package/src/tools/credential-execution/make-authenticated-request.ts +4 -4
package/src/tools/credential-execution/manage-secure-command-tool.ts +3 -3
package/src/tools/credential-execution/run-authenticated-command.ts +4 -4
package/src/tools/credentials/broker-types.ts +5 -5
package/src/tools/credentials/broker.ts +15 -15
package/src/tools/credentials/metadata-store.ts +2 -2
package/src/tools/credentials/resolve.ts +1 -1
package/src/tools/credentials/selection.ts +1 -1
package/src/tools/credentials/tool-policy.ts +1 -1
package/src/tools/credentials/vault.ts +115 -25
package/src/tools/execution-target.ts +2 -2
package/src/tools/executor.ts +7 -7
package/src/tools/filesystem/edit.ts +2 -2
package/src/tools/filesystem/read.ts +1 -1
package/src/tools/filesystem/write.ts +1 -1
package/src/tools/host-filesystem/edit.ts +2 -1
package/src/tools/host-filesystem/read.ts +2 -1
package/src/tools/host-filesystem/write.ts +1 -1
package/src/tools/host-terminal/host-shell.ts +9 -8
package/src/tools/mcp/mcp-tool-factory.ts +7 -6
package/src/tools/memory/definitions.ts +6 -5
package/src/tools/memory/handlers.test.ts +1 -1
package/src/tools/network/__tests__/web-search.test.ts +3 -3
package/src/tools/network/domain-normalize.ts +2 -2
package/src/tools/network/script-proxy/session-manager.ts +10 -10
package/src/tools/network/web-fetch.ts +1 -1
package/src/tools/network/web-search.ts +3 -3
package/src/tools/permission-checker.ts +8 -8
package/src/tools/registry.ts +7 -7
package/src/tools/schedule/list.ts +2 -2
package/src/tools/schema-transforms.ts +31 -21
package/src/tools/secret-detection-handler.ts +1 -1
package/src/tools/sensitive-output-placeholders.ts +1 -1
package/src/tools/shared/filesystem/edit-engine.ts +1 -1
package/src/tools/shared/filesystem/file-ops-service.ts +3 -3
package/src/tools/shared/filesystem/image-read.ts +25 -5
package/src/tools/shared/filesystem/path-policy.ts +2 -2
package/src/tools/shared/shell-output.ts +1 -1
package/src/tools/side-effects.ts +1 -1
package/src/tools/skills/execute.ts +1 -1
package/src/tools/skills/load.ts +3 -3
package/src/tools/skills/sandbox-runner.ts +3 -3
package/src/tools/subagent/read.ts +1 -1
package/src/tools/subagent/spawn.ts +2 -2
package/src/tools/swarm/delegate.ts +3 -3
package/src/tools/system/request-permission.ts +5 -4
package/src/tools/terminal/backends/native.ts +4 -4
package/src/tools/terminal/parser.ts +6 -6
package/src/tools/terminal/sandbox-diagnostics.ts +1 -1
package/src/tools/terminal/shell.ts +16 -16
package/src/tools/tool-approval-handler.ts +21 -12
package/src/tools/tool-manifest.ts +4 -4
package/src/tools/types.ts +3 -3
package/src/tools/ui-surface/definitions.ts +9 -37
package/src/tools/watcher/list.ts +1 -1
package/src/util/logger.ts +7 -2
package/src/util/retry.ts +29 -1
package/src/workspace/migrations/007-web-search-provider-rename.ts +37 -0
package/src/workspace/migrations/registry.ts +2 -0
package/src/__tests__/cli-help-reference-sync.test.ts +0 -26
package/src/__tests__/onboarding-starter-tasks.test.ts +0 -190
package/src/cli/reference.ts +0 -38
package/src/memory/job-handlers/capability-cards.ts +0 -420
package/src/runtime/routes/thread-starter-routes.ts +0 -294

package/ARCHITECTURE.md CHANGED Viewed

@@ -4,11 +4,11 @@ This document owns assistant-runtime architecture details. The repo-level archit
 ### Channel Onboarding Playbook Bootstrap
-- Transport metadata arrives via `session_create.transport` (HTTP) or `/channels/inbound` (`channelId`, optional `hints`, optional `uxBrief`).
+- Transport metadata arrives via `conversation_create.transport` (HTTP) or `/channels/inbound` (`channelId`, optional `hints`, optional `uxBrief`).
 - Telegram webhook ingress injects deterministic channel-safe transport metadata (`hints` + `uxBrief`) so non-dashboard channels defer dashboard-only UI tasks cleanly.
 - `OnboardingPlaybookManager` resolves `<channel>_onboarding.md`, checks `onboarding/playbooks/registry.json`, and applies per-channel first-time fast-path onboarding.
 - `OnboardingOrchestrator` derives onboarding-mode guidance (post-hatch sequence, USER.md capture) from playbook + transport context.
-- Session runtime assembly injects both `<channel_onboarding_playbook>` and `<onboarding_mode>` context before provider calls, then strips both from persisted conversation history.
+- Conversation runtime assembly injects both `<channel_onboarding_playbook>` and `<onboarding_mode>` context before provider calls, then strips both from persisted conversation history.
 - Permission setup remains user-initiated and hatch + first-conversation flows avoid proactive permission asks.
 ### Guardian Actor Context (Unified Across Channels)
@@ -17,7 +17,7 @@ This document owns assistant-runtime architecture details. The repo-level archit
 - The same resolver is used by:
   - `/channels/inbound` (Telegram/WhatsApp path) before run orchestration.
   - Inbound Twilio voice setup (`RelayConnection.handleSetup`) to seed call-time actor context.
-- Runtime channel runs pass this as `trustContext`, and session runtime assembly injects `<inbound_actor_context>` (via `inboundActorContextFromTrustContext()`) into provider-facing prompts.
+- Runtime channel runs pass this as `trustContext`, and conversation runtime assembly injects `<inbound_actor_context>` (via `inboundActorContextFromTrustContext()`) into provider-facing prompts.
 - Voice calls mirror the same prompt contract: `CallController` receives guardian context on setup and refreshes it immediately after successful voice challenge verification, so the first post-verification turn is grounded as `actor_role: guardian`.
 - Voice-specific behavior (DTMF/speech verification flow, relay state machine) remains voice-local; only actor-role resolution is shared.
@@ -138,7 +138,7 @@ All guardian approval decisions — regardless of how they arrive — route thro
 | `src/runtime/routes/guardian-action-routes.ts` | HTTP route handlers for `GET /v1/guardian-actions/pending` and `POST /v1/guardian-actions/decision`                                               |
 | `src/runtime/channel-approval-types.ts`        | Channel-facing approval action types and `toApprovalActionOptions` bridge                                                                         |
-### Temporary Approval Modes (Session-Scoped Overrides)
+### Temporary Approval Modes (Conversation-Scoped Overrides)
 In addition to persistent trust rules (`always_allow` / `always_deny`), the approval system supports two **temporary** approval modes that auto-approve tool confirmations for the duration of a conversation or a fixed time window. These exist to reduce prompt fatigue during intensive sessions without permanently altering the trust configuration.
@@ -147,7 +147,7 @@ In addition to persistent trust rules (`always_allow` / `always_deny`), the appr
 1. **`allow_conversation`** — Auto-approve all tool confirmations for the remainder of the current conversation. The override persists until the session ends, the conversation is closed, or the mode is explicitly cleared.
 2. **`allow_10m`** — Auto-approve all tool confirmations for 10 minutes (configurable). The override expires lazily on the next read after the TTL elapses — no background sweep runs.
-**Session-scoped, in-memory only:** Overrides are keyed by `conversationId` and stored in an in-memory `Map` inside `conversation-approval-overrides.ts`. They do not survive daemon restarts, which is intentional — temporary approvals should not outlive the session that created them.
+**Conversation-scoped, in-memory only:** Overrides are keyed by `conversationId` and stored in an in-memory `Map` inside `conversation-approval-overrides.ts`. They do not survive daemon restarts, which is intentional — temporary approvals should not outlive the conversation that created them.
 **Integration with the permission pipeline:** The permission checker (`src/tools/permission-checker.ts`) checks for an active temporary override via `getEffectiveMode()` before prompting the user. If an active override exists for the current conversation, the confirmation is auto-approved without surfacing a prompt. This check runs after persistent trust rules, so a persistent `deny` rule still takes precedence.
@@ -783,10 +783,10 @@ All client-server communication uses HTTP for request/response operations and Se
 The daemon emits two distinct error message types via SSE:
-| Message type         | Scope          | Purpose                                                                                                        | Payload                                                                       |
-| -------------------- | -------------- | -------------------------------------------------------------------------------------------------------------- | ----------------------------------------------------------------------------- |
-| `conversation_error` | Session-scoped | Typed, actionable failures during chat/session runtime (e.g., provider network error, rate limit, API failure) | `sessionId`, `code` (typed enum), `userMessage`, `retryable`, `debugDetails?` |
-| `error`              | Global         | Generic, non-session failures (e.g., daemon startup errors, unknown message types)                             | `message` (string)                                                            |
+| Message type         | Scope               | Purpose                                                                                                        | Payload                                                                       |
+| -------------------- | ------------------- | -------------------------------------------------------------------------------------------------------------- | ----------------------------------------------------------------------------- |
+| `conversation_error` | Conversation-scoped | Typed, actionable failures during conversation runtime (e.g., provider network error, rate limit, API failure) | `sessionId`, `code` (typed enum), `userMessage`, `retryable`, `debugDetails?` |
+| `error`              | Global              | Generic, non-session failures (e.g., daemon startup errors, unknown message types)                             | `message` (string)                                                            |
 **Design rationale:** `conversation_error` carries structured metadata (error code, retryable flag, debug details) so the client can present actionable UI — a toast with retry/dismiss buttons — rather than a generic error banner. The older `error` type is retained for backward compatibility with non-session contexts.
@@ -845,7 +845,7 @@ sequenceDiagram
     end
 ```
-1. **Daemon** encounters a session-scoped failure, classifies it via `classifyConversationError()`, and sends a `conversation_error` SSE event with the session ID, typed error code, user-facing message, retryable flag, and optional debug details. Session-scoped failures emit _only_ `conversation_error` (never the generic `error` type) to prevent cross-session bleed.
+1. **Daemon** encounters a conversation-scoped failure, classifies it via `classifyConversationError()`, and sends a `conversation_error` SSE event with the conversation ID, typed error code, user-facing message, retryable flag, and optional debug details. Conversation-scoped failures emit _only_ `conversation_error` (never the generic `error` type) to prevent cross-conversation bleed.
 2. **ChatViewModel** receives the error via DaemonClient's `subscribe()` stream (each view model gets an independent stream), sets the `conversationError` property, and transitions out of the streaming/loading state so the UI is interactive. If the error arrives during an active cancel (`wasCancelling == true`), it is suppressed — cancel only shows `generation_cancelled` behavior.
 3. **ChatView** observes the published `conversationError` and displays an actionable toast with a category-specific icon and accent color:
    - **Retry** (shown when `retryable` is true): calls `retryAfterConversationError()`, which clears the error and sends a `regenerate` message to the daemon.

package/Dockerfile CHANGED Viewed

@@ -89,6 +89,9 @@ RUN echo 'Dir::State "/data/dpkg";' > /etc/apt/apt.conf.d/99data-dir && \
 ENV PATH="/data/usr/bin:/data/usr/sbin:${PATH}"
 ENV LD_LIBRARY_PATH="/data/usr/lib:/data/usr/lib/x86_64-linux-gnu:/data/usr/lib/aarch64-linux-gnu"
+# Ensure the CES bootstrap socket volume is writable by the non-root CES user.
+RUN mkdir -p /run/ces-bootstrap && chmod 777 /run/ces-bootstrap
 USER root
 EXPOSE 3001

package/README.md CHANGED Viewed

@@ -77,17 +77,17 @@ bun run src/index.ts                # interactive CLI session
 ### CLI commands
-| Command                                       | Description                                      |
-| --------------------------------------------- | ------------------------------------------------ |
-| `vellum wake`                                 | Start assistant + gateway from current checkout  |
-| `vellum sleep`                                | Stop assistant + gateway processes               |
-| `vellum ps`                                   | List assistants and per-assistant process status |
-| `assistant`                                   | Launch interactive CLI session                   |
-| `assistant sessions list\|new\|export\|clear` | Manage conversation sessions                     |
-| `assistant config set\|get\|list`             | Manage configuration                             |
-| `assistant keys set\|list\|delete`            | Manage API keys in secure storage                |
-| `assistant trust list\|remove\|clear`         | Manage trust rules                               |
-| `assistant doctor`                            | Run diagnostic checks                            |
+| Command                                            | Description                                      |
+| -------------------------------------------------- | ------------------------------------------------ |
+| `vellum wake`                                      | Start assistant + gateway from current checkout  |
+| `vellum sleep`                                     | Stop assistant + gateway processes               |
+| `vellum ps`                                        | List assistants and per-assistant process status |
+| `assistant`                                        | Launch interactive CLI session                   |
+| `assistant conversations list\|new\|export\|clear` | Manage conversations                             |
+| `assistant config set\|get\|list`                  | Manage configuration                             |
+| `assistant keys set\|list\|delete`                 | Manage API keys in secure storage                |
+| `assistant trust list\|remove\|clear`              | Manage trust rules                               |
+| `assistant doctor`                                 | Run diagnostic checks                            |
 ## Project Structure

package/docs/architecture/integrations.md CHANGED Viewed

@@ -542,7 +542,7 @@ sequenceDiagram
     Materialize->>DB: load attachment (including base64 data)
     Materialize->>Visibility: isAttachmentVisible(attachmentCtx, currentCtx)
     Note over Visibility: Second visibility check at materialize time<br/>prevents TOCTOU between search and materialize
-    Materialize->>Materialize: size check (max 50 MB)
+    Materialize->>Materialize: size check (max 100 MB)
     Materialize->>Sandbox: write decoded bytes to destination
     Materialize-->>Model: "Materialized 'photo.jpg' to /workspace/media/photo.jpg"
 ```
@@ -586,7 +586,7 @@ graph TB
 ### Materialize Safeguards
 - **Sandbox path enforcement**: Destination path must resolve inside the sandbox working directory
-- **Size limit**: 50 MB ceiling prevents materializing excessively large attachments
+- **Size limit**: 100 MB ceiling prevents materializing excessively large attachments
 - **Double visibility check**: Both `asset_search` and `asset_materialize` independently verify visibility, preventing TOCTOU races between search and use
 - **Risk level**: Both tools are `RiskLevel.Low` since they read existing data and write only within the sandbox

package/docs/architecture/memory.md CHANGED Viewed

@@ -250,7 +250,7 @@ The recall pipeline runs on every turn that passes the `needsMemory` gate (skips
 9. **Two-layer XML injection** (`formatting.ts`): Budget-aware rendering into four XML sections:
    ```xml
-   <memory_context>
+   <memory_context __injected>
    <user_identity>
    <!-- identity-kind tier 1 items (plain statements) -->
@@ -273,7 +273,7 @@ The recall pipeline runs on every turn that passes the `needsMemory` gate (skips
    Empty sections are omitted. Each section has a per-item token budget (150 tokens for tier 1, 100 for tier 2). Tier 1 sections consume budget first; tier 2 uses the remainder.
-10. **Injection strategy**: The rendered `<memory_context>` block is injected as a separate user + assistant acknowledgment message pair before the last user message (`injectMemoryRecallAsSeparateMessage`). This separates memory context from the user's actual query.
+10. **Injection strategy**: The rendered `<memory_context __injected>` block is prepended as a text content block to the last user message (`injectMemoryRecallAsUserBlock`), following the same pattern as workspace, temporal, and other runtime injections. Stripping is handled by the generic `stripUserTextBlocksByPrefix` mechanism matching the `<memory_context __injected>` prefix (with a backward-compat entry for the legacy `<memory_context>` prefix from older history). This avoids synthetic message pairs and preserves prompt prefix caching between turns.
 ### Internal-Only Trust Gating
@@ -464,7 +464,7 @@ The Anthropic provider places `cache_control: { type: 'ephemeral' }` on the **la
 ## Temporal Context Injection — Date Grounding
-The session injects a `<temporal_context>` block into every user message at runtime, giving the model awareness of the current date, current local time, current UTC time, timezone source metadata, upcoming weekend/work week windows, and a 14-day horizon of labelled future dates. This enables reliable reasoning about future dates (e.g. "plan a trip for next weekend") without persisting volatile temporal data in conversation history.
+The session injects a `<temporal_context>` block into every user message at runtime, giving the model awareness of the current date, current local time, current UTC time, and timezone source metadata. This enables reliable reasoning about dates and times without persisting volatile temporal data in conversation history.
 ### Per-turn flow
@@ -488,7 +488,6 @@ graph TB
 - **Clock source invariant**: Absolute time (`now`) always comes from the assistant host clock (`Date.now()`), never from channel/client clocks.
 - **Timezone precedence**: If `ui.userTimezone` is configured, temporal context uses it for local-date interpretation. Otherwise it falls back to memory-stored timezone, then assistant host timezone.
 - **Timezone-aware**: Uses `Intl.DateTimeFormat` APIs for DST-safe date arithmetic and timezone validation/canonicalization.
-- **Bounded output**: Hard-capped at 1500 characters and 14 horizon entries to prevent prompt bloat.
 - **Runtime-only**: The injected `<temporal_context>` block is stripped from `this.messages` after the agent loop completes via `stripTemporalContext`. It never persists in conversation history.
 - **Specific strip prefix**: The strip function matches the exact injected prefix (`<temporal_context>\nToday:`) to avoid accidentally removing user-authored text that starts with `<temporal_context>`.
 - **Retry paths**: Temporal context is included in all three `applyRuntimeInjections` call sites (main path, compact retry, media-trim retry).

package/docs/credential-execution-service.md CHANGED Viewed

@@ -60,36 +60,29 @@ The existing `host_bash` tool executes commands on the host machine without any
 **Implication**: `host_bash` represents a weaker security tier. Agents that require the strong secrecy guarantee must use `run_authenticated_command` instead. Trust rules and permission policies should reflect this distinction — managed deployments may deny `host_bash` entirely for untrusted agents while allowing `run_authenticated_command`.
-### 2. Local static secrets are local-mode only — by design
+### 2. Local static secrets are local-mode only — by policy
-For the initial implementation, local static secrets (API keys, tokens stored via the credential store in `~/.vellum/protected/`) are only accessible to CES in **local mode**, where CES runs as a child process of the assistant as the same OS user. CES reads them at materialization time via direct filesystem access.
+For the current implementation, local static secrets (API keys, tokens stored via the credential store in `~/.vellum/protected/`) are only accessible to CES in **local mode**, where CES runs as a child process of the assistant. CES reads them at materialization time via direct filesystem access.
-In **managed mode**, `local_static` handles are not supported and the CES returns a clear error for any `local_static` handle. Managed deployments use `platform_oauth` handles exclusively. This is a deliberate architectural decision, not a temporary limitation.
+In **managed mode**, `local_static` handles are not supported and the CES returns a clear error for any `local_static` handle. Managed deployments use `platform_oauth` handles exclusively. With v2 `store.key`, this is a **policy choice** (simpler lifecycle, centralized token management) rather than a technical limitation — the UID-independent key file could be shared via volume mount.
-#### Why `local_static` cannot work in managed mode
+#### Historical: v1 key derivation blocker (resolved in v2)
-The original design considered having managed deployments share static secrets via the assistant data volume. This is technically impossible due to how the encrypted key store works.
+The v1 encrypted key store uses PBKDF2 key derivation where the encryption key is derived from `userInfo().username` and `userInfo().homedir`. In managed deployments the assistant and CES sidecar run as different OS users, producing different derived keys — making it impossible for CES to decrypt secrets stored by the assistant.
-The `local-secure-key-backend.ts` module uses PBKDF2 key derivation where the encryption key is derived from `userInfo().username` and `userInfo().homedir`. In managed deployments:
+v2 stores replaced PBKDF2 derivation with a random 32-byte key stored at `<vellumRoot>/protected/store.key`. This key is UID-independent and can be shared via volume mount, removing the technical barrier to `local_static` in managed mode.
-- The **assistant container** runs as `root` (homedir `/root`)
-- The **CES sidecar container** runs as `ces` / uid 1001 (homedir `/home/ces`)
+The policy decision to use `platform_oauth` exclusively in managed mode still stands for operational reasons: simpler credential lifecycle, centralized token management, and no need to synchronize key files across containers. Future iterations may enable `local_static` in managed mode via shared `store.key` volume mounts if there is a compelling use case.
-These produce different PBKDF2-derived AES keys. Even if the encrypted key store file (`keys.enc`) were mounted as a shared volume, CES would derive a different decryption key and silently fail to decrypt the secrets.
+#### Rejected alternatives (v1-era, historical context)
-#### Rejected alternatives
+These alternatives were evaluated for the v1 key store and rejected. They are retained for historical context — the v2 `store.key` format resolves the underlying issue without hitting these trade-offs.
-Three alternatives were evaluated and rejected because each breaks a core security invariant:
+1. **Mount decrypted secrets into the CES container** — Breaks the "secrets never in assistant process memory" boundary (Boundary Invariant #2).
-1. **Mount decrypted secrets into the CES container** — This would require decrypting secrets in the assistant container and writing plaintext to a shared volume, breaking the "secrets never in assistant process memory" boundary (Boundary Invariant #2).
+2. **Use shared key derivation independent of UID** — Was rejected for v1 because it weakened the encrypted-at-rest model. The v2 `store.key` approach achieves UID-independent decryption without the per-user identity trade-off, since the random key file is protected by filesystem permissions rather than derivation entropy.
-2. **Use shared key derivation independent of UID** — Deriving the encryption key from a shared secret (e.g., a pod-level token) rather than per-user identity would weaken the encrypted-at-rest security model. The UID-based derivation ensures that only the user who stored the credential can decrypt it, which is a fundamental property of the local credential store.
-3. **Pre-decrypt and pass via the RPC socket** — Having the assistant decrypt the secret and send it to CES over the Unix socket would mean the assistant process handles plaintext credential values, directly violating the CES process-boundary isolation guarantee.
-Since all alternatives break security invariants that CES exists to enforce, managed deployments route credential access through `platform_oauth` where the platform manages token lifecycle and CES requests materialized tokens via the platform proxy endpoint.
-Future iterations may move secret storage to a dedicated secret manager (e.g., cloud KMS, Vault) with CES as the only authorized reader, which would enable static secrets in managed mode without compromising the process-boundary isolation.
+3. **Pre-decrypt and pass via the RPC socket** — Violates the CES process-boundary isolation guarantee.
 ### 3. Platform OAuth materialization stays on the platform
@@ -396,7 +389,7 @@ This means the helper is subject to the same cooperative egress limitation as th
 The following capabilities are intentionally deferred beyond v1:
-- **`local_static` handles in managed mode** — Structurally unsupported due to PBKDF2 key derivation depending on per-container UID (see Locked Decision #2 for full rationale and rejected alternatives). Managed mode returns a clear error and requires `platform_oauth` handles exclusively.
+- **`local_static` handles in managed mode** — Technically feasible with v2 `store.key` (UID-independent), but managed mode currently uses `platform_oauth` exclusively as a policy choice (see Locked Decision #2). May be enabled in the future via shared `store.key` volume mount if there is a compelling use case.
 - **Cloud KMS/Vault integration for secret storage** — v1 reads secrets from filesystem (`~/.vellum/protected/` locally, `/ces-data` in managed). Moving to a dedicated secrets manager is a future enhancement.
 - **Multi-CES-instance support** — Each assistant pod runs exactly one CES sidecar. Horizontal scaling of CES within a pod is not supported.
 - **Cross-pod credential sharing** — CES grants are scoped to a single pod. There is no grant federation across pods or assistant instances.

package/node_modules/@vellumai/ces-contracts/src/error.ts CHANGED Viewed

@@ -15,10 +15,11 @@ export type RpcError = z.infer<typeof RpcErrorSchema>;
 /**
  * Error returned when a local_static credential handle is used in managed
- * mode. The encrypted key store uses PBKDF2 key derivation from user
- * identity (username, homedir), but the assistant container runs as root
- * while CES runs as ces — different derived keys make decryption silently
- * fail. Managed deployments must use platform_oauth handles exclusively.
+ * mode. v2 stores use a UID-independent `store.key` file that removes the
+ * technical barrier (legacy v1 relied on PBKDF2 key derivation from user
+ * identity, which broke across container users). The restriction is now a
+ * policy choice: managed deployments use platform_oauth handles exclusively
+ * for simpler lifecycle and centralized token management.
  */
 export const MANAGED_LOCAL_STATIC_REJECTION_ERROR =
   "local_static credential handles are not supported in managed mode. " +

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@vellumai/assistant",
-  "version": "0.4.56",
+  "version": "0.4.57",
   "type": "module",
   "exports": {
     ".": "./src/index.ts"

package/src/__tests__/actor-token-service.test.ts CHANGED Viewed

@@ -93,8 +93,8 @@ function mockServer(address: string): ServerWithRequestIP {
 /** Mock loopback server -- returns 127.0.0.1 for all requests. */
 const loopbackServer = mockServer("127.0.0.1");
-/** Mock non-loopback server -- returns a LAN IP for all requests. */
-const nonLoopbackServer = mockServer("192.168.1.50");
+/** Mock non-loopback server -- returns a public IP for all requests. */
+const nonLoopbackServer = mockServer("203.0.113.50");
 initializeDb();
@@ -676,11 +676,11 @@ describe("pairing credential flow", () => {
 });
 // ---------------------------------------------------------------------------
-// Bootstrap loopback guard tests
+// Bootstrap private-network guard tests
 // ---------------------------------------------------------------------------
-describe("bootstrap loopback guard", () => {
-  test("rejects bootstrap request with X-Forwarded-For header", async () => {
+describe("bootstrap private-network guard", () => {
+  test("rejects bootstrap request with public X-Forwarded-For", async () => {
     const { handleGuardianBootstrap } =
       await import("../runtime/routes/guardian-bootstrap-routes.js");
@@ -688,7 +688,7 @@ describe("bootstrap loopback guard", () => {
       method: "POST",
       headers: {
         "Content-Type": "application/json",
-        "X-Forwarded-For": "10.0.0.1",
+        "X-Forwarded-For": "203.0.113.1",
       },
       body: JSON.stringify({ platform: "macos", deviceId: "test-device" }),
     });
@@ -699,7 +699,7 @@ describe("bootstrap loopback guard", () => {
     expect(body.error.message).toContain("local-only");
   });
-  test("rejects bootstrap request from non-loopback IP", async () => {
+  test("rejects bootstrap request from public IP peer", async () => {
     const { handleGuardianBootstrap } =
       await import("../runtime/routes/guardian-bootstrap-routes.js");

package/src/__tests__/anthropic-provider.test.ts CHANGED Viewed

@@ -62,6 +62,7 @@ mock.module("@anthropic-ai/sdk", () => ({
 }));
 // Import after mocking
+import { SYSTEM_PROMPT_CACHE_BOUNDARY } from "../prompts/system-prompt.js";
 import {
   AnthropicProvider,
   PLACEHOLDER_BLOCKS_OMITTED,
@@ -155,6 +156,25 @@ describe("AnthropicProvider — Cache-Control Characterization", () => {
     expect(lastStreamParams!.system).toBeUndefined();
   });
+  test("splits system prompt into two cache blocks on boundary marker", async () => {
+    const staticBlock = "You are a helpful assistant.";
+    const dynamicBlock = "User workspace files here.";
+    const prompt = staticBlock + SYSTEM_PROMPT_CACHE_BOUNDARY + dynamicBlock;
+    await provider.sendMessage([userMsg("Hi")], undefined, prompt);
+    const system = lastStreamParams!.system as Array<{
+      type: string;
+      text: string;
+      cache_control?: { type: string };
+    }>;
+    expect(system).toHaveLength(2);
+    expect(system[0].text).toBe(staticBlock);
+    expect(system[0].cache_control).toEqual({ type: "ephemeral" });
+    expect(system[1].text).toBe(dynamicBlock);
+    expect(system[1].cache_control).toEqual({ type: "ephemeral" });
+  });
   // -----------------------------------------------------------------------
   // Tool cache control
   // -----------------------------------------------------------------------
@@ -1307,6 +1327,158 @@ describe("AnthropicProvider — Cache-Control Characterization", () => {
     expect(userMsgs[2].content[0].cache_control).toBeUndefined();
     expect(userMsgs[2].content[1].cache_control).toBeUndefined();
   });
+  // -----------------------------------------------------------------------
+  // is_error + contentBlocks — non-text blocks must be stripped
+  // -----------------------------------------------------------------------
+  test("is_error tool_result strips non-text contentBlocks (images)", async () => {
+    const messages: Message[] = [
+      userMsg("Do something"),
+      toolUseMsg("tu_img", "file_read"),
+      {
+        role: "user",
+        content: [
+          {
+            type: "tool_result",
+            tool_use_id: "tu_img",
+            content: "Error: file not found",
+            is_error: true,
+            contentBlocks: [
+              {
+                type: "image",
+                source: {
+                  type: "base64",
+                  media_type: "image/png",
+                  data: "iVBOR",
+                },
+              },
+              { type: "text", text: "extra error detail" },
+            ],
+          },
+        ],
+      },
+    ];
+    await provider.sendMessage(messages);
+    const sent = lastStreamParams!.messages as Array<{
+      role: string;
+      content: Array<{
+        type: string;
+        tool_use_id?: string;
+        is_error?: boolean;
+        content?: unknown;
+      }>;
+    }>;
+    const toolResult = sent[2].content.find(
+      (b) => b.type === "tool_result" && b.tool_use_id === "tu_img",
+    )!;
+    expect(toolResult.is_error).toBe(true);
+    // Content should be an array with only text blocks (no images)
+    const parts = toolResult.content as Array<{ type: string }>;
+    expect(Array.isArray(parts)).toBe(true);
+    expect(parts.every((p) => p.type === "text")).toBe(true);
+    // Original text + the extra text contentBlock
+    expect(parts).toHaveLength(2);
+  });
+  test("is_error tool_result with only image contentBlocks falls back to text-only", async () => {
+    const messages: Message[] = [
+      userMsg("Do something"),
+      toolUseMsg("tu_img2", "file_read"),
+      {
+        role: "user",
+        content: [
+          {
+            type: "tool_result",
+            tool_use_id: "tu_img2",
+            content: "Error: file not found",
+            is_error: true,
+            contentBlocks: [
+              {
+                type: "image",
+                source: {
+                  type: "base64",
+                  media_type: "image/png",
+                  data: "iVBOR",
+                },
+              },
+            ],
+          },
+        ],
+      },
+    ];
+    await provider.sendMessage(messages);
+    const sent = lastStreamParams!.messages as Array<{
+      role: string;
+      content: Array<{
+        type: string;
+        tool_use_id?: string;
+        is_error?: boolean;
+        content?: unknown;
+      }>;
+    }>;
+    const toolResult = sent[2].content.find(
+      (b) => b.type === "tool_result" && b.tool_use_id === "tu_img2",
+    )!;
+    expect(toolResult.is_error).toBe(true);
+    // All images stripped → no usable blocks → falls back to text-only content
+    expect(toolResult.content).toBe("Error: file not found");
+  });
+  test("non-error tool_result preserves image contentBlocks", async () => {
+    const messages: Message[] = [
+      userMsg("Do something"),
+      toolUseMsg("tu_img3", "file_read"),
+      {
+        role: "user",
+        content: [
+          {
+            type: "tool_result",
+            tool_use_id: "tu_img3",
+            content: "Success",
+            is_error: false,
+            contentBlocks: [
+              {
+                type: "image",
+                source: {
+                  type: "base64",
+                  media_type: "image/png",
+                  data: "iVBOR",
+                },
+              },
+            ],
+          },
+        ],
+      },
+    ];
+    await provider.sendMessage(messages);
+    const sent = lastStreamParams!.messages as Array<{
+      role: string;
+      content: Array<{
+        type: string;
+        tool_use_id?: string;
+        is_error?: boolean;
+        content?: unknown;
+      }>;
+    }>;
+    const toolResult = sent[2].content.find(
+      (b) => b.type === "tool_result" && b.tool_use_id === "tu_img3",
+    )!;
+    expect(toolResult.is_error).toBe(false);
+    // Non-error: images should be preserved in the content array
+    const parts = toolResult.content as Array<{ type: string }>;
+    expect(Array.isArray(parts)).toBe(true);
+    expect(parts.some((p) => p.type === "image")).toBe(true);
+  });
 });
 // ---------------------------------------------------------------------------

package/src/__tests__/app-builder-tool-scripts.test.ts CHANGED Viewed

@@ -63,7 +63,21 @@ function makeContext(overrides: Partial<ToolContext> = {}): ToolContext {
 const mockStore = makeMockStore();
-mock.module("../memory/app-store.js", () => mockStore);
+mock.module("../memory/app-store.js", () => ({
+  ...mockStore,
+  getAppsDir: () => "/tmp/test-apps",
+  isMultifileApp: (app: AppDefinition) => app.formatVersion === 2,
+}));
+// Mock compileApp for multifile scaffold path
+mock.module("../bundler/app-compiler.js", () => ({
+  compileApp: async () => ({
+    ok: true,
+    errors: [],
+    warnings: [],
+    durationMs: 0,
+  }),
+}));
 // ---------------------------------------------------------------------------
 // Import skill scripts (after mocking)

package/src/__tests__/approval-cascade.test.ts CHANGED Viewed

@@ -76,7 +76,7 @@ mock.module("../config/loader.js", () => ({
       summaryModel: "mock-model",
       maxSummaryTokens: 512,
     },
-    rateLimit: { maxRequestsPerMinute: 0, maxTokensPerSession: 0 },
+    rateLimit: { maxRequestsPerMinute: 0 },
     timeouts: { permissionTimeoutSec: 300 },
     skills: { entries: {}, allowBundled: true },
     permissions: { mode: "workspace" },
@@ -166,7 +166,7 @@ mock.module("../memory/retriever.js", () => ({
     injectedTokens: 0,
     latencyMs: 0,
   }),
-  stripMemoryRecallMessages: (msgs: Message[]) => msgs,
+  injectMemoryRecallAsUserBlock: (msgs: Message[]) => msgs,
 }));
 mock.module("../context/window-manager.js", () => ({

package/src/__tests__/approval-routes-http.test.ts CHANGED Viewed

@@ -42,9 +42,8 @@ mock.module("../config/loader.js", () => ({
     model: "test",
     provider: "test",
     memory: { enabled: false },
-    rateLimit: { maxRequestsPerMinute: 0, maxTokensPerSession: 0 },
+    rateLimit: { maxRequestsPerMinute: 0 },
     secretDetection: { enabled: false },
-    sandbox: { enabled: false },
     contextWindow: { maxInputTokens: 200000 },
     services: {
       inference: {
@@ -55,9 +54,9 @@ mock.module("../config/loader.js", () => ({
       "image-generation": {
         mode: "your-own",
         provider: "gemini",
-        model: "gemini-2.5-flash-image",
+        model: "gemini-3.1-flash-image-preview",
       },
-      "web-search": { mode: "your-own", provider: "anthropic-native" },
+      "web-search": { mode: "your-own", provider: "inference-provider-native" },
     },
   }),
 }));

package/src/__tests__/asset-materialize-tool.test.ts CHANGED Viewed

@@ -34,7 +34,7 @@ mock.module("../config/loader.js", () => ({
     model: "test",
     provider: "test",
     memory: { enabled: false },
-    rateLimit: { maxRequestsPerMinute: 0, maxTokensPerSession: 0 },
+    rateLimit: { maxRequestsPerMinute: 0 },
   }),
 }));
@@ -263,7 +263,7 @@ describe("AssetMaterializeTool materialization", () => {
 describe("AssetMaterializeTool size limit", () => {
   beforeEach(resetTables);
-  test("rejects attachment exceeding 50MB limit", async () => {
+  test("rejects attachment exceeding 100MB limit", async () => {
     // Simulate a large attachment by inserting directly into the DB
     // with a sizeBytes value over the limit
     const db = getDb();
@@ -271,7 +271,7 @@ describe("AssetMaterializeTool size limit", () => {
     db.run(
       `INSERT INTO attachments (id, original_filename, mime_type, size_bytes, kind, data_base64, created_at)
        VALUES ('${fakeId}', 'huge.bin', 'application/octet-stream', ${
-         51 * 1024 * 1024
+         101 * 1024 * 1024
        }, 'document', 'AAAA', ${Date.now()})`,
     );
@@ -314,8 +314,8 @@ describe("AssetMaterializeTool metadata", () => {
     ).toHaveProperty("destination_path");
   });
-  test("tool has MEDIUM risk level", () => {
-    expect(assetMaterializeTool.defaultRiskLevel).toBe(RiskLevel.Medium);
+  test("tool has LOW risk level", () => {
+    expect(assetMaterializeTool.defaultRiskLevel).toBe(RiskLevel.Low);
   });
   test("tool category is assets", () => {

package/src/__tests__/asset-search-tool.test.ts CHANGED Viewed

@@ -33,7 +33,7 @@ mock.module("../config/loader.js", () => ({
     model: "test",
     provider: "test",
     memory: { enabled: false },
-    rateLimit: { maxRequestsPerMinute: 0, maxTokensPerSession: 0 },
+    rateLimit: { maxRequestsPerMinute: 0 },
   }),
 }));