@vellumai/assistant 0.9.0 → 0.10.0-staging.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/ARCHITECTURE.md +18 -34
- package/bun.lock +7 -8
- package/docs/activation-funnel-telemetry.md +28 -22
- package/docs/architecture/security.md +29 -28
- package/docs/stt-provider-onboarding.md +3 -5
- package/docs/workflows-testing.md +13 -44
- package/docs/workflows.md +3 -5
- package/node_modules/@vellumai/ces-client/src/__tests__/ces-client.test.ts +47 -0
- package/node_modules/@vellumai/ces-client/src/rpc-client.ts +28 -5
- package/node_modules/@vellumai/environments/src/seeds.ts +2 -5
- package/node_modules/@vellumai/gateway-client/src/admission-policy-contract.ts +97 -0
- package/node_modules/@vellumai/gateway-client/src/inbound-contract.ts +10 -0
- package/node_modules/@vellumai/gateway-client/src/index.ts +32 -6
- package/node_modules/@vellumai/gateway-client/src/outbound-contract.ts +119 -0
- package/node_modules/@vellumai/gateway-client/src/types.ts +15 -84
- package/openapi.yaml +976 -63
- package/package.json +2 -1
- package/scripts/sync-llm-catalog.ts +6 -15
- package/scripts/sync-web-search-catalog.ts +3 -11
- package/src/__tests__/access-request-card-view.test.ts +98 -0
- package/src/__tests__/access-request-seed-content-blocks.test.ts +2 -4
- package/src/__tests__/actor-trust-resolver-address-fallback.test.ts +72 -32
- package/src/__tests__/agent-loop-compaction-strip.test.ts +241 -0
- package/src/__tests__/agent-loop-mutable-latest-user-message.test.ts +16 -13
- package/src/__tests__/agent-loop-output-hooks.test.ts +69 -0
- package/src/__tests__/agent-loop-override-profile.test.ts +25 -0
- package/src/__tests__/always-loaded-tools-guard.test.ts +2 -3
- package/src/__tests__/app-compiler.test.ts +15 -1
- package/src/__tests__/app-dir-path-guard.test.ts +0 -1
- package/src/__tests__/assistant-feature-flag-guard.test.ts +1 -4
- package/src/__tests__/assistant-feature-flag-guardrails.test.ts +0 -2
- package/src/__tests__/auth-fallback-events-store.test.ts +6 -14
- package/src/__tests__/avatar-identity-sync.test.ts +2 -27
- package/src/__tests__/btw-routes.test.ts +6 -8
- package/src/__tests__/call-pointer-messages.test.ts +28 -0
- package/src/__tests__/cancel-clears-processing.test.ts +89 -0
- package/src/__tests__/channel-approval-routes.test.ts +0 -4
- package/src/__tests__/channel-inbound-disk-pressure.test.ts +5 -15
- package/src/__tests__/checker.test.ts +0 -3
- package/src/__tests__/cli-memory-v2-reembed-skills.test.ts +3 -4
- package/src/__tests__/compactor-image-manifest-trust.test.ts +21 -1
- package/src/__tests__/compactor-summary-call-truncation.test.ts +223 -0
- package/src/__tests__/config-loader-backfill.test.ts +268 -27
- package/src/__tests__/config-schema.test.ts +35 -0
- package/src/__tests__/config-watcher.test.ts +0 -18
- package/src/__tests__/confirmation-request-guardian-bridge.test.ts +2 -2
- package/src/__tests__/contact-store-user-file.test.ts +0 -6
- package/src/__tests__/contacts-tools.test.ts +29 -0
- package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +22 -0
- package/src/__tests__/conversation-agent-loop-overflow.test.ts +1 -0
- package/src/__tests__/conversation-agent-loop.test.ts +58 -0
- package/src/__tests__/conversation-attention-telegram.test.ts +0 -1
- package/src/__tests__/conversation-lifecycle.test.ts +7 -9
- package/src/__tests__/conversation-load-history-repair.test.ts +101 -0
- package/src/__tests__/conversation-routes-guardian-reply.test.ts +15 -12
- package/src/__tests__/conversation-surfaces-activation-emit.test.ts +6 -3
- package/src/__tests__/conversation-title-service.test.ts +62 -0
- package/src/__tests__/credential-broker.test.ts +449 -1
- package/src/__tests__/credential-execution-shell-lockdown.test.ts +18 -11
- package/src/__tests__/credential-execution-tools.test.ts +0 -1
- package/src/__tests__/credential-prompt-route.test.ts +4 -4
- package/src/__tests__/credential-routes.test.ts +360 -0
- package/src/__tests__/credential-security-invariants.test.ts +4 -13
- package/src/__tests__/disk-pressure-policy.test.ts +12 -0
- package/src/__tests__/disk-usage.test.ts +65 -0
- package/src/__tests__/dynamic-page-surface.test.ts +152 -1
- package/src/__tests__/fixtures/credential-security-fixtures.ts +2 -33
- package/src/__tests__/gateway-flag-listener.test.ts +110 -1
- package/src/__tests__/gateway-only-guard.test.ts +3 -7
- package/src/__tests__/guardian-binding-drift-heal.test.ts +1 -1
- package/src/__tests__/guardian-card-withdrawal.test.ts +403 -0
- package/src/__tests__/guardian-decision-primitive-canonical.test.ts +5 -3
- package/src/__tests__/guardian-grant-minting.test.ts +3 -35
- package/src/__tests__/guardian-routing-invariants.test.ts +64 -26
- package/src/__tests__/guardian-routing-state.test.ts +0 -1
- package/src/__tests__/headless-browser-mode.test.ts +10 -0
- package/src/__tests__/headless-browser-navigate.test.ts +8 -3
- package/src/__tests__/helpers/create-guardian-binding.ts +0 -1
- package/src/__tests__/host-browser-proxy.test.ts +87 -0
- package/src/__tests__/identity-routes.test.ts +0 -189
- package/src/__tests__/inbound-invite-redemption.test.ts +4 -4
- package/src/__tests__/injector-v3-suppression.test.ts +27 -20
- package/src/__tests__/internal-telemetry-routes.test.ts +6 -14
- package/src/__tests__/invite-redemption-service.test.ts +4 -7
- package/src/__tests__/llm-callsite-catalog.test.ts +5 -6
- package/src/__tests__/llm-catalog-parity.test.ts +30 -23
- package/src/__tests__/llm-resolver.test.ts +70 -24
- package/src/__tests__/llm-schema.test.ts +1 -0
- package/src/__tests__/managed-profile-guard.test.ts +163 -4
- package/src/__tests__/mcp-health-check.test.ts +6 -7
- package/src/__tests__/media-stream-server-integration.test.ts +317 -13
- package/src/__tests__/oauth-provider-seed-logos.test.ts +4 -6
- package/src/__tests__/onboarding-persona-write.test.ts +1 -1
- package/src/__tests__/path-policy.test.ts +34 -0
- package/src/__tests__/persona-resolver.test.ts +49 -14
- package/src/__tests__/plugin-api-model-profiles.test.ts +178 -0
- package/src/__tests__/plugin-api-provider.test.ts +24 -0
- package/src/__tests__/plugin-tool-contribution.test.ts +6 -3
- package/src/__tests__/post-compaction-reinjection-idempotency.test.ts +214 -0
- package/src/__tests__/provider-send-message-override-profile.test.ts +76 -0
- package/src/__tests__/reaction-persistence.test.ts +150 -29
- package/src/__tests__/registry.test.ts +2 -7
- package/src/__tests__/relay-server.test.ts +285 -0
- package/src/__tests__/runtime-attachment-metadata.test.ts +0 -1
- package/src/__tests__/schedule-routes-workflow-validation.test.ts +1 -10
- package/src/__tests__/schedule-routes.test.ts +0 -30
- package/src/__tests__/schedule-tools.test.ts +2 -18
- package/src/__tests__/scheduler-reuse-conversation.test.ts +8 -5
- package/src/__tests__/skill-execute-input.test.ts +51 -1
- package/src/__tests__/skill-runtime-path.test.ts +2 -3
- package/src/__tests__/skills.test.ts +51 -0
- package/src/__tests__/slack-notification-approval-card.test.ts +176 -0
- package/src/__tests__/slack-reaction-canonical-approval.test.ts +285 -0
- package/src/__tests__/subagent-tools.test.ts +266 -0
- package/src/__tests__/surface-completion-nudge-hook.test.ts +367 -0
- package/src/__tests__/task-progress-nudge-hook.test.ts +1 -1
- package/src/__tests__/title-generate-hook.test.ts +100 -3
- package/src/__tests__/token-estimator-accuracy.benchmark.test.ts +1 -29
- package/src/__tests__/token-manager.test.ts +519 -0
- package/src/__tests__/tool-approval-seed-content-blocks.test.ts +1 -1
- package/src/__tests__/tool-audit-listener.test.ts +7 -7
- package/src/__tests__/tool-executor-lifecycle-events.test.ts +6 -3
- package/src/__tests__/tool-executor.test.ts +0 -79
- package/src/__tests__/trusted-contact-approval-notifier.test.ts +4 -2
- package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +220 -3
- package/src/__tests__/trusted-contact-multichannel.test.ts +3 -3
- package/src/__tests__/trusted-contact-verification.test.ts +8 -10
- package/src/__tests__/twilio-routes.test.ts +81 -1
- package/src/__tests__/voice-invite-redemption.test.ts +2 -3
- package/src/__tests__/weak-open-model.test.ts +30 -0
- package/src/__tests__/web-search-catalog-parity.test.ts +6 -25
- package/src/__tests__/workspace-greetings.test.ts +152 -0
- package/src/__tests__/workspace-migration-105-enable-memory-v3-live-for-new-workspaces.test.ts +149 -0
- package/src/__tests__/workspace-migration-108-drop-balanced-economy-profile.test.ts +285 -0
- package/src/__tests__/workspace-migration-add-send-diagnostics.test.ts +1 -1
- package/src/__tests__/workspace-migration-drop-collect-usage-data.test.ts +118 -0
- package/src/__tests__/workspace-migration-drop-send-diagnostics.test.ts +118 -0
- package/src/a2a/__tests__/e2e-a2a-channel.test.ts +0 -4
- package/src/agent/loop.ts +49 -29
- package/src/api/README.md +6 -6
- package/src/api/events/tool-result.ts +6 -0
- package/src/api/events/workflow-completed.ts +53 -0
- package/src/api/events/workflow-leaf-finished.ts +38 -0
- package/src/api/events/workflow-leaf-started.ts +35 -0
- package/src/api/events/workflow-progress.ts +32 -0
- package/src/api/events/workflow-started.ts +31 -0
- package/src/api/index.ts +40 -0
- package/src/api/responses/conversation-message.ts +28 -4
- package/src/api/responses/home.ts +26 -4
- package/src/api/responses/workflow-journal.ts +53 -0
- package/src/approvals/guardian-card-withdrawal.ts +145 -0
- package/src/approvals/guardian-decision-primitive.ts +26 -3
- package/src/approvals/guardian-request-resolvers.ts +183 -80
- package/src/calls/__tests__/channel-admission-reader.test.ts +132 -0
- package/src/calls/__tests__/relay-setup-router.test.ts +350 -0
- package/src/calls/call-pointer-messages.ts +10 -4
- package/src/calls/channel-admission-reader.ts +104 -0
- package/src/calls/guardian-dispatch.ts +17 -45
- package/src/calls/media-stream-server.ts +84 -2
- package/src/calls/relay-access-wait.ts +1 -1
- package/src/calls/relay-server.ts +66 -0
- package/src/calls/relay-setup-router.ts +82 -1
- package/src/calls/twilio-routes.ts +17 -8
- package/src/calls/voice-session-bridge.ts +2 -2
- package/src/cli/commands/clients.ts +3 -0
- package/src/cli/commands/{__tests__ → memory/__tests__}/memory-v2-compare-render.test.ts +1 -1
- package/src/cli/commands/{__tests__ → memory/__tests__}/memory-v2.test.ts +8 -7
- package/src/cli/commands/{__tests__ → memory/__tests__}/memory-v3.test.ts +5 -4
- package/src/cli/commands/memory/index.ts +30 -0
- package/src/cli/commands/{memory-v2-compare-render.ts → memory/memory-v2-compare-render.ts} +1 -1
- package/src/cli/commands/{memory-v2.ts → memory/memory-v2.ts} +6 -15
- package/src/cli/commands/{memory-v3.ts → memory/memory-v3.ts} +97 -11
- package/src/cli/commands/oauth/status.test.ts +36 -0
- package/src/cli/commands/oauth/status.ts +23 -3
- package/src/cli/commands/plugins.ts +197 -4
- package/src/cli/lib/__tests__/diff-plugin.test.ts +443 -0
- package/src/cli/lib/__tests__/inspect-plugin.test.ts +54 -0
- package/src/cli/lib/__tests__/merge-plugin-tree.test.ts +443 -0
- package/src/cli/lib/__tests__/plugin-surfaces.test.ts +111 -0
- package/src/cli/lib/__tests__/upgrade-plugin.test.ts +295 -2
- package/src/cli/lib/diff-plugin.ts +346 -0
- package/src/cli/lib/inspect-plugin.ts +12 -1
- package/src/cli/lib/install-from-github.ts +105 -17
- package/src/cli/lib/merge-plugin-tree.ts +328 -0
- package/src/cli/lib/plugin-fingerprint.ts +14 -0
- package/src/cli/lib/plugin-surfaces.ts +104 -0
- package/src/cli/lib/upgrade-plugin.ts +298 -10
- package/src/cli/program.ts +2 -6
- package/src/config/__tests__/sync-gated-profiles.test.ts +368 -0
- package/src/config/assistant-feature-flags.ts +22 -7
- package/src/config/bundled-skills/contacts/tools/contact-search.ts +0 -1
- package/src/config/bundled-skills/messaging/SKILL.md +6 -4
- package/src/config/bundled-skills/messaging/tools/messaging-archive-by-sender.ts +9 -8
- package/src/config/bundled-skills/subagent/SKILL.md +4 -0
- package/src/config/bundled-skills/subagent/TOOLS.json +4 -0
- package/src/config/bundled-skills/workflows/SKILL.md +14 -8
- package/src/config/bundled-tool-registry.ts +2 -7
- package/src/config/call-site-defaults.ts +15 -2
- package/src/config/feature-flag-registry.json +46 -31
- package/src/config/inference-profile-validation.ts +26 -0
- package/src/config/llm-resolver.ts +3 -0
- package/src/config/loader.ts +4 -0
- package/src/config/memory-v3-gate.ts +11 -0
- package/src/config/profile-order.ts +28 -0
- package/src/config/schema.ts +8 -6
- package/src/config/schemas/__tests__/memory-v3.test.ts +1 -0
- package/src/config/schemas/call-site-catalog.ts +7 -0
- package/src/config/schemas/channels.ts +11 -0
- package/src/config/schemas/elevenlabs.ts +0 -1
- package/src/config/schemas/llm.ts +31 -0
- package/src/config/schemas/memory-lifecycle.ts +3 -7
- package/src/config/schemas/memory-v3.ts +6 -0
- package/src/config/schemas/platform.ts +0 -8
- package/src/config/schemas/services.ts +18 -0
- package/src/config/seed-inference-profiles.ts +109 -44
- package/src/config/skills.ts +21 -0
- package/src/config/sync-gated-profiles.ts +220 -0
- package/src/contacts/contact-store.ts +89 -106
- package/src/contacts/contacts-write.ts +5 -22
- package/src/contacts/types.ts +0 -1
- package/src/context/compactor.ts +88 -54
- package/src/context/strip-injections.ts +58 -10
- package/src/context/token-estimator.ts +1 -1
- package/src/credential-execution/process-manager.ts +55 -14
- package/src/credential-execution/prompted-credential.ts +2 -3
- package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +3 -2
- package/src/daemon/config-watcher.ts +0 -4
- package/src/daemon/conversation-agent-loop-handlers.ts +2 -0
- package/src/daemon/conversation-agent-loop.ts +114 -22
- package/src/daemon/conversation-history.ts +1 -1
- package/src/daemon/conversation-lifecycle.ts +3 -5
- package/src/daemon/conversation-process.ts +13 -5
- package/src/daemon/conversation-runtime-assembly.ts +13 -15
- package/src/daemon/conversation-slash.ts +2 -23
- package/src/daemon/conversation-surfaces.ts +26 -0
- package/src/daemon/conversation-tool-setup.ts +27 -14
- package/src/daemon/conversation.ts +66 -14
- package/src/daemon/disk-pressure-policy.ts +5 -3
- package/src/daemon/handlers/__tests__/config-a2a-complete.test.ts +0 -1
- package/src/daemon/handlers/__tests__/config-a2a-redeem.test.ts +0 -1
- package/src/daemon/handlers/config-a2a.ts +0 -2
- package/src/daemon/handlers/config-channels.ts +15 -16
- package/src/daemon/handlers/config-slack-channel.ts +22 -3
- package/src/daemon/handlers/conversations.ts +107 -0
- package/src/daemon/host-browser-proxy.ts +41 -0
- package/src/daemon/lifecycle.ts +55 -27
- package/src/daemon/message-provenance.ts +2 -0
- package/src/daemon/message-types/contacts.ts +0 -1
- package/src/daemon/message-types/conversations.ts +3 -3
- package/src/daemon/message-types/sync.ts +0 -1
- package/src/daemon/message-types/web-activity.ts +7 -1
- package/src/daemon/message-types/workflows.ts +83 -1
- package/src/daemon/orphan-reaper.test.ts +0 -19
- package/src/daemon/orphan-reaper.ts +2 -24
- package/src/daemon/server.ts +0 -10
- package/src/daemon/tool-setup-types.ts +4 -0
- package/src/daemon/trust-context.ts +1 -1
- package/src/events/tool-audit-listener.ts +2 -2
- package/src/home/feed-source-enrichment.test.ts +151 -0
- package/src/home/feed-source-enrichment.ts +176 -0
- package/src/home/relationship-state.ts +2 -4
- package/src/instrument.ts +18 -6
- package/src/ipc/__tests__/binary-result-ipc.test.ts +81 -0
- package/src/ipc/__tests__/clients-list-ipc.test.ts +20 -0
- package/src/ipc/assistant-server.ts +37 -4
- package/src/ipc/gateway-flag-listener.ts +18 -2
- package/src/memory/__tests__/auto-analysis-enqueue.test.ts +5 -16
- package/src/memory/__tests__/jobs-store-enqueue-gate.test.ts +7 -11
- package/src/memory/__tests__/memory-retrospective-enqueue.test.ts +37 -7
- package/src/memory/__tests__/memory-retrospective-job.test.ts +229 -401
- package/src/memory/__tests__/onboarding-events-store.test.ts +7 -7
- package/src/memory/auth-fallback-events-store.ts +2 -2
- package/src/memory/auto-analysis-enqueue.ts +3 -5
- package/src/memory/bookmark-crud.ts +1 -2
- package/src/memory/canonical-guardian-store.ts +39 -1
- package/src/memory/conversation-crud.ts +9 -4
- package/src/memory/conversation-key-store.ts +17 -2
- package/src/memory/conversation-title-service.ts +64 -7
- package/src/memory/db-init.ts +17 -17
- package/src/memory/embedding-backend.ts +38 -1
- package/src/memory/embedding-billing-breaker.ts +96 -0
- package/src/memory/jobs-store.ts +25 -13
- package/src/memory/jobs-worker.ts +54 -1
- package/src/memory/lifecycle-events-store.ts +2 -2
- package/src/memory/memory-retrospective-constants.ts +4 -4
- package/src/memory/memory-retrospective-enqueue.ts +31 -6
- package/src/memory/memory-retrospective-job.ts +28 -227
- package/src/memory/migrations/129-contact-channels-access-fields.ts +18 -9
- package/src/memory/migrations/131-drop-legacy-member-guardian-tables.ts +14 -2
- package/src/memory/migrations/289-contact-channels-unique-ext-user.ts +10 -0
- package/src/memory/migrations/291-contact-channels-renormalize-addresses.ts +72 -0
- package/src/memory/migrations/292-schedule-default-no-reuse-conversation.test.ts +67 -0
- package/src/memory/migrations/292-schedule-default-no-reuse-conversation.ts +25 -0
- package/src/memory/migrations/293-workflow-journal-leaf-tokens.ts +32 -0
- package/src/memory/migrations/294-drop-external-user-id.ts +31 -0
- package/src/memory/migrations/295-drop-approval-prompt-ts-tracker.ts +20 -0
- package/src/memory/migrations/296-rewrite-balanced-economy-profile-pins.test.ts +110 -0
- package/src/memory/migrations/296-rewrite-balanced-economy-profile-pins.ts +68 -0
- package/src/memory/migrations/__tests__/131-drop-legacy-member-guardian-tables.test.ts +154 -0
- package/src/memory/migrations/__tests__/289-contact-channels-unique-ext-user.test.ts +31 -0
- package/src/memory/migrations/__tests__/291-contact-channels-renormalize-addresses.test.ts +341 -0
- package/src/memory/migrations/__tests__/run-migrations.test.ts +52 -0
- package/src/memory/migrations/index.ts +6 -0
- package/src/memory/migrations/run-migrations.ts +41 -0
- package/src/memory/migrations/validate-migration-state.ts +1 -1
- package/src/memory/onboarding-events-store.ts +3 -3
- package/src/memory/schema/contacts.ts +0 -5
- package/src/memory/skill-loaded-events-store.test.ts +7 -15
- package/src/memory/skill-loaded-events-store.ts +2 -2
- package/src/memory/tool-executed-events-store.test.ts +7 -7
- package/src/memory/turn-trace-store.test.ts +736 -0
- package/src/memory/turn-trace-store.ts +364 -0
- package/src/memory/v2/__tests__/consolidation-job.test.ts +8 -0
- package/src/memory/v2/__tests__/skill-content.test.ts +30 -0
- package/src/memory/v2/consolidation-job.ts +2 -2
- package/src/memory/v2/skill-content.ts +25 -7
- package/src/memory/v2/skill-store.ts +7 -1
- package/src/memory/v3-eval/__tests__/eval-packets.test.ts +248 -0
- package/src/memory/v3-eval/eval-packets.ts +546 -0
- package/src/messaging/providers/slack/adapter.ts +1 -1
- package/src/messaging/providers/slack/api.ts +31 -0
- package/src/messaging/providers/slack/send.test.ts +114 -2
- package/src/messaging/providers/slack/send.ts +30 -7
- package/src/messaging/providers/slack/withdraw.test.ts +200 -0
- package/src/messaging/providers/slack/withdraw.ts +161 -0
- package/src/notifications/AGENTS.md +2 -0
- package/src/notifications/access-request-copy.ts +72 -59
- package/src/notifications/adapters/shared.ts +29 -0
- package/src/notifications/adapters/slack.ts +58 -103
- package/src/notifications/adapters/telegram.ts +2 -20
- package/src/notifications/approval-card-data.ts +333 -0
- package/src/notifications/broadcaster.ts +16 -3
- package/src/notifications/canonical-delivery-recorder.ts +139 -0
- package/src/notifications/copy-composer.ts +3 -3
- package/src/notifications/decision-engine.ts +4 -2
- package/src/notifications/destination-resolver.ts +4 -6
- package/src/notifications/guardian-question-mode.ts +10 -0
- package/src/notifications/home-feed-side-effect.ts +7 -16
- package/src/notifications/notification-utils.ts +19 -20
- package/src/notifications/signal.ts +79 -43
- package/src/notifications/types.ts +98 -121
- package/src/oauth/AGENTS.md +5 -24
- package/src/permissions/checker.test.ts +51 -0
- package/src/permissions/checker.ts +185 -26
- package/src/permissions/ipc-risk-types.ts +24 -0
- package/src/permissions/question-prompter.test.ts +27 -0
- package/src/permissions/question-prompter.ts +4 -0
- package/src/platform/client.test.ts +119 -0
- package/src/platform/client.ts +66 -0
- package/src/platform/consent-cache.test.ts +267 -0
- package/src/platform/consent-cache.ts +174 -0
- package/src/plugin-api/constants.ts +1 -1
- package/src/plugin-api/index.ts +33 -1
- package/src/plugin-api/model-profiles.ts +33 -0
- package/src/plugin-api/types.ts +50 -2
- package/src/plugins/defaults/advisor/__tests__/advisor-gate.test.ts +56 -0
- package/src/plugins/defaults/advisor/__tests__/advisor-state-store.test.ts +43 -0
- package/src/plugins/defaults/advisor/__tests__/agent-loop-integration.test.ts +137 -0
- package/src/plugins/defaults/advisor/__tests__/consult.test.ts +153 -0
- package/src/plugins/defaults/advisor/__tests__/hooks.test.ts +138 -0
- package/src/plugins/defaults/advisor/__tests__/transcript.test.ts +147 -0
- package/src/plugins/defaults/advisor/advisor-gate.ts +29 -0
- package/src/plugins/defaults/advisor/advisor-state-store.ts +94 -0
- package/src/plugins/defaults/advisor/config.ts +21 -0
- package/src/plugins/defaults/advisor/consult.ts +93 -0
- package/src/plugins/defaults/advisor/hooks/post-model-call.ts +34 -0
- package/src/plugins/defaults/advisor/hooks/pre-model-call.ts +30 -0
- package/src/plugins/defaults/advisor/hooks/user-prompt-submit.ts +19 -0
- package/src/plugins/defaults/advisor/package.json +14 -0
- package/src/plugins/defaults/advisor/steering.ts +67 -0
- package/src/plugins/defaults/advisor/tools/advisor.ts +65 -0
- package/src/plugins/defaults/advisor/transcript.ts +76 -0
- package/src/plugins/defaults/index.ts +60 -0
- package/src/plugins/defaults/memory-retrieval/hooks/post-compact.ts +22 -9
- package/src/plugins/defaults/memory-retrieval/hooks/user-prompt-submit.ts +2 -2
- package/src/plugins/defaults/memory-retrieval/tail-reinjection-strip.ts +64 -0
- package/src/plugins/defaults/memory-retrieval/unified-turn-context.ts +29 -21
- package/src/plugins/defaults/memory-v3-shadow/__tests__/carry-integration.test.ts +1 -0
- package/src/plugins/defaults/memory-v3-shadow/__tests__/injection.test.ts +1 -0
- package/src/plugins/defaults/memory-v3-shadow/__tests__/maintain-job.test.ts +129 -9
- package/src/plugins/defaults/memory-v3-shadow/__tests__/orchestrate.test.ts +31 -4
- package/src/plugins/defaults/memory-v3-shadow/__tests__/selection-log-store.test.ts +77 -2
- package/src/plugins/defaults/memory-v3-shadow/__tests__/shadow-plugin.test.ts +1 -0
- package/src/plugins/defaults/memory-v3-shadow/injector.ts +7 -10
- package/src/plugins/defaults/memory-v3-shadow/maintain-job.ts +144 -11
- package/src/plugins/defaults/memory-v3-shadow/orchestrate.ts +32 -20
- package/src/plugins/defaults/memory-v3-shadow/selection-log-store.ts +56 -3
- package/src/plugins/defaults/memory-v3-shadow/shadow-plugin.ts +23 -2
- package/src/plugins/defaults/surface-completion-nudge/hooks/post-model-call.ts +276 -0
- package/src/plugins/defaults/surface-completion-nudge/hooks/stop.ts +22 -0
- package/src/plugins/defaults/surface-completion-nudge/nudge-state-store.ts +46 -0
- package/src/plugins/defaults/surface-completion-nudge/package.json +14 -0
- package/src/plugins/defaults/task-progress-nudge/hooks/post-tool-use.ts +3 -13
- package/src/plugins/defaults/title-generate/hooks/stop.ts +56 -21
- package/src/prompts/persona-resolver.ts +14 -4
- package/src/prompts/templates/system-sections.ts +7 -2
- package/src/providers/__tests__/provider-env-vars.test.ts +6 -0
- package/src/providers/__tests__/provider-secret-catalog.test.ts +1 -0
- package/src/providers/__tests__/retry-callsite.test.ts +176 -0
- package/src/providers/atlascloud/client.ts +85 -0
- package/src/providers/fetch-provider-catalog.ts +85 -0
- package/src/providers/inference/adapter-factory.ts +3 -0
- package/src/providers/model-catalog.ts +58 -0
- package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +33 -0
- package/src/providers/openai/chat-completions-provider.ts +7 -0
- package/src/providers/openai/responses-provider.ts +10 -0
- package/src/providers/provider-send-message.ts +11 -3
- package/src/providers/retry.ts +53 -12
- package/src/providers/search-provider-catalog.ts +10 -0
- package/src/providers/weak-open-model.ts +22 -0
- package/src/runtime/AGENTS.md +0 -1
- package/src/runtime/__tests__/agent-wake.test.ts +181 -0
- package/src/runtime/__tests__/client-health.test.ts +44 -0
- package/src/runtime/access-request-helper.ts +21 -53
- package/src/runtime/actor-trust-resolver.ts +59 -63
- package/src/runtime/agent-wake.ts +52 -0
- package/src/runtime/assistant-event-hub.ts +18 -4
- package/src/runtime/auth/__tests__/route-policy.test.ts +12 -0
- package/src/runtime/auth/require-bound-guardian.ts +1 -4
- package/src/runtime/btw-sidechain.ts +3 -6
- package/src/runtime/capabilities.test.ts +120 -0
- package/src/runtime/capabilities.ts +197 -0
- package/src/runtime/channel-approval-types.ts +22 -45
- package/src/runtime/channel-invite-transports/telegram.ts +4 -4
- package/src/runtime/channel-retry-sweep.ts +1 -0
- package/src/runtime/channel-verification-service.ts +3 -3
- package/src/runtime/client-health.ts +26 -0
- package/src/runtime/confirmation-request-guardian-bridge.ts +38 -29
- package/src/runtime/effective-capabilities.test.ts +128 -0
- package/src/runtime/effective-capabilities.ts +84 -0
- package/src/runtime/guardian-reply-router.ts +106 -21
- package/src/runtime/invite-redemption-service.ts +9 -25
- package/src/runtime/migrations/__tests__/vbundle-builder-fd-leak.test.ts +123 -0
- package/src/runtime/migrations/vbundle-builder.ts +49 -20
- package/src/runtime/pending-interactions.ts +15 -0
- package/src/runtime/routes/__tests__/client-routes.test.ts +13 -0
- package/src/runtime/routes/__tests__/conversation-management-routes.test.ts +67 -0
- package/src/runtime/routes/__tests__/plugins-routes.test.ts +240 -1
- package/src/runtime/routes/app-routes.ts +1 -1
- package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +2 -2
- package/src/runtime/routes/assets/vellum-design-system.css +1959 -0
- package/src/runtime/routes/browser-tabs-routes.ts +9 -0
- package/src/runtime/routes/btw-routes.ts +1 -27
- package/src/runtime/routes/canonical-guardian-expiry-sweep.ts +17 -8
- package/src/runtime/routes/client-routes.ts +10 -0
- package/src/runtime/routes/contact-routes.ts +31 -8
- package/src/runtime/routes/conversation-compaction-routes.ts +1 -1
- package/src/runtime/routes/conversation-management-routes.ts +80 -1
- package/src/runtime/routes/conversation-query-routes.ts +68 -22
- package/src/runtime/routes/conversation-routes.ts +39 -14
- package/src/runtime/routes/credential-routes.ts +40 -16
- package/src/runtime/routes/empty-state-greeting-cache.ts +1 -2
- package/src/runtime/routes/events-routes.ts +1 -3
- package/src/runtime/routes/guardian-approval-interception.ts +14 -73
- package/src/runtime/routes/guardian-approval-prompt.ts +22 -4
- package/src/runtime/routes/home-feed-routes.ts +8 -3
- package/src/runtime/routes/identity-routes.ts +1 -296
- package/src/runtime/routes/inbound-message-handler.ts +214 -228
- package/src/runtime/routes/inbound-stages/acl-enforcement.ts +89 -7
- package/src/runtime/routes/inbound-stages/admission-policy.test.ts +154 -0
- package/src/runtime/routes/inbound-stages/admission-policy.ts +140 -0
- package/src/runtime/routes/inbound-stages/background-dispatch.test.ts +3 -3
- package/src/runtime/routes/inbound-stages/background-dispatch.ts +11 -6
- package/src/runtime/routes/inbound-stages/escalation-intercept.ts +1 -2
- package/src/runtime/routes/inbound-stages/guardian-activation-intercept.ts +1 -2
- package/src/runtime/routes/inbound-stages/guardian-reply-intercept.test.ts +7 -7
- package/src/runtime/routes/inbound-stages/guardian-reply-intercept.ts +47 -28
- package/src/runtime/routes/inbound-stages/reaction-intercept.ts +358 -0
- package/src/runtime/routes/index.ts +2 -0
- package/src/runtime/routes/integrations/slack/__tests__/channel.test.ts +8 -0
- package/src/runtime/routes/integrations/slack/channel.ts +36 -0
- package/src/runtime/routes/internal-telemetry-routes.ts +1 -1
- package/src/runtime/routes/mcp-auth-routes.ts +233 -41
- package/src/runtime/routes/memory-eval-routes.ts +87 -0
- package/src/runtime/routes/notification-routes.ts +122 -133
- package/src/runtime/routes/platform-routes.ts +2 -2
- package/src/runtime/routes/plugins-routes.ts +202 -3
- package/src/runtime/routes/schedule-routes.ts +0 -22
- package/src/runtime/routes/secret-routes.ts +10 -0
- package/src/runtime/routes/surface-action-routes.ts +2 -1
- package/src/runtime/routes/tool-call-question-enrichment.test.ts +146 -0
- package/src/runtime/routes/tool-call-question-enrichment.ts +66 -0
- package/src/runtime/routes/workflow-routes.test.ts +229 -44
- package/src/runtime/routes/workflow-routes.ts +131 -29
- package/src/runtime/routes/workspace-greetings.ts +55 -0
- package/src/runtime/sync/resource-sync-events.ts +1 -11
- package/src/runtime/tool-grant-request-helper.ts +18 -16
- package/src/runtime/trust-context-resolver.ts +8 -5
- package/src/schedule/inference-profile.ts +2 -14
- package/src/schedule/schedule-store.ts +1 -1
- package/src/schedule/scheduler-types.ts +5 -1
- package/src/security/__tests__/provider-key-env-fallback.test.ts +6 -0
- package/src/security/secret-patterns.ts +3 -0
- package/src/subagent/manager.ts +17 -4
- package/src/subagent/types.ts +6 -0
- package/src/telemetry/trace-collection-policy.test.ts +28 -0
- package/src/telemetry/trace-collection-policy.ts +30 -0
- package/src/telemetry/types.ts +89 -0
- package/src/telemetry/usage-telemetry-reporter.test.ts +586 -36
- package/src/telemetry/usage-telemetry-reporter.ts +148 -41
- package/src/tools/AGENTS.md +3 -3
- package/src/tools/browser/__tests__/browser-execution-acquire.test.ts +31 -0
- package/src/tools/browser/browser-execution.ts +30 -19
- package/src/tools/document/document-tool.ts +2 -3
- package/src/tools/executor.ts +5 -3
- package/src/tools/host-terminal/host-shell.ts +5 -4
- package/src/tools/memory/register.ts +2 -2
- package/src/tools/network/__tests__/web-fetch-firecrawl.test.ts +360 -0
- package/src/tools/network/__tests__/web-search.test.ts +143 -0
- package/src/tools/network/web-fetch.ts +372 -1
- package/src/tools/network/web-search-error.ts +1 -1
- package/src/tools/network/web-search.ts +213 -10
- package/src/tools/permission-checker.ts +4 -3
- package/src/tools/registry.ts +20 -0
- package/src/tools/schedule/create.ts +7 -12
- package/src/tools/schedule/update.ts +4 -11
- package/src/tools/shared/filesystem/path-policy.ts +39 -13
- package/src/tools/side-effects.ts +2 -17
- package/src/tools/skills/execute.ts +33 -0
- package/src/tools/subagent/spawn.ts +61 -12
- package/src/tools/terminal/shell.ts +10 -4
- package/src/tools/tool-approval-handler.ts +18 -13
- package/src/tools/tool-manifest.ts +0 -2
- package/src/tools/types.ts +9 -0
- package/src/tools/ui-surface/definitions.ts +64 -3
- package/src/tools/verification-control-plane-policy.ts +3 -1
- package/src/tools/workflows/run-workflow.test.ts +8 -18
- package/src/tools/workflows/run-workflow.ts +1 -0
- package/src/util/disk-usage.ts +78 -23
- package/src/util/platform.ts +10 -3
- package/src/watcher/telemetry.ts +2 -2
- package/src/workflows/capabilities.ts +2 -3
- package/src/workflows/engine.test.ts +175 -1
- package/src/workflows/engine.ts +82 -0
- package/src/workflows/journal-store.test.ts +70 -0
- package/src/workflows/journal-store.ts +18 -3
- package/src/workflows/run-manager.test.ts +171 -28
- package/src/workflows/run-manager.ts +66 -24
- package/src/workspace/migrations/105-enable-memory-v3-live-for-new-workspaces.ts +63 -0
- package/src/workspace/migrations/106-drop-collect-usage-data.ts +47 -0
- package/src/workspace/migrations/107-drop-send-diagnostics.ts +47 -0
- package/src/workspace/migrations/108-drop-balanced-economy-profile.ts +129 -0
- package/src/workspace/migrations/registry.ts +8 -0
- package/src/__tests__/app-control-no-global-cgevent.test.ts +0 -98
- package/src/__tests__/credential-security-e2e.test.ts +0 -362
- package/src/__tests__/credential-vault-unit.test.ts +0 -1528
- package/src/__tests__/credential-vault.test.ts +0 -1706
- package/src/__tests__/identity-intro-cache.test.ts +0 -315
- package/src/__tests__/secret-onetime-send.test.ts +0 -182
- package/src/cli/commands/__tests__/task.test.ts +0 -914
- package/src/cli/commands/task.ts +0 -771
- package/src/config/bundled-skills/personal-page/SKILL.md +0 -57
- package/src/config/bundled-skills/personal-page/TOOLS.json +0 -27
- package/src/config/bundled-skills/personal-page/tools/app-refresh.ts +0 -17
- package/src/config/preloaded-apps/personal-page/src/components/About.tsx +0 -22
- package/src/config/preloaded-apps/personal-page/src/components/App.tsx +0 -16
- package/src/config/preloaded-apps/personal-page/src/components/Features.tsx +0 -77
- package/src/config/preloaded-apps/personal-page/src/components/Hero.tsx +0 -57
- package/src/config/preloaded-apps/personal-page/src/components/Pending.tsx +0 -28
- package/src/config/preloaded-apps/personal-page/src/components/animations.tsx +0 -234
- package/src/config/preloaded-apps/personal-page/src/components/icons.tsx +0 -48
- package/src/config/preloaded-apps/personal-page/src/components/media.ts +0 -16
- package/src/config/preloaded-apps/personal-page/src/index.html +0 -20
- package/src/config/preloaded-apps/personal-page/src/main.tsx +0 -7
- package/src/config/preloaded-apps/personal-page/src/profile-data.ts +0 -82
- package/src/config/preloaded-apps/personal-page/src/styles.css +0 -759
- package/src/memory/__tests__/preloaded-apps.test.ts +0 -85
- package/src/memory/preloaded-apps.ts +0 -116
- package/src/notifications/tool-approval-copy.ts +0 -142
- package/src/runtime/routes/approval-prompt-ts-tracker.ts +0 -78
- package/src/runtime/routes/identity-intro-cache.ts +0 -172
- package/src/tools/credentials/vault.ts +0 -712
|
@@ -6,6 +6,28 @@ import { describe, expect, mock, test } from "bun:test";
|
|
|
6
6
|
let mockGetMessages: (
|
|
7
7
|
conversationId: string,
|
|
8
8
|
) => Array<{ role: string; content: string }> | null = () => null;
|
|
9
|
+
const mockProfiles = {
|
|
10
|
+
balanced: {},
|
|
11
|
+
"cost-optimized": {},
|
|
12
|
+
disabled: { status: "disabled" },
|
|
13
|
+
"quality-optimized": {},
|
|
14
|
+
};
|
|
15
|
+
mock.module("../config/loader.js", () => ({
|
|
16
|
+
getConfigReadOnly: () => ({
|
|
17
|
+
llm: { profiles: mockProfiles },
|
|
18
|
+
}),
|
|
19
|
+
getConfig: () => ({
|
|
20
|
+
llm: {
|
|
21
|
+
default: {
|
|
22
|
+
provider: "anthropic",
|
|
23
|
+
provider_connection: "anthropic-managed",
|
|
24
|
+
model: "claude-opus-4-7",
|
|
25
|
+
},
|
|
26
|
+
profiles: mockProfiles,
|
|
27
|
+
},
|
|
28
|
+
rateLimit: { maxRequestsPerMinute: 0 },
|
|
29
|
+
}),
|
|
30
|
+
}));
|
|
9
31
|
mock.module("../memory/conversation-crud.js", () => ({
|
|
10
32
|
setConversationOriginChannelIfUnset: () => {},
|
|
11
33
|
updateConversationContextWindow: () => {},
|
|
@@ -140,6 +162,7 @@ describe("Subagent tool definitions", () => {
|
|
|
140
162
|
const def = findTool("subagent_spawn");
|
|
141
163
|
expect(def).toBeDefined();
|
|
142
164
|
expect(def.input_schema.required).toEqual(["label", "objective"]);
|
|
165
|
+
expect(def.input_schema.properties.inference_profile).toBeDefined();
|
|
143
166
|
});
|
|
144
167
|
|
|
145
168
|
test("abort tool has correct definition", () => {
|
|
@@ -422,6 +445,249 @@ describe("Subagent spawn success and failure", () => {
|
|
|
422
445
|
}
|
|
423
446
|
});
|
|
424
447
|
|
|
448
|
+
test("spawn passes explicit inference_profile to manager over inherited override", async () => {
|
|
449
|
+
const manager = getSubagentManager();
|
|
450
|
+
const originalSpawn = manager.spawn.bind(manager);
|
|
451
|
+
let capturedConfig: Record<string, unknown> | undefined;
|
|
452
|
+
|
|
453
|
+
manager.spawn = async (config: Record<string, unknown>) => {
|
|
454
|
+
capturedConfig = config;
|
|
455
|
+
return "profile-subagent-id";
|
|
456
|
+
};
|
|
457
|
+
|
|
458
|
+
try {
|
|
459
|
+
const result = await executeSubagentSpawn(
|
|
460
|
+
{
|
|
461
|
+
label: "Profile test",
|
|
462
|
+
objective: "Do it with a chosen model profile",
|
|
463
|
+
inference_profile: "quality-optimized",
|
|
464
|
+
},
|
|
465
|
+
makeContext("sess-spawn-profile", {
|
|
466
|
+
sendToClient: () => {},
|
|
467
|
+
overrideProfile: "balanced",
|
|
468
|
+
}),
|
|
469
|
+
);
|
|
470
|
+
|
|
471
|
+
expect(result.isError).toBe(false);
|
|
472
|
+
expect(capturedConfig).toBeDefined();
|
|
473
|
+
expect(capturedConfig!.overrideProfile).toBe("quality-optimized");
|
|
474
|
+
expect(capturedConfig!.forceOverrideProfile).toBe(true);
|
|
475
|
+
} finally {
|
|
476
|
+
manager.spawn = originalSpawn;
|
|
477
|
+
}
|
|
478
|
+
});
|
|
479
|
+
|
|
480
|
+
test("spawn inherits the invoking call site's default profile when no override is present", async () => {
|
|
481
|
+
const manager = getSubagentManager();
|
|
482
|
+
const originalSpawn = manager.spawn.bind(manager);
|
|
483
|
+
let capturedConfig: Record<string, unknown> | undefined;
|
|
484
|
+
|
|
485
|
+
manager.spawn = async (config: Record<string, unknown>) => {
|
|
486
|
+
capturedConfig = config;
|
|
487
|
+
return "inherit-default-id";
|
|
488
|
+
};
|
|
489
|
+
|
|
490
|
+
try {
|
|
491
|
+
const result = await executeSubagentSpawn(
|
|
492
|
+
{ label: "Inherit default", objective: "Do it" },
|
|
493
|
+
makeContext("sess-inherit-default", {
|
|
494
|
+
sendToClient: () => {},
|
|
495
|
+
invokingCallSite: "mainAgent",
|
|
496
|
+
}),
|
|
497
|
+
);
|
|
498
|
+
|
|
499
|
+
expect(result.isError).toBe(false);
|
|
500
|
+
// No explicit profile and no per-turn override → the child matches the
|
|
501
|
+
// invoking call site's resolved default profile (balanced for mainAgent
|
|
502
|
+
// in the test config).
|
|
503
|
+
expect(capturedConfig!.overrideProfile).toBe("balanced");
|
|
504
|
+
expect(capturedConfig!.forceOverrideProfile).toBeUndefined();
|
|
505
|
+
} finally {
|
|
506
|
+
manager.spawn = originalSpawn;
|
|
507
|
+
}
|
|
508
|
+
});
|
|
509
|
+
|
|
510
|
+
test("spawn inherits a non-main invoker's call-site default profile", async () => {
|
|
511
|
+
const manager = getSubagentManager();
|
|
512
|
+
const originalSpawn = manager.spawn.bind(manager);
|
|
513
|
+
let capturedConfig: Record<string, unknown> | undefined;
|
|
514
|
+
|
|
515
|
+
manager.spawn = async (config: Record<string, unknown>) => {
|
|
516
|
+
capturedConfig = config;
|
|
517
|
+
return "inherit-heartbeat-id";
|
|
518
|
+
};
|
|
519
|
+
|
|
520
|
+
try {
|
|
521
|
+
const result = await executeSubagentSpawn(
|
|
522
|
+
{ label: "Heartbeat child", objective: "Do it" },
|
|
523
|
+
makeContext("sess-inherit-heartbeat", {
|
|
524
|
+
sendToClient: () => {},
|
|
525
|
+
invokingCallSite: "heartbeatAgent",
|
|
526
|
+
}),
|
|
527
|
+
);
|
|
528
|
+
|
|
529
|
+
expect(result.isError).toBe(false);
|
|
530
|
+
// A subagent spawned from a heartbeat turn matches heartbeatAgent's own
|
|
531
|
+
// cost-optimized default, not the mainAgent default.
|
|
532
|
+
expect(capturedConfig!.overrideProfile).toBe("cost-optimized");
|
|
533
|
+
} finally {
|
|
534
|
+
manager.spawn = originalSpawn;
|
|
535
|
+
}
|
|
536
|
+
});
|
|
537
|
+
|
|
538
|
+
test("spawn prefers a per-turn override profile over the invoker default", async () => {
|
|
539
|
+
const manager = getSubagentManager();
|
|
540
|
+
const originalSpawn = manager.spawn.bind(manager);
|
|
541
|
+
let capturedConfig: Record<string, unknown> | undefined;
|
|
542
|
+
|
|
543
|
+
manager.spawn = async (config: Record<string, unknown>) => {
|
|
544
|
+
capturedConfig = config;
|
|
545
|
+
return "inherit-override-id";
|
|
546
|
+
};
|
|
547
|
+
|
|
548
|
+
try {
|
|
549
|
+
const result = await executeSubagentSpawn(
|
|
550
|
+
{ label: "Override child", objective: "Do it" },
|
|
551
|
+
makeContext("sess-inherit-override", {
|
|
552
|
+
sendToClient: () => {},
|
|
553
|
+
invokingCallSite: "mainAgent",
|
|
554
|
+
overrideProfile: "quality-optimized",
|
|
555
|
+
}),
|
|
556
|
+
);
|
|
557
|
+
|
|
558
|
+
expect(result.isError).toBe(false);
|
|
559
|
+
// The live per-turn override (per-conversation or tool-routed) wins over
|
|
560
|
+
// the call-site default, and is forwarded non-forced.
|
|
561
|
+
expect(capturedConfig!.overrideProfile).toBe("quality-optimized");
|
|
562
|
+
expect(capturedConfig!.forceOverrideProfile).toBeUndefined();
|
|
563
|
+
} finally {
|
|
564
|
+
manager.spawn = originalSpawn;
|
|
565
|
+
}
|
|
566
|
+
});
|
|
567
|
+
|
|
568
|
+
test("spawn skips the auto profile so the child keeps its own default", async () => {
|
|
569
|
+
const manager = getSubagentManager();
|
|
570
|
+
const originalSpawn = manager.spawn.bind(manager);
|
|
571
|
+
let capturedConfig: Record<string, unknown> | undefined;
|
|
572
|
+
|
|
573
|
+
manager.spawn = async (config: Record<string, unknown>) => {
|
|
574
|
+
capturedConfig = config;
|
|
575
|
+
return "inherit-auto-id";
|
|
576
|
+
};
|
|
577
|
+
|
|
578
|
+
try {
|
|
579
|
+
const result = await executeSubagentSpawn(
|
|
580
|
+
{ label: "Auto child", objective: "Do it" },
|
|
581
|
+
makeContext("sess-inherit-auto", {
|
|
582
|
+
sendToClient: () => {},
|
|
583
|
+
invokingCallSite: "mainAgent",
|
|
584
|
+
// "auto" is metadata-only; forwarding it would collapse the child to
|
|
585
|
+
// llm.default, so the inherited path drops it and the child keeps its
|
|
586
|
+
// own subagentSpawn default.
|
|
587
|
+
overrideProfile: "auto",
|
|
588
|
+
}),
|
|
589
|
+
);
|
|
590
|
+
|
|
591
|
+
expect(result.isError).toBe(false);
|
|
592
|
+
expect(capturedConfig!.overrideProfile).toBeUndefined();
|
|
593
|
+
} finally {
|
|
594
|
+
manager.spawn = originalSpawn;
|
|
595
|
+
}
|
|
596
|
+
});
|
|
597
|
+
|
|
598
|
+
test("spawn still forces an explicit inference_profile over the invoker default", async () => {
|
|
599
|
+
const manager = getSubagentManager();
|
|
600
|
+
const originalSpawn = manager.spawn.bind(manager);
|
|
601
|
+
let capturedConfig: Record<string, unknown> | undefined;
|
|
602
|
+
|
|
603
|
+
manager.spawn = async (config: Record<string, unknown>) => {
|
|
604
|
+
capturedConfig = config;
|
|
605
|
+
return "inherit-explicit-id";
|
|
606
|
+
};
|
|
607
|
+
|
|
608
|
+
try {
|
|
609
|
+
const result = await executeSubagentSpawn(
|
|
610
|
+
{
|
|
611
|
+
label: "Explicit child",
|
|
612
|
+
objective: "Do it",
|
|
613
|
+
inference_profile: "cost-optimized",
|
|
614
|
+
},
|
|
615
|
+
makeContext("sess-inherit-explicit", {
|
|
616
|
+
sendToClient: () => {},
|
|
617
|
+
invokingCallSite: "mainAgent",
|
|
618
|
+
}),
|
|
619
|
+
);
|
|
620
|
+
|
|
621
|
+
expect(result.isError).toBe(false);
|
|
622
|
+
expect(capturedConfig!.overrideProfile).toBe("cost-optimized");
|
|
623
|
+
expect(capturedConfig!.forceOverrideProfile).toBe(true);
|
|
624
|
+
} finally {
|
|
625
|
+
manager.spawn = originalSpawn;
|
|
626
|
+
}
|
|
627
|
+
});
|
|
628
|
+
|
|
629
|
+
test("spawn returns error for unknown inference_profile", async () => {
|
|
630
|
+
const manager = getSubagentManager();
|
|
631
|
+
const originalSpawn = manager.spawn.bind(manager);
|
|
632
|
+
let spawnCalled = false;
|
|
633
|
+
|
|
634
|
+
manager.spawn = async () => {
|
|
635
|
+
spawnCalled = true;
|
|
636
|
+
return "profile-subagent-id";
|
|
637
|
+
};
|
|
638
|
+
|
|
639
|
+
try {
|
|
640
|
+
const result = await executeSubagentSpawn(
|
|
641
|
+
{
|
|
642
|
+
label: "Bad profile",
|
|
643
|
+
objective: "Do it",
|
|
644
|
+
inference_profile: "does-not-exist",
|
|
645
|
+
},
|
|
646
|
+
makeContext("sess-spawn-bad-profile", { sendToClient: () => {} }),
|
|
647
|
+
);
|
|
648
|
+
|
|
649
|
+
expect(result.isError).toBe(true);
|
|
650
|
+
expect(result.content).toContain(
|
|
651
|
+
'Inference profile "does-not-exist" is not defined',
|
|
652
|
+
);
|
|
653
|
+
expect(spawnCalled).toBe(false);
|
|
654
|
+
} finally {
|
|
655
|
+
manager.spawn = originalSpawn;
|
|
656
|
+
}
|
|
657
|
+
});
|
|
658
|
+
|
|
659
|
+
test("spawn returns error for disabled inference_profile", async () => {
|
|
660
|
+
const manager = getSubagentManager();
|
|
661
|
+
const originalSpawn = manager.spawn.bind(manager);
|
|
662
|
+
let spawnCalled = false;
|
|
663
|
+
|
|
664
|
+
manager.spawn = async () => {
|
|
665
|
+
spawnCalled = true;
|
|
666
|
+
return "profile-subagent-id";
|
|
667
|
+
};
|
|
668
|
+
|
|
669
|
+
try {
|
|
670
|
+
const result = await executeSubagentSpawn(
|
|
671
|
+
{
|
|
672
|
+
label: "Disabled profile",
|
|
673
|
+
objective: "Do it",
|
|
674
|
+
inference_profile: "disabled",
|
|
675
|
+
},
|
|
676
|
+
makeContext("sess-spawn-disabled-profile", {
|
|
677
|
+
sendToClient: () => {},
|
|
678
|
+
}),
|
|
679
|
+
);
|
|
680
|
+
|
|
681
|
+
expect(result.isError).toBe(true);
|
|
682
|
+
expect(result.content).toContain(
|
|
683
|
+
'Inference profile "disabled" is disabled',
|
|
684
|
+
);
|
|
685
|
+
expect(spawnCalled).toBe(false);
|
|
686
|
+
} finally {
|
|
687
|
+
manager.spawn = originalSpawn;
|
|
688
|
+
}
|
|
689
|
+
});
|
|
690
|
+
|
|
425
691
|
test("spawn handles non-Error throws gracefully", async () => {
|
|
426
692
|
const manager = getSubagentManager();
|
|
427
693
|
const originalSpawn = manager.spawn.bind(manager);
|
|
@@ -0,0 +1,367 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Tests for the default `surface-completion-nudge` plugin's hooks.
|
|
3
|
+
*
|
|
4
|
+
* Covers:
|
|
5
|
+
* - The `post-model-call` hook nudges (continue + canonical text appended as a
|
|
6
|
+
* `user` message) when a turn ends with a progress surface left open: a
|
|
7
|
+
* `task_progress` card shown and never advanced to a terminal status, and a
|
|
8
|
+
* `work_result` shown `in_progress`.
|
|
9
|
+
* - It does NOT nudge when the surface was completed via `ui_update`, dismissed
|
|
10
|
+
* via `ui_dismiss`, or was never a progress surface (a plain card / a form).
|
|
11
|
+
* - Outcomes it does not own are ignored: a provider rejection, a tool-bearing
|
|
12
|
+
* turn, and a non-main-agent call site.
|
|
13
|
+
* - The signal is scoped to the current response cycle — a surface left open in
|
|
14
|
+
* a prior cycle (before the last genuine user prompt) does not trigger it.
|
|
15
|
+
* - The one-shot bound is split across the two hooks: `post-model-call` marks it
|
|
16
|
+
* (nudging at most once per run) and `stop` clears it so the next run nudges
|
|
17
|
+
* afresh.
|
|
18
|
+
*
|
|
19
|
+
* The loop's actual continuation side-effects live in `agent/loop.ts` and are
|
|
20
|
+
* covered by integration tests. This file isolates the hook.
|
|
21
|
+
*/
|
|
22
|
+
|
|
23
|
+
import { beforeEach, describe, expect, test } from "bun:test";
|
|
24
|
+
|
|
25
|
+
import type {
|
|
26
|
+
PluginLogger,
|
|
27
|
+
PostModelCallContext,
|
|
28
|
+
} from "../plugin-api/types.js";
|
|
29
|
+
import postModelCall, {
|
|
30
|
+
SURFACE_COMPLETION_NUDGE_TEXT,
|
|
31
|
+
} from "../plugins/defaults/surface-completion-nudge/hooks/post-model-call.js";
|
|
32
|
+
import stop from "../plugins/defaults/surface-completion-nudge/hooks/stop.js";
|
|
33
|
+
import {
|
|
34
|
+
isSurfaceCompletionNudged,
|
|
35
|
+
resetSurfaceCompletionNudgeStoreForTests,
|
|
36
|
+
} from "../plugins/defaults/surface-completion-nudge/nudge-state-store.js";
|
|
37
|
+
import type { ContentBlock, Message } from "../providers/types.js";
|
|
38
|
+
|
|
39
|
+
// ─── Fixtures ────────────────────────────────────────────────────────────────
|
|
40
|
+
|
|
41
|
+
const noopLogger: PluginLogger = {
|
|
42
|
+
info: () => {},
|
|
43
|
+
warn: () => {},
|
|
44
|
+
error: () => {},
|
|
45
|
+
debug: () => {},
|
|
46
|
+
};
|
|
47
|
+
|
|
48
|
+
const finalText: ContentBlock = { type: "text", text: "All set." };
|
|
49
|
+
|
|
50
|
+
let surfaceCounter = 0;
|
|
51
|
+
|
|
52
|
+
/**
|
|
53
|
+
* An assistant `ui_show` turn paired with its `{ surfaceId }` tool result.
|
|
54
|
+
* Returns both messages plus the assigned surface id.
|
|
55
|
+
*/
|
|
56
|
+
function showSurface(input: Record<string, unknown>): {
|
|
57
|
+
messages: Message[];
|
|
58
|
+
surfaceId: string;
|
|
59
|
+
} {
|
|
60
|
+
surfaceCounter += 1;
|
|
61
|
+
const toolUseId = `tu_show_${surfaceCounter}`;
|
|
62
|
+
const surfaceId = `surface-${surfaceCounter}`;
|
|
63
|
+
return {
|
|
64
|
+
surfaceId,
|
|
65
|
+
messages: [
|
|
66
|
+
{
|
|
67
|
+
role: "assistant",
|
|
68
|
+
content: [{ type: "tool_use", id: toolUseId, name: "ui_show", input }],
|
|
69
|
+
},
|
|
70
|
+
{
|
|
71
|
+
role: "user",
|
|
72
|
+
content: [
|
|
73
|
+
{
|
|
74
|
+
type: "tool_result",
|
|
75
|
+
tool_use_id: toolUseId,
|
|
76
|
+
content: JSON.stringify({ surfaceId }),
|
|
77
|
+
},
|
|
78
|
+
],
|
|
79
|
+
},
|
|
80
|
+
],
|
|
81
|
+
};
|
|
82
|
+
}
|
|
83
|
+
|
|
84
|
+
function updateSurface(
|
|
85
|
+
surfaceId: string,
|
|
86
|
+
data: Record<string, unknown>,
|
|
87
|
+
): Message {
|
|
88
|
+
return {
|
|
89
|
+
role: "assistant",
|
|
90
|
+
content: [
|
|
91
|
+
{
|
|
92
|
+
type: "tool_use",
|
|
93
|
+
id: `tu_update_${surfaceId}`,
|
|
94
|
+
name: "ui_update",
|
|
95
|
+
input: { surface_id: surfaceId, data },
|
|
96
|
+
},
|
|
97
|
+
],
|
|
98
|
+
};
|
|
99
|
+
}
|
|
100
|
+
|
|
101
|
+
function dismissSurface(surfaceId: string): Message {
|
|
102
|
+
return {
|
|
103
|
+
role: "assistant",
|
|
104
|
+
content: [
|
|
105
|
+
{
|
|
106
|
+
type: "tool_use",
|
|
107
|
+
id: `tu_dismiss_${surfaceId}`,
|
|
108
|
+
name: "ui_dismiss",
|
|
109
|
+
input: { surface_id: surfaceId },
|
|
110
|
+
},
|
|
111
|
+
],
|
|
112
|
+
};
|
|
113
|
+
}
|
|
114
|
+
|
|
115
|
+
function userPrompt(text: string): Message {
|
|
116
|
+
return { role: "user", content: [{ type: "text", text }] };
|
|
117
|
+
}
|
|
118
|
+
|
|
119
|
+
const taskProgressShow = (status?: string): Record<string, unknown> => ({
|
|
120
|
+
surface_type: "card",
|
|
121
|
+
title: "Working on X",
|
|
122
|
+
data: {
|
|
123
|
+
template: "task_progress",
|
|
124
|
+
templateData: {
|
|
125
|
+
title: "Working on X",
|
|
126
|
+
...(status ? { status } : {}),
|
|
127
|
+
steps: [{ label: "Step 1", status: status ?? "in_progress" }],
|
|
128
|
+
},
|
|
129
|
+
},
|
|
130
|
+
});
|
|
131
|
+
|
|
132
|
+
function makeCtx(
|
|
133
|
+
overrides: Partial<PostModelCallContext> = {},
|
|
134
|
+
): PostModelCallContext {
|
|
135
|
+
return {
|
|
136
|
+
conversationId: "conv-scn",
|
|
137
|
+
callSite: "mainAgent",
|
|
138
|
+
content: [finalText],
|
|
139
|
+
messages: [],
|
|
140
|
+
stopReason: null,
|
|
141
|
+
decision: "stop",
|
|
142
|
+
logger: noopLogger,
|
|
143
|
+
...overrides,
|
|
144
|
+
};
|
|
145
|
+
}
|
|
146
|
+
|
|
147
|
+
beforeEach(() => {
|
|
148
|
+
resetSurfaceCompletionNudgeStoreForTests();
|
|
149
|
+
surfaceCounter = 0;
|
|
150
|
+
});
|
|
151
|
+
|
|
152
|
+
// ─── Nudges when a progress surface is left open ──────────────────────────────
|
|
153
|
+
|
|
154
|
+
describe("surface-completion-nudge — nudges on a dangling progress surface", () => {
|
|
155
|
+
test("task_progress card shown and never completed → continue with nudge", async () => {
|
|
156
|
+
const shown = showSurface(taskProgressShow("in_progress"));
|
|
157
|
+
const ctx = makeCtx({
|
|
158
|
+
messages: [userPrompt("do the thing"), ...shown.messages],
|
|
159
|
+
});
|
|
160
|
+
|
|
161
|
+
await postModelCall(ctx);
|
|
162
|
+
|
|
163
|
+
expect(ctx.decision).toBe("continue");
|
|
164
|
+
const last = ctx.messages[ctx.messages.length - 1];
|
|
165
|
+
expect(last.role).toBe("user");
|
|
166
|
+
expect(last.content[0]).toEqual({
|
|
167
|
+
type: "text",
|
|
168
|
+
text: SURFACE_COMPLETION_NUDGE_TEXT,
|
|
169
|
+
});
|
|
170
|
+
expect(isSurfaceCompletionNudged("conv-scn")).toBe(true);
|
|
171
|
+
});
|
|
172
|
+
|
|
173
|
+
test("task_progress card shown with no explicit status → continue with nudge", async () => {
|
|
174
|
+
const shown = showSurface(taskProgressShow());
|
|
175
|
+
const ctx = makeCtx({
|
|
176
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
177
|
+
});
|
|
178
|
+
|
|
179
|
+
await postModelCall(ctx);
|
|
180
|
+
|
|
181
|
+
expect(ctx.decision).toBe("continue");
|
|
182
|
+
});
|
|
183
|
+
|
|
184
|
+
test("work_result shown in_progress → continue with nudge", async () => {
|
|
185
|
+
const shown = showSurface({
|
|
186
|
+
surface_type: "work_result",
|
|
187
|
+
data: { status: "in_progress", summary: "Crunching" },
|
|
188
|
+
});
|
|
189
|
+
const ctx = makeCtx({
|
|
190
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
191
|
+
});
|
|
192
|
+
|
|
193
|
+
await postModelCall(ctx);
|
|
194
|
+
|
|
195
|
+
expect(ctx.decision).toBe("continue");
|
|
196
|
+
});
|
|
197
|
+
});
|
|
198
|
+
|
|
199
|
+
// ─── Stays quiet when there is nothing to close ───────────────────────────────
|
|
200
|
+
|
|
201
|
+
describe("surface-completion-nudge — no nudge when surface is closed or absent", () => {
|
|
202
|
+
test("task_progress completed via ui_update → stop", async () => {
|
|
203
|
+
const shown = showSurface(taskProgressShow("in_progress"));
|
|
204
|
+
const ctx = makeCtx({
|
|
205
|
+
messages: [
|
|
206
|
+
userPrompt("go"),
|
|
207
|
+
...shown.messages,
|
|
208
|
+
updateSurface(shown.surfaceId, {
|
|
209
|
+
templateData: { status: "completed" },
|
|
210
|
+
}),
|
|
211
|
+
],
|
|
212
|
+
});
|
|
213
|
+
|
|
214
|
+
await postModelCall(ctx);
|
|
215
|
+
|
|
216
|
+
expect(ctx.decision).toBe("stop");
|
|
217
|
+
expect(isSurfaceCompletionNudged("conv-scn")).toBe(false);
|
|
218
|
+
});
|
|
219
|
+
|
|
220
|
+
test("progress surface dismissed via ui_dismiss → stop", async () => {
|
|
221
|
+
const shown = showSurface(taskProgressShow("in_progress"));
|
|
222
|
+
const ctx = makeCtx({
|
|
223
|
+
messages: [
|
|
224
|
+
userPrompt("go"),
|
|
225
|
+
...shown.messages,
|
|
226
|
+
dismissSurface(shown.surfaceId),
|
|
227
|
+
],
|
|
228
|
+
});
|
|
229
|
+
|
|
230
|
+
await postModelCall(ctx);
|
|
231
|
+
|
|
232
|
+
expect(ctx.decision).toBe("stop");
|
|
233
|
+
});
|
|
234
|
+
|
|
235
|
+
test("work_result shown completed → stop", async () => {
|
|
236
|
+
const shown = showSurface({
|
|
237
|
+
surface_type: "work_result",
|
|
238
|
+
data: { status: "completed", summary: "Done" },
|
|
239
|
+
});
|
|
240
|
+
const ctx = makeCtx({
|
|
241
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
242
|
+
});
|
|
243
|
+
|
|
244
|
+
await postModelCall(ctx);
|
|
245
|
+
|
|
246
|
+
expect(ctx.decision).toBe("stop");
|
|
247
|
+
});
|
|
248
|
+
|
|
249
|
+
test("plain card (not a progress surface) → stop", async () => {
|
|
250
|
+
const shown = showSurface({
|
|
251
|
+
surface_type: "card",
|
|
252
|
+
title: "Weather",
|
|
253
|
+
data: { template: "weather_forecast", body: "Sunny" },
|
|
254
|
+
});
|
|
255
|
+
const ctx = makeCtx({
|
|
256
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
257
|
+
});
|
|
258
|
+
|
|
259
|
+
await postModelCall(ctx);
|
|
260
|
+
|
|
261
|
+
expect(ctx.decision).toBe("stop");
|
|
262
|
+
});
|
|
263
|
+
|
|
264
|
+
test("no surfaces shown at all → stop", async () => {
|
|
265
|
+
const ctx = makeCtx({
|
|
266
|
+
messages: [userPrompt("go")],
|
|
267
|
+
});
|
|
268
|
+
|
|
269
|
+
await postModelCall(ctx);
|
|
270
|
+
|
|
271
|
+
expect(ctx.decision).toBe("stop");
|
|
272
|
+
});
|
|
273
|
+
});
|
|
274
|
+
|
|
275
|
+
// ─── Outcomes the hook does not own ───────────────────────────────────────────
|
|
276
|
+
|
|
277
|
+
describe("surface-completion-nudge — ignores outcomes it does not own", () => {
|
|
278
|
+
test("provider rejection (error present) → stop", async () => {
|
|
279
|
+
const shown = showSurface(taskProgressShow("in_progress"));
|
|
280
|
+
const ctx = makeCtx({
|
|
281
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
282
|
+
error: new Error("provider exploded"),
|
|
283
|
+
});
|
|
284
|
+
|
|
285
|
+
await postModelCall(ctx);
|
|
286
|
+
|
|
287
|
+
expect(ctx.decision).toBe("stop");
|
|
288
|
+
});
|
|
289
|
+
|
|
290
|
+
test("tool-bearing turn (model still working) → stop", async () => {
|
|
291
|
+
const shown = showSurface(taskProgressShow("in_progress"));
|
|
292
|
+
const ctx = makeCtx({
|
|
293
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
294
|
+
content: [
|
|
295
|
+
{ type: "tool_use", id: "tu_next", name: "read_file", input: {} },
|
|
296
|
+
],
|
|
297
|
+
});
|
|
298
|
+
|
|
299
|
+
await postModelCall(ctx);
|
|
300
|
+
|
|
301
|
+
expect(ctx.decision).toBe("stop");
|
|
302
|
+
});
|
|
303
|
+
|
|
304
|
+
test("non-main-agent call site → stop", async () => {
|
|
305
|
+
const shown = showSurface(taskProgressShow("in_progress"));
|
|
306
|
+
const ctx = makeCtx({
|
|
307
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
308
|
+
callSite: "heartbeatAgent",
|
|
309
|
+
});
|
|
310
|
+
|
|
311
|
+
await postModelCall(ctx);
|
|
312
|
+
|
|
313
|
+
expect(ctx.decision).toBe("stop");
|
|
314
|
+
});
|
|
315
|
+
});
|
|
316
|
+
|
|
317
|
+
// ─── Cycle scoping and the one-shot bound ─────────────────────────────────────
|
|
318
|
+
|
|
319
|
+
describe("surface-completion-nudge — cycle scoping and one-shot bound", () => {
|
|
320
|
+
test("a surface left open in a prior cycle does not trigger this cycle", async () => {
|
|
321
|
+
const priorOpen = showSurface(taskProgressShow("in_progress"));
|
|
322
|
+
const ctx = makeCtx({
|
|
323
|
+
messages: [
|
|
324
|
+
userPrompt("first task"),
|
|
325
|
+
...priorOpen.messages,
|
|
326
|
+
// New genuine user prompt opens a fresh cycle with no open surface.
|
|
327
|
+
userPrompt("second task"),
|
|
328
|
+
],
|
|
329
|
+
});
|
|
330
|
+
|
|
331
|
+
await postModelCall(ctx);
|
|
332
|
+
|
|
333
|
+
expect(ctx.decision).toBe("stop");
|
|
334
|
+
});
|
|
335
|
+
|
|
336
|
+
test("nudges at most once per run; stop clears the bound", async () => {
|
|
337
|
+
const shown = showSurface(taskProgressShow("in_progress"));
|
|
338
|
+
const firstCtx = makeCtx({
|
|
339
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
340
|
+
});
|
|
341
|
+
|
|
342
|
+
await postModelCall(firstCtx);
|
|
343
|
+
expect(firstCtx.decision).toBe("continue");
|
|
344
|
+
|
|
345
|
+
// Same run, surface still open: the one-shot bound suppresses a second nudge.
|
|
346
|
+
const secondCtx = makeCtx({
|
|
347
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
348
|
+
});
|
|
349
|
+
await postModelCall(secondCtx);
|
|
350
|
+
expect(secondCtx.decision).toBe("stop");
|
|
351
|
+
|
|
352
|
+
// Terminal stop clears the bound so the next run nudges afresh.
|
|
353
|
+
await stop({
|
|
354
|
+
conversationId: "conv-scn",
|
|
355
|
+
messages: [],
|
|
356
|
+
exitReason: "no_tool_calls",
|
|
357
|
+
logger: noopLogger,
|
|
358
|
+
});
|
|
359
|
+
expect(isSurfaceCompletionNudged("conv-scn")).toBe(false);
|
|
360
|
+
|
|
361
|
+
const thirdCtx = makeCtx({
|
|
362
|
+
messages: [userPrompt("go"), ...shown.messages],
|
|
363
|
+
});
|
|
364
|
+
await postModelCall(thirdCtx);
|
|
365
|
+
expect(thirdCtx.decision).toBe("continue");
|
|
366
|
+
});
|
|
367
|
+
});
|
|
@@ -104,7 +104,7 @@ function currentResponse(toolUseId: string): ToolResultContent {
|
|
|
104
104
|
};
|
|
105
105
|
}
|
|
106
106
|
|
|
107
|
-
/** A weak-model id that matches
|
|
107
|
+
/** A weak-model id that matches WEAK_OPEN_MODEL_PATTERN (the gated population). */
|
|
108
108
|
const WEAK_MODEL = "minimax/minimax-m3";
|
|
109
109
|
|
|
110
110
|
function makeCtx(
|