npm - @vellumai/assistant - Versions diffs - 0.3.27 → 0.4.0 - Mend

@vellumai/assistant 0.3.27 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (247) hide show

package/ARCHITECTURE.md +81 -4
package/Dockerfile +2 -2
package/bun.lock +4 -1
package/docs/trusted-contact-access.md +9 -2
package/package.json +6 -3
package/scripts/ipc/generate-swift.ts +9 -5
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +80 -0
package/src/__tests__/agent-loop-thinking.test.ts +1 -1
package/src/__tests__/agent-loop.test.ts +119 -0
package/src/__tests__/approval-routes-http.test.ts +13 -5
package/src/__tests__/asset-materialize-tool.test.ts +2 -0
package/src/__tests__/asset-search-tool.test.ts +2 -0
package/src/__tests__/assistant-events-sse-hardening.test.ts +4 -2
package/src/__tests__/attachments-store.test.ts +2 -0
package/src/__tests__/browser-skill-endstate.test.ts +3 -3
package/src/__tests__/bundled-asset.test.ts +107 -0
package/src/__tests__/call-controller.test.ts +30 -29
package/src/__tests__/call-routes-http.test.ts +34 -32
package/src/__tests__/call-start-guardian-guard.test.ts +2 -0
package/src/__tests__/canonical-guardian-store.test.ts +636 -0
package/src/__tests__/channel-approval-routes.test.ts +174 -1
package/src/__tests__/channel-invite-transport.test.ts +6 -6
package/src/__tests__/channel-reply-delivery.test.ts +19 -0
package/src/__tests__/channel-retry-sweep.test.ts +130 -0
package/src/__tests__/clarification-resolver.test.ts +2 -0
package/src/__tests__/claude-code-skill-regression.test.ts +2 -0
package/src/__tests__/claude-code-tool-profiles.test.ts +2 -0
package/src/__tests__/commit-message-enrichment-service.test.ts +9 -1
package/src/__tests__/computer-use-session-lifecycle.test.ts +2 -0
package/src/__tests__/computer-use-session-working-dir.test.ts +1 -0
package/src/__tests__/computer-use-skill-lifecycle-cleanup.test.ts +2 -0
package/src/__tests__/config-schema.test.ts +5 -5
package/src/__tests__/config-watcher.test.ts +3 -1
package/src/__tests__/connection-policy.test.ts +14 -5
package/src/__tests__/contacts-tools.test.ts +3 -1
package/src/__tests__/contradiction-checker.test.ts +2 -0
package/src/__tests__/conversation-pairing.test.ts +10 -0
package/src/__tests__/conversation-routes.test.ts +1 -1
package/src/__tests__/credential-security-invariants.test.ts +16 -6
package/src/__tests__/credential-vault-unit.test.ts +2 -2
package/src/__tests__/credential-vault.test.ts +5 -4
package/src/__tests__/daemon-lifecycle.test.ts +9 -0
package/src/__tests__/daemon-server-session-init.test.ts +27 -0
package/src/__tests__/elevenlabs-config.test.ts +2 -0
package/src/__tests__/emit-signal-routing-intent.test.ts +43 -1
package/src/__tests__/encrypted-store.test.ts +10 -5
package/src/__tests__/followup-tools.test.ts +3 -1
package/src/__tests__/gateway-only-enforcement.test.ts +21 -21
package/src/__tests__/gmail-integration.test.ts +0 -1
package/src/__tests__/guardian-actions-endpoint.test.ts +205 -345
package/src/__tests__/guardian-control-plane-policy.test.ts +19 -19
package/src/__tests__/guardian-decision-primitive-canonical.test.ts +599 -0
package/src/__tests__/guardian-dispatch.test.ts +21 -19
package/src/__tests__/guardian-grant-minting.test.ts +68 -1
package/src/__tests__/guardian-outbound-http.test.ts +12 -9
package/src/__tests__/guardian-routing-invariants.test.ts +1092 -0
package/src/__tests__/handle-user-message-secret-resume.test.ts +1 -0
package/src/__tests__/handlers-slack-config.test.ts +3 -1
package/src/__tests__/handlers-telegram-config.test.ts +3 -1
package/src/__tests__/handlers-twilio-config.test.ts +3 -1
package/src/__tests__/handlers-twitter-config.test.ts +3 -1
package/src/__tests__/handlers-user-message-approval-consumption.test.ts +318 -0
package/src/__tests__/heartbeat-service.test.ts +20 -0
package/src/__tests__/inbound-invite-redemption.test.ts +33 -0
package/src/__tests__/ingress-reconcile.test.ts +3 -1
package/src/__tests__/ingress-routes-http.test.ts +231 -4
package/src/__tests__/intent-routing.test.ts +2 -0
package/src/__tests__/ipc-snapshot.test.ts +13 -0
package/src/__tests__/mcp-cli.test.ts +77 -0
package/src/__tests__/media-generate-image.test.ts +21 -0
package/src/__tests__/media-reuse-story.e2e.test.ts +2 -0
package/src/__tests__/memory-regressions.test.ts +20 -20
package/src/__tests__/non-member-access-request.test.ts +212 -36
package/src/__tests__/notification-decision-fallback.test.ts +63 -3
package/src/__tests__/notification-decision-strategy.test.ts +78 -0
package/src/__tests__/notification-guardian-path.test.ts +15 -15
package/src/__tests__/oauth-connect-handler.test.ts +3 -1
package/src/__tests__/oauth2-gateway-transport.test.ts +2 -0
package/src/__tests__/onboarding-starter-tasks.test.ts +4 -4
package/src/__tests__/onboarding-template-contract.test.ts +116 -21
package/src/__tests__/pairing-routes.test.ts +171 -0
package/src/__tests__/playbook-execution.test.ts +3 -1
package/src/__tests__/playbook-tools.test.ts +3 -1
package/src/__tests__/provider-error-scenarios.test.ts +59 -8
package/src/__tests__/proxy-approval-callback.test.ts +2 -0
package/src/__tests__/recording-handler.test.ts +11 -0
package/src/__tests__/recording-intent-handler.test.ts +15 -0
package/src/__tests__/recording-state-machine.test.ts +13 -2
package/src/__tests__/registry.test.ts +7 -3
package/src/__tests__/relay-server.test.ts +148 -28
package/src/__tests__/runtime-attachment-metadata.test.ts +4 -2
package/src/__tests__/runtime-events-sse-parity.test.ts +21 -0
package/src/__tests__/runtime-events-sse.test.ts +4 -2
package/src/__tests__/sandbox-diagnostics.test.ts +2 -0
package/src/__tests__/schedule-tools.test.ts +3 -1
package/src/__tests__/secret-scanner-executor.test.ts +59 -0
package/src/__tests__/secret-scanner.test.ts +8 -0
package/src/__tests__/send-endpoint-busy.test.ts +4 -0
package/src/__tests__/sensitive-output-placeholders.test.ts +208 -0
package/src/__tests__/session-abort-tool-results.test.ts +23 -0
package/src/__tests__/session-agent-loop.test.ts +16 -0
package/src/__tests__/session-conflict-gate.test.ts +21 -0
package/src/__tests__/session-load-history-repair.test.ts +27 -17
package/src/__tests__/session-pre-run-repair.test.ts +23 -0
package/src/__tests__/session-profile-injection.test.ts +21 -0
package/src/__tests__/session-provider-retry-repair.test.ts +20 -0
package/src/__tests__/session-queue.test.ts +23 -0
package/src/__tests__/session-runtime-assembly.test.ts +126 -59
package/src/__tests__/session-skill-tools.test.ts +27 -5
package/src/__tests__/session-slash-known.test.ts +23 -0
package/src/__tests__/session-slash-queue.test.ts +23 -0
package/src/__tests__/session-slash-unknown.test.ts +23 -0
package/src/__tests__/session-workspace-cache-state.test.ts +7 -0
package/src/__tests__/session-workspace-injection.test.ts +21 -0
package/src/__tests__/session-workspace-tool-tracking.test.ts +21 -0
package/src/__tests__/shell-credential-ref.test.ts +2 -0
package/src/__tests__/skill-feature-flags-integration.test.ts +6 -6
package/src/__tests__/skill-load-feature-flag.test.ts +5 -4
package/src/__tests__/skill-projection-feature-flag.test.ts +22 -0
package/src/__tests__/skills.test.ts +8 -4
package/src/__tests__/slack-channel-config.test.ts +3 -1
package/src/__tests__/subagent-tools.test.ts +19 -0
package/src/__tests__/swarm-recursion.test.ts +2 -0
package/src/__tests__/swarm-session-integration.test.ts +2 -0
package/src/__tests__/swarm-tool.test.ts +2 -0
package/src/__tests__/system-prompt.test.ts +3 -1
package/src/__tests__/task-compiler.test.ts +3 -1
package/src/__tests__/task-management-tools.test.ts +3 -1
package/src/__tests__/task-tools.test.ts +3 -1
package/src/__tests__/terminal-sandbox.test.ts +13 -12
package/src/__tests__/terminal-tools.test.ts +2 -0
package/src/__tests__/tool-approval-handler.test.ts +15 -15
package/src/__tests__/tool-execution-abort-cleanup.test.ts +2 -0
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +2 -0
package/src/__tests__/tool-grant-request-escalation.test.ts +497 -0
package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +48 -0
package/src/__tests__/trusted-contact-multichannel.test.ts +22 -19
package/src/__tests__/trusted-contact-verification.test.ts +91 -0
package/src/__tests__/twilio-routes-elevenlabs.test.ts +2 -0
package/src/__tests__/twitter-auth-handler.test.ts +3 -1
package/src/__tests__/twitter-cli-routing.test.ts +3 -1
package/src/__tests__/view-image-tool.test.ts +3 -1
package/src/__tests__/voice-invite-redemption.test.ts +329 -0
package/src/__tests__/voice-scoped-grant-consumer.test.ts +7 -5
package/src/__tests__/voice-session-bridge.test.ts +10 -10
package/src/__tests__/work-item-output.test.ts +3 -1
package/src/__tests__/workspace-lifecycle.test.ts +13 -2
package/src/agent/loop.ts +46 -3
package/src/approvals/guardian-decision-primitive.ts +285 -0
package/src/approvals/guardian-request-resolvers.ts +539 -0
package/src/calls/call-controller.ts +26 -23
package/src/calls/guardian-action-sweep.ts +10 -2
package/src/calls/guardian-dispatch.ts +46 -40
package/src/calls/relay-server.ts +358 -24
package/src/calls/types.ts +1 -1
package/src/calls/voice-session-bridge.ts +3 -3
package/src/cli.ts +12 -0
package/src/config/agent-schema.ts +14 -3
package/src/config/calls-schema.ts +6 -6
package/src/config/core-schema.ts +3 -3
package/src/config/feature-flag-registry.json +8 -0
package/src/config/mcp-schema.ts +1 -1
package/src/config/memory-schema.ts +27 -19
package/src/config/schema.ts +21 -21
package/src/config/skills-schema.ts +7 -7
package/src/config/system-prompt.ts +2 -1
package/src/config/templates/BOOTSTRAP.md +47 -31
package/src/config/templates/USER.md +5 -0
package/src/config/update-bulletin-template-path.ts +4 -1
package/src/config/vellum-skills/trusted-contacts/SKILL.md +149 -21
package/src/daemon/handlers/config-inbox.ts +4 -4
package/src/daemon/handlers/guardian-actions.ts +45 -66
package/src/daemon/handlers/sessions.ts +148 -4
package/src/daemon/ipc-contract/guardian-actions.ts +7 -0
package/src/daemon/ipc-contract/messages.ts +16 -0
package/src/daemon/ipc-contract-inventory.json +1 -0
package/src/daemon/lifecycle.ts +22 -16
package/src/daemon/pairing-store.ts +86 -3
package/src/daemon/server.ts +18 -0
package/src/daemon/session-agent-loop-handlers.ts +5 -4
package/src/daemon/session-agent-loop.ts +33 -6
package/src/daemon/session-lifecycle.ts +25 -17
package/src/daemon/session-memory.ts +2 -2
package/src/daemon/session-process.ts +68 -326
package/src/daemon/session-runtime-assembly.ts +119 -25
package/src/daemon/session-tool-setup.ts +3 -2
package/src/daemon/session.ts +4 -3
package/src/home-base/prebuilt/seed.ts +2 -1
package/src/hooks/templates.ts +2 -1
package/src/memory/canonical-guardian-store.ts +586 -0
package/src/memory/channel-guardian-store.ts +2 -0
package/src/memory/conversation-crud.ts +7 -7
package/src/memory/db-init.ts +20 -0
package/src/memory/embedding-local.ts +257 -39
package/src/memory/embedding-runtime-manager.ts +471 -0
package/src/memory/guardian-action-store.ts +7 -60
package/src/memory/guardian-approvals.ts +9 -4
package/src/memory/guardian-bindings.ts +25 -1
package/src/memory/indexer.ts +3 -3
package/src/memory/ingress-invite-store.ts +45 -0
package/src/memory/job-handlers/backfill.ts +16 -9
package/src/memory/migrations/036-normalize-phone-identities.ts +289 -0
package/src/memory/migrations/037-voice-invite-columns.ts +16 -0
package/src/memory/migrations/118-reminder-routing-intent.ts +3 -3
package/src/memory/migrations/121-canonical-guardian-requests.ts +59 -0
package/src/memory/migrations/122-canonical-guardian-requester-chat-id.ts +15 -0
package/src/memory/migrations/123-canonical-guardian-deliveries-destination-index.ts +15 -0
package/src/memory/migrations/index.ts +5 -0
package/src/memory/migrations/registry.ts +5 -0
package/src/memory/qdrant-client.ts +31 -22
package/src/memory/schema-migration.ts +1 -0
package/src/memory/schema.ts +56 -0
package/src/notifications/copy-composer.ts +31 -4
package/src/notifications/decision-engine.ts +57 -0
package/src/permissions/defaults.ts +2 -0
package/src/runtime/access-request-helper.ts +173 -0
package/src/runtime/actor-trust-resolver.ts +221 -0
package/src/runtime/channel-guardian-service.ts +12 -4
package/src/runtime/channel-invite-transports/voice.ts +58 -0
package/src/runtime/channel-retry-sweep.ts +18 -6
package/src/runtime/guardian-context-resolver.ts +38 -71
package/src/runtime/guardian-decision-types.ts +6 -0
package/src/runtime/guardian-reply-router.ts +717 -0
package/src/runtime/http-server.ts +8 -0
package/src/runtime/ingress-service.ts +80 -3
package/src/runtime/invite-redemption-service.ts +141 -2
package/src/runtime/routes/canonical-guardian-expiry-sweep.ts +116 -0
package/src/runtime/routes/channel-route-shared.ts +1 -1
package/src/runtime/routes/channel-routes.ts +1 -1
package/src/runtime/routes/conversation-routes.ts +20 -2
package/src/runtime/routes/guardian-action-routes.ts +100 -109
package/src/runtime/routes/guardian-approval-interception.ts +17 -6
package/src/runtime/routes/inbound-message-handler.ts +205 -529
package/src/runtime/routes/ingress-routes.ts +52 -4
package/src/runtime/routes/pairing-routes.ts +3 -0
package/src/runtime/tool-grant-request-helper.ts +195 -0
package/src/tools/executor.ts +13 -1
package/src/tools/guardian-control-plane-policy.ts +2 -2
package/src/tools/sensitive-output-placeholders.ts +203 -0
package/src/tools/tool-approval-handler.ts +53 -10
package/src/tools/types.ts +13 -2
package/src/util/bundled-asset.ts +31 -0
package/src/util/canonicalize-identity.ts +52 -0
package/src/util/logger.ts +20 -8
package/src/util/platform.ts +10 -0
package/src/util/voice-code.ts +29 -0
package/src/daemon/guardian-invite-intent.ts +0 -124

package/ARCHITECTURE.md CHANGED Viewed

@@ -18,7 +18,7 @@ This document owns assistant-runtime architecture details. The repo-level archit
 - The same resolver is used by:
   - `/channels/inbound` (Telegram/SMS/WhatsApp path) before run orchestration.
   - Inbound Twilio voice setup (`RelayConnection.handleSetup`) to seed call-time actor context.
-- Runtime channel runs pass this as `guardianContext`, and session runtime assembly injects `<guardian_context>` into provider-facing prompts.
+- Runtime channel runs pass this as `guardianContext`, and session runtime assembly injects `<inbound_actor_context>` (via `inboundActorContextFromGuardian()`) into provider-facing prompts.
 - Voice calls mirror the same prompt contract: `CallController` receives guardian context on setup and refreshes it immediately after successful voice challenge verification, so the first post-verification turn is grounded as `actor_role: guardian`.
 - Voice-specific behavior (DTMF/speech verification flow, relay state machine) remains voice-local; only actor-role resolution is shared.
@@ -62,6 +62,41 @@ All guardian approval decisions — regardless of how they arrive — route thro
 | `src/daemon/ipc-contract/guardian-actions.ts` | IPC message type definitions for guardian action requests/responses |
 | `src/runtime/channel-approval-types.ts` | Channel-facing approval action types and `toApprovalActionOptions` bridge |
+### Canonical Guardian Request System
+The canonical guardian request system provides a channel-agnostic, unified domain for all guardian approval and question flows. It replaces the fragmented per-channel storage with a single source of truth that works identically for voice calls, Telegram/SMS/WhatsApp, and desktop UI.
+**Architecture layers:**
+1. **Canonical domain (single source of truth):** All guardian requests — tool approvals, pending questions, access requests — are persisted in the `canonical_guardian_requests` table (`src/memory/canonical-guardian-store.js`). Each request has a unique ID, a short human-readable request code, and a status that follows a CAS (compare-and-swap) lifecycle: `pending` -> `approved` | `denied` | `expired` | `cancelled`. Deliveries (notifications sent to guardians) are tracked in `canonical_guardian_deliveries`.
+2. **Unified apply primitive (single write path):** `applyCanonicalGuardianDecision()` in `src/approvals/guardian-decision-primitive.ts` is the single write path for all guardian decisions. It enforces identity validation, expiry checks, CAS resolution, `approve_always` downgrade (guardian-on-behalf invariant), kind-specific resolver dispatch via the resolver registry, and scoped grant minting. All callers — HTTP API, IPC handlers, inbound channel router, desktop session — route decisions through this function.
+3. **Shared reply router (priority-ordered routing):** `routeGuardianReply()` in `src/runtime/guardian-reply-router.ts` provides a single entry point for all inbound guardian reply processing across channels. It routes through a priority-ordered pipeline: (a) deterministic callback parsing (button presses with `apr:<requestId>:<action>`), (b) request code parsing (6-char alphanumeric prefix), (c) NL classification via the conversational approval engine. All decisions flow through `applyCanonicalGuardianDecision`.
+4. **Deterministic API (prompt listing and decision endpoints):** Desktop clients and API consumers use `GET /v1/guardian-actions/pending` and `POST /v1/guardian-actions/decision` (HTTP) or the equivalent IPC messages. These endpoints surface canonical requests alongside legacy pending interactions and channel approval records, with deduplication to avoid double-rendering.
+5. **Dual-mode (deterministic + conversational):** Guardians can respond via structured button UIs (deterministic path) or free-text conversation (NL path). Both paths converge on the same canonical primitive. Code-only messages (just a request code without decision text) return clarification instead of auto-approving. Disambiguation with multiple pending requests stays fail-closed — no auto-resolve when the target is ambiguous.
+**Resolver registry:** Kind-specific resolvers (`src/approvals/guardian-request-resolvers.ts`) handle side effects after CAS resolution. Built-in resolvers: `tool_approval` (channel/desktop approval path) and `pending_question` (voice call question path). New request kinds register resolvers without touching the core primitive.
+**Expiry sweeps:** Three complementary sweeps run on 60-second intervals to clean up stale requests:
+- `src/calls/guardian-action-sweep.ts` — voice call guardian action requests
+- `src/runtime/routes/guardian-expiry-sweep.ts` — channel guardian approval requests
+- `src/runtime/routes/canonical-guardian-expiry-sweep.ts` — canonical guardian requests (CAS-safe)
+**Key source files:**
+| File | Purpose |
+|------|---------|
+| `src/memory/canonical-guardian-store.ts` | Canonical request and delivery persistence (CRUD, CAS resolve, list with filters) |
+| `src/approvals/guardian-decision-primitive.ts` | Unified decision primitive: `applyCanonicalGuardianDecision` (canonical) and `applyGuardianDecision` (legacy) |
+| `src/approvals/guardian-request-resolvers.ts` | Resolver registry: kind-specific side-effect dispatch after CAS resolution |
+| `src/runtime/guardian-reply-router.ts` | Shared inbound router: callback -> code -> NL classification pipeline |
+| `src/runtime/routes/guardian-action-routes.ts` | HTTP endpoints for prompt listing and decision submission |
+| `src/daemon/handlers/guardian-actions.ts` | IPC handlers for desktop socket clients |
+| `src/runtime/routes/canonical-guardian-expiry-sweep.ts` | Canonical request expiry sweep |
 ### Outbound Guardian Verification (HTTP Endpoints)
 Guardian verification can be initiated through gateway HTTP endpoints (which forward to runtime handlers) as an alternative to the legacy IPC-only flow. This enables chat-first verification where the assistant guides the user through guardian setup via normal conversation.
@@ -357,26 +392,56 @@ A complementary access-granting flow where the guardian proactively creates a sh
 **Inbound intercept points:** Invite token extraction runs early in the inbound handler, before ACL denial, so valid invites short-circuit the membership check. Two intercept branches handle: (a) non-members — the invite creates their first member record; (b) inactive members (revoked/pending) — the invite reactivates them.
-**Deferred channel adapters:**
+**Channel adapter status:**
 | Channel | Status | Prerequisites |
 |---------|--------|--------------|
 | Telegram | Shipped | Bot username resolved from credential metadata or `TELEGRAM_BOT_USERNAME` env |
+| Voice | Shipped | Identity-bound voice code redemption via DTMF/speech in the relay state machine. Gated behind `feature_flags.voice-invite-redemption.enabled` (default OFF). |
 | SMS | Deferred | Needs a deep-link strategy compatible with SMS (short URL or web redemption page) |
 | Slack | Deferred | Needs DM-safe ingress — Socket Mode handles channel messages but DM-initiated invite flows need routing |
-| Voice | Deferred | Needs DTMF or speech-based token capture integrated with the voice relay state machine |
+### Voice Invite Flow (invite_redemption_pending)
+Voice invites use a short numeric code (4-10 digits, default 6) instead of a URL token. The guardian creates an invite bound to the invitee's E.164 phone number; the invitee redeems it by entering the code during an inbound voice call.
+**Creation flow:**
+1. Guardian creates a voice invite via `POST /v1/ingress/invites` with `sourceChannel: "voice"` and `expectedExternalUserId` (E.164 phone).
+2. `ingress-service.ts` generates a cryptographically random numeric code (`generateVoiceCode`), hashes it with SHA-256 (`hashVoiceCode`), and stores only the hash.
+3. The one-time plaintext `voiceCode` is returned in the creation response. The raw token is NOT returned for voice invites — redemption uses the identity-bound code flow exclusively.
+4. Guardian communicates the code to the invitee out-of-band.
+**Call-time redemption subflow (`invite_redemption_pending`):**
+1. Unknown caller dials in. `relay-server.ts` resolves trust via `resolveActorTrust`. Caller is `unknown`, no pending guardian challenge.
+2. If `feature_flags.voice-invite-redemption.enabled` is ON, the relay checks `findActiveVoiceInvites` for invites bound to the caller's phone number.
+3. If active, non-expired invites exist, the relay enters the `invite_redemption_pending` state (reuses the `verification_pending` connection state) and prompts the caller to enter their invite code via DTMF or speech.
+4. `redeemVoiceInviteCode` validates: identity match, code hash match, expiry, use count. On success, an active member record is upserted and the call transitions to the normal call flow.
+5. On failure, the caller gets up to 3 attempts. After max attempts, the call is terminated.
+**Security invariants:**
+- The plaintext voice code is returned exactly once at creation time and never stored.
+- Voice invites are identity-bound: `expectedExternalUserId` must match the caller's E.164 number. An attacker with the code but the wrong phone number cannot redeem.
+- Failure responses are intentionally generic (`invalid_or_expired`) to prevent oracle attacks.
+- Blocked members cannot bypass the guardian's explicit block via invite redemption.
+**Feature flag:** `feature_flags.voice-invite-redemption.enabled` (default OFF). When disabled, unknown callers with active voice invites are denied normally — the invite check is skipped entirely.
 **Key source files:**
 | File | Purpose |
 |------|---------|
-| `src/runtime/invite-redemption-service.ts` | Core redemption engine — token validation, member creation, discriminated-union outcomes |
+| `src/runtime/invite-redemption-service.ts` | Core redemption engine — token validation, voice code redemption, member creation, discriminated-union outcomes |
 | `src/runtime/invite-redemption-templates.ts` | Deterministic reply templates for each redemption outcome |
 | `src/runtime/channel-invite-transport.ts` | Transport adapter registry with `buildShareableInvite` / `extractInboundToken` interface |
 | `src/runtime/channel-invite-transports/telegram.ts` | Telegram adapter — `t.me/<bot>?start=iv_<token>` deep links, `/start iv_<token>` extraction |
+| `src/runtime/channel-invite-transports/voice.ts` | Voice transport adapter — code-based redemption metadata |
 | `src/daemon/guardian-invite-intent.ts` | Intent detection — routes create/list/revoke requests into the trusted-contacts skill |
 | `src/runtime/ingress-service.ts` | Shared business logic for invite/member operations (used by both HTTP routes and IPC) |
+| `src/runtime/routes/ingress-routes.ts` | HTTP API handlers for member/invite management including voice invite creation and redemption |
 | `src/runtime/routes/inbound-message-handler.ts` | Invite token intercept in the inbound flow (non-member and inactive-member branches) |
+| `src/calls/relay-server.ts` | Voice relay state machine — `invite_redemption_pending` subflow, feature flag gate |
+| `src/util/voice-code.ts` | Cryptographic voice code generation and SHA-256 hashing |
+| `src/memory/ingress-invite-store.ts` | Invite persistence including `findActiveVoiceInvites` for identity-bound lookup |
 ### Update Bulletin System
@@ -1874,6 +1939,18 @@ Connected channels are resolved at signal emission time: vellum is always includ
+### Sensitive Tool Output Placeholder Substitution
+Some tool outputs contain values that must reach the user's final reply but should never be visible to the LLM (e.g., invite tokens). The system handles this with a three-stage pipeline:
+1. **Directive extraction** (`src/tools/sensitive-output-placeholders.ts`): Tool output may include `<vellum-sensitive-output kind="invite_code" value="<raw>" />` directives. The executor strips directives, replaces raw values with deterministic placeholders (`VELLUM_ASSISTANT_INVITE_CODE_<shortId>`), and attaches `sensitiveBindings` metadata to the tool result.
+2. **Placeholder-only model context**: The agent loop stores placeholder->value bindings in a per-run `substitutionMap`. Tool results sent to the LLM contain only placeholders — the model generates conversational text referencing them without ever seeing the real values.
+3. **Post-generation substitution** (`src/agent/loop.ts`): Before emitting streamed `text_delta` events and before building the final `assistantMessage`, all placeholders are deterministically replaced with their real values. The substitution is chunk-safe for streaming (buffering partial placeholder prefixes across deltas).
+Key files: `src/tools/sensitive-output-placeholders.ts`, `src/tools/executor.ts` (extraction hook), `src/agent/loop.ts` (substitution), `src/config/vellum-skills/trusted-contacts/SKILL.md` (invite flow adoption).
 ### Notifications
 For full notification developer guidance and lifecycle details, see [`assistant/src/notifications/README.md`](src/notifications/README.md).

package/Dockerfile CHANGED Viewed

@@ -1,5 +1,5 @@
 # Use debian as base image
-FROM debian:bookworm AS builder
+FROM debian:trixie@sha256:3615a749858a1cba49b408fb49c37093db813321355a9ab7c1f9f4836341e9db AS builder
 WORKDIR /app
@@ -26,7 +26,7 @@ RUN bun install --frozen-lockfile
 COPY . .
 # Final stage
-FROM debian:bookworm AS runner
+FROM debian:trixie@sha256:3615a749858a1cba49b408fb49c37093db813321355a9ab7c1f9f4836341e9db AS runner
 WORKDIR /app

package/bun.lock CHANGED Viewed

@@ -8,7 +8,6 @@
         "@anthropic-ai/claude-agent-sdk": "^0.2.42",
         "@anthropic-ai/sdk": "^0.39.0",
         "@google/genai": "^1.40.0",
-        "@huggingface/transformers": "^3.8.1",
         "@modelcontextprotocol/sdk": "^1.15.1",
         "@qdrant/js-client-rest": "^1.16.2",
         "@sentry/node": "^10.38.0",
@@ -35,6 +34,7 @@
         "zod": "^4.3.6",
       },
       "devDependencies": {
+        "@huggingface/transformers": "^3.8.1",
         "@pydantic/logfire-node": "^0.13.0",
         "@types/archiver": "^7.0.0",
         "@types/bun": "^1.2.4",
@@ -46,6 +46,7 @@
         "eslint-plugin-simple-import-sort": "^12.1.1",
         "fast-check": "^4.5.3",
         "knip": "^5.83.1",
+        "prettier": "^3.8.1",
         "quicktype-core": "^23.2.6",
         "typescript": "^5.7.3",
         "typescript-eslint": "^8.54.0",
@@ -1136,6 +1137,8 @@
     "prelude-ls": ["prelude-ls@1.2.1", "", {}, "sha512-vkcDPrRZo1QZLbn5RLGPpg/WmIQ65qoWWhcGKf/b5eplkkarX0m9z8ppCat4mlOqUsWpyNuYgO3VRyrYHSzX5g=="],
+    "prettier": ["prettier@3.8.1", "", { "bin": { "prettier": "bin/prettier.cjs" } }, "sha512-UOnG6LftzbdaHZcKoPFtOcCKztrQ57WkHDeRD9t/PTQtmT0NHSeWWepj6pS0z/N7+08BHFDQVUrfmfMRcZwbMg=="],
     "process": ["process@0.11.10", "", {}, "sha512-cdGef/drWFoydD1JsMzuFf8100nZl+GT+yacc2bEced5f9Rjk4z+WtFUTBu9PhOi9j/jfmBPu0mMEY4wIdAF8A=="],
     "process-nextick-args": ["process-nextick-args@2.0.1", "", {}, "sha512-3ouUOpQhtgrbOa17J7+uxOTpITYWaGP7/AhoR3+A+/1e9skrzelGi/dXzEYyvbxubEF6Wn2ypscTKiKJFFn1ag=="],

package/docs/trusted-contact-access.md CHANGED Viewed

@@ -13,8 +13,15 @@ Design doc defining how unknown users gain access to a Vellum assistant via chan
 ## User Journey
 1. **Unknown user messages the assistant** on Telegram (or SMS, or any channel).
-2. **Assistant rejects the message** via the ingress ACL in `inbound-message-handler.ts`. The user has no `assistant_ingress_members` record, so the handler replies: *"Sorry, you haven't been approved to message this assistant. You can ask its Guardian for an invite."* and returns `{ denied: true, reason: 'not_a_member' }`.
-3. **Notification pipeline alerts the guardian.** The rejection triggers `emitNotificationSignal()` with `sourceEventName: 'ingress.access_request'`, routing through the decision engine to all connected channels (vellum macOS app, Telegram, etc.). The guardian sees who is requesting access.
+2. **Assistant rejects the message** via the ingress ACL in `inbound-message-handler.ts`. The user has no `assistant_ingress_members` record, so the handler replies: *"Hmm looks like you don't have access to talk to me. I'll let them know you tried talking to me and get back to you."* and returns `{ denied: true, reason: 'not_a_member' }`.
+3. **Notification pipeline alerts the guardian.** The rejection triggers `notifyGuardianOfAccessRequest()` which creates a canonical access request and calls `emitNotificationSignal()` with `sourceEventName: 'ingress.access_request'`. The notification routes through the decision engine to all connected channels (vellum macOS app, Telegram, etc.). The guardian sees who is requesting access, including a request code for approve/reject and an `open invite flow` option to start the Trusted Contacts invite flow.
+   **Guardian binding resolution for access requests** uses a fallback strategy:
+   1. Source-channel active binding first (e.g., Telegram binding for a Telegram access request).
+   2. Any active binding for the assistant on another channel (deterministic: most recently verified first, then alphabetical by channel).
+   3. No guardian identity — the notification pipeline delivers via trusted/vellum channels even when no channel binding exists.
+   This ensures unknown inbound access attempts always trigger guardian notification, even when the requester's source channel has no guardian binding.
 4. **Guardian approves the request.** The guardian responds to the notification (via Telegram inline button, macOS app, or IPC). On approval, the assistant creates a verification session via `createOutboundSession()` and generates a 6-digit verification code.
 5. **Guardian receives the verification code.** The assistant delivers the code to the guardian's verified channel (Telegram chat, SMS, etc.).
 6. **Guardian gives the code to the requester out-of-band** (in person, text message, phone call, etc.). This out-of-band transfer is the trust anchor: it proves the requester has a real-world relationship with the guardian.

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@vellumai/assistant",
-  "version": "0.3.27",
+  "version": "0.4.0",
   "type": "module",
   "bin": {
     "vellum": "./src/index.ts"
@@ -14,6 +14,8 @@
     "ipc:inventory:update": "bun run scripts/ipc/check-contract-inventory.ts --update",
     "generate:ipc": "bun run scripts/ipc/generate-swift.ts",
     "check:ipc-generated": "bun run scripts/ipc/generate-swift.ts --check",
+    "format": "prettier --write .",
+    "format:check": "prettier --check .",
     "ipc:check-swift-drift": "bun run scripts/ipc/check-swift-decoder-drift.ts",
     "lint": "eslint",
     "typecheck": "bunx tsc --noEmit",
@@ -28,7 +30,6 @@
     "@anthropic-ai/sdk": "^0.39.0",
     "@google/genai": "^1.40.0",
     "@modelcontextprotocol/sdk": "^1.15.1",
-    "@huggingface/transformers": "^3.8.1",
     "@qdrant/js-client-rest": "^1.16.2",
     "@sentry/node": "^10.38.0",
     "agentmail": "^0.1.0",
@@ -65,9 +66,11 @@
     "eslint-plugin-simple-import-sort": "^12.1.1",
     "fast-check": "^4.5.3",
     "knip": "^5.83.1",
+    "prettier": "^3.8.1",
     "quicktype-core": "^23.2.6",
     "typescript": "^5.7.3",
     "typescript-eslint": "^8.54.0",
-    "typescript-json-schema": "^0.67.1"
+    "typescript-json-schema": "^0.67.1",
+    "@huggingface/transformers": "^3.8.1"
   }
 }

package/scripts/ipc/generate-swift.ts CHANGED Viewed

@@ -94,9 +94,9 @@ function generateSchemas(): Record<string, SchemaDef> {
   const program = TJS.getProgramFromFiles(contractFiles, {
     strict: true,
-    target: 99,
-    module: 199,
-    moduleResolution: 99,
+    target: 'es2022',
+    module: 'commonjs',
+    moduleResolution: 'node',
     skipLibCheck: true,
   });
@@ -411,14 +411,18 @@ function emitStruct(s: SwiftStruct): string {
   const lines: string[] = [];
   if (s.doc) {
-    lines.push(`/// ${s.doc}`);
+    for (const docLine of s.doc.split('\n')) {
+      lines.push(`/// ${docLine}`);
+    }
   }
   lines.push(`public struct ${s.name}: Codable, Sendable {`);
   for (const p of s.properties) {
     if (p.doc) {
-      lines.push(`    /// ${p.doc}`);
+      for (const docLine of p.doc.split('\n')) {
+        lines.push(`    /// ${docLine}`);
+      }
     }
     lines.push(`    public let ${p.swiftName}: ${p.swiftType}`);
   }

package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap CHANGED Viewed

@@ -1302,6 +1302,15 @@ exports[`IPC message snapshots ServerMessage types message_complete serializes t
 }
 `;
+exports[`IPC message snapshots ServerMessage types message_request_complete serializes to expected JSON 1`] = `
+{
+  "requestId": "req-inline-001",
+  "runStillActive": true,
+  "sessionId": "sess-001",
+  "type": "message_request_complete",
+}
+`;
 exports[`IPC message snapshots ServerMessage types session_info serializes to expected JSON 1`] = `
 {
   "correlationId": "corr-001",
@@ -3112,3 +3121,74 @@ exports[`IPC message snapshots ServerMessage types generate_avatar_response seri
   "type": "generate_avatar_response",
 }
 `;
+exports[`IPC message snapshots ClientMessage types guardian_actions_pending_request serializes to expected JSON 1`] = `
+{
+  "conversationId": "conv-guardian-001",
+  "type": "guardian_actions_pending_request",
+}
+`;
+exports[`IPC message snapshots ClientMessage types guardian_action_decision serializes to expected JSON 1`] = `
+{
+  "action": "approve_once",
+  "conversationId": "conv-guardian-001",
+  "requestId": "req-guardian-001",
+  "type": "guardian_action_decision",
+}
+`;
+exports[`IPC message snapshots ClientMessage types reorder_threads serializes to expected JSON 1`] = `
+{
+  "type": "reorder_threads",
+  "updates": [
+    {
+      "displayOrder": 0,
+      "isPinned": false,
+      "sessionId": "sess-001",
+    },
+    {
+      "displayOrder": 1,
+      "isPinned": true,
+      "sessionId": "sess-002",
+    },
+  ],
+}
+`;
+exports[`IPC message snapshots ServerMessage types guardian_actions_pending_response serializes to expected JSON 1`] = `
+{
+  "conversationId": "conv-guardian-001",
+  "prompts": [
+    {
+      "actions": [
+        {
+          "action": "approve_once",
+          "label": "Approve once",
+        },
+        {
+          "action": "reject",
+          "label": "Reject",
+        },
+      ],
+      "callSessionId": null,
+      "conversationId": "conv-guardian-001",
+      "expiresAt": 1700100000000,
+      "questionText": "Approve tool: bash",
+      "requestCode": "REQ-GU",
+      "requestId": "req-guardian-001",
+      "state": "pending",
+      "toolName": "bash",
+    },
+  ],
+  "type": "guardian_actions_pending_response",
+}
+`;
+exports[`IPC message snapshots ServerMessage types guardian_action_decision_response serializes to expected JSON 1`] = `
+{
+  "applied": true,
+  "requestId": "req-guardian-001",
+  "type": "guardian_action_decision_response",
+}
+`;

package/src/__tests__/agent-loop-thinking.test.ts CHANGED Viewed

@@ -44,7 +44,7 @@ describe('AgentLoop thinking budget clamping', () => {
     const config = lastConfig()!;
     const thinking = config.thinking as { type: string; budget_tokens: number };
     expect(thinking.type).toBe('enabled');
-    expect(thinking.budget_tokens).toBe(4095); // clamped to maxTokens - 1
+    expect(thinking.budget_tokens).toBe(3072); // clamped to floor(maxTokens * 0.75)
   });
   test('does not clamp when budget_tokens is within max_tokens', async () => {

package/src/__tests__/agent-loop.test.ts CHANGED Viewed

@@ -1167,4 +1167,123 @@ describe('AgentLoop', () => {
     expect(sentBlock).toBeDefined();
     expect(sentBlock!.content).toBe(smallContent);
   });
+  // ---------------------------------------------------------------------------
+  // Sensitive output placeholder substitution tests
+  // ---------------------------------------------------------------------------
+  // 32. Tool results with sensitiveBindings populate substitution map and
+  //     final assistant message text is resolved with real values.
+  test('resolves sensitive output placeholders in final assistant message', async () => {
+    const placeholder = 'VELLUM_ASSISTANT_INVITE_CODE_TEST1234';
+    const realToken = 'realInviteToken999';
+    const { provider, calls } = createMockProvider([
+      toolUseResponse('t1', 'bash', { command: 'create invite' }),
+      // The LLM responds using the placeholder (it never saw the real token)
+      textResponse(`Here is your invite link: https://t.me/bot?start=iv_${placeholder}`),
+    ]);
+    const toolExecutor = async () => ({
+      content: `https://t.me/bot?start=iv_${placeholder}`,
+      isError: false,
+      sensitiveBindings: [{ kind: 'invite_code' as const, placeholder, value: realToken }],
+    });
+    const loop = new AgentLoop(provider, 'system', {}, dummyTools, toolExecutor);
+    const events: AgentEvent[] = [];
+    const history = await loop.run([userMessage], collectEvents(events));
+    // The final assistant message in HISTORY should retain placeholders
+    // (so the model never sees real values on subsequent turns)
+    const lastAssistant = history[history.length - 1];
+    expect(lastAssistant.role).toBe('assistant');
+    const historyTextBlock = lastAssistant.content.find(
+      (b): b is Extract<ContentBlock, { type: 'text' }> => b.type === 'text',
+    );
+    expect(historyTextBlock).toBeDefined();
+    expect(historyTextBlock!.text).toContain(placeholder);
+    expect(historyTextBlock!.text).not.toContain(realToken);
+    // The message_complete EVENT should also retain placeholders (persisted
+    // to conversation store; real values leak on session reload otherwise)
+    const completeEvents = events.filter(
+      (e): e is Extract<AgentEvent, { type: 'message_complete' }> => e.type === 'message_complete',
+    );
+    const lastComplete = completeEvents[completeEvents.length - 1];
+    const completeText = lastComplete.message.content.find(
+      (b): b is Extract<ContentBlock, { type: 'text' }> => b.type === 'text',
+    );
+    expect(completeText!.text).toContain(placeholder);
+    expect(completeText!.text).not.toContain(realToken);
+    // The tool result content in provider history should contain the PLACEHOLDER,
+    // NOT the raw token (model never sees the real value)
+    const secondCallMessages = calls[1].messages;
+    const toolResultMsg = secondCallMessages.find(
+      (m) => m.role === 'user' && m.content.some((b) => b.type === 'tool_result'),
+    );
+    expect(toolResultMsg).toBeDefined();
+    const toolResultBlock = toolResultMsg!.content.find(
+      (b): b is Extract<ContentBlock, { type: 'tool_result' }> => b.type === 'tool_result',
+    );
+    expect(toolResultBlock!.content).toContain(placeholder);
+    expect(toolResultBlock!.content).not.toContain(realToken);
+  });
+  // 33. Streamed text_delta events have placeholders resolved to real values
+  test('resolves sensitive output placeholders in streamed text_delta events', async () => {
+    const placeholder = 'VELLUM_ASSISTANT_INVITE_CODE_STRM5678';
+    const realToken = 'streamedRealToken';
+    const { provider } = createMockProvider([
+      toolUseResponse('t1', 'bash', { command: 'invite' }),
+      // Response text includes the placeholder
+      textResponse(`Link: https://t.me/bot?start=iv_${placeholder}`),
+    ]);
+    const toolExecutor = async () => ({
+      content: `https://t.me/bot?start=iv_${placeholder}`,
+      isError: false,
+      sensitiveBindings: [{ kind: 'invite_code' as const, placeholder, value: realToken }],
+    });
+    const loop = new AgentLoop(provider, 'system', {}, dummyTools, toolExecutor);
+    const events: AgentEvent[] = [];
+    await loop.run([userMessage], collectEvents(events));
+    // Collect all text_delta events from the final turn (after tool result)
+    const textDeltas = events.filter(
+      (e): e is Extract<AgentEvent, { type: 'text_delta' }> => e.type === 'text_delta',
+    );
+    const allStreamedText = textDeltas.map((e) => e.text).join('');
+    // Streamed text should contain the real token, not the placeholder
+    expect(allStreamedText).toContain(realToken);
+    expect(allStreamedText).not.toContain(placeholder);
+  });
+  // 34. Without sensitive bindings, text passes through unchanged
+  test('text passes through unchanged when no sensitive bindings exist', async () => {
+    const { provider } = createMockProvider([
+      toolUseResponse('t1', 'read_file', { path: '/test.txt' }),
+      textResponse('Normal response with no placeholders.'),
+    ]);
+    const toolExecutor = async () => ({
+      content: 'file contents',
+      isError: false,
+      // No sensitiveBindings
+    });
+    const loop = new AgentLoop(provider, 'system', {}, dummyTools, toolExecutor);
+    const events: AgentEvent[] = [];
+    const history = await loop.run([userMessage], collectEvents(events));
+    const lastAssistant = history[history.length - 1];
+    const textBlock = lastAssistant.content.find(
+      (b): b is Extract<ContentBlock, { type: 'text' }> => b.type === 'text',
+    );
+    expect(textBlock!.text).toBe('Normal response with no placeholders.');
+  });
 });

package/src/__tests__/approval-routes-http.test.ts CHANGED Viewed

@@ -36,6 +36,8 @@ mock.module('../util/logger.js', () => ({
 mock.module('../config/loader.js', () => ({
   getConfig: () => ({
+    ui: {},
     model: 'test',
     provider: 'test',
     apiKeys: {},
@@ -79,8 +81,11 @@ function makeIdleSession(opts?: {
     setAssistantId: () => {},
     setGuardianContext: () => {},
     setCommandIntent: () => {},
+    setTurnChannelContext: () => {},
+    setTurnInterfaceContext: () => {},
     updateClient: () => {},
     enqueueMessage: () => ({ queued: false, requestId: 'noop' }),
+    hasAnyPendingConfirmation: () => false,
     runAgentLoop: async (_content: string, _messageId: string, onEvent: (msg: ServerMessage) => void) => {
       onEvent({ type: 'assistant_text_delta', text: 'Hello!' });
       onEvent({ type: 'message_complete', sessionId: 'test-session' });
@@ -118,8 +123,11 @@ function makeConfirmationEmittingSession(opts?: {
     setAssistantId: () => {},
     setGuardianContext: () => {},
     setCommandIntent: () => {},
+    setTurnChannelContext: () => {},
+    setTurnInterfaceContext: () => {},
     updateClient: () => {},
     enqueueMessage: () => ({ queued: false, requestId: 'noop' }),
+    hasAnyPendingConfirmation: () => false,
     runAgentLoop: async (_content: string, _messageId: string, onEvent: (msg: ServerMessage) => void) => {
       // Emit confirmation_request — this triggers the hub publisher to register
       // the pending interaction
@@ -549,8 +557,8 @@ describe('standalone approval endpoints — HTTP layer', () => {
       });
       expect(res.status).toBe(403);
-      const body = await res.json() as { error: string };
-      expect(body.error).toContain('pattern');
+      const body = await res.json() as { error: { message: string; code?: string } };
+      expect(body.error.message).toContain('pattern');
       await stopServer();
     });
@@ -579,8 +587,8 @@ describe('standalone approval endpoints — HTTP layer', () => {
       });
       expect(res.status).toBe(403);
-      const body = await res.json() as { error: string };
-      expect(body.error).toContain('scope');
+      const body = await res.json() as { error: { message: string; code?: string } };
+      expect(body.error.message).toContain('scope');
       await stopServer();
     });
@@ -637,7 +645,7 @@ describe('standalone approval endpoints — HTTP layer', () => {
       const res = await fetch(url('messages'), {
         method: 'POST',
         headers: { 'Content-Type': 'application/json', ...AUTH_HEADERS },
-        body: JSON.stringify({ conversationKey: 'conv-auto', content: 'Run ls', sourceChannel: 'vellum' }),
+        body: JSON.stringify({ conversationKey: 'conv-auto', content: 'Run ls', sourceChannel: 'vellum', interface: 'macos' }),
       });
       expect(res.status).toBe(202);

package/src/__tests__/asset-materialize-tool.test.ts CHANGED Viewed

@@ -30,6 +30,8 @@ mock.module('../util/logger.js', () => ({
 mock.module('../config/loader.js', () => ({
   getConfig: () => ({
+    ui: {},
     model: 'test',
     provider: 'test',
     apiKeys: {},

package/src/__tests__/asset-search-tool.test.ts CHANGED Viewed

@@ -29,6 +29,8 @@ mock.module('../util/logger.js', () => ({
 mock.module('../config/loader.js', () => ({
   getConfig: () => ({
+    ui: {},
     model: 'test',
     provider: 'test',
     apiKeys: {},

package/src/__tests__/assistant-events-sse-hardening.test.ts CHANGED Viewed

@@ -37,6 +37,8 @@ mock.module('../util/logger.js', () => ({
 mock.module('../config/loader.js', () => ({
   getConfig: () => ({
+    ui: {},
     model: 'test',
     provider: 'test',
     apiKeys: {},
@@ -181,8 +183,8 @@ describe('SSE route — capacity limit', () => {
     const response = handleSubscribeAssistantEvents(req, new URL(req.url), { hub });
     expect(response.status).toBe(503);
-    const body = await response.json() as { error: string };
-    expect(body.error).toMatch(/Too many concurrent connections/);
+    const body = await response.json() as { error: { message: string; code?: string } };
+    expect(body.error.message).toMatch(/Too many concurrent connections/);
   });
   test('returns 200 when hub has remaining capacity', () => {

package/src/__tests__/attachments-store.test.ts CHANGED Viewed

@@ -27,6 +27,8 @@ mock.module('../util/logger.js', () => ({
 mock.module('../config/loader.js', () => ({
   getConfig: () => ({
+    ui: {},
     model: 'test',
     provider: 'test',
     apiKeys: {},

package/src/__tests__/browser-skill-endstate.test.ts CHANGED Viewed

@@ -64,10 +64,10 @@ describe('browser skill migration end-state', () => {
   test('startup tool definition count is reduced (no browser tools)', () => {
     const definitions = getAllToolDefinitions();
-    // Startup has ~31 definitions (no browser tools).
+    // Startup has ~15 eager + ~11 explicit definitions (no browser tools).
     // Allow wider drift for unrelated tool additions while still failing if
-    // browser tools are reintroduced at startup (+10 definitions).
-    expect(definitions.length).toBeGreaterThanOrEqual(25);
+    // browser tools are reintroduced at startup (+14 definitions).
+    expect(definitions.length).toBeGreaterThanOrEqual(10);
     expect(definitions.length).toBeLessThanOrEqual(50);
     const defNames = definitions.map((d) => d.name);