npm - @vellumai/assistant - Versions diffs - 0.4.30 → 0.4.32 - Mend

@vellumai/assistant 0.4.30 → 0.4.32

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (194) hide show

package/ARCHITECTURE.md +1 -1
package/Dockerfile +14 -8
package/README.md +2 -2
package/docs/architecture/memory.md +28 -29
package/docs/runbook-trusted-contacts.md +1 -4
package/package.json +1 -1
package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +0 -7
package/src/__tests__/anthropic-provider.test.ts +86 -1
package/src/__tests__/assistant-feature-flags-integration.test.ts +2 -2
package/src/__tests__/checker.test.ts +37 -98
package/src/__tests__/commit-message-enrichment-service.test.ts +15 -4
package/src/__tests__/config-schema.test.ts +6 -14
package/src/__tests__/conflict-policy.test.ts +76 -0
package/src/__tests__/conflict-store.test.ts +14 -20
package/src/__tests__/contacts-tools.test.ts +8 -61
package/src/__tests__/contradiction-checker.test.ts +5 -1
package/src/__tests__/credential-security-invariants.test.ts +1 -0
package/src/__tests__/daemon-server-session-init.test.ts +1 -19
package/src/__tests__/followup-tools.test.ts +0 -30
package/src/__tests__/gemini-provider.test.ts +79 -1
package/src/__tests__/guardian-decision-primitive-canonical.test.ts +5 -3
package/src/__tests__/guardian-routing-invariants.test.ts +6 -4
package/src/__tests__/ipc-snapshot.test.ts +0 -4
package/src/__tests__/managed-proxy-context.test.ts +163 -0
package/src/__tests__/memory-lifecycle-e2e.test.ts +13 -12
package/src/__tests__/memory-regressions.test.ts +6 -6
package/src/__tests__/openai-provider.test.ts +82 -0
package/src/__tests__/provider-fail-open-selection.test.ts +134 -1
package/src/__tests__/provider-managed-proxy-integration.test.ts +269 -0
package/src/__tests__/recurrence-types.test.ts +0 -15
package/src/__tests__/registry.test.ts +0 -10
package/src/__tests__/schedule-tools.test.ts +28 -44
package/src/__tests__/script-proxy-session-runtime.test.ts +6 -1
package/src/__tests__/session-agent-loop.test.ts +0 -2
package/src/__tests__/session-conflict-gate.test.ts +243 -388
package/src/__tests__/session-profile-injection.test.ts +0 -2
package/src/__tests__/session-runtime-assembly.test.ts +2 -3
package/src/__tests__/session-skill-tools.test.ts +0 -49
package/src/__tests__/session-workspace-cache-state.test.ts +0 -1
package/src/__tests__/session-workspace-injection.test.ts +0 -1
package/src/__tests__/session-workspace-tool-tracking.test.ts +0 -1
package/src/__tests__/skill-feature-flags.test.ts +2 -2
package/src/__tests__/task-management-tools.test.ts +111 -0
package/src/__tests__/tool-grant-request-escalation.test.ts +2 -1
package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +2 -1
package/src/__tests__/twilio-config.test.ts +0 -3
package/src/amazon/session.ts +30 -91
package/src/approvals/guardian-decision-primitive.ts +11 -7
package/src/approvals/guardian-request-resolvers.ts +5 -3
package/src/calls/call-controller.ts +423 -571
package/src/calls/finalize-call.ts +20 -0
package/src/calls/relay-access-wait.ts +340 -0
package/src/calls/relay-server.ts +269 -899
package/src/calls/relay-setup-router.ts +307 -0
package/src/calls/relay-verification.ts +280 -0
package/src/calls/twilio-config.ts +1 -8
package/src/calls/voice-control-protocol.ts +184 -0
package/src/calls/voice-session-bridge.ts +1 -8
package/src/config/agent-schema.ts +1 -1
package/src/config/bundled-skills/contacts/SKILL.md +7 -18
package/src/config/bundled-skills/contacts/TOOLS.json +4 -20
package/src/config/bundled-skills/contacts/tools/contact-merge.ts +2 -4
package/src/config/bundled-skills/contacts/tools/contact-search.ts +6 -12
package/src/config/bundled-skills/contacts/tools/contact-upsert.ts +3 -24
package/src/config/bundled-skills/followups/TOOLS.json +0 -4
package/src/config/bundled-skills/schedule/SKILL.md +1 -1
package/src/config/bundled-skills/schedule/TOOLS.json +2 -10
package/src/config/bundled-tool-registry.ts +0 -5
package/src/config/core-schema.ts +1 -1
package/src/config/env.ts +0 -10
package/src/config/feature-flag-registry.json +1 -1
package/src/config/loader.ts +19 -0
package/src/config/memory-schema.ts +0 -10
package/src/config/schema.ts +2 -2
package/src/config/system-prompt.ts +6 -0
package/src/contacts/contact-store.ts +36 -62
package/src/contacts/contacts-write.ts +14 -3
package/src/contacts/types.ts +9 -4
package/src/daemon/handlers/config-heartbeat.ts +1 -2
package/src/daemon/handlers/contacts.ts +2 -2
package/src/daemon/handlers/guardian-actions.ts +1 -1
package/src/daemon/handlers/session-history.ts +398 -0
package/src/daemon/handlers/session-user-message.ts +982 -0
package/src/daemon/handlers/sessions.ts +9 -1337
package/src/daemon/ipc-contract/contacts.ts +2 -2
package/src/daemon/ipc-contract/sessions.ts +0 -6
package/src/daemon/ipc-contract-inventory.json +0 -1
package/src/daemon/lifecycle.ts +0 -29
package/src/daemon/session-agent-loop.ts +1 -45
package/src/daemon/session-conflict-gate.ts +21 -82
package/src/daemon/session-memory.ts +7 -52
package/src/daemon/session-process.ts +3 -1
package/src/daemon/session-runtime-assembly.ts +18 -35
package/src/heartbeat/heartbeat-service.ts +5 -1
package/src/home-base/app-link-store.ts +0 -7
package/src/memory/conflict-intent.ts +3 -6
package/src/memory/conflict-policy.ts +34 -0
package/src/memory/conflict-store.ts +10 -18
package/src/memory/contradiction-checker.ts +2 -2
package/src/memory/conversation-attention-store.ts +1 -1
package/src/memory/conversation-store.ts +0 -51
package/src/memory/db-init.ts +8 -0
package/src/memory/job-handlers/conflict.ts +24 -7
package/src/memory/migrations/105-contacts-and-triage.ts +4 -7
package/src/memory/migrations/134-contacts-notes-column.ts +68 -0
package/src/memory/migrations/135-backfill-contact-interaction-stats.ts +31 -0
package/src/memory/migrations/index.ts +2 -0
package/src/memory/migrations/registry.ts +6 -0
package/src/memory/recall-cache.ts +0 -5
package/src/memory/schema/calls.ts +274 -0
package/src/memory/schema/contacts.ts +125 -0
package/src/memory/schema/conversations.ts +129 -0
package/src/memory/schema/guardian.ts +172 -0
package/src/memory/schema/index.ts +8 -0
package/src/memory/schema/infrastructure.ts +205 -0
package/src/memory/schema/memory-core.ts +196 -0
package/src/memory/schema/notifications.ts +191 -0
package/src/memory/schema/tasks.ts +78 -0
package/src/memory/schema.ts +1 -1402
package/src/memory/slack-thread-store.ts +0 -69
package/src/messaging/index.ts +0 -1
package/src/messaging/types.ts +0 -38
package/src/notifications/decisions-store.ts +2 -105
package/src/notifications/deliveries-store.ts +0 -11
package/src/notifications/preferences-store.ts +1 -58
package/src/permissions/checker.ts +6 -17
package/src/providers/anthropic/client.ts +6 -2
package/src/providers/gemini/client.ts +13 -2
package/src/providers/managed-proxy/constants.ts +55 -0
package/src/providers/managed-proxy/context.ts +77 -0
package/src/providers/registry.ts +112 -0
package/src/runtime/auth/__tests__/guard-tests.test.ts +51 -23
package/src/runtime/guardian-action-service.ts +3 -2
package/src/runtime/guardian-outbound-actions.ts +3 -3
package/src/runtime/guardian-reply-router.ts +4 -4
package/src/runtime/http-server.ts +83 -710
package/src/runtime/http-types.ts +0 -16
package/src/runtime/middleware/auth.ts +0 -12
package/src/runtime/routes/app-routes.ts +33 -0
package/src/runtime/routes/approval-routes.ts +32 -0
package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +6 -3
package/src/runtime/routes/attachment-routes.ts +32 -0
package/src/runtime/routes/brain-graph-routes.ts +27 -0
package/src/runtime/routes/call-routes.ts +41 -0
package/src/runtime/routes/channel-readiness-routes.ts +20 -0
package/src/runtime/routes/channel-routes.ts +70 -0
package/src/runtime/routes/contact-routes.ts +371 -29
package/src/runtime/routes/conversation-attention-routes.ts +15 -0
package/src/runtime/routes/conversation-routes.ts +192 -194
package/src/runtime/routes/debug-routes.ts +15 -0
package/src/runtime/routes/events-routes.ts +16 -0
package/src/runtime/routes/global-search-routes.ts +17 -2
package/src/runtime/routes/guardian-action-routes.ts +23 -1
package/src/runtime/routes/guardian-approval-interception.ts +2 -1
package/src/runtime/routes/guardian-bootstrap-routes.ts +26 -1
package/src/runtime/routes/guardian-refresh-routes.ts +20 -0
package/src/runtime/routes/identity-routes.ts +20 -0
package/src/runtime/routes/inbound-message-handler.ts +8 -0
package/src/runtime/routes/inbound-stages/acl-enforcement.ts +5 -1
package/src/runtime/routes/inbound-stages/guardian-reply-intercept.ts +2 -1
package/src/runtime/routes/integration-routes.ts +83 -0
package/src/runtime/routes/invite-routes.ts +31 -0
package/src/runtime/routes/migration-routes.ts +47 -17
package/src/runtime/routes/pairing-routes.ts +18 -0
package/src/runtime/routes/secret-routes.ts +20 -0
package/src/runtime/routes/surface-action-routes.ts +26 -0
package/src/runtime/routes/trust-rules-routes.ts +31 -0
package/src/runtime/routes/twilio-routes.ts +79 -0
package/src/schedule/recurrence-types.ts +1 -11
package/src/tools/followups/followup_create.ts +9 -3
package/src/tools/mcp/mcp-tool-factory.ts +0 -17
package/src/tools/memory/definitions.ts +0 -6
package/src/tools/network/script-proxy/session-manager.ts +38 -3
package/src/tools/schedule/create.ts +1 -3
package/src/tools/schedule/update.ts +9 -6
package/src/twitter/session.ts +29 -77
package/src/util/cookie-session.ts +114 -0
package/src/workspace/git-service.ts +6 -4
package/src/__tests__/conversation-routes.test.ts +0 -99
package/src/__tests__/get-weather.test.ts +0 -393
package/src/__tests__/task-tools.test.ts +0 -685
package/src/__tests__/weather-skill-regression.test.ts +0 -276
package/src/autonomy/autonomy-resolver.ts +0 -62
package/src/autonomy/autonomy-store.ts +0 -138
package/src/autonomy/disposition-mapper.ts +0 -31
package/src/autonomy/index.ts +0 -11
package/src/autonomy/types.ts +0 -43
package/src/config/bundled-skills/weather/SKILL.md +0 -38
package/src/config/bundled-skills/weather/TOOLS.json +0 -36
package/src/config/bundled-skills/weather/icon.svg +0 -24
package/src/config/bundled-skills/weather/tools/get-weather.ts +0 -12
package/src/contacts/startup-migration.ts +0 -21
package/src/messaging/triage-engine.ts +0 -344
package/src/tools/weather/service.ts +0 -712

package/ARCHITECTURE.md CHANGED Viewed

@@ -883,7 +883,7 @@ graph LR
         C5["user_message<br/>text, attachments"]
         C6["confirmation_response<br/>decision"]
         C7["cancel / undo"]
-        C8["model_get / model_set<br/>sandbox_set (deprecated no-op)"]
+        C8["model_get / model_set"]
         C9["ping"]
         C10["ipc_blob_probe<br/>probeId, nonceSha256"]
         C11["work_items_list / work_item_get<br/>work_item_create / work_item_update<br/>work_item_complete / work_item_run_task<br/>(planned)"]

package/Dockerfile CHANGED Viewed

@@ -16,16 +16,21 @@ RUN apt-get update && apt-get install -y \
 RUN curl -fsSL https://bun.sh/install | bash
 ENV PATH="/root/.bun/bin:${PATH}"
-# Copy package files
-COPY package.json bun.lock ./
+# Install assistant and CLI dependencies first for cache reuse
+COPY assistant/package.json assistant/bun.lock ./assistant/
+RUN cd /app/assistant && bun install --frozen-lockfile
-# Install dependencies
-RUN bun install --frozen-lockfile
+COPY cli/package.json cli/bun.lock ./cli/
+RUN cd /app/cli && bun install --frozen-lockfile
+# Copy source
+COPY assistant ./assistant
+COPY cli ./cli
 # Final stage
 FROM debian:trixie@sha256:3615a749858a1cba49b408fb49c37093db813321355a9ab7c1f9f4836341e9db AS runner
-WORKDIR /app
+WORKDIR /app/assistant
 # Install runtime dependencies for Playwright and tree-sitter
 RUN apt-get update && apt-get install -y \
@@ -47,6 +52,10 @@ RUN apt-get update && apt-get install -y \
 COPY --from=builder /root/.bun/bin/bun /usr/local/bin/bun
 RUN ln -sf /usr/local/bin/bun /usr/local/bin/bunx
+# Install a vellum CLI launcher backed by the bundled local cli package
+RUN printf '#!/usr/bin/env sh\nexec bun run /app/cli/src/index.ts "$@"\n' > /usr/local/bin/vellum && \
+    chmod +x /usr/local/bin/vellum
 # Create non-root user that also has sudo access so it can like install stuff
 RUN groupadd --system --gid 1001 assistant && \
     useradd --system --uid 1001 --gid assistant --create-home --shell /bin/bash assistant && \
@@ -95,8 +104,5 @@ ENV IS_CONTAINERIZED=true
 # Copy from builder
 COPY --from=builder /app /app
-# Copy source
-COPY . .
 # Run the daemon + http server
 CMD ["bun", "run", "src/daemon/main.ts"]

package/README.md CHANGED Viewed

@@ -481,7 +481,7 @@ bun run db:push       # Apply migrations
 ```bash
 # Build production image
-docker build -t vellum-assistant:local assistant
+docker build -f assistant/Dockerfile -t vellum-assistant:local .
 # Run
 docker run --rm -p 3001:3001 \
@@ -489,7 +489,7 @@ docker run --rm -p 3001:3001 \
   vellum-assistant:local
 ```
-The image runs as non-root user `assistant` (uid 1001) and exposes port `3001`.
+The image exposes port `3001` and bundles the `vellum` CLI binary.
 ## Troubleshooting

package/docs/architecture/memory.md CHANGED Viewed

@@ -41,7 +41,7 @@ graph TB
     subgraph "Read Path (Memory Recall)"
         QUERY["Recall Query Builder<br/>User request + compacted context summary"]
-        CONFLICT_GATE["Soft Conflict Gate<br/>dismiss non-actionable conflicts (kind + statement policy)<br/>resolve pending conflicts from user turn<br/>relevance + cooldown + configurable ask behavior"]
+        CONFLICT_GATE["Soft Conflict Gate<br/>dismiss non-actionable conflicts (kind + statement + provenance policy)<br/>attempt internal resolution from user turn<br/>relevance-based; never produces user-facing prompts"]
         PROFILE_BUILD["Dynamic Profile Compiler<br/>active trusted profile memories<br/>user_confirmed > user_reported > assistant_inferred"]
         PROFILE_INJECT["Inject profile context block<br/>into runtime user tail<br/>(strict token cap)"]
         BUDGET["Dynamic Recall Budget<br/>computeRecallBudget()<br/>from prompt headroom"]
@@ -158,28 +158,26 @@ The key distinction: normal compaction is a cost-optimized background process th
 ### Memory Retrieval Config Knobs (Defaults)
-| Config key                                                |                                                           Default | Purpose                                                                                                                                                |
-| --------------------------------------------------------- | ----------------------------------------------------------------: | ------------------------------------------------------------------------------------------------------------------------------------------------------ |
-| `memory.retrieval.dynamicBudget.enabled`                  |                                                            `true` | Toggle per-turn recall budget calculation from live prompt headroom.                                                                                   |
-| `memory.retrieval.dynamicBudget.minInjectTokens`          |                                                            `1200` | Lower clamp for computed recall injection budget.                                                                                                      |
-| `memory.retrieval.dynamicBudget.maxInjectTokens`          |                                                           `10000` | Upper clamp for computed recall injection budget.                                                                                                      |
-| `memory.retrieval.dynamicBudget.targetHeadroomTokens`     |                                                           `10000` | Reserved headroom to keep free for response generation/tool traces.                                                                                    |
-| `memory.entity.extractRelations.enabled`                  |                                                            `true` | Enable relation edge extraction and persistence in `memory_entity_relations`.                                                                          |
-| `memory.entity.extractRelations.backfillBatchSize`        |                                                             `200` | Batch size for checkpointed `backfill_entity_relations` jobs.                                                                                          |
-| `memory.entity.relationRetrieval.enabled`                 |                                                            `true` | Enable one-hop relation expansion from matched seed entities at recall time.                                                                           |
-| `memory.entity.relationRetrieval.maxSeedEntities`         |                                                               `8` | Maximum matched seed entities from the query.                                                                                                          |
-| `memory.entity.relationRetrieval.maxNeighborEntities`     |                                                              `20` | Maximum unique neighbor entities expanded from relation edges.                                                                                         |
-| `memory.entity.relationRetrieval.maxEdges`                |                                                              `40` | Maximum relation edges traversed during expansion.                                                                                                     |
-| `memory.entity.relationRetrieval.neighborScoreMultiplier` |                                                             `0.7` | Downweight multiplier for relation-expanded candidates vs direct entity hits.                                                                          |
-| `memory.conflicts.enabled`                                |                                                            `true` | Enable soft conflict gate for unresolved `memory_item_conflicts`.                                                                                      |
-| `memory.conflicts.reaskCooldownTurns`                     |                                                               `3` | Minimum turn distance before re-asking the same conflict clarification.                                                                                |
-| `memory.conflicts.resolverLlmTimeoutMs`                   |                                                           `12000` | Timeout bound for clarification resolver LLM fallback.                                                                                                 |
-| `memory.conflicts.relevanceThreshold`                     |                                                             `0.3` | Similarity threshold for deciding whether a pending conflict is relevant to the current request.                                                       |
-| `memory.conflicts.gateMode`                               |                                                          `'soft'` | Conflict gate strategy. Currently only `'soft'` is supported (asks the user inline).                                                                   |
-| `memory.conflicts.askOnIrrelevantTurns`                   |                                                           `false` | When `true`, soft-inject irrelevant conflict clarifications into every turn. When `false` (default), only ask when the conflict is topically relevant. |
-| `memory.conflicts.conflictableKinds`                      | `['preference', 'profile', 'constraint', 'instruction', 'style']` | Memory item kinds eligible for conflict detection. Items with kinds outside this list are auto-dismissed.                                              |
-| `memory.profile.enabled`                                  |                                                            `true` | Enable dynamic profile compilation from active trusted profile/preference/constraint/instruction memories.                                             |
-| `memory.profile.maxInjectTokens`                          |                                                             `800` | Hard token cap enforced by `ProfileCompiler` when generating the runtime profile block.                                                                |
+| Config key                                                |                                                           Default | Purpose                                                                                                            |
+| --------------------------------------------------------- | ----------------------------------------------------------------: | ------------------------------------------------------------------------------------------------------------------ |
+| `memory.retrieval.dynamicBudget.enabled`                  |                                                            `true` | Toggle per-turn recall budget calculation from live prompt headroom.                                               |
+| `memory.retrieval.dynamicBudget.minInjectTokens`          |                                                            `1200` | Lower clamp for computed recall injection budget.                                                                  |
+| `memory.retrieval.dynamicBudget.maxInjectTokens`          |                                                           `10000` | Upper clamp for computed recall injection budget.                                                                  |
+| `memory.retrieval.dynamicBudget.targetHeadroomTokens`     |                                                           `10000` | Reserved headroom to keep free for response generation/tool traces.                                                |
+| `memory.entity.extractRelations.enabled`                  |                                                            `true` | Enable relation edge extraction and persistence in `memory_entity_relations`.                                      |
+| `memory.entity.extractRelations.backfillBatchSize`        |                                                             `200` | Batch size for checkpointed `backfill_entity_relations` jobs.                                                      |
+| `memory.entity.relationRetrieval.enabled`                 |                                                            `true` | Enable one-hop relation expansion from matched seed entities at recall time.                                       |
+| `memory.entity.relationRetrieval.maxSeedEntities`         |                                                               `8` | Maximum matched seed entities from the query.                                                                      |
+| `memory.entity.relationRetrieval.maxNeighborEntities`     |                                                              `20` | Maximum unique neighbor entities expanded from relation edges.                                                     |
+| `memory.entity.relationRetrieval.maxEdges`                |                                                              `40` | Maximum relation edges traversed during expansion.                                                                 |
+| `memory.entity.relationRetrieval.neighborScoreMultiplier` |                                                             `0.7` | Downweight multiplier for relation-expanded candidates vs direct entity hits.                                      |
+| `memory.conflicts.enabled`                                |                                                            `true` | Enable soft conflict gate for unresolved `memory_item_conflicts`.                                                  |
+| `memory.conflicts.resolverLlmTimeoutMs`                   |                                                           `12000` | Timeout bound for clarification resolver LLM fallback.                                                             |
+| `memory.conflicts.relevanceThreshold`                     |                                                             `0.3` | Similarity threshold for deciding whether a pending conflict is relevant to the current request.                   |
+| `memory.conflicts.gateMode`                               |                                                          `'soft'` | Conflict gate strategy. Currently only `'soft'` is supported (resolves conflicts internally without user prompts). |
+| `memory.conflicts.conflictableKinds`                      | `['preference', 'profile', 'constraint', 'instruction', 'style']` | Memory item kinds eligible for conflict detection. Items with kinds outside this list are auto-dismissed.          |
+| `memory.profile.enabled`                                  |                                                            `true` | Enable dynamic profile compilation from active trusted profile/preference/constraint/instruction memories.         |
+| `memory.profile.maxInjectTokens`                          |                                                             `800` | Hard token cap enforced by `ProfileCompiler` when generating the runtime profile block.                            |
 ### Memory Recall Debugging Playbook
@@ -211,7 +209,7 @@ The key distinction: normal compaction is a cost-optimized background process th
 stateDiagram-v2
     [*] --> ActiveItems : extract_items/check_contradictions
     ActiveItems --> PendingConflict : ambiguous_contradiction\n(candidate -> pending_clarification)
-    PendingConflict --> PendingConflict : soft gate ask\n(reask cooldown + relevance + askOnIrrelevantTurns)
+    PendingConflict --> PendingConflict : internal evaluation\n(relevance check, no user prompt)
     PendingConflict --> Dismissed : non-actionable\n(kind policy + transient statement filter)
     PendingConflict --> ResolvedKeepExisting : clarification resolver\n+ applyConflictResolution
     PendingConflict --> ResolvedKeepCandidate : clarification resolver\n+ applyConflictResolution
@@ -224,6 +222,10 @@ stateDiagram-v2
     SupersededItems --> CleanupItems : cleanup_stale_superseded_items
 ```
+### Internal-Only Conflict Handling
+Memory conflict resolution is entirely internal and non-interruptive. The conflict gate evaluates pending conflicts on each turn, dismisses non-actionable ones (based on kind policy, statement eligibility, coherence, and provenance), and attempts resolution when user input looks like a natural clarification. At no point does the conflict system produce user-facing clarification prompts, inject conflict instructions into the assistant's response, or block the user's request. The user is never aware that a conflict exists; the runtime response path always continues answering the user's actual request. This invariant is enforced across the conflict gate (`session-conflict-gate.ts`), session memory (`session-memory.ts`), session agent loop (`session-agent-loop.ts`), and runtime assembly (`session-runtime-assembly.ts`).
 Runtime profile flow (per turn):
 1. `ProfileCompiler` builds a trusted profile block from active `profile` / `preference` / `constraint` / `instruction` items under strict token cap.
@@ -238,7 +240,7 @@ Two trust gates enforce trust-class-based access control over the memory pipelin
 - **Write gate** (`indexer.ts`): The `extract_items` and `resolve_conflicts` jobs only run for messages from trusted actors (guardian or undefined provenance). Messages from untrusted actors (`trusted_contact`, `unknown`) are still segmented and embedded — so they appear in conversation context — but no profile extraction or conflict resolution is triggered. This prevents untrusted channels from injecting or mutating long-term memory items.
-- **Read gate** (`session-memory.ts`): When the current session's actor is untrusted, the memory recall pipeline returns a no-op context — no recall injection, no dynamic profile, no conflict clarification prompts. This ensures untrusted actors cannot surface or exploit previously extracted memory.
+- **Read gate** (`session-memory.ts`): When the current session's actor is untrusted, the memory recall pipeline returns a no-op context — no recall injection, no dynamic profile, no conflict resolution. This ensures untrusted actors cannot surface or exploit previously extracted memory.
 Trust policy is **cross-channel and trust-class-based**: decisions use `trustContext.trustClass`, not the channel string. Desktop/IPC sessions default to `trustClass: 'guardian'`. External channels (Telegram, SMS, WhatsApp, voice) provide explicit trust context via the resolver. Messages without provenance metadata are treated as trusted (guardian); all new messages carry provenance.
@@ -381,7 +383,7 @@ graph TB
 - **Prepend, not append**: The workspace block is prepended to the user message content so that Anthropic cache breakpoints continue to land on the trailing user text block, preserving prompt cache efficiency.
 - **Runtime-only**: The injected `<workspace_top_level>` block is stripped from `this.messages` after the agent loop completes. It never persists in conversation history or the database.
 - **Dirty-refresh**: The scanner runs once on the first turn, then only re-runs after a successful mutation tool (`file_edit`, `file_write`, `bash`). Failed tool results do not trigger a refresh.
-- **Injection ordering**: Workspace context is injected after other runtime injections (soft conflict instruction, active surface) via `applyRuntimeInjections`, but because it is **prepended** to content blocks, it appears first in the final message.
+- **Injection ordering**: Workspace context is injected after other runtime injections (active surface, etc.) via `applyRuntimeInjections`, but because it is **prepended** to content blocks, it appears first in the final message.
 ### Cache compatibility
@@ -506,7 +508,6 @@ graph TB
 10. **Provider-aware commit message generation (optional)**: When `workspaceGit.commitMessageLLM.enabled` is `true`, turn-boundary commits attempt to generate a descriptive commit message using the configured LLM provider before falling back to deterministic messages. The feature ships disabled by default and is designed to never degrade turn completion guarantees.
     **Commit message LLM fallback chain**: The generator runs a sequence of pre-flight checks before calling the LLM. Each check that fails produces a machine-readable `llmFallbackReason` in the structured log output and immediately returns a deterministic message. The checks, in order:
     1. `disabled` — `commitMessageLLM.enabled` is `false` or `useConfiguredProvider` is `false`
     2. `missing_provider_api_key` — the configured provider's API key is not set in `config.apiKeys` (skipped for keyless providers like Ollama that run without an API key)
     3. `breaker_open` — the generator's internal circuit breaker is open after consecutive LLM failures (exponential backoff)
@@ -516,11 +517,9 @@ graph TB
     7. `timeout` — the LLM call exceeded `timeoutMs` (AbortController fires)
     8. `provider_error` — the provider threw an exception during the LLM call
     9. `invalid_output` — the LLM returned empty text, the literal string "FALLBACK", or total output > 500 chars
     - **Subject line capping**: If the LLM subject line exceeds 72 chars it is deterministically truncated to 72 chars. This is NOT treated as a failure (no breaker penalty, no deterministic fallback).
     **Fast model resolution**: The LLM call uses a small/fast model to minimize latency and cost. The model is resolved **before** any provider call as a pre-flight check:
     - If `commitMessageLLM.providerFastModelOverrides[provider]` is set, that model is used.
     - Otherwise, a built-in default is used: `anthropic` -> `claude-haiku-4-5-20251001`, `openai` -> `gpt-4o-mini`, `gemini` -> `gemini-2.0-flash`.
     - If the configured provider has no override and no built-in default (e.g., `ollama`, `fireworks`, `openrouter`), the generator returns a deterministic fallback with reason `missing_fast_model` and the provider is never called. To enable LLM commit messages for such providers, set `providerFastModelOverrides[provider]` to the desired model.

package/docs/runbook-trusted-contacts.md CHANGED Viewed

@@ -62,10 +62,7 @@ Response shape:
     {
       "id": "uuid",
       "displayName": "Alice",
-      "relationship": "friend",
-      "importance": 0.5,
-      "responseExpectation": null,
-      "preferredTone": null,
+      "notes": null,
       "lastInteraction": 1700000000000,
       "interactionCount": 12,
       "createdAt": 1699000000000,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@vellumai/assistant",
-  "version": "0.4.30",
+  "version": "0.4.32",
   "type": "module",
   "bin": {
     "vellum": "./src/index.ts"

package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap CHANGED Viewed

@@ -145,13 +145,6 @@ exports[`IPC message snapshots ClientMessage types usage_request serializes to e
 }
 `;
-exports[`IPC message snapshots ClientMessage types sandbox_set serializes to expected JSON 1`] = `
-{
-  "enabled": true,
-  "type": "sandbox_set",
-}
-`;
 exports[`IPC message snapshots ClientMessage types cu_session_create serializes to expected JSON 1`] = `
 {
   "screenHeight": 1080,

package/src/__tests__/anthropic-provider.test.ts CHANGED Viewed

@@ -8,6 +8,7 @@ import type { Message, ToolDefinition } from "../providers/types.js";
 let lastStreamParams: Record<string, unknown> | null = null;
 let _lastStreamOptions: Record<string, unknown> | null = null;
+let lastConstructorArgs: Record<string, unknown> | null = null;
 const fakeResponse = {
   content: [{ type: "text", text: "Hello" }],
@@ -33,7 +34,9 @@ class FakeAPIError extends Error {
 mock.module("@anthropic-ai/sdk", () => ({
   default: class MockAnthropic {
     static APIError = FakeAPIError;
-    constructor() {}
+    constructor(args: Record<string, unknown>) {
+      lastConstructorArgs = { ...args };
+    }
     messages = {
       stream: (
         params: Record<string, unknown>,
@@ -127,6 +130,7 @@ describe("AnthropicProvider — Cache-Control Characterization", () => {
   beforeEach(() => {
     lastStreamParams = null;
     _lastStreamOptions = null;
+    lastConstructorArgs = null;
     provider = new AnthropicProvider("sk-ant-test", "claude-sonnet-4-6");
   });
@@ -935,3 +939,84 @@ describe("AnthropicProvider — Cache-Control Characterization", () => {
     expect(userMsgs[2].content[1].cache_control).toEqual({ type: "ephemeral" });
   });
 });
+// ---------------------------------------------------------------------------
+// Tests — Managed Proxy Fallback
+// ---------------------------------------------------------------------------
+describe("AnthropicProvider — Managed Proxy Fallback", () => {
+  beforeEach(() => {
+    lastStreamParams = null;
+    _lastStreamOptions = null;
+    lastConstructorArgs = null;
+  });
+  test("constructor passes baseURL to Anthropic SDK when provided", () => {
+    new AnthropicProvider("managed-key", "claude-sonnet-4-6", {
+      baseURL: "https://platform.example.com/v1/runtime-proxy/anthropic",
+    });
+    expect(lastConstructorArgs).not.toBeNull();
+    expect(lastConstructorArgs!.apiKey).toBe("managed-key");
+    expect(lastConstructorArgs!.baseURL).toBe(
+      "https://platform.example.com/v1/runtime-proxy/anthropic",
+    );
+  });
+  test("constructor does not set baseURL when option is omitted", () => {
+    new AnthropicProvider("sk-ant-user-key", "claude-sonnet-4-6");
+    expect(lastConstructorArgs).not.toBeNull();
+    expect(lastConstructorArgs!.apiKey).toBe("sk-ant-user-key");
+    expect(lastConstructorArgs!.baseURL).toBeUndefined();
+  });
+  test("managed mode provider preserves tool-pairing behavior", async () => {
+    const provider = new AnthropicProvider("managed-key", "claude-sonnet-4-6", {
+      baseURL: "https://platform.example.com/v1/runtime-proxy/anthropic",
+    });
+    const messages: Message[] = [
+      userMsg("Read file"),
+      toolUseMsg("tu_1", "file_read"),
+      toolResultMsg("tu_1", "file contents"),
+    ];
+    await provider.sendMessage(messages);
+    const sent = lastStreamParams!.messages as Array<{
+      role: string;
+      content: Array<{ type: string; tool_use_id?: string }>;
+    }>;
+    expect(sent).toHaveLength(3);
+    const toolResults = sent[2].content.filter((b) => b.type === "tool_result");
+    expect(toolResults).toHaveLength(1);
+    expect(toolResults[0].tool_use_id).toBe("tu_1");
+  });
+  test("managed mode provider preserves cache-control behavior", async () => {
+    const provider = new AnthropicProvider("managed-key", "claude-sonnet-4-6", {
+      baseURL: "https://platform.example.com/v1/runtime-proxy/anthropic",
+    });
+    await provider.sendMessage(
+      [userMsg("Hi")],
+      sampleTools,
+      "You are helpful.",
+    );
+    // System prompt cache control
+    const system = lastStreamParams!.system as Array<{
+      cache_control?: { type: string };
+    }>;
+    expect(system[0].cache_control).toEqual({ type: "ephemeral" });
+    // Last tool cache control
+    const tools = lastStreamParams!.tools as Array<{
+      cache_control?: { type: string };
+    }>;
+    expect(tools[tools.length - 1].cache_control).toEqual({
+      type: "ephemeral",
+    });
+  });
+});

package/src/__tests__/assistant-feature-flags-integration.test.ts CHANGED Viewed

@@ -241,8 +241,8 @@ describe("buildSystemPrompt assistant feature flag filtering", () => {
     const result = buildSystemPrompt();
-    // browser is declared in the registry with defaultEnabled: false
-    expect(result).not.toContain('id="browser"');
+    // browser is declared in the registry with defaultEnabled: true
+    expect(result).toContain('id="browser"');
   });
 });

package/src/__tests__/checker.test.ts CHANGED Viewed

@@ -55,16 +55,16 @@ mock.module("../util/logger.js", () => ({
 }));
 // Mutable config object so tests can switch permissions.mode between
-// 'legacy', 'strict', and 'workspace' without re-registering the mock.
+// 'strict' and 'workspace' without re-registering the mock.
 interface TestConfig {
-  permissions: { mode: "legacy" | "strict" | "workspace" };
+  permissions: { mode: "strict" | "workspace" };
   skills: { load: { extraDirs: string[] } };
   sandbox: { enabled: boolean };
   [key: string]: unknown;
 }
 const testConfig: TestConfig = {
-  permissions: { mode: "legacy" },
+  permissions: { mode: "workspace" },
   skills: { load: { extraDirs: [] } },
   sandbox: { enabled: true },
 };
@@ -81,7 +81,6 @@ mock.module("../config/loader.js", () => ({
 }));
 import {
-  _resetLegacyDeprecationWarning,
   check,
   classifyRisk,
   generateAllowlistOptions,
@@ -169,11 +168,9 @@ describe("Permission Checker", () => {
   beforeEach(() => {
     // Reset trust-store state between tests
     clearCache();
-    // Reset permissions mode to legacy so existing tests are not affected
-    testConfig.permissions = { mode: "legacy" };
+    // Reset permissions mode to workspace (default) so existing tests are not affected
+    testConfig.permissions = { mode: "workspace" };
     testConfig.skills = { load: { extraDirs: [] } };
-    // Reset the one-time legacy deprecation warning flag and captured log calls
-    _resetLegacyDeprecationWarning();
     loggerWarnCalls.length = 0;
     try {
       rmSync(join(checkerTestDir, "protected", "trust.json"));
@@ -684,12 +681,22 @@ describe("Permission Checker", () => {
       expect(result.decision).toBe("allow");
     });
-    test("file_write with no rule → prompt", async () => {
+    test("file_write within workspace with no rule → auto-allowed in workspace mode", async () => {
       const result = await check(
         "file_write",
         { path: "/tmp/file.txt" },
         "/tmp",
       );
+      expect(result.decision).toBe("allow");
+      expect(result.reason).toContain("workspace-scoped");
+    });
+    test("file_write outside workspace with no rule → prompt", async () => {
+      const result = await check(
+        "file_write",
+        { path: "/etc/some-file.txt" },
+        "/tmp",
+      );
       expect(result.decision).toBe("prompt");
     });
@@ -1354,12 +1361,10 @@ describe("Permission Checker", () => {
     });
     test("core tool (no origin) still follows risk-based fallback", async () => {
-      // file_read is a core tool with Low risk → should auto-allow as before
-      const result = await check(
-        "file_read",
-        { path: "/tmp/test.txt" },
-        "/tmp",
-      );
+      // file_read is a core tool with Low risk — in workspace mode,
+      // workspace-scoped invocations are auto-allowed before risk fallback.
+      // Use a path outside the workspace to test the risk-based fallback.
+      const result = await check("file_read", { path: "/etc/hosts" }, "/tmp");
       expect(result.decision).toBe("allow");
       expect(result.reason).toContain("Low risk");
     });
@@ -1488,7 +1493,8 @@ describe("Permission Checker", () => {
     test("file_write of non-workspace file is not auto-allowed", async () => {
       const otherPath = join(checkerTestDir, "workspace", "OTHER.md");
-      const result = await check("file_write", { path: otherPath }, "/tmp");
+      // Use a workingDir that doesn't contain the path so it's not workspace-scoped
+      const result = await check("file_write", { path: otherPath }, "/home");
       // Medium risk with no matching allow rule → prompt
       expect(result.decision).toBe("prompt");
     });
@@ -2565,7 +2571,7 @@ describe("Permission Checker", () => {
       });
       test("legacy mode: file_write to skill source still prompts as High risk", async () => {
-        testConfig.permissions.mode = "legacy";
+        testConfig.permissions.mode = "workspace";
         ensureSkillsDir();
         const skillPath = join(
           checkerTestDir,
@@ -3327,7 +3333,7 @@ describe("Permission Checker", () => {
     });
     test("skill_load auto-allows in legacy mode (backward compat)", async () => {
-      testConfig.permissions.mode = "legacy";
+      testConfig.permissions.mode = "workspace";
       const result = await check("skill_load", { skill: "any-skill" }, "/tmp");
       expect(result.decision).toBe("allow");
       // The default allow rule matches before the Low risk fallback
@@ -3850,7 +3856,7 @@ describe("Permission Checker", () => {
     describe("Invariant 6: user can set broad rules if they choose", () => {
       test("wildcard allow rule matches any command in legacy mode", async () => {
-        testConfig.permissions.mode = "legacy";
+        testConfig.permissions.mode = "workspace";
         addRule("bash", "*", "everywhere");
         const result = await check(
           "bash",
@@ -4203,7 +4209,7 @@ describe("Permission Checker", () => {
     }
     test("browser tools are auto-allowed in legacy mode", async () => {
-      testConfig.permissions = { mode: "legacy" };
+      testConfig.permissions = { mode: "workspace" };
       for (const toolName of browserToolNames) {
         const result = await check(toolName, {}, "/tmp");
         expect(result.decision).toBe("allow");
@@ -4218,7 +4224,7 @@ describe("Permission Checker", () => {
           expect(result.decision).toBe("allow");
         }
       } finally {
-        testConfig.permissions = { mode: "legacy" };
+        testConfig.permissions = { mode: "workspace" };
       }
     });
   });
@@ -4295,7 +4301,7 @@ describe("Permission Checker", () => {
 describe("bash network_mode=proxied — no special-casing", () => {
   beforeEach(() => {
     clearCache();
-    testConfig.permissions = { mode: "legacy" };
+    testConfig.permissions = { mode: "workspace" };
     testConfig.skills = { load: { extraDirs: [] } };
   });
@@ -4416,7 +4422,7 @@ describe("computer-use tool permission defaults", () => {
 describe("scope matching behavior", () => {
   beforeEach(() => {
     clearCache();
-    testConfig.permissions = { mode: "legacy" };
+    testConfig.permissions = { mode: "workspace" };
     try {
       rmSync(join(checkerTestDir, "protected", "trust.json"));
     } catch {
@@ -4456,6 +4462,8 @@ describe("scope matching behavior", () => {
   });
   test("project-scoped rule does NOT match invocations from sibling directory", async () => {
+    // Use strict mode to test rule-matching isolation without workspace auto-allow
+    testConfig.permissions.mode = "strict";
     const projectDir = "/home/user/my-project";
     // Use a broad pattern that matches any file, scoped to the project
     addRule("file_write", "file_write:*", projectDir);
@@ -4470,6 +4478,8 @@ describe("scope matching behavior", () => {
   });
   test("project-scoped rule does NOT match invocations from parent directory", async () => {
+    // Use strict mode to test rule-matching isolation without workspace auto-allow
+    testConfig.permissions.mode = "strict";
     const projectDir = "/home/user/my-project";
     addRule("file_write", "file_write:*", projectDir);
@@ -4483,6 +4493,8 @@ describe("scope matching behavior", () => {
   });
   test("project-scoped rule does NOT match directory with shared prefix", async () => {
+    // Use strict mode to test rule-matching isolation without workspace auto-allow
+    testConfig.permissions.mode = "strict";
     // A rule for /home/user/project should NOT match /home/user/project-evil
     // (directory-boundary enforcement in matchesScope)
     const projectDir = "/home/user/project";
@@ -4562,7 +4574,7 @@ describe("workspace mode — auto-allow workspace-scoped operations", () => {
   });
   afterEach(() => {
-    testConfig.permissions = { mode: "legacy" };
+    testConfig.permissions = { mode: "workspace" };
   });
   // ── workspace-scoped file operations auto-allow ──────────────────
@@ -4771,79 +4783,6 @@ describe("workspace mode — auto-allow workspace-scoped operations", () => {
   });
 });
-// ── legacy mode deprecation warning ─────────────────────────────────────
-describe("legacy mode — deprecation warning", () => {
-  beforeEach(() => {
-    clearCache();
-    _resetLegacyDeprecationWarning();
-    loggerWarnCalls.length = 0;
-    testConfig.permissions = { mode: "legacy" };
-    testConfig.skills = { load: { extraDirs: [] } };
-    try {
-      rmSync(join(checkerTestDir, "protected", "trust.json"));
-    } catch {
-      /* may not exist */
-    }
-  });
-  afterEach(() => {
-    testConfig.permissions = { mode: "legacy" };
-  });
-  test("emits deprecation warning on first check() call in legacy mode", async () => {
-    await check("file_read", { file_path: "/tmp/test.txt" }, "/tmp");
-    expect(loggerWarnCalls.some((m) => m.includes("deprecated"))).toBe(true);
-    expect(loggerWarnCalls.some((m) => m.includes("legacy"))).toBe(true);
-  });
-  test("deprecation warning fires only once per process", async () => {
-    await check("file_read", { file_path: "/tmp/a.txt" }, "/tmp");
-    const firstCount = loggerWarnCalls.filter((m) =>
-      m.includes("deprecated"),
-    ).length;
-    expect(firstCount).toBe(1);
-    await check("file_read", { file_path: "/tmp/b.txt" }, "/tmp");
-    const secondCount = loggerWarnCalls.filter((m) =>
-      m.includes("deprecated"),
-    ).length;
-    expect(secondCount).toBe(1);
-  });
-  test("no deprecation warning in workspace mode", async () => {
-    testConfig.permissions = { mode: "workspace" };
-    await check("file_read", { file_path: "/tmp/test.txt" }, "/tmp");
-    expect(loggerWarnCalls.some((m) => m.includes("deprecated"))).toBe(false);
-  });
-  test("no deprecation warning in strict mode", async () => {
-    testConfig.permissions = { mode: "strict" };
-    await check("file_read", { file_path: "/tmp/test.txt" }, "/tmp");
-    expect(loggerWarnCalls.some((m) => m.includes("deprecated"))).toBe(false);
-  });
-  test("legacy mode still produces correct decisions (low risk auto-allowed)", async () => {
-    const result = await check(
-      "file_read",
-      { file_path: "/tmp/test.txt" },
-      "/tmp",
-    );
-    expect(result.decision).toBe("allow");
-    expect(result.reason).toContain("Low risk");
-  });
-  test("legacy mode still prompts for medium risk", async () => {
-    const result = await check(
-      "file_write",
-      { file_path: "/tmp/test.txt" },
-      "/tmp",
-    );
-    expect(result.decision).toBe("prompt");
-    expect(result.reason).toContain("risk");
-  });
-});
 describe("shell command candidates wiring (PR 04)", () => {
   test("existing raw shell rule still matches", async () => {
     clearCache();
@@ -4896,7 +4835,7 @@ describe("integration regressions (PR 11)", () => {
       /* may not exist */
     }
     clearCache();
-    testConfig.permissions = { mode: "legacy" };
+    testConfig.permissions = { mode: "workspace" };
     testConfig.sandbox = { enabled: true };
   });