npm - @vellumai/assistant - Versions diffs - 0.7.2 → 0.8.0 - Mend

@vellumai/assistant 0.7.2 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (424) hide show

package/ARCHITECTURE.md +45 -29
package/Dockerfile +1 -0
package/__tests__/permissions/gateway-threshold-reader.test.ts +236 -9
package/bun.lock +3 -0
package/docs/architecture/memory.md +5 -2
package/knip.json +1 -0
package/node_modules/@vellumai/gateway-client/src/ipc-client.ts +13 -4
package/node_modules/@vellumai/ipc-server-utils/bun.lock +24 -0
package/node_modules/@vellumai/ipc-server-utils/package.json +18 -0
package/node_modules/@vellumai/ipc-server-utils/src/index.ts +6 -0
package/node_modules/@vellumai/ipc-server-utils/src/socket-watchdog.test.ts +430 -0
package/node_modules/@vellumai/ipc-server-utils/src/socket-watchdog.ts +221 -0
package/node_modules/@vellumai/ipc-server-utils/tsconfig.json +20 -0
package/node_modules/@vellumai/skill-host-contracts/src/assistant-event.ts +0 -9
package/node_modules/@vellumai/slack-text/src/index.test.ts +18 -35
package/node_modules/@vellumai/slack-text/src/index.ts +2 -48
package/openapi.yaml +470 -25
package/package.json +3 -1
package/src/__tests__/annotate-risk-options.test.ts +291 -0
package/src/__tests__/app-control-flow.test.ts +21 -11
package/src/__tests__/approval-cascade.test.ts +8 -16
package/src/__tests__/approval-routes-http.test.ts +6 -0
package/src/__tests__/assistant-event-hub.test.ts +48 -0
package/src/__tests__/assistant-event.test.ts +0 -10
package/src/__tests__/assistant-events-sse-hardening.test.ts +2 -7
package/src/__tests__/assistant-feature-flags-integration.test.ts +18 -0
package/src/__tests__/auto-analysis-end-to-end.test.ts +48 -0
package/src/__tests__/background-workers-disk-pressure.test.ts +268 -0
package/src/__tests__/call-constants.test.ts +10 -1
package/src/__tests__/call-controller.test.ts +127 -0
package/src/__tests__/call-conversation-messages.test.ts +8 -2
package/src/__tests__/channel-inbound-disk-pressure.test.ts +537 -0
package/src/__tests__/channel-readiness-service.test.ts +4 -2
package/src/__tests__/cli-memory-v2-reembed-skills.test.ts +58 -28
package/src/__tests__/config-loader-backfill.test.ts +379 -0
package/src/__tests__/config-loader-platform-defaults.test.ts +284 -1
package/src/__tests__/config-schema.test.ts +1 -0
package/src/__tests__/config-watcher-cleanup-throttle.test.ts +18 -9
package/src/__tests__/config-watcher.test.ts +140 -69
package/src/__tests__/context-search-agent-runner.test.ts +61 -3
package/src/__tests__/context-search-conversations-source.test.ts +0 -24
package/src/__tests__/context-search-fanout.test.ts +0 -1
package/src/__tests__/context-search-memory-source.test.ts +6 -33
package/src/__tests__/context-search-memory-v2-source.test.ts +0 -2
package/src/__tests__/context-search-pkb-source.test.ts +12 -7
package/src/__tests__/context-search-workspace-source.test.ts +0 -1
package/src/__tests__/conversation-abort-tool-results.test.ts +1 -0
package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +223 -0
package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +1 -1
package/src/__tests__/conversation-agent-loop-overflow.test.ts +1 -1
package/src/__tests__/conversation-agent-loop.test.ts +457 -8
package/src/__tests__/conversation-confirmation-signals.test.ts +5 -13
package/src/__tests__/conversation-error.test.ts +150 -3
package/src/__tests__/conversation-init.benchmark.test.ts +1 -1
package/src/__tests__/conversation-process-callsite.test.ts +38 -0
package/src/__tests__/conversation-provider-retry-repair.test.ts +1 -0
package/src/__tests__/conversation-runtime-assembly.test.ts +74 -0
package/src/__tests__/conversation-slash-unknown.test.ts +1 -0
package/src/__tests__/conversation-speed-override.test.ts +0 -3
package/src/__tests__/conversation-store.test.ts +0 -18
package/src/__tests__/conversation-surfaces-action-delivery.test.ts +170 -9
package/src/__tests__/conversation-surfaces-app-control.test.ts +15 -4
package/src/__tests__/conversation-surfaces-data-persist.test.ts +476 -0
package/src/__tests__/conversation-tool-setup-app-refresh.test.ts +61 -5
package/src/__tests__/conversation-workspace-injection.test.ts +1 -1
package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
package/src/__tests__/credentials-cli.test.ts +7 -0
package/src/__tests__/cu-unified-flow.test.ts +176 -10
package/src/__tests__/date-context.test.ts +164 -2
package/src/__tests__/disk-pressure-guard.test.ts +262 -0
package/src/__tests__/disk-pressure-lifecycle.test.ts +168 -0
package/src/__tests__/disk-pressure-policy.test.ts +241 -0
package/src/__tests__/disk-pressure-routes.test.ts +379 -0
package/src/__tests__/disk-pressure-tools.test.ts +277 -0
package/src/__tests__/disk-usage.test.ts +150 -0
package/src/__tests__/events-client-registration.test.ts +52 -0
package/src/__tests__/events-dev-bypass-actor.test.ts +162 -0
package/src/__tests__/file-write-tool.test.ts +4 -10
package/src/__tests__/filing-service.test.ts +2 -20
package/src/__tests__/handlers-skills-memory-v2-reseed.test.ts +10 -26
package/src/__tests__/heartbeat-disk-pressure.test.ts +183 -0
package/src/__tests__/heartbeat-service.test.ts +260 -11
package/src/__tests__/host-app-control-proxy.test.ts +195 -25
package/src/__tests__/host-bash-proxy.test.ts +227 -34
package/src/__tests__/host-bash-routes.test.ts +178 -13
package/src/__tests__/host-cu-proxy.test.ts +210 -3
package/src/__tests__/host-cu-routes-targeted.test.ts +141 -12
package/src/__tests__/host-file-proxy-targeted.test.ts +48 -9
package/src/__tests__/host-file-proxy.test.ts +268 -6
package/src/__tests__/host-file-routes-targeted.test.ts +175 -17
package/src/__tests__/host-transfer-proxy-targeted.test.ts +408 -59
package/src/__tests__/host-transfer-routes-targeted.test.ts +232 -17
package/src/__tests__/http-user-message-parity.test.ts +107 -1
package/src/__tests__/injector-chain.test.ts +36 -16
package/src/__tests__/injector-disk-pressure.test.ts +224 -0
package/src/__tests__/injector-pkb-v2-silenced.test.ts +10 -7
package/src/__tests__/lifecycle-memory-v2-seed.test.ts +154 -67
package/src/__tests__/managed-profile-guard.test.ts +18 -0
package/src/__tests__/mcp-abort-signal.test.ts +130 -0
package/src/__tests__/memory-admin-recall.test.ts +3 -11
package/src/__tests__/memory-retrieval-pipeline.test.ts +22 -1
package/src/__tests__/normalize-onboarding.test.ts +180 -0
package/src/__tests__/notification-decision-fallback.test.ts +91 -0
package/src/__tests__/notification-decision-strategy.test.ts +22 -0
package/src/__tests__/oauth-cli.test.ts +121 -0
package/src/__tests__/oauth-connect-routes.test.ts +316 -0
package/src/__tests__/oauth-provider-seed-logos.test.ts +24 -2
package/src/__tests__/onboarding-persona-write.test.ts +308 -0
package/src/__tests__/openai-provider.test.ts +45 -8
package/src/__tests__/persist-onboarding-artifacts.test.ts +44 -64
package/src/__tests__/platform-callback-registration.test.ts +21 -4
package/src/__tests__/platform.test.ts +2 -1
package/src/__tests__/playbook-execution.test.ts +0 -43
package/src/__tests__/plugin-tool-contribution.test.ts +47 -0
package/src/__tests__/prechat-onboarding-contract.test.ts +214 -27
package/src/__tests__/provider-tool-name.test.ts +23 -0
package/src/__tests__/relay-server.test.ts +60 -5
package/src/__tests__/runtime-events-sse.test.ts +4 -8
package/src/__tests__/scheduler-disk-pressure.test.ts +148 -0
package/src/__tests__/secret-ingress-http.test.ts +0 -1
package/src/__tests__/secret-prompt-log-hygiene.test.ts +7 -5
package/src/__tests__/secret-prompter-channel-fallback.test.ts +7 -5
package/src/__tests__/secret-response-routing.test.ts +7 -5
package/src/__tests__/server-history-render.test.ts +82 -0
package/src/__tests__/skill-include-graph.test.ts +31 -0
package/src/__tests__/skill-load-tool.test.ts +44 -16
package/src/__tests__/skills.test.ts +39 -0
package/src/__tests__/suggestion-routes.test.ts +46 -0
package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +0 -42
package/src/__tests__/tool-executor.test.ts +155 -0
package/src/__tests__/twilio-validation.test.ts +2 -2
package/src/__tests__/voice-session-bridge.test.ts +3 -0
package/src/__tests__/workspace-migration-065-bump-stale-heartbeat-interval.test.ts +122 -0
package/src/__tests__/workspace-migration-066-seed-heartbeat-callsite-cost-default.test.ts +285 -0
package/src/__tests__/workspace-migration-068-release-notes-local-timezone.test.ts +90 -0
package/src/__tests__/workspace-migration-069-seed-onboarding-threads.test.ts +120 -0
package/src/__tests__/workspace-migration-071-remove-safe-storage-release-note.test.ts +206 -0
package/src/__tests__/workspace-migration-safe-storage-limits-release.test.ts +78 -0
package/src/agent/loop.ts +11 -0
package/src/approvals/guardian-request-resolvers.ts +3 -32
package/src/backup/snapshot-lock.ts +2 -27
package/src/bundler/compiler-tools.ts +3 -2
package/src/calls/call-constants.ts +5 -8
package/src/calls/call-controller.ts +130 -67
package/src/calls/call-conversation-messages.ts +46 -10
package/src/calls/relay-server.ts +7 -1
package/src/calls/voice-session-bridge.ts +1 -1
package/src/cli/commands/__tests__/webhooks.test.ts +0 -4
package/src/cli/commands/bash.ts +35 -108
package/src/cli/commands/contacts.ts +64 -25
package/src/cli/commands/credentials.ts +56 -0
package/src/cli/commands/memory-v2.ts +11 -10
package/src/cli/commands/oauth/__tests__/connect.test.ts +401 -219
package/src/cli/commands/oauth/connect.ts +124 -40
package/src/cli/commands/platform/__tests__/callback-routes-list.test.ts +0 -3
package/src/cli/commands/platform/__tests__/connect.test.ts +7 -1
package/src/cli/commands/platform/__tests__/disconnect.test.ts +7 -1
package/src/cli/commands/platform/__tests__/status.test.ts +103 -6
package/src/cli/commands/platform/index.ts +16 -7
package/src/cli/commands/status.ts +57 -0
package/src/cli/program.ts +4 -2
package/src/config/assistant-feature-flags.ts +13 -3
package/src/config/bundled-skills/app-builder/SKILL.md +1 -3
package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +4 -3
package/src/config/bundled-skills/phone-calls/references/TROUBLESHOOTING.md +13 -7
package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +2 -2
package/src/config/bundled-skills/playbooks/tools/playbook-delete.ts +2 -2
package/src/config/bundled-skills/playbooks/tools/playbook-list.ts +2 -2
package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +2 -2
package/src/config/env.ts +0 -8
package/src/config/feature-flag-registry.json +13 -5
package/src/config/loader.ts +199 -27
package/src/config/schemas/__tests__/memory-v2.test.ts +10 -5
package/src/config/schemas/call-site-catalog.ts +14 -0
package/src/config/schemas/channels.ts +0 -5
package/src/config/schemas/heartbeat.ts +1 -1
package/src/config/schemas/llm.ts +2 -0
package/src/config/schemas/memory-lifecycle.ts +13 -0
package/src/config/schemas/memory-v2.ts +76 -12
package/src/config/schemas/platform.ts +43 -3
package/src/config/schemas/services.ts +28 -0
package/src/config/seed-inference-profiles.ts +230 -33
package/src/contacts/contact-store.ts +0 -25
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +32 -0
package/src/daemon/__tests__/conversation-tool-setup.test.ts +86 -25
package/src/daemon/assistant-attachments.ts +4 -4
package/src/daemon/config-watcher.ts +85 -57
package/src/daemon/conversation-agent-loop-handlers.ts +38 -0
package/src/daemon/conversation-agent-loop.ts +183 -43
package/src/daemon/conversation-error.ts +87 -15
package/src/daemon/conversation-lifecycle.ts +22 -10
package/src/daemon/conversation-process.ts +8 -0
package/src/daemon/conversation-runtime-assembly.ts +26 -0
package/src/daemon/conversation-store.ts +2 -2
package/src/daemon/conversation-surfaces.ts +211 -29
package/src/daemon/conversation-tool-setup.ts +66 -19
package/src/daemon/conversation.ts +18 -23
package/src/daemon/date-context.ts +71 -22
package/src/daemon/disk-pressure-background-gate.ts +73 -0
package/src/daemon/disk-pressure-guard.ts +343 -0
package/src/daemon/disk-pressure-policy.ts +163 -0
package/src/daemon/handlers/shared.ts +26 -1
package/src/daemon/handlers/skills.ts +3 -4
package/src/daemon/host-app-control-proxy.ts +137 -41
package/src/daemon/host-bash-proxy.ts +47 -22
package/src/daemon/host-browser-proxy.ts +1 -1
package/src/daemon/host-cu-proxy.ts +50 -4
package/src/daemon/host-file-proxy.ts +44 -8
package/src/daemon/host-transfer-proxy.ts +97 -6
package/src/daemon/lifecycle.ts +167 -101
package/src/daemon/meet-host-supervisor.ts +4 -4
package/src/daemon/meet-manifest-loader.ts +0 -1
package/src/daemon/memory-v2-startup.ts +66 -15
package/src/daemon/message-protocol.ts +3 -0
package/src/daemon/message-types/conversations.ts +4 -0
package/src/daemon/message-types/disk-pressure.ts +9 -0
package/src/daemon/message-types/messages.ts +22 -1
package/src/daemon/profiler-run-store.ts +5 -5
package/src/daemon/tool-setup-types.ts +2 -2
package/src/documents/document-store.ts +119 -0
package/src/filing/filing-service.ts +29 -5
package/src/heartbeat/__tests__/heartbeat-feed-event.test.ts +9 -16
package/src/heartbeat/__tests__/heartbeat-run-store.test.ts +36 -0
package/src/heartbeat/heartbeat-run-store.ts +13 -0
package/src/heartbeat/heartbeat-service.ts +205 -31
package/src/home/feed-scheduler.ts +18 -0
package/src/inbound/platform-callback-registration.ts +8 -15
package/src/ipc/__tests__/clients-list-ipc.test.ts +169 -0
package/src/ipc/assistant-server.ts +149 -38
package/src/ipc/gateway-client.ts +37 -3
package/src/ipc/skill-server.ts +99 -42
package/src/live-voice/live-voice-archive.ts +4 -4
package/src/live-voice/protocol.ts +5 -7
package/src/media/image-service.ts +1 -7
package/src/memory/__tests__/fixtures/memory-v2-activation-fixtures.ts +21 -13
package/src/memory/__tests__/jobs-worker-v2-schedule.test.ts +34 -51
package/src/memory/__tests__/memory-v2-activation-log-store.test.ts +0 -6
package/src/memory/__tests__/memory-v2-concept-frequency.test.ts +272 -0
package/src/memory/admin.ts +5 -9
package/src/memory/context-search/agent-runner.ts +19 -2
package/src/memory/context-search/sources/conversations.ts +2 -11
package/src/memory/context-search/sources/memory-v2.ts +1 -16
package/src/memory/context-search/sources/memory.ts +2 -3
package/src/memory/context-search/sources/pkb.ts +2 -3
package/src/memory/context-search/types.ts +0 -1
package/src/memory/conversation-crud.ts +4 -12
package/src/memory/db-init.ts +2 -0
package/src/memory/embedding-runtime-manager.ts +119 -5
package/src/memory/graph/__tests__/conversation-graph-memory-v2-routing.test.ts +136 -82
package/src/memory/graph/__tests__/handle-remember-v2.test.ts +11 -26
package/src/memory/graph/conversation-graph-memory.ts +72 -61
package/src/memory/graph/extraction.ts +1 -3
package/src/memory/graph/graph-search.test.ts +11 -67
package/src/memory/graph/graph-search.ts +4 -24
package/src/memory/graph/retriever.test.ts +12 -1
package/src/memory/graph/retriever.ts +10 -15
package/src/memory/graph/tool-handlers.ts +3 -4
package/src/memory/graph/tools.ts +4 -4
package/src/memory/indexer.ts +53 -45
package/src/memory/job-handlers/backfill.ts +2 -11
package/src/memory/job-handlers/cleanup.ts +43 -0
package/src/memory/job-handlers/embedding.ts +6 -8
package/src/memory/job-handlers/summarization.ts +2 -7
package/src/memory/jobs/__tests__/embed-concept-page.test.ts +116 -0
package/src/memory/jobs/embed-concept-page.ts +223 -87
package/src/memory/jobs-store.ts +48 -0
package/src/memory/jobs-worker.ts +85 -43
package/src/memory/memory-v2-activation-log-store.ts +32 -14
package/src/memory/memory-v2-concept-frequency.ts +169 -0
package/src/memory/migrations/239-trace-events-created-at-index.ts +18 -0
package/src/memory/migrations/index.ts +1 -0
package/src/memory/pkb/pkb-search.test.ts +7 -0
package/src/memory/pkb/pkb-search.ts +4 -5
package/src/memory/qdrant-client.ts +3 -13
package/src/memory/rerank-local.ts +374 -0
package/src/memory/search/semantic.ts +10 -72
package/src/memory/trace-event-store.ts +1 -17
package/src/memory/v2/__tests__/activation.test.ts +346 -255
package/src/memory/v2/__tests__/consolidation-job.test.ts +61 -40
package/src/memory/v2/__tests__/injection.test.ts +297 -190
package/src/memory/v2/__tests__/prompts-consolidation.test.ts +61 -2
package/src/memory/v2/__tests__/qdrant.test.ts +326 -9
package/src/memory/v2/__tests__/reranker.test.ts +338 -0
package/src/memory/v2/__tests__/sim.test.ts +113 -196
package/src/memory/v2/__tests__/skill-store.test.ts +71 -65
package/src/memory/v2/__tests__/static-context.test.ts +77 -14
package/src/memory/v2/__tests__/sweep-job.test.ts +19 -33
package/src/memory/v2/activation.ts +149 -156
package/src/memory/v2/consolidation-job.ts +69 -20
package/src/memory/v2/injection.ts +75 -68
package/src/memory/v2/page-store.ts +39 -0
package/src/memory/v2/prompts/consolidation.ts +41 -1
package/src/memory/v2/qdrant.ts +306 -46
package/src/memory/v2/reranker.ts +177 -0
package/src/memory/v2/sim.ts +77 -110
package/src/memory/v2/skill-content.ts +4 -3
package/src/memory/v2/skill-store.ts +82 -59
package/src/memory/v2/static-context.ts +26 -8
package/src/memory/v2/sweep-job.ts +5 -6
package/src/memory/v2/types.ts +17 -10
package/src/notifications/copy-composer.ts +47 -0
package/src/notifications/decision-engine.ts +46 -0
package/src/notifications/signal.ts +4 -0
package/src/oauth/AGENTS.md +3 -1
package/src/oauth/__tests__/oauth-connect-state.test.ts +137 -0
package/src/oauth/connect-orchestrator.ts +2 -0
package/src/oauth/connection-resolver.test.ts +66 -1
package/src/oauth/connection-resolver.ts +55 -1
package/src/oauth/oauth-connect-state.ts +77 -0
package/src/oauth/seed-providers.ts +58 -1
package/src/permissions/gateway-threshold-reader.ts +116 -8
package/src/permissions/prompter.ts +86 -96
package/src/permissions/secret-prompter.ts +31 -31
package/src/plugins/defaults/injectors.ts +36 -4
package/src/plugins/defaults/memory-retrieval.ts +5 -6
package/src/plugins/types.ts +7 -0
package/src/proactive-artifact/aux-message-injector.ts +74 -0
package/src/proactive-artifact/decision.test.ts +226 -0
package/src/proactive-artifact/decision.ts +165 -0
package/src/proactive-artifact/index.ts +7 -0
package/src/proactive-artifact/job.test.ts +914 -0
package/src/proactive-artifact/job.ts +366 -0
package/src/proactive-artifact/message-copy.ts +58 -0
package/src/proactive-artifact/trigger-state.test.ts +277 -0
package/src/proactive-artifact/trigger-state.ts +119 -0
package/src/prompts/normalize-onboarding.ts +80 -0
package/src/prompts/persona-resolver.ts +101 -9
package/src/prompts/system-prompt.ts +21 -7
package/src/prompts/templates/BOOTSTRAP.md +13 -5
package/src/prompts/templates/SOUL.md +13 -28
package/src/providers/__tests__/retry-callsite.test.ts +222 -1
package/src/providers/model-intents.ts +7 -0
package/src/providers/openrouter/client.ts +8 -0
package/src/providers/retry.ts +50 -0
package/src/providers/types.ts +1 -0
package/src/runtime/__tests__/agent-wake.test.ts +456 -3
package/src/runtime/agent-wake.ts +238 -100
package/src/runtime/assistant-event-hub.ts +36 -6
package/src/runtime/assistant-event.ts +0 -1
package/src/runtime/auth/__tests__/route-policy.test.ts +64 -0
package/src/runtime/auth/route-policy.ts +15 -1
package/src/runtime/auth/same-actor.ts +216 -0
package/src/runtime/channel-approvals.ts +3 -2
package/src/runtime/channel-retry-sweep.ts +65 -1
package/src/runtime/local-actor-identity.ts +52 -11
package/src/runtime/pending-interactions.ts +27 -15
package/src/runtime/routes/__tests__/client-routes.test.ts +155 -0
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +0 -5
package/src/runtime/routes/__tests__/heartbeat-routes.test.ts +1 -1
package/src/runtime/routes/__tests__/memory-v2-routes.test.ts +147 -0
package/src/runtime/routes/approval-routes.ts +7 -3
package/src/runtime/routes/client-routes.ts +20 -2
package/src/runtime/routes/consolidation-routes.ts +8 -9
package/src/runtime/routes/contact-routes.ts +0 -25
package/src/runtime/routes/conversation-query-routes.ts +44 -1
package/src/runtime/routes/conversation-routes.ts +35 -26
package/src/runtime/routes/debug-bash-routes.ts +165 -0
package/src/runtime/routes/disk-pressure-routes.ts +121 -0
package/src/runtime/routes/document-pdf-renderer.ts +6 -2
package/src/runtime/routes/documents-routes.ts +2 -75
package/src/runtime/routes/events-routes.ts +41 -9
package/src/runtime/routes/filing-routes.ts +2 -3
package/src/runtime/routes/host-bash-routes.ts +23 -3
package/src/runtime/routes/host-cu-routes.ts +33 -6
package/src/runtime/routes/host-file-routes.ts +32 -6
package/src/runtime/routes/host-transfer-routes.ts +79 -16
package/src/runtime/routes/identity-routes.ts +7 -138
package/src/runtime/routes/inbound-message-handler.ts +77 -12
package/src/runtime/routes/index.ts +6 -0
package/src/runtime/routes/memory-item-routes.test.ts +37 -17
package/src/runtime/routes/memory-item-routes.ts +5 -6
package/src/runtime/routes/memory-v2-routes.ts +136 -17
package/src/runtime/routes/oauth-connect-routes.ts +153 -0
package/src/runtime/verification-outbound-actions.ts +4 -4
package/src/schedule/run-script.ts +37 -5
package/src/schedule/scheduler.ts +20 -1
package/src/security/encrypted-store.ts +2 -0
package/src/security/secure-keys.ts +55 -0
package/src/skills/include-graph.ts +35 -13
package/src/skills/remote-skill-policy.ts +4 -10
package/src/subagent/index.ts +1 -7
package/src/subagent/manager.ts +1 -15
package/src/tasks/task-runner.ts +0 -1
package/src/tasks/task-store.ts +0 -3
package/src/tools/background-tool-registry.ts +17 -3
package/src/tools/document/document-tool.ts +20 -0
package/src/tools/executor.ts +18 -2
package/src/tools/host-filesystem/edit.test.ts +151 -0
package/src/tools/host-filesystem/edit.ts +43 -1
package/src/tools/host-filesystem/read.test.ts +129 -0
package/src/tools/host-filesystem/read.ts +43 -1
package/src/tools/host-filesystem/transfer.test.ts +127 -2
package/src/tools/host-filesystem/transfer.ts +56 -11
package/src/tools/host-filesystem/write.test.ts +134 -0
package/src/tools/host-filesystem/write.ts +43 -1
package/src/tools/host-terminal/host-shell.ts +13 -6
package/src/tools/mcp/mcp-tool-factory.ts +2 -1
package/src/tools/memory/register.test.ts +14 -9
package/src/tools/memory/register.ts +1 -2
package/src/tools/permission-checker.ts +15 -0
package/src/tools/provider-tool-name.ts +28 -0
package/src/tools/registry.ts +30 -9
package/src/tools/skills/load.ts +24 -20
package/src/tools/terminal/shell.ts +9 -1
package/src/tools/tool-approval-handler.ts +31 -6
package/src/tools/tool-name-aliases.ts +19 -0
package/src/tools/types.ts +43 -3
package/src/tts/provider-catalog.ts +3 -5
package/src/util/disk-usage.ts +138 -0
package/src/util/platform.ts +21 -11
package/src/util/process-liveness.ts +26 -0
package/src/workspace/heartbeat-service.ts +19 -0
package/src/workspace/migrations/065-bump-stale-heartbeat-interval.ts +60 -0
package/src/workspace/migrations/066-seed-heartbeat-callsite-cost-default.ts +146 -0
package/src/workspace/migrations/067-release-notes-safe-storage-limits.ts +14 -0
package/src/workspace/migrations/068-release-notes-local-timezone.ts +65 -0
package/src/workspace/migrations/069-seed-onboarding-threads.ts +28 -0
package/src/workspace/migrations/070-memory-v2-summary-schema-rebuild.ts +31 -0
package/src/workspace/migrations/071-remove-safe-storage-release-note.ts +111 -0
package/src/workspace/migrations/registry.ts +14 -0
package/src/__tests__/conversation-tool-setup-memory-scope.test.ts +0 -167
package/src/memory/v2/__tests__/skill-qdrant.test.ts +0 -657
package/src/memory/v2/skill-qdrant.ts +0 -404
package/src/signals/bash.ts +0 -198

package/src/memory/v2/__tests__/sim.test.ts CHANGED Viewed

@@ -70,16 +70,6 @@ const state = {
       points: Array<{ score?: number; payload: Record<string, unknown> }>;
     }>,
   },
-  // Separate response queue for the dedicated skills collection so a test
-  // querying both concept pages and skills doesn't have to interleave.
-  skillQueryResponses: {
-    dense: [] as Array<{
-      points: Array<{ score?: number; payload: Record<string, unknown> }>;
-    }>,
-    sparse: [] as Array<{
-      points: Array<{ score?: number; payload: Record<string, unknown> }>;
-    }>,
-  },
   queryCalls: [] as Array<{
     collection: string;
     using: string;
@@ -146,12 +136,12 @@ class MockQdrantClient {
       limit: params.limit,
       filter: params.filter,
     });
-    const channel = params.using as "dense" | "sparse";
-    const queue =
-      name === "memory_v2_skills"
-        ? state.skillQueryResponses[channel]
-        : state.queryResponses[channel];
-    return queue.shift() ?? { points: [] };
+    // Both `dense` and `summary_dense` consume from the dense queue (and
+    // similarly for sparse). The four-channel hybrid query fires them in
+    // order: body-dense, body-sparse, summary-dense, summary-sparse — so
+    // the queue order matches the call order.
+    const channel = params.using.endsWith("sparse") ? "sparse" : "dense";
+    return state.queryResponses[channel].shift() ?? { points: [] };
   }
 }
@@ -159,10 +149,7 @@ mock.module("@qdrant/js-client-rest", () => ({
   QdrantClient: MockQdrantClient,
 }));
-const { simBatch, simSkillBatch, clamp01, effectiveWeights } =
-  await import("../sim.js");
-const { _resetMemoryV2SkillQdrantForTests } =
-  await import("../skill-qdrant.js");
+const { simBatch, clamp01, effectiveWeights } = await import("../sim.js");
 const { _resetMemoryV2QdrantForTests } = await import("../qdrant.js");
 // ---------------------------------------------------------------------------
@@ -175,15 +162,12 @@ function resetState(): void {
   state.embedReturn = [[0.1, 0.2, 0.3]];
   state.queryResponses.dense.length = 0;
   state.queryResponses.sparse.length = 0;
-  state.skillQueryResponses.dense.length = 0;
-  state.skillQueryResponses.sparse.length = 0;
   state.queryCalls.length = 0;
   // Bun's `mock.module` persists across files in the same process, so the
-  // qdrant modules' singletons may already hold a MockQdrantClient instance
-  // from a sibling test file. Reset both readiness caches so each test in
-  // this file gets a fresh `new QdrantClient()` resolved against our mock.
+  // qdrant module's singleton may already hold a MockQdrantClient instance
+  // from a sibling test file. Reset readiness so each test in this file
+  // gets a fresh `new QdrantClient()` resolved against our mock.
   _resetMemoryV2QdrantForTests();
-  _resetMemoryV2SkillQdrantForTests();
 }
 function configWithWeights(
@@ -205,10 +189,18 @@ function configWithWeights(
 /**
  * Stage a single Qdrant response that maps each (slug, denseScore?, sparseScore?)
  * tuple onto the dense or sparse channel, mirroring how `hybridQueryConceptPages`
- * merges per-channel hits.
+ * merges per-channel hits. Optional `summaryDenseScore` / `summarySparseScore`
+ * stage the summary-side channels — pages without those entries fall through
+ * to body-only scoring at fusion time.
  */
 function stageHybridResponse(
-  hits: Array<{ slug: string; denseScore?: number; sparseScore?: number }>,
+  hits: Array<{
+    slug: string;
+    denseScore?: number;
+    sparseScore?: number;
+    summaryDenseScore?: number;
+    summarySparseScore?: number;
+  }>,
 ): void {
   state.queryResponses.dense.push({
     points: hits
@@ -220,6 +212,20 @@ function stageHybridResponse(
       .filter((h) => h.sparseScore !== undefined)
       .map((h) => ({ score: h.sparseScore, payload: { slug: h.slug } })),
   });
+  // The four-channel hybrid query also fires `summary_dense` and
+  // `summary_sparse` queries against the same collection. Tests that don't
+  // care about summary scores leave those channels empty so the fallback
+  // (body-only) path runs.
+  state.queryResponses.dense.push({
+    points: hits
+      .filter((h) => h.summaryDenseScore !== undefined)
+      .map((h) => ({ score: h.summaryDenseScore, payload: { slug: h.slug } })),
+  });
+  state.queryResponses.sparse.push({
+    points: hits
+      .filter((h) => h.summarySparseScore !== undefined)
+      .map((h) => ({ score: h.summarySparseScore, payload: { slug: h.slug } })),
+  });
 }
 beforeEach(resetState);
@@ -488,15 +494,16 @@ describe("simBatch", () => {
     expect(out.get("loud-page")).toBe(1);
   });
-  test("forwards the candidate slugs as a Qdrant slug-IN filter", async () => {
+  test("forwards the candidate slugs as a Qdrant slug-IN filter on every channel", async () => {
     const config = configWithWeights(0.7, 0.3);
     stageHybridResponse([]);
     await simBatch("query", ["alice", "bob", "carol"], config);
-    // Both channels (dense + sparse) ran with the same slug-restriction
-    // filter and the same per-channel limit equal to the candidate count.
-    expect(state.queryCalls).toHaveLength(2);
+    // All four channels (body dense + sparse, summary dense + sparse) ran
+    // with the same slug-restriction filter and the same per-channel limit
+    // equal to the candidate count.
+    expect(state.queryCalls).toHaveLength(4);
     for (const call of state.queryCalls) {
       expect(call.limit).toBe(3);
       expect(call.filter).toEqual({
@@ -516,194 +523,104 @@ describe("simBatch", () => {
     expect(state.sparseCalls).toEqual(["hello world"]);
   });
-  test("returned scores are always in [0, 1] for arbitrary inputs", async () => {
-    const config = configWithWeights(0.7, 0.3);
+  test("takes max(body, summary) per slug — summary higher than body wins", async () => {
+    // Body channels return a modest score; summary channels return a much
+    // higher score. The max collapses to the summary score.
+    const config = configWithWeights(1.0, 0.0);
     stageHybridResponse([
-      { slug: "a", denseScore: 0.99, sparseScore: 100 },
-      { slug: "b", denseScore: 0.5, sparseScore: 50 },
-      { slug: "c", denseScore: 0.0, sparseScore: 1 },
-      { slug: "d", denseScore: 0.123, sparseScore: 0 }, // explicit zero
+      {
+        slug: "alice",
+        denseScore: 0.3,
+        summaryDenseScore: 0.7,
+      },
     ]);
-    const out = await simBatch("query", ["a", "b", "c", "d"], config);
-    for (const [, score] of out) {
-      expect(score).toBeGreaterThanOrEqual(0);
-      expect(score).toBeLessThanOrEqual(1);
-    }
-  });
-});
-// ---------------------------------------------------------------------------
-// simSkillBatch
-// ---------------------------------------------------------------------------
+    const out = await simBatch("query", ["alice"], config);
-/**
- * Stage a single hybrid response on the dedicated skills queues. Mirrors
- * `stageHybridResponse` but uses `payload.id` (skills' Qdrant payload key)
- * instead of `payload.slug`.
- */
-function stageSkillHybridResponse(
-  hits: Array<{ id: string; denseScore?: number; sparseScore?: number }>,
-): void {
-  state.skillQueryResponses.dense.push({
-    points: hits
-      .filter((h) => h.denseScore !== undefined)
-      .map((h) => ({ score: h.denseScore, payload: { id: h.id } })),
+    expect(out.get("alice")).toBeCloseTo(0.7, 6);
   });
-  state.skillQueryResponses.sparse.push({
-    points: hits
-      .filter((h) => h.sparseScore !== undefined)
-      .map((h) => ({ score: h.sparseScore, payload: { id: h.id } })),
-  });
-}
-describe("simSkillBatch", () => {
-  test("empty id list returns empty map without touching backends", async () => {
-    const config = configWithWeights(0.7, 0.3);
-    const out = await simSkillBatch("anything", [], config);
-    expect(out.size).toBe(0);
-    expect(state.embedCalls).toHaveLength(0);
-    expect(state.sparseCalls).toHaveLength(0);
-    expect(state.queryCalls).toHaveLength(0);
-  });
-  test("empty text returns empty map without touching backends", async () => {
-    const config = configWithWeights(0.7, 0.3);
-    for (const text of ["", "   ", "\n\n"]) {
-      state.embedCalls.length = 0;
-      state.sparseCalls.length = 0;
-      state.queryCalls.length = 0;
-      const out = await simSkillBatch(text, ["example-skill-a"], config);
-      expect(out.size).toBe(0);
-      expect(state.embedCalls).toHaveLength(0);
-      expect(state.sparseCalls).toHaveLength(0);
-      expect(state.queryCalls).toHaveLength(0);
-    }
-  });
-  test("queries the dedicated skills collection and forwards an id-IN filter", async () => {
-    const config = configWithWeights(0.7, 0.3);
-    stageSkillHybridResponse([]);
+  test("takes max(body, summary) per slug — body higher than summary wins", async () => {
+    // Inverse case: body dominates, max stays at body.
+    const config = configWithWeights(1.0, 0.0);
+    stageHybridResponse([
+      {
+        slug: "alice",
+        denseScore: 0.9,
+        summaryDenseScore: 0.4,
+      },
+    ]);
-    await simSkillBatch(
-      "query",
-      ["example-skill-a", "example-skill-b"],
-      config,
-    );
+    const out = await simBatch("query", ["alice"], config);
-    expect(state.queryCalls).toHaveLength(2);
-    for (const call of state.queryCalls) {
-      expect(call.collection).toBe("memory_v2_skills");
-      // The candidate ids are forwarded as a Qdrant filter so Qdrant scores
-      // exactly the candidate set, not its global top-K. Without this,
-      // candidate ids absent from the global top-K silently score 0.
-      expect(call.filter).toEqual({
-        must: [
-          { key: "id", match: { any: ["example-skill-a", "example-skill-b"] } },
-        ],
-      });
-      // Limit equals the candidate count.
-      expect(call.limit).toBe(2);
-    }
+    expect(out.get("alice")).toBeCloseTo(0.9, 6);
   });
-  test("fuses dense + sparse with the configured weight blend", async () => {
-    const config = configWithWeights(0.4, 0.6);
-    stageSkillHybridResponse([
-      { id: "example-skill-a", denseScore: 0.5, sparseScore: 4 }, // sparse-norm 1.0
-      { id: "example-skill-b", denseScore: 0.25, sparseScore: 2 }, // sparse-norm 0.5
+  test("falls back to body-only when the page has no summary embedding", async () => {
+    // Pages predating the summary field have no summary_dense/sparse vectors.
+    // Their summary channels return no hits — the max collapses to body.
+    const config = configWithWeights(1.0, 0.0);
+    stageHybridResponse([
+      {
+        slug: "legacy-page",
+        denseScore: 0.6,
+        // summaryDenseScore / summarySparseScore omitted
+      },
     ]);
-    const out = await simSkillBatch(
-      "query",
-      ["example-skill-a", "example-skill-b"],
-      config,
-    );
+    const out = await simBatch("query", ["legacy-page"], config);
-    // example-skill-a: 0.4 * 0.5 + 0.6 * 1.0 = 0.8
-    // example-skill-b: 0.4 * 0.25 + 0.6 * 0.5 = 0.4
-    expect(out.get("example-skill-a")).toBeCloseTo(0.8, 6);
-    expect(out.get("example-skill-b")).toBeCloseTo(0.4, 6);
+    expect(out.get("legacy-page")).toBeCloseTo(0.6, 6);
   });
-  test("dense-only and sparse-only hits are handled symmetrically", async () => {
-    const config = configWithWeights(0.7, 0.3);
-    stageSkillHybridResponse([
-      { id: "example-skill-a", denseScore: 0.5 /* sparse omitted */ },
-      { id: "example-skill-b", sparseScore: 8 /* dense omitted */ },
+  test("normalizes body and summary sparse channels independently", async () => {
+    // Summary sparse scores live on a different scale than body sparse —
+    // a small absolute summary-sparse value (1.5) on the only page that
+    // has summary signal still normalizes to 1.0 within the summary
+    // channel, so the summary-only fused score should win out.
+    const config = configWithWeights(0.0, 1.0);
+    stageHybridResponse([
+      {
+        slug: "alice",
+        denseScore: 0.0,
+        sparseScore: 100, // body sparse max in this batch
+      },
+      {
+        slug: "bob",
+        denseScore: 0.0,
+        sparseScore: 0.5, // body sparse normalized = 0.005
+        summaryDenseScore: 0.0,
+        summarySparseScore: 1.5, // summary sparse max in this batch
+      },
     ]);
-    const out = await simSkillBatch(
-      "query",
-      ["example-skill-a", "example-skill-b"],
-      config,
-    );
+    const out = await simBatch("query", ["alice", "bob"], config);
-    // example-skill-a: 0.7 * 0.5 + 0.3 * 0   = 0.35
-    // example-skill-b: 0.7 * 0   + 0.3 * 1.0 = 0.30 (sparse-norm = 8/8)
-    expect(out.get("example-skill-a")).toBeCloseTo(0.35, 6);
-    expect(out.get("example-skill-b")).toBeCloseTo(0.3, 6);
+    // Alice has only body. Body sparse normalized to 1.0; sparse_weight=1.0 → 1.0.
+    expect(out.get("alice")).toBeCloseTo(1.0, 6);
+    // Bob's summary side normalizes its 1.5 (only sparse-bearing summary
+    // hit) — a single sparse-bearing hit is below the adaptive-spread
+    // floor, so the channel collapses to base weights and the lone
+    // sparseNormalized=1.0 hit yields a fused summary score of 1.0.
+    // Body side has only bob's tiny sparse=0.5 against the body batch max
+    // of 100 → ~0.005. The max picks the summary side.
+    expect(out.get("bob")).toBeCloseTo(1.0, 6);
   });
-  test("forwards candidate ids as the Qdrant restriction; only candidates in result", async () => {
-    // The bug we're guarding against: when the skills collection has more
-    // skills than `ids.length`, calling `hybridQuerySkills` without a filter
-    // returns Qdrant's global top-K. Candidate ids absent from that top-K
-    // would silently score 0. The fix is to forward the candidate ids as a
-    // server-side restriction so Qdrant scores exactly the candidate set.
+  test("returned scores are always in [0, 1] for arbitrary inputs", async () => {
     const config = configWithWeights(0.7, 0.3);
-    stageSkillHybridResponse([
-      { id: "example-skill-a", denseScore: 0.5, sparseScore: 1 },
-      // `example-skill-c` would never be returned in production once the
-      // filter is applied; the post-filter in simSkillBatch defensively
-      // drops it even if a stale payload slips through.
-      { id: "example-skill-c", denseScore: 0.9, sparseScore: 1 },
+    stageHybridResponse([
+      { slug: "a", denseScore: 0.99, sparseScore: 100 },
+      { slug: "b", denseScore: 0.5, sparseScore: 50 },
+      { slug: "c", denseScore: 0.0, sparseScore: 1 },
+      { slug: "d", denseScore: 0.123, sparseScore: 0 }, // explicit zero
     ]);
-    const out = await simSkillBatch(
-      "query",
-      ["example-skill-a", "example-skill-b"],
-      config,
-    );
+    const out = await simBatch("query", ["a", "b", "c", "d"], config);
-    // The Qdrant filter was forwarded — both channels carry the id-IN
-    // restriction matching the caller's candidate set.
-    expect(state.queryCalls).toHaveLength(2);
-    for (const call of state.queryCalls) {
-      expect(call.filter).toEqual({
-        must: [
-          { key: "id", match: { any: ["example-skill-a", "example-skill-b"] } },
-        ],
-      });
+    for (const [, score] of out) {
+      expect(score).toBeGreaterThanOrEqual(0);
+      expect(score).toBeLessThanOrEqual(1);
     }
-    // Only candidate ids appear in the result map.
-    expect(out.has("example-skill-a")).toBe(true);
-    expect(out.has("example-skill-c")).toBe(false);
-  });
-  test("returned scores are clamped into [0, 1]", async () => {
-    const config = configWithWeights(0.8, 0.5); // intentionally sums to > 1
-    stageSkillHybridResponse([
-      { id: "example-skill-a", denseScore: 1.0, sparseScore: 1 },
-    ]);
-    const out = await simSkillBatch("query", ["example-skill-a"], config);
-    expect(out.get("example-skill-a")).toBe(1);
-  });
-  test("embeds the query text exactly once via dense + sparse backends", async () => {
-    const config = configWithWeights(0.7, 0.3);
-    stageSkillHybridResponse([]);
-    await simSkillBatch("hello skill", ["example-skill-a"], config);
-    expect(state.embedCalls).toHaveLength(1);
-    expect(state.embedCalls[0].inputs).toEqual(["hello skill"]);
-    expect(state.sparseCalls).toEqual(["hello skill"]);
   });
 });

package/src/memory/v2/__tests__/skill-store.test.ts CHANGED Viewed

@@ -1,12 +1,17 @@
 /**
  * Tests for `assistant/src/memory/v2/skill-store.ts`.
  *
- * Coverage matrix from PR 5 acceptance criteria:
+ * Coverage matrix:
  *   - `seedV2SkillEntries` enumerates the catalog and calls
- *     `upsertSkillEmbedding` for each enabled skill.
+ *     `upsertConceptPageEmbedding` with `slug: "skills/<id>"` for each
+ *     enabled skill in the unified `memory_v2_concept_pages` collection.
  *   - It skips skills whose declared feature flag is disabled.
- *   - It calls `pruneSkillsExcept` with the active id list.
- *   - It populates the `entries` cache so `getSkillCapability` returns each entry.
+ *   - It calls `pruneSlugsWithPrefixExcept("skills/", ...)` with the active
+ *     id list as suffixes, so stale skill slugs in the unified collection
+ *     get pruned without touching concept-page slugs.
+ *   - It populates the `entries` cache so `getSkillCapability` returns each
+ *     entry — accepting both bare ids (`"example-skill"`) and unified-collection
+ *     slugs (`"skills/example-skill"`).
  *   - It swallows errors from the embedding backend — the function resolves
  *     and the cache is unchanged from prior state.
  *
@@ -29,6 +34,18 @@ mock.module("../../../util/logger.js", () => ({
 // Programmable test state — drives every mocked dependency below.
 // ---------------------------------------------------------------------------
+interface UpsertCall {
+  slug: string;
+  dense: number[];
+  sparse: { indices: number[]; values: number[] };
+  updatedAt: number;
+}
+interface PruneCall {
+  prefix: string;
+  activeSuffixes: readonly string[];
+}
 interface TestState {
   catalog: SkillSummary[];
   resolved: ResolvedSkill[];
@@ -38,14 +55,8 @@ interface TestState {
   embedThrows: Error | null;
   embedReturn: number[][];
   sparseReturn: { indices: number[]; values: number[] };
-  upsertCalls: Array<{
-    id: string;
-    content: string;
-    dense: number[];
-    sparse: { indices: number[]; values: number[] };
-    updatedAt: number;
-  }>;
-  pruneCalls: Array<readonly string[]>;
+  upsertCalls: UpsertCall[];
+  pruneCalls: PruneCall[];
   upsertThrows: Error | null;
 }
@@ -99,13 +110,16 @@ mock.module("../../embedding-backend.js", () => ({
   generateSparseEmbedding: () => state.sparseReturn,
 }));
-mock.module("../skill-qdrant.js", () => ({
-  upsertSkillEmbedding: async (params: TestState["upsertCalls"][number]) => {
+mock.module("../qdrant.js", () => ({
+  upsertConceptPageEmbedding: async (params: UpsertCall) => {
     if (state.upsertThrows) throw state.upsertThrows;
     state.upsertCalls.push(params);
   },
-  pruneSkillsExcept: async (ids: readonly string[]) => {
-    state.pruneCalls.push(ids);
+  pruneSlugsWithPrefixExcept: async (
+    prefix: string,
+    activeSuffixes: readonly string[],
+  ) => {
+    state.pruneCalls.push({ prefix, activeSuffixes });
   },
 }));
@@ -160,7 +174,7 @@ afterEach(resetState);
 // ---------------------------------------------------------------------------
 describe("seedV2SkillEntries", () => {
-  test("enumerates the catalog and upserts one point per enabled skill", async () => {
+  test("upserts each enabled skill into the unified collection under skills/<id>", async () => {
     const skillA = makeSummary({
       id: "example-skill-a",
       displayName: "Skill A",
@@ -182,15 +196,16 @@ describe("seedV2SkillEntries", () => {
     await seedV2SkillEntries();
     expect(state.upsertCalls).toHaveLength(2);
-    const ids = state.upsertCalls.map((c) => c.id).sort();
-    expect(ids).toEqual(["example-skill-a", "example-skill-b"]);
-    // Each upsert carries the per-skill dense + sparse + content payload.
-    const callA = state.upsertCalls.find((c) => c.id === "example-skill-a")!;
+    const slugs = state.upsertCalls.map((c) => c.slug).sort();
+    expect(slugs).toEqual(["skills/example-skill-a", "skills/example-skill-b"]);
+    // Each upsert carries the per-skill dense + sparse + updatedAt payload,
+    // keyed under the unified `skills/<id>` slug.
+    const callA = state.upsertCalls.find(
+      (c) => c.slug === "skills/example-skill-a",
+    )!;
     expect(callA.dense).toEqual([0.1, 0.2, 0.3]);
     expect(callA.sparse).toEqual(state.sparseReturn);
-    expect(callA.content).toContain("Skill A");
-    expect(callA.content).toContain("(example-skill-a)");
     expect(callA.updatedAt).toBeGreaterThan(0);
   });
@@ -207,12 +222,11 @@ describe("seedV2SkillEntries", () => {
     await seedV2SkillEntries();
     expect(state.upsertCalls).toHaveLength(1);
-    expect(state.upsertCalls[0].id).toBe("example-skill-a");
+    expect(state.upsertCalls[0].slug).toBe("skills/example-skill-a");
   });
   test("does not re-seed an installed-but-disabled skill from the remote catalog", async () => {
-    // Regression for https://github.com/vellum-ai/vellum-assistant/pull/28635
-    // (Codex P1): if `seenIds` is built only from enabled skills, a locally
+    // Regression: if `seenIds` is built only from enabled skills, a locally
     // installed-but-disabled skill falls through to the catalog loop and gets
     // embedded as if it were a discoverable uninstalled skill — contradicting
     // the user's explicit disablement.
@@ -223,8 +237,6 @@ describe("seedV2SkillEntries", () => {
       { summary: enabledSkill, state: "enabled" },
       { summary: disabledSkill, state: "disabled" },
     ];
-    // The remote catalog also contains the disabled skill (same id) — the
-    // seed function must NOT pull it back in via `getCatalog()`.
     state.fullCatalog = [
       {
         id: "example-skill-b",
@@ -237,7 +249,7 @@ describe("seedV2SkillEntries", () => {
     await seedV2SkillEntries();
     expect(state.upsertCalls).toHaveLength(1);
-    expect(state.upsertCalls[0].id).toBe("example-skill-a");
+    expect(state.upsertCalls[0].slug).toBe("skills/example-skill-a");
   });
   test("seeds genuinely uninstalled catalog skills alongside enabled installed skills", async () => {
@@ -263,8 +275,11 @@ describe("seedV2SkillEntries", () => {
     await seedV2SkillEntries();
-    const ids = state.upsertCalls.map((c) => c.id).sort();
-    expect(ids).toEqual(["example-skill-a", "uninstalled-skill"]);
+    const slugs = state.upsertCalls.map((c) => c.slug).sort();
+    expect(slugs).toEqual([
+      "skills/example-skill-a",
+      "skills/uninstalled-skill",
+    ]);
   });
   test("skips skills whose declared feature flag is disabled", async () => {
@@ -284,10 +299,10 @@ describe("seedV2SkillEntries", () => {
     await seedV2SkillEntries();
     expect(state.upsertCalls).toHaveLength(1);
-    expect(state.upsertCalls[0].id).toBe("example-skill-b");
+    expect(state.upsertCalls[0].slug).toBe("skills/example-skill-b");
   });
-  test("calls pruneSkillsExcept with the active id list", async () => {
+  test("calls pruneSlugsWithPrefixExcept with the active id list and the skills/ prefix", async () => {
     const skillA = makeSummary({ id: "example-skill-a" });
     const skillB = makeSummary({ id: "example-skill-b" });
     state.catalog = [skillA, skillB];
@@ -309,13 +324,14 @@ describe("seedV2SkillEntries", () => {
     await seedV2SkillEntries();
     expect(state.pruneCalls).toHaveLength(1);
-    expect([...state.pruneCalls[0]].sort()).toEqual([
+    expect(state.pruneCalls[0].prefix).toBe("skills/");
+    expect([...state.pruneCalls[0].activeSuffixes].sort()).toEqual([
       "example-skill-a",
       "example-skill-b",
     ]);
   });
-  test("passes only the active (post-flag-filter) ids to pruneSkillsExcept", async () => {
+  test("passes only the active (post-flag-filter) ids to pruneSlugsWithPrefixExcept", async () => {
     const flagged = makeSummary({
       id: "example-skill-a",
       featureFlag: "off-flag",
@@ -327,8 +343,6 @@ describe("seedV2SkillEntries", () => {
       { summary: unflagged, state: "enabled" },
     ];
     state.flagsEnabled = { "off-flag": false };
-    // Remote catalog must be non-empty so catalogAvailable is true and
-    // pruning is not skipped.
     state.fullCatalog = [
       { id: "example-skill-a", name: "example-skill-a", description: "A" },
       { id: "example-skill-b", name: "example-skill-b", description: "B" },
@@ -338,44 +352,35 @@ describe("seedV2SkillEntries", () => {
     await seedV2SkillEntries();
     expect(state.pruneCalls).toHaveLength(1);
-    expect([...state.pruneCalls[0]]).toEqual(["example-skill-b"]);
+    expect(state.pruneCalls[0].prefix).toBe("skills/");
+    expect([...state.pruneCalls[0].activeSuffixes]).toEqual([
+      "example-skill-b",
+    ]);
   });
-  test("populates the entries cache so getSkillCapability returns each entry", async () => {
+  test("populates the entries cache so getSkillCapability resolves both bare id and unified slug", async () => {
     const skillA = makeSummary({
       id: "example-skill-a",
       displayName: "Skill A",
     });
-    const skillB = makeSummary({
-      id: "example-skill-b",
-      displayName: "Skill B",
-    });
-    state.catalog = [skillA, skillB];
-    state.resolved = [
-      { summary: skillA, state: "enabled" },
-      { summary: skillB, state: "enabled" },
-    ];
-    state.embedReturn = [
-      [0.1, 0.2, 0.3],
-      [0.4, 0.5, 0.6],
-    ];
+    state.catalog = [skillA];
+    state.resolved = [{ summary: skillA, state: "enabled" }];
+    state.embedReturn = [[0.1, 0.2, 0.3]];
     expect(getSkillCapability("example-skill-a")).toBeNull();
     await seedV2SkillEntries();
-    const entryA = getSkillCapability("example-skill-a");
-    const entryB = getSkillCapability("example-skill-b");
-    expect(entryA).not.toBeNull();
-    expect(entryA?.id).toBe("example-skill-a");
-    expect(entryA?.content).toContain("Skill A");
-    expect(entryB).not.toBeNull();
-    expect(entryB?.id).toBe("example-skill-b");
-    expect(entryB?.content).toContain("Skill B");
+    // Bare id and unified-slug forms both resolve to the same entry.
+    const byId = getSkillCapability("example-skill-a");
+    const bySlug = getSkillCapability("skills/example-skill-a");
+    expect(byId).not.toBeNull();
+    expect(byId?.id).toBe("example-skill-a");
+    expect(byId?.content).toContain("Skill A");
+    expect(bySlug).toEqual(byId);
-    // Unknown ids return null even when the cache is populated.
     expect(getSkillCapability("unknown-skill")).toBeNull();
+    expect(getSkillCapability("skills/unknown-skill")).toBeNull();
   });
   test("swallows errors from embedWithBackend and leaves prior cache intact", async () => {
@@ -426,9 +431,10 @@ describe("seedV2SkillEntries", () => {
     await seedV2SkillEntries();
     expect(state.upsertCalls).toHaveLength(1);
-    expect(state.upsertCalls[0].id).toBe("remote-only");
+    expect(state.upsertCalls[0].slug).toBe("skills/remote-only");
     expect(state.pruneCalls).toHaveLength(1);
-    expect([...state.pruneCalls[0]]).toEqual(["remote-only"]);
+    expect(state.pruneCalls[0].prefix).toBe("skills/");
+    expect([...state.pruneCalls[0].activeSuffixes]).toEqual(["remote-only"]);
   });
   test("skips pruning when catalog fetch returns empty (network failure guard)", async () => {