@vellumai/assistant 0.5.15 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (503) hide show
  1. package/ARCHITECTURE.md +3 -3
  2. package/Dockerfile +0 -3
  3. package/docs/architecture/integrations.md +15 -14
  4. package/knip.json +4 -1
  5. package/openapi.yaml +670 -122
  6. package/package.json +1 -1
  7. package/src/__tests__/actor-token-service.test.ts +68 -0
  8. package/src/__tests__/agent-loop.test.ts +0 -32
  9. package/src/__tests__/always-loaded-tools-guard.test.ts +2 -2
  10. package/src/__tests__/anthropic-provider.test.ts +57 -3
  11. package/src/__tests__/app-compiler.test.ts +120 -0
  12. package/src/__tests__/assistant-feature-flags-integration.test.ts +5 -377
  13. package/src/__tests__/call-conversation-messages.test.ts +2 -6
  14. package/src/__tests__/call-domain.test.ts +2 -6
  15. package/src/__tests__/call-pointer-messages.test.ts +2 -14
  16. package/src/__tests__/call-recovery.test.ts +2 -6
  17. package/src/__tests__/call-routes-http.test.ts +2 -6
  18. package/src/__tests__/call-store.test.ts +2 -6
  19. package/src/__tests__/cancel-resolves-conversation-key.test.ts +2 -6
  20. package/src/__tests__/canonical-guardian-store.test.ts +2 -6
  21. package/src/__tests__/ces-rpc-credential-backend.test.ts +4 -1
  22. package/src/__tests__/channel-delivery-store.test.ts +2 -6
  23. package/src/__tests__/channel-retry-sweep.test.ts +2 -6
  24. package/src/__tests__/checker.test.ts +84 -3
  25. package/src/__tests__/clawhub.test.ts +54 -24
  26. package/src/__tests__/cli-command-risk-guard.test.ts +108 -6
  27. package/src/__tests__/cli-memory.test.ts +377 -0
  28. package/src/__tests__/computer-use-skill-manifest-regression.test.ts +12 -2
  29. package/src/__tests__/config-schema.test.ts +1 -3
  30. package/src/__tests__/config-set-platform-guard.test.ts +302 -0
  31. package/src/__tests__/config-watcher-feature-flags.test.ts +211 -0
  32. package/src/__tests__/confirmation-request-guardian-bridge.test.ts +2 -6
  33. package/src/__tests__/contacts-tools.test.ts +31 -0
  34. package/src/__tests__/context-overflow-reducer.test.ts +86 -0
  35. package/src/__tests__/context-token-estimator.test.ts +175 -10
  36. package/src/__tests__/conversation-agent-loop-overflow.test.ts +9 -0
  37. package/src/__tests__/conversation-agent-loop.test.ts +9 -0
  38. package/src/__tests__/conversation-attachments.test.ts +2 -6
  39. package/src/__tests__/conversation-attention-store.test.ts +2 -6
  40. package/src/__tests__/conversation-clear-safety.test.ts +2 -6
  41. package/src/__tests__/conversation-delete-schedule-cleanup.test.ts +4 -10
  42. package/src/__tests__/conversation-disk-view-integration.test.ts +2 -6
  43. package/src/__tests__/conversation-disk-view.test.ts +2 -6
  44. package/src/__tests__/conversation-error.test.ts +33 -2
  45. package/src/__tests__/conversation-fork-crud.test.ts +2 -6
  46. package/src/__tests__/conversation-history-web-search.test.ts +5 -0
  47. package/src/__tests__/conversation-load-history-repair.test.ts +5 -1
  48. package/src/__tests__/conversation-media-retry.test.ts +91 -0
  49. package/src/__tests__/conversation-runtime-assembly.test.ts +7 -4
  50. package/src/__tests__/conversation-slash-commands.test.ts +2 -6
  51. package/src/__tests__/conversation-starter-routes.test.ts +20 -11
  52. package/src/__tests__/conversation-store.test.ts +2 -6
  53. package/src/__tests__/conversation-usage.test.ts +3 -6
  54. package/src/__tests__/conversation-wipe.test.ts +11 -408
  55. package/src/__tests__/credential-execution-feature-gates.test.ts +3 -3
  56. package/src/__tests__/credential-execution-shell-lockdown.test.ts +2 -2
  57. package/src/__tests__/credential-security-e2e.test.ts +6 -1
  58. package/src/__tests__/docker-signing-key-bootstrap.test.ts +7 -73
  59. package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +6 -7
  60. package/src/__tests__/followup-tools.test.ts +2 -6
  61. package/src/__tests__/graph-extraction-event-date.test.ts +186 -0
  62. package/src/__tests__/guardian-action-conversation-turn.test.ts +2 -6
  63. package/src/__tests__/guardian-action-followup-executor.test.ts +2 -6
  64. package/src/__tests__/guardian-action-followup-store.test.ts +2 -6
  65. package/src/__tests__/guardian-action-grant-mint-consume.test.ts +2 -6
  66. package/src/__tests__/guardian-action-late-reply.test.ts +2 -6
  67. package/src/__tests__/guardian-action-store.test.ts +2 -6
  68. package/src/__tests__/guardian-binding-drift-heal.test.ts +2 -6
  69. package/src/__tests__/guardian-decision-primitive-canonical.test.ts +8 -8
  70. package/src/__tests__/guardian-dispatch.test.ts +2 -6
  71. package/src/__tests__/guardian-grant-minting.test.ts +2 -14
  72. package/src/__tests__/guardian-principal-id-roundtrip.test.ts +2 -6
  73. package/src/__tests__/guardian-routing-invariants.test.ts +343 -6
  74. package/src/__tests__/guardian-routing-state.test.ts +2 -6
  75. package/src/__tests__/guardian-verification-voice-binding.test.ts +2 -6
  76. package/src/__tests__/heartbeat-service.test.ts +1 -3
  77. package/src/__tests__/inbound-invite-redemption.test.ts +2 -6
  78. package/src/__tests__/injection-block.test.ts +154 -0
  79. package/src/__tests__/install-meta.test.ts +506 -0
  80. package/src/__tests__/install-skill-routing.test.ts +292 -0
  81. package/src/__tests__/intent-routing.test.ts +6 -18
  82. package/src/__tests__/invite-redemption-service.test.ts +2 -6
  83. package/src/__tests__/invite-routes-http.test.ts +2 -6
  84. package/src/__tests__/jobs-store-qdrant-breaker.test.ts +2 -14
  85. package/src/__tests__/list-messages-attachments.test.ts +2 -6
  86. package/src/__tests__/llm-context-route-provider.test.ts +2 -6
  87. package/src/__tests__/llm-request-log-turn-query.test.ts +2 -6
  88. package/src/__tests__/llm-usage-store.test.ts +2 -6
  89. package/src/__tests__/log-export-workspace.test.ts +4 -34
  90. package/src/__tests__/managed-skill-lifecycle.test.ts +7 -37
  91. package/src/__tests__/managed-store.test.ts +40 -21
  92. package/src/__tests__/memory-jobs-worker-backoff.test.ts +2 -8
  93. package/src/__tests__/memory-recall-log-store.test.ts +2 -6
  94. package/src/__tests__/memory-upsert-concurrency.test.ts +4 -112
  95. package/src/__tests__/messaging-send-tool.test.ts +6 -6
  96. package/src/__tests__/migration-cross-version-compatibility.test.ts +1 -29
  97. package/src/__tests__/migration-export-http.test.ts +3 -34
  98. package/src/__tests__/migration-import-commit-http.test.ts +1 -29
  99. package/src/__tests__/migration-import-preflight-http.test.ts +3 -34
  100. package/src/__tests__/no-domain-routing-in-prompt-guard.test.ts +2 -1
  101. package/src/__tests__/non-member-access-request.test.ts +2 -6
  102. package/src/__tests__/notification-guardian-path.test.ts +2 -6
  103. package/src/__tests__/oauth-apps-routes.test.ts +120 -10
  104. package/src/__tests__/oauth-cli.test.ts +364 -2
  105. package/src/__tests__/oauth-connect-orchestrator.test.ts +709 -0
  106. package/src/__tests__/oauth-provider-serializer.test.ts +2 -1
  107. package/src/__tests__/oauth-provider-visibility.test.ts +149 -0
  108. package/src/__tests__/oauth-providers-routes.test.ts +5 -2
  109. package/src/__tests__/oauth-store.test.ts +0 -5
  110. package/src/__tests__/oauth2-gateway-transport.test.ts +18 -3
  111. package/src/__tests__/outlook-attachments.test.ts +301 -0
  112. package/src/__tests__/outlook-automation-tools.test.ts +425 -0
  113. package/src/__tests__/outlook-categories.test.ts +212 -0
  114. package/src/__tests__/outlook-client-automation.test.ts +246 -0
  115. package/src/__tests__/outlook-compose-tools.test.ts +325 -0
  116. package/src/__tests__/outlook-declutter-tools.test.ts +585 -0
  117. package/src/__tests__/outlook-email-watcher.test.ts +322 -0
  118. package/src/__tests__/outlook-follow-up.test.ts +196 -0
  119. package/src/__tests__/outlook-messaging-provider.test.ts +1071 -0
  120. package/src/__tests__/outlook-trash.test.ts +77 -0
  121. package/src/__tests__/outlook-unsubscribe.test.ts +250 -0
  122. package/src/__tests__/path-policy.test.ts +2 -17
  123. package/src/__tests__/permission-types.test.ts +0 -1
  124. package/src/__tests__/platform-callback-registration.test.ts +7 -11
  125. package/src/__tests__/playbook-execution.test.ts +76 -80
  126. package/src/__tests__/playbook-tools.test.ts +5 -7
  127. package/src/__tests__/provider-commit-message-generator.test.ts +0 -1
  128. package/src/__tests__/provider-error-scenarios.test.ts +21 -2
  129. package/src/__tests__/qdrant-manager.test.ts +68 -21
  130. package/src/__tests__/rebuild-index-graph-nodes.test.ts +273 -0
  131. package/src/__tests__/registry.test.ts +2 -2
  132. package/src/__tests__/require-fresh-approval.test.ts +64 -3
  133. package/src/__tests__/runtime-events-sse-parity.test.ts +2 -6
  134. package/src/__tests__/runtime-events-sse.test.ts +2 -6
  135. package/src/__tests__/sandbox-diagnostics.test.ts +20 -29
  136. package/src/__tests__/scaffold-managed-skill-tool.test.ts +2 -10
  137. package/src/__tests__/schedule-store.test.ts +2 -6
  138. package/src/__tests__/schedule-tools.test.ts +2 -6
  139. package/src/__tests__/scheduler-recurrence.test.ts +1 -5
  140. package/src/__tests__/scoped-approval-grants.test.ts +2 -6
  141. package/src/__tests__/scoped-grant-security-matrix.test.ts +2 -6
  142. package/src/__tests__/search-skills-unified.test.ts +421 -0
  143. package/src/__tests__/secret-allowlist.test.ts +20 -35
  144. package/src/__tests__/secret-onetime-send.test.ts +2 -0
  145. package/src/__tests__/send-endpoint-busy.test.ts +2 -6
  146. package/src/__tests__/sequence-store.test.ts +2 -6
  147. package/src/__tests__/server-history-render.test.ts +2 -6
  148. package/src/__tests__/shell-credential-ref.test.ts +0 -5
  149. package/src/__tests__/skill-feature-flags-integration.test.ts +38 -31
  150. package/src/__tests__/skill-feature-flags.test.ts +6 -6
  151. package/src/__tests__/skill-load-feature-flag.test.ts +13 -54
  152. package/src/__tests__/skill-load-inline-command.test.ts +3 -65
  153. package/src/__tests__/skill-load-inline-includes.test.ts +3 -65
  154. package/src/__tests__/skill-load-tool.test.ts +3 -67
  155. package/src/__tests__/skill-memory.test.ts +480 -195
  156. package/src/__tests__/skills-uninstall.test.ts +2 -2
  157. package/src/__tests__/skills.test.ts +23 -50
  158. package/src/__tests__/slack-channel-config.test.ts +2 -21
  159. package/src/__tests__/slack-inbound-verification.test.ts +2 -6
  160. package/src/__tests__/starter-bundle.test.ts +2 -8
  161. package/src/__tests__/stt-hints.test.ts +7 -2
  162. package/src/__tests__/system-prompt.test.ts +25 -45
  163. package/src/__tests__/task-compiler.test.ts +2 -27
  164. package/src/__tests__/task-management-tools.test.ts +2 -27
  165. package/src/__tests__/task-memory-cleanup.test.ts +173 -250
  166. package/src/__tests__/task-runner.test.ts +2 -27
  167. package/src/__tests__/task-scheduler.test.ts +2 -27
  168. package/src/__tests__/terminal-tools.test.ts +1 -17
  169. package/src/__tests__/test-preload.ts +3 -0
  170. package/src/__tests__/token-estimator-accuracy.benchmark.test.ts +0 -79
  171. package/src/__tests__/tool-approval-handler.test.ts +4 -27
  172. package/src/__tests__/tool-execution-abort-cleanup.test.ts +2 -11
  173. package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +1 -25
  174. package/src/__tests__/tool-executor-lifecycle-events.test.ts +0 -1
  175. package/src/__tests__/tool-executor.test.ts +0 -1
  176. package/src/__tests__/tool-grant-request-escalation.test.ts +4 -27
  177. package/src/__tests__/tool-preview-lifecycle.test.ts +0 -20
  178. package/src/__tests__/tool-side-effects-slack-dm.test.ts +276 -0
  179. package/src/__tests__/trust-store.test.ts +10 -42
  180. package/src/__tests__/trusted-contact-approval-notifier.test.ts +1 -30
  181. package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +3 -27
  182. package/src/__tests__/trusted-contact-lifecycle-notifications.test.ts +2 -28
  183. package/src/__tests__/trusted-contact-multichannel.test.ts +2 -28
  184. package/src/__tests__/trusted-contact-verification.test.ts +2 -28
  185. package/src/__tests__/turn-boundary-resolution.test.ts +2 -34
  186. package/src/__tests__/twilio-provider.test.ts +0 -16
  187. package/src/__tests__/twilio-routes-twiml.test.ts +7 -12
  188. package/src/__tests__/twilio-routes.test.ts +0 -24
  189. package/src/__tests__/update-bulletin.test.ts +17 -89
  190. package/src/__tests__/usage-cache-backfill-migration.test.ts +1 -26
  191. package/src/__tests__/usage-routes.test.ts +2 -27
  192. package/src/__tests__/user-reference.test.ts +1 -5
  193. package/src/__tests__/vbundle-pax-and-symlink.test.ts +4 -34
  194. package/src/__tests__/vellum-self-knowledge-inline-command.test.ts +2 -53
  195. package/src/__tests__/verification-control-plane-policy.test.ts +0 -2
  196. package/src/__tests__/voice-invite-redemption.test.ts +2 -27
  197. package/src/__tests__/voice-scoped-grant-consumer.test.ts +2 -30
  198. package/src/__tests__/voice-session-bridge.test.ts +2 -27
  199. package/src/__tests__/volume-security-guard.test.ts +2 -0
  200. package/src/__tests__/workspace-lifecycle.test.ts +29 -1
  201. package/src/__tests__/workspace-migration-009-backfill-conversation-disk-view.test.ts +4 -29
  202. package/src/__tests__/workspace-migration-012-rename-conversation-disk-view-dirs.test.ts +2 -2
  203. package/src/__tests__/workspace-migration-013-repair-conversation-disk-view.test.ts +4 -29
  204. package/src/__tests__/workspace-migration-026-backfill-install-meta.test.ts +558 -0
  205. package/src/__tests__/workspace-migration-down-functions.test.ts +0 -6
  206. package/src/__tests__/workspace-policy.test.ts +1 -1
  207. package/src/acp/client-handler.ts +1 -2
  208. package/src/agent/attachments.ts +7 -2
  209. package/src/agent/image-optimize.ts +165 -0
  210. package/src/agent/loop.ts +1 -15
  211. package/src/bundler/app-compiler.ts +179 -2
  212. package/src/bundler/package-resolver.ts +3 -5
  213. package/src/cli/__tests__/notifications.test.ts +1 -24
  214. package/src/cli/cli-memory.ts +179 -0
  215. package/src/cli/commands/avatar.ts +3 -3
  216. package/src/cli/commands/config.ts +26 -13
  217. package/src/cli/commands/doctor.ts +2 -2
  218. package/src/cli/commands/memory.ts +41 -55
  219. package/src/cli/commands/oauth/__tests__/connect.test.ts +2 -2
  220. package/src/cli/commands/oauth/__tests__/disconnect.test.ts +2 -2
  221. package/src/cli/commands/oauth/__tests__/mode.test.ts +8 -1
  222. package/src/cli/commands/oauth/__tests__/providers-update.test.ts +1 -1
  223. package/src/cli/commands/oauth/__tests__/status.test.ts +2 -2
  224. package/src/cli/commands/oauth/connect.ts +26 -6
  225. package/src/cli/commands/oauth/mode.ts +7 -0
  226. package/src/cli/commands/oauth/providers.ts +49 -42
  227. package/src/cli/commands/oauth/shared.ts +39 -3
  228. package/src/cli/commands/platform/__tests__/connect.test.ts +3 -49
  229. package/src/cli/commands/platform/__tests__/disconnect.test.ts +3 -49
  230. package/src/cli/commands/platform/__tests__/status.test.ts +5 -55
  231. package/src/cli/commands/platform/index.ts +16 -16
  232. package/src/cli/commands/skills.ts +88 -16
  233. package/src/cli/commands/trust.ts +2 -2
  234. package/src/cli/lib/daemon-credential-client.ts +2 -3
  235. package/src/config/bundled-skills/acp/TOOLS.json +1 -1
  236. package/src/config/bundled-skills/computer-use/TOOLS.json +7 -7
  237. package/src/config/bundled-skills/contacts/SKILL.md +0 -1
  238. package/src/config/bundled-skills/contacts/TOOLS.json +0 -8
  239. package/src/config/bundled-skills/contacts/tools/contact-upsert.ts +0 -4
  240. package/src/config/bundled-skills/gmail/SKILL.md +2 -10
  241. package/src/config/bundled-skills/google-calendar/SKILL.md +1 -9
  242. package/src/config/bundled-skills/messaging/SKILL.md +26 -19
  243. package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +40 -33
  244. package/src/config/bundled-skills/outlook/SKILL.md +189 -0
  245. package/src/config/bundled-skills/outlook/TOOLS.json +530 -0
  246. package/src/config/bundled-skills/outlook/tools/outlook-attachments.ts +85 -0
  247. package/src/config/bundled-skills/outlook/tools/outlook-categories.ts +77 -0
  248. package/src/config/bundled-skills/outlook/tools/outlook-draft.ts +84 -0
  249. package/src/config/bundled-skills/outlook/tools/outlook-follow-up.ts +94 -0
  250. package/src/config/bundled-skills/outlook/tools/outlook-forward.ts +49 -0
  251. package/src/config/bundled-skills/outlook/tools/outlook-outreach-scan.ts +237 -0
  252. package/src/config/bundled-skills/outlook/tools/outlook-rules.ts +161 -0
  253. package/src/config/bundled-skills/outlook/tools/outlook-send-draft.ts +32 -0
  254. package/src/config/bundled-skills/outlook/tools/outlook-sender-digest.ts +272 -0
  255. package/src/config/bundled-skills/outlook/tools/outlook-trash.ts +29 -0
  256. package/src/config/bundled-skills/outlook/tools/outlook-unsubscribe.ts +129 -0
  257. package/src/config/bundled-skills/outlook/tools/outlook-vacation.ts +87 -0
  258. package/src/config/bundled-skills/outlook/tools/shared.ts +20 -0
  259. package/src/config/bundled-skills/outlook-calendar/SKILL.md +51 -0
  260. package/src/config/bundled-skills/outlook-calendar/TOOLS.json +221 -0
  261. package/src/config/bundled-skills/outlook-calendar/calendar-client.ts +252 -0
  262. package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-check-availability.ts +53 -0
  263. package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-create-event.ts +74 -0
  264. package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-get-event.ts +18 -0
  265. package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-list-events.ts +46 -0
  266. package/src/config/bundled-skills/outlook-calendar/tools/outlook-calendar-rsvp.ts +36 -0
  267. package/src/config/bundled-skills/outlook-calendar/tools/shared.ts +17 -0
  268. package/src/config/bundled-skills/outlook-calendar/types.ts +120 -0
  269. package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +47 -40
  270. package/src/config/bundled-skills/playbooks/tools/playbook-delete.ts +16 -29
  271. package/src/config/bundled-skills/playbooks/tools/playbook-list.ts +16 -18
  272. package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +39 -47
  273. package/src/config/bundled-skills/settings/TOOLS.json +3 -3
  274. package/src/config/bundled-skills/slack/SKILL.md +1 -7
  275. package/src/config/bundled-tool-registry.ts +56 -4
  276. package/src/config/env-registry.ts +15 -8
  277. package/src/config/feature-flag-registry.json +29 -116
  278. package/src/config/loader.ts +4 -0
  279. package/src/config/schemas/platform.ts +8 -0
  280. package/src/config/schemas/security.ts +0 -6
  281. package/src/config/schemas/services.ts +8 -0
  282. package/src/config/schemas/timeouts.ts +1 -1
  283. package/src/config/skills.ts +18 -7
  284. package/src/context/token-estimator.ts +25 -18
  285. package/src/context/window-manager.ts +32 -9
  286. package/src/credential-execution/approval-bridge.ts +0 -1
  287. package/src/credential-execution/process-manager.ts +3 -1
  288. package/src/daemon/config-watcher.ts +51 -0
  289. package/src/daemon/context-overflow-reducer.ts +46 -2
  290. package/src/daemon/conversation-agent-loop-handlers.ts +123 -82
  291. package/src/daemon/conversation-agent-loop.ts +99 -63
  292. package/src/daemon/conversation-error.ts +31 -8
  293. package/src/daemon/conversation-lifecycle.ts +33 -0
  294. package/src/daemon/conversation-media-retry.ts +85 -7
  295. package/src/daemon/conversation-notifiers.ts +4 -1
  296. package/src/daemon/conversation-process.ts +1 -0
  297. package/src/daemon/conversation-runtime-assembly.ts +5 -0
  298. package/src/daemon/conversation-usage.ts +1 -0
  299. package/src/daemon/conversation.ts +41 -2
  300. package/src/daemon/daemon-control.ts +8 -2
  301. package/src/daemon/handlers/shared.ts +22 -12
  302. package/src/daemon/handlers/skills.ts +423 -201
  303. package/src/daemon/lifecycle.ts +52 -4
  304. package/src/daemon/main.ts +5 -1
  305. package/src/daemon/message-types/conversations.ts +5 -1
  306. package/src/daemon/message-types/messages.ts +3 -1
  307. package/src/daemon/message-types/skills.ts +97 -36
  308. package/src/daemon/providers-setup.ts +7 -0
  309. package/src/daemon/server.ts +35 -22
  310. package/src/daemon/tool-side-effects.ts +27 -5
  311. package/src/events/domain-events.ts +1 -2
  312. package/src/heartbeat/heartbeat-service.ts +1 -0
  313. package/src/hooks/cli.ts +2 -2
  314. package/src/hooks/runner.ts +15 -38
  315. package/src/inbound/platform-callback-registration.ts +14 -14
  316. package/src/memory/admin.ts +11 -45
  317. package/src/memory/conversation-bootstrap.ts +2 -0
  318. package/src/memory/conversation-crud.ts +242 -348
  319. package/src/memory/conversation-group-migration.ts +157 -0
  320. package/src/memory/conversation-queries.ts +4 -2
  321. package/src/memory/db-init.ts +39 -3
  322. package/src/memory/embed.ts +73 -0
  323. package/src/memory/embedding-backend.ts +8 -14
  324. package/src/memory/embedding-runtime-manager.ts +12 -114
  325. package/src/memory/fingerprint.ts +2 -2
  326. package/src/memory/graph/bootstrap.ts +512 -0
  327. package/src/memory/graph/capability-seed.ts +297 -0
  328. package/src/memory/graph/consolidation.ts +691 -0
  329. package/src/memory/graph/conversation-graph-memory.ts +630 -0
  330. package/src/memory/graph/decay.test.ts +208 -0
  331. package/src/memory/graph/decay.ts +195 -0
  332. package/src/memory/graph/extraction-job.ts +69 -0
  333. package/src/memory/graph/extraction.test.ts +936 -0
  334. package/src/memory/graph/extraction.ts +1254 -0
  335. package/src/memory/graph/graph-search.ts +266 -0
  336. package/src/memory/graph/image-ref-utils.ts +29 -0
  337. package/src/memory/graph/injection.test.ts +513 -0
  338. package/src/memory/graph/injection.ts +439 -0
  339. package/src/memory/graph/inspect.ts +534 -0
  340. package/src/memory/graph/narrative.ts +267 -0
  341. package/src/memory/graph/pattern-scan.ts +269 -0
  342. package/src/memory/graph/retriever.ts +1008 -0
  343. package/src/memory/graph/scoring.test.ts +548 -0
  344. package/src/memory/graph/scoring.ts +232 -0
  345. package/src/memory/graph/serendipity.ts +65 -0
  346. package/src/memory/graph/store.test.ts +1050 -0
  347. package/src/memory/graph/store.ts +699 -0
  348. package/src/memory/graph/tool-handlers.ts +426 -0
  349. package/src/memory/graph/tools.ts +141 -0
  350. package/src/memory/graph/triggers.test.ts +487 -0
  351. package/src/memory/graph/triggers.ts +223 -0
  352. package/src/memory/graph/types.ts +271 -0
  353. package/src/memory/group-crud.ts +191 -0
  354. package/src/memory/indexer.ts +37 -19
  355. package/src/memory/job-handlers/cleanup.ts +0 -53
  356. package/src/memory/job-handlers/conversation-starters.ts +91 -53
  357. package/src/memory/job-handlers/embedding.test.ts +3 -27
  358. package/src/memory/job-handlers/embedding.ts +5 -31
  359. package/src/memory/job-handlers/index-maintenance.ts +23 -11
  360. package/src/memory/job-handlers/summarization.ts +32 -17
  361. package/src/memory/job-utils.ts +1 -1
  362. package/src/memory/jobs-store.ts +50 -70
  363. package/src/memory/jobs-worker.ts +147 -112
  364. package/src/memory/llm-usage-store.ts +35 -2
  365. package/src/memory/message-content.ts +1 -0
  366. package/src/memory/migrations/201-oauth-providers-feature-flag.ts +11 -0
  367. package/src/memory/migrations/202-drop-callback-transport-column.ts +13 -0
  368. package/src/memory/migrations/202-memory-graph-tables.ts +130 -0
  369. package/src/memory/migrations/203-drop-memory-items-tables.ts +23 -0
  370. package/src/memory/migrations/204-rename-memory-graph-type-values.ts +46 -0
  371. package/src/memory/migrations/205-memory-graph-image-refs.ts +11 -0
  372. package/src/memory/migrations/index.ts +6 -0
  373. package/src/memory/migrations/registry.ts +8 -0
  374. package/src/memory/qdrant-client.ts +44 -17
  375. package/src/memory/qdrant-manager.ts +26 -5
  376. package/src/memory/schema/index.ts +1 -0
  377. package/src/memory/schema/memory-graph.ts +139 -0
  378. package/src/memory/schema/oauth.ts +1 -1
  379. package/src/memory/search/semantic.ts +47 -91
  380. package/src/memory/slack-thread-store.ts +17 -0
  381. package/src/memory/task-memory-cleanup.ts +28 -50
  382. package/src/messaging/providers/outlook/adapter.ts +200 -0
  383. package/src/messaging/providers/outlook/client.ts +610 -0
  384. package/src/messaging/providers/outlook/types.ts +201 -0
  385. package/src/notifications/adapters/macos.ts +1 -0
  386. package/src/notifications/adapters/slack.ts +1 -1
  387. package/src/notifications/copy-composer.ts +9 -0
  388. package/src/notifications/signal.ts +16 -0
  389. package/src/oauth/__tests__/identity-verifier.test.ts +1 -1
  390. package/src/oauth/connect-orchestrator.ts +10 -3
  391. package/src/oauth/oauth-store.ts +10 -11
  392. package/src/oauth/provider-serializer.ts +3 -0
  393. package/src/oauth/provider-visibility.ts +16 -0
  394. package/src/oauth/seed-providers.ts +50 -17
  395. package/src/permissions/checker.ts +62 -9
  396. package/src/permissions/defaults.ts +4 -4
  397. package/src/permissions/types.ts +2 -4
  398. package/src/permissions/workspace-policy.ts +1 -1
  399. package/src/playbooks/playbook-compiler.ts +19 -18
  400. package/src/playbooks/types.ts +4 -3
  401. package/src/prompts/system-prompt.ts +6 -93
  402. package/src/prompts/templates/UPDATES.md +6 -0
  403. package/src/providers/anthropic/client.ts +47 -19
  404. package/src/providers/gemini/client.ts +1 -1
  405. package/src/providers/openai/client.ts +1 -1
  406. package/src/providers/registry.ts +1 -1
  407. package/src/providers/retry.ts +19 -3
  408. package/src/runtime/actor-trust-resolver.ts +5 -1
  409. package/src/runtime/auth/__tests__/credential-service.test.ts +1 -27
  410. package/src/runtime/auth/__tests__/token-service.test.ts +1 -25
  411. package/src/runtime/auth/route-policy.ts +7 -4
  412. package/src/runtime/guardian-reply-router.ts +10 -2
  413. package/src/runtime/http-server.ts +23 -3
  414. package/src/runtime/middleware/auth.ts +20 -0
  415. package/src/runtime/routes/attachment-routes.test.ts +106 -0
  416. package/src/runtime/routes/attachment-routes.ts +106 -16
  417. package/src/runtime/routes/brain-graph-routes.ts +21 -22
  418. package/src/runtime/routes/btw-routes.ts +8 -0
  419. package/src/runtime/routes/conversation-management-routes.ts +2 -0
  420. package/src/runtime/routes/conversation-query-routes.ts +2 -58
  421. package/src/runtime/routes/conversation-starter-routes.ts +2 -2
  422. package/src/runtime/routes/debug-routes.ts +1 -1
  423. package/src/runtime/routes/global-search-routes.ts +21 -19
  424. package/src/runtime/routes/group-routes.ts +207 -0
  425. package/src/runtime/routes/guardian-action-routes.ts +21 -10
  426. package/src/runtime/routes/guardian-bootstrap-routes.ts +23 -19
  427. package/src/runtime/routes/inbound-message-handler.ts +19 -0
  428. package/src/runtime/routes/inbound-stages/background-dispatch.ts +43 -2
  429. package/src/runtime/routes/inbound-stages/guardian-activation-intercept.test.ts +292 -0
  430. package/src/runtime/routes/inbound-stages/guardian-activation-intercept.ts +207 -0
  431. package/src/runtime/routes/memory-item-routes.test.ts +2 -31
  432. package/src/runtime/routes/memory-item-routes.ts +385 -341
  433. package/src/runtime/routes/oauth-apps.ts +18 -1
  434. package/src/runtime/routes/oauth-providers.ts +13 -1
  435. package/src/runtime/routes/schedule-routes.ts +2 -0
  436. package/src/runtime/routes/settings-routes.ts +1 -0
  437. package/src/runtime/routes/skills-routes.ts +103 -37
  438. package/src/runtime/routes/usage-routes.ts +19 -2
  439. package/src/runtime/routes/work-items-routes.test.ts +2 -27
  440. package/src/runtime/routes/workspace-routes.test.ts +3 -27
  441. package/src/schedule/scheduler.ts +8 -1
  442. package/src/security/oauth2.ts +1 -1
  443. package/src/security/secret-allowlist.ts +4 -4
  444. package/src/security/secure-keys.ts +4 -8
  445. package/src/shared/provider-env-vars.ts +19 -0
  446. package/src/skills/catalog-cache.ts +5 -0
  447. package/src/skills/catalog-install.ts +15 -14
  448. package/src/skills/clawhub.ts +134 -154
  449. package/src/skills/install-meta.ts +208 -0
  450. package/src/skills/managed-store.ts +27 -16
  451. package/src/skills/skill-memory.ts +210 -96
  452. package/src/skills/skillssh-registry.ts +19 -17
  453. package/src/tasks/task-runner.ts +3 -1
  454. package/src/telemetry/usage-telemetry-reporter.test.ts +3 -5
  455. package/src/tools/browser/runtime-check.ts +3 -1
  456. package/src/tools/memory/register.ts +63 -46
  457. package/src/tools/permission-checker.ts +7 -19
  458. package/src/tools/shared/filesystem/image-read.ts +22 -85
  459. package/src/tools/skills/skill-script-runner.ts +1 -1
  460. package/src/tools/terminal/safe-env.ts +1 -0
  461. package/src/tools/tool-manifest.ts +3 -3
  462. package/src/util/browser.ts +25 -10
  463. package/src/util/bun-runtime.ts +172 -0
  464. package/src/util/device-id.ts +3 -65
  465. package/src/watcher/providers/outlook-calendar.ts +343 -0
  466. package/src/watcher/providers/outlook.ts +198 -0
  467. package/src/workspace/git-service.ts +27 -6
  468. package/src/workspace/migrations/025-remove-oauth-app-setup-skills.ts +76 -0
  469. package/src/workspace/migrations/026-backfill-install-meta.ts +325 -0
  470. package/src/workspace/migrations/027-remove-orphaned-optimized-images-cache.ts +42 -0
  471. package/src/workspace/migrations/registry.ts +6 -0
  472. package/src/__tests__/context-memory-e2e.test.ts +0 -415
  473. package/src/__tests__/journal-context.test.ts +0 -268
  474. package/src/__tests__/memory-context-benchmark.benchmark.test.ts +0 -297
  475. package/src/__tests__/memory-lifecycle-e2e.test.ts +0 -459
  476. package/src/__tests__/memory-query-builder.test.ts +0 -59
  477. package/src/__tests__/memory-recall-quality.test.ts +0 -1046
  478. package/src/__tests__/memory-regressions.experimental.test.ts +0 -629
  479. package/src/__tests__/memory-regressions.test.ts +0 -3696
  480. package/src/__tests__/memory-retrieval.benchmark.test.ts +0 -295
  481. package/src/daemon/conversation-memory.ts +0 -207
  482. package/src/memory/conversation-starters-cadence.ts +0 -74
  483. package/src/memory/items-extractor.ts +0 -860
  484. package/src/memory/job-handlers/batch-extraction.ts +0 -741
  485. package/src/memory/job-handlers/extraction.ts +0 -40
  486. package/src/memory/job-handlers/journal-carry-forward.test.ts +0 -383
  487. package/src/memory/job-handlers/journal-carry-forward.ts +0 -255
  488. package/src/memory/journal-memory.ts +0 -224
  489. package/src/memory/query-builder.ts +0 -47
  490. package/src/memory/query-expansion.ts +0 -83
  491. package/src/memory/retriever.test.ts +0 -1590
  492. package/src/memory/retriever.ts +0 -1323
  493. package/src/memory/search/formatting.test.ts +0 -140
  494. package/src/memory/search/formatting.ts +0 -262
  495. package/src/memory/search/mmr.ts +0 -136
  496. package/src/memory/search/ranking.ts +0 -15
  497. package/src/memory/search/staleness.ts +0 -40
  498. package/src/memory/search/tier-classifier.ts +0 -18
  499. package/src/memory/search/types.ts +0 -121
  500. package/src/prompts/journal-context.ts +0 -156
  501. package/src/tools/memory/definitions.ts +0 -69
  502. package/src/tools/memory/handlers.test.ts +0 -590
  503. package/src/tools/memory/handlers.ts +0 -434
@@ -1,20 +1,4 @@
1
- import { mkdtempSync, rmSync } from "node:fs";
2
- import { tmpdir } from "node:os";
3
- import { join } from "node:path";
4
- import { afterAll, beforeEach, describe, expect, mock, test } from "bun:test";
5
-
6
- const testDir = mkdtempSync(join(tmpdir(), "task-scheduler-test-"));
7
-
8
- mock.module("../util/platform.js", () => ({
9
- getDataDir: () => testDir,
10
- isMacOS: () => process.platform === "darwin",
11
- isLinux: () => process.platform === "linux",
12
- isWindows: () => process.platform === "win32",
13
- getPidPath: () => join(testDir, "test.pid"),
14
- getDbPath: () => join(testDir, "test.db"),
15
- getLogPath: () => join(testDir, "test.log"),
16
- ensureDataDir: () => {},
17
- }));
1
+ import { beforeEach, describe, expect, mock, test } from "bun:test";
18
2
 
19
3
  mock.module("../util/logger.js", () => ({
20
4
  getLogger: () =>
@@ -23,7 +7,7 @@ mock.module("../util/logger.js", () => ({
23
7
  }),
24
8
  }));
25
9
 
26
- import { getDb, initializeDb, resetDb } from "../memory/db.js";
10
+ import { getDb, initializeDb } from "../memory/db.js";
27
11
  import {
28
12
  createSchedule,
29
13
  getSchedule,
@@ -49,15 +33,6 @@ function forceScheduleDue(scheduleId: string): void {
49
33
  ]);
50
34
  }
51
35
 
52
- afterAll(() => {
53
- resetDb();
54
- try {
55
- rmSync(testDir, { recursive: true });
56
- } catch {
57
- /* best effort */
58
- }
59
- });
60
-
61
36
  // ── scheduleTask helper ─────────────────────────────────────────────
62
37
 
63
38
  describe("scheduleTask", () => {
@@ -1,6 +1,3 @@
1
- import { mkdtempSync } from "node:fs";
2
- import { tmpdir } from "node:os";
3
- import { join } from "node:path";
4
1
  import { afterEach, beforeEach, describe, expect, mock, test } from "bun:test";
5
2
 
6
3
  import type { ShellOutputResult } from "../tools/shared/shell-output.js";
@@ -16,20 +13,7 @@ mock.module("../util/logger.js", () => ({
16
13
  }),
17
14
  }));
18
15
 
19
- const testTmpDir = mkdtempSync(join(tmpdir(), "terminal-test-"));
20
-
21
- mock.module("../util/platform.js", () => ({
22
- getProtectedDir: () => join(testTmpDir, "protected"),
23
- getDataDir: () => join(testTmpDir, "data"),
24
- getSandboxWorkingDir: () => join(testTmpDir, "sandbox"),
25
- isMacOS: () => process.platform === "darwin",
26
- isLinux: () => process.platform === "linux",
27
- isWindows: () => process.platform === "win32",
28
- getPidPath: () => join(testTmpDir, "test.pid"),
29
- getDbPath: () => join(testTmpDir, "test.db"),
30
- getLogPath: () => join(testTmpDir, "test.log"),
31
- ensureDataDir: () => {},
32
- }));
16
+ const testTmpDir = process.env.VELLUM_WORKSPACE_DIR!;
33
17
 
34
18
  mock.module("../config/loader.js", () => ({
35
19
  getConfig: () => ({
@@ -16,12 +16,15 @@ import { tmpdir } from "node:os";
16
16
  import { join } from "node:path";
17
17
  import { afterAll } from "bun:test";
18
18
 
19
+ import { resetDb } from "../memory/db-connection.js";
20
+
19
21
  const testDir = realpathSync(
20
22
  mkdtempSync(join(tmpdir(), "vellum-test-workspace-")),
21
23
  );
22
24
  process.env.VELLUM_WORKSPACE_DIR = testDir;
23
25
 
24
26
  afterAll(() => {
27
+ resetDb();
25
28
  delete process.env.VELLUM_WORKSPACE_DIR;
26
29
  try {
27
30
  rmSync(testDir, { recursive: true, force: true });
@@ -216,85 +216,6 @@ function makeSystemPrompt(size: "small" | "production" = "small"): string {
216
216
  "Each MCP server entry requires: name, command, args, and optional env.",
217
217
  );
218
218
 
219
- // Dynamic skills catalog (~5K chars)
220
- sections.push("", "## Available Skills", "<available_skills>");
221
- const skillCategories = [
222
- {
223
- id: "gmail",
224
- name: "Gmail",
225
- desc: "Send, search, draft, and manage Gmail messages",
226
- },
227
- {
228
- id: "calendar",
229
- name: "Google Calendar",
230
- desc: "Create, list, update, and delete calendar events",
231
- },
232
- {
233
- id: "slack",
234
- name: "Slack",
235
- desc: "Send messages, search channels, manage threads",
236
- },
237
- { id: "contacts", name: "Contacts", desc: "Search and manage contacts" },
238
- {
239
- id: "tasks",
240
- name: "Tasks",
241
- desc: "Create, list, update, and complete tasks",
242
- },
243
- {
244
- id: "browser",
245
- name: "Browser",
246
- desc: "Navigate web pages, take screenshots, interact with web content",
247
- },
248
- {
249
- id: "schedule",
250
- name: "Schedule",
251
- desc: "Set reminders and schedule recurring tasks",
252
- },
253
- {
254
- id: "messaging",
255
- name: "Messaging",
256
- desc: "Send iMessage and SMS messages",
257
- },
258
- {
259
- id: "sequences",
260
- name: "Sequences",
261
- desc: "Create and manage multi-step automation workflows",
262
- },
263
- {
264
- id: "playbooks",
265
- name: "Playbooks",
266
- desc: "Execute pre-defined operational playbooks",
267
- },
268
- {
269
- id: "notes",
270
- name: "Notes",
271
- desc: "Create and manage notes in Apple Notes",
272
- },
273
- { id: "music", name: "Music", desc: "Control Apple Music playback" },
274
- {
275
- id: "photos",
276
- name: "Photos",
277
- desc: "Search and manage photos in Apple Photos",
278
- },
279
- {
280
- id: "maps",
281
- name: "Maps",
282
- desc: "Search locations, get directions, find nearby places",
283
- },
284
- {
285
- id: "weather",
286
- name: "Weather",
287
- desc: "Get current weather and forecasts",
288
- },
289
- ];
290
- for (const skill of skillCategories) {
291
- sections.push(
292
- ` <skill id="${skill.id}" name="${skill.name}" description="${skill.desc}" ` +
293
- `credential_setup="oauth" enabled="true" />`,
294
- );
295
- }
296
- sections.push("</available_skills>");
297
-
298
219
  // Attachment handling (~1K chars)
299
220
  sections.push(
300
221
  "",
@@ -1,20 +1,6 @@
1
- import { mkdtempSync, rmSync } from "node:fs";
2
- import { tmpdir } from "node:os";
3
- import { join } from "node:path";
4
- import { afterAll, beforeEach, describe, expect, mock, test } from "bun:test";
5
-
6
- const testDir = mkdtempSync(join(tmpdir(), "tool-approval-handler-test-"));
7
-
8
- mock.module("../util/platform.js", () => ({
9
- getDataDir: () => testDir,
10
- isMacOS: () => process.platform === "darwin",
11
- isLinux: () => process.platform === "linux",
12
- isWindows: () => process.platform === "win32",
13
- getPidPath: () => join(testDir, "test.pid"),
14
- getDbPath: () => join(testDir, "test.db"),
15
- getLogPath: () => join(testDir, "test.log"),
16
- ensureDataDir: () => {},
17
- }));
1
+ import { beforeEach, describe, expect, mock, test } from "bun:test";
2
+
3
+ const testDir = process.env.VELLUM_WORKSPACE_DIR!;
18
4
 
19
5
  mock.module("../util/logger.js", () => ({
20
6
  getLogger: () =>
@@ -57,7 +43,7 @@ import {
57
43
  mintGrantFromDecision,
58
44
  type MintGrantParams,
59
45
  } from "../approvals/approval-primitive.js";
60
- import { getDb, initializeDb, resetDb } from "../memory/db.js";
46
+ import { getDb, initializeDb } from "../memory/db.js";
61
47
  import { scopedApprovalGrants } from "../memory/schema.js";
62
48
  import { computeToolApprovalDigest } from "../security/tool-approval-digest.js";
63
49
  import { ToolApprovalHandler } from "../tools/tool-approval-handler.js";
@@ -70,15 +56,6 @@ function clearTables(): void {
70
56
  db.delete(scopedApprovalGrants).run();
71
57
  }
72
58
 
73
- afterAll(() => {
74
- resetDb();
75
- try {
76
- rmSync(testDir, { recursive: true });
77
- } catch {
78
- /* best effort */
79
- }
80
- });
81
-
82
59
  // ---------------------------------------------------------------------------
83
60
  // Helpers
84
61
  // ---------------------------------------------------------------------------
@@ -13,11 +13,11 @@ import {
13
13
  } from "node:fs";
14
14
  import { tmpdir } from "node:os";
15
15
  import { join } from "node:path";
16
- import { afterEach, beforeEach, describe, expect, test } from "bun:test";
16
+ import { afterEach, beforeEach, describe, expect, mock, test } from "bun:test";
17
+
17
18
  // ── Shared mock setup ────────────────────────────────────────────────────────
18
19
  // Config mock must be declared before importing tool modules so that the
19
20
  // mock.module calls are hoisted above the dynamic imports.
20
- import { mock } from "bun:test";
21
21
 
22
22
  mock.module("../config/loader.js", () => ({
23
23
  getConfig: () => ({
@@ -75,15 +75,6 @@ mock.module("../tools/network/script-proxy/index.js", () => ({
75
75
  getSessionEnv: () => ({}),
76
76
  }));
77
77
 
78
- mock.module("../util/platform.js", () => ({
79
- getProtectedDir: () => "/tmp/protected",
80
- getDataDir: () => "/tmp",
81
- getWorkspaceDir: () => "/tmp/workspace",
82
- getConversationsDir: () => "/tmp/workspace/conversations",
83
- getDbPath: () => "/tmp/assistant.db",
84
- ensureDataDir: () => {},
85
- }));
86
-
87
78
  mock.module("../tools/credentials/resolve.js", () => ({
88
79
  resolveCredentialRef: () => null,
89
80
  }));
@@ -15,30 +15,14 @@
15
15
  * - Secret scanning < 50ms for large outputs (100KB)
16
16
  * - ToolExecutor overhead < 20ms regardless of tool execution time
17
17
  */
18
- import { mkdtempSync, rmSync } from "node:fs";
19
- import { tmpdir } from "node:os";
20
- import { join } from "node:path";
21
- import { afterAll, beforeAll, describe, expect, mock, test } from "bun:test";
22
18
 
23
- const testDir = mkdtempSync(join(tmpdir(), "tool-pipeline-bench-"));
19
+ import { beforeAll, describe, expect, mock, test } from "bun:test";
24
20
 
25
21
  // Local registry for ToolExecutor tests — the mock delegates to this map
26
22
  // so that registerTool/getTool/getAllTools work for our benchmark tools.
27
23
  const localRegistry = new Map<string, import("../tools/types.js").Tool>();
28
24
 
29
25
  // Mocks must precede imports of modules under test.
30
- mock.module("../util/platform.js", () => ({
31
- getDataDir: () => testDir,
32
- isMacOS: () => process.platform === "darwin",
33
- isLinux: () => process.platform === "linux",
34
- isWindows: () => process.platform === "win32",
35
- getPidPath: () => join(testDir, "test.pid"),
36
- getDbPath: () => join(testDir, "test.db"),
37
- getLogPath: () => join(testDir, "test.log"),
38
- ensureDataDir: () => {},
39
- getHooksDir: () => join(testDir, "hooks"),
40
- }));
41
-
42
26
  mock.module("../util/logger.js", () => ({
43
27
  getLogger: () =>
44
28
  new Proxy({} as Record<string, unknown>, {
@@ -192,14 +176,6 @@ describe("Tool execution pipeline benchmark", () => {
192
176
  }
193
177
  });
194
178
 
195
- afterAll(() => {
196
- try {
197
- rmSync(testDir, { recursive: true });
198
- } catch {
199
- // best effort cleanup
200
- }
201
- });
202
-
203
179
  test("classifyRisk: low-risk tool (file_read) is fast", async () => {
204
180
  const { timings } = await benchmarkAsync(
205
181
  () => classifyRisk("file_read", { path: "/tmp/test.ts" }, "/tmp"),
@@ -34,7 +34,6 @@ const mockConfig = {
34
34
  },
35
35
  permissions: {
36
36
  mode: "workspace" as const,
37
- dangerouslySkipPermissions: false,
38
37
  },
39
38
  };
40
39
 
@@ -52,7 +52,6 @@ const mockConfig = {
52
52
  },
53
53
  permissions: {
54
54
  mode: "workspace" as const,
55
- dangerouslySkipPermissions: false,
56
55
  },
57
56
  };
58
57
 
@@ -8,23 +8,9 @@
8
8
  * 5. Inline wait-and-resume for trusted-contact grant-gated tools
9
9
  */
10
10
 
11
- import { mkdtempSync, rmSync } from "node:fs";
12
- import { tmpdir } from "node:os";
13
- import { join } from "node:path";
14
- import { afterAll, beforeEach, describe, expect, mock, test } from "bun:test";
15
-
16
- const testDir = mkdtempSync(join(tmpdir(), "tool-grant-escalation-test-"));
17
-
18
- mock.module("../util/platform.js", () => ({
19
- getDataDir: () => testDir,
20
- isMacOS: () => process.platform === "darwin",
21
- isLinux: () => process.platform === "linux",
22
- isWindows: () => process.platform === "win32",
23
- getPidPath: () => join(testDir, "test.pid"),
24
- getDbPath: () => join(testDir, "test.db"),
25
- getLogPath: () => join(testDir, "test.log"),
26
- ensureDataDir: () => {},
27
- }));
11
+ import { beforeEach, describe, expect, mock, test } from "bun:test";
12
+
13
+ const testDir = process.env.VELLUM_WORKSPACE_DIR!;
28
14
 
29
15
  mock.module("../util/logger.js", () => ({
30
16
  getLogger: () =>
@@ -123,7 +109,7 @@ import {
123
109
  getCanonicalGuardianRequest,
124
110
  listCanonicalGuardianRequests,
125
111
  } from "../memory/canonical-guardian-store.js";
126
- import { getDb, initializeDb, resetDb } from "../memory/db.js";
112
+ import { getDb, initializeDb } from "../memory/db.js";
127
113
  import { scopedApprovalGrants } from "../memory/schema.js";
128
114
  import { computeToolApprovalDigest } from "../security/tool-approval-digest.js";
129
115
  import {
@@ -144,15 +130,6 @@ function resetTables(): void {
144
130
  db.run("DELETE FROM canonical_guardian_requests");
145
131
  }
146
132
 
147
- afterAll(() => {
148
- resetDb();
149
- try {
150
- rmSync(testDir, { recursive: true });
151
- } catch {
152
- /* best effort */
153
- }
154
- });
155
-
156
133
  // ---------------------------------------------------------------------------
157
134
  // Helpers
158
135
  // ---------------------------------------------------------------------------
@@ -8,29 +8,9 @@
8
8
  * - handleToolResult includes toolUseId in emitted tool_result
9
9
  * - Event ordering: tool_use_preview_start → input_json_delta → tool_use
10
10
  */
11
- import { join } from "node:path";
12
11
  import { beforeEach, describe, expect, mock, test } from "bun:test";
13
12
 
14
13
  // ── Mock platform (must precede imports that read it) ─────────────────────────
15
- mock.module("../util/platform.js", () => ({
16
- getSessionTokenPath: () => "/tmp/test-token",
17
- getProtectedDir: () => join("/tmp/test", "protected"),
18
- getDataDir: () => "/tmp/test",
19
- getWorkspaceDir: () => "/tmp/test/workspace",
20
- getWorkspaceSkillsDir: () => "/tmp/test/skills",
21
- getSandboxWorkingDir: () => "/tmp/test/sandbox",
22
- getTCPPort: () => undefined,
23
- getTCPHost: () => "127.0.0.1",
24
- isTCPEnabled: () => false,
25
- isMacOS: () => false,
26
- isLinux: () => true,
27
- isWindows: () => false,
28
- getPidPath: () => "/tmp/test.pid",
29
- getLogPath: () => "/tmp/test.log",
30
- getDbPath: () => "/tmp/test.db",
31
- ensureDataDir: () => {},
32
- }));
33
-
34
14
  mock.module("../util/logger.js", () => ({
35
15
  getLogger: () =>
36
16
  new Proxy({} as Record<string, unknown>, {
@@ -0,0 +1,276 @@
1
+ /**
2
+ * Tests for the bash post-execution hook that dispatches Slack DMs
3
+ * for channel verification sessions. Validates that the hook only
4
+ * delivers when an active session exists with a matching destination.
5
+ */
6
+
7
+ import { beforeEach, describe, expect, mock, test } from "bun:test";
8
+
9
+ // ---------------------------------------------------------------------------
10
+ // Mocks — must be set up before importing the module under test
11
+ // ---------------------------------------------------------------------------
12
+
13
+ const mockFindActiveSession = mock(() => null as unknown);
14
+ mock.module("../runtime/channel-verification-service.js", () => ({
15
+ findActiveSession: mockFindActiveSession,
16
+ }));
17
+
18
+ const mockDeliverVerificationSlack = mock(() => {});
19
+ mock.module("../runtime/verification-outbound-actions.js", () => ({
20
+ deliverVerificationSlack: mockDeliverVerificationSlack,
21
+ }));
22
+
23
+ // Stub out transitive dependencies to prevent import errors
24
+ mock.module("../bundler/app-compiler.js", () => ({
25
+ compileApp: mock(() => Promise.resolve({ ok: true })),
26
+ }));
27
+ mock.module("../media/app-icon-generator.js", () => ({
28
+ generateAppIcon: mock(() => Promise.resolve()),
29
+ }));
30
+ mock.module("../memory/app-store.js", () => ({
31
+ getApp: mock(() => null),
32
+ getAppDirPath: mock(() => ""),
33
+ isMultifileApp: mock(() => false),
34
+ }));
35
+ mock.module("../services/published-app-updater.js", () => ({
36
+ updatePublishedAppDeployment: mock(() => Promise.resolve()),
37
+ }));
38
+ mock.module("../daemon/conversation-surfaces.js", () => ({
39
+ refreshSurfacesForApp: mock(() => {}),
40
+ }));
41
+ mock.module("../daemon/doordash-steps.js", () => ({
42
+ isDoordashCommand: mock(() => false),
43
+ updateDoordashProgress: mock(() => {}),
44
+ }));
45
+
46
+ const mockLogWarn = mock((_obj: unknown, _msg: string) => {});
47
+ const mockLogInfo = mock((_obj: unknown, _msg: string) => {});
48
+ const mockLogError = mock((_obj: unknown, _msg: string) => {});
49
+ mock.module("../util/logger.js", () => ({
50
+ getLogger: () => ({
51
+ warn: mockLogWarn,
52
+ info: mockLogInfo,
53
+ error: mockLogError,
54
+ debug: () => {},
55
+ trace: () => {},
56
+ }),
57
+ }));
58
+
59
+ // ---------------------------------------------------------------------------
60
+ // Import after mocks — dynamic import ensures mock.module() calls above
61
+ // are registered before tool-side-effects.ts evaluates its top-level
62
+ // `const log = getLogger(...)`.
63
+ // ---------------------------------------------------------------------------
64
+
65
+ import type { SideEffectContext } from "../daemon/tool-side-effects.js";
66
+
67
+ const { runPostExecutionSideEffects } =
68
+ await import("../daemon/tool-side-effects.js");
69
+
70
+ // ---------------------------------------------------------------------------
71
+ // Helpers
72
+ // ---------------------------------------------------------------------------
73
+
74
+ const dummySideEffectCtx = {
75
+ ctx: {} as SideEffectContext["ctx"],
76
+ } satisfies SideEffectContext;
77
+
78
+ function callWithBashHook(
79
+ command: string,
80
+ content: string,
81
+ isError = false,
82
+ ): void {
83
+ runPostExecutionSideEffects(
84
+ "bash",
85
+ { command },
86
+ { content, isError },
87
+ dummySideEffectCtx,
88
+ );
89
+ }
90
+
91
+ // ---------------------------------------------------------------------------
92
+ // Tests
93
+ // ---------------------------------------------------------------------------
94
+
95
+ describe("bash hook — Slack DM dispatch with session validation", () => {
96
+ beforeEach(() => {
97
+ mockFindActiveSession.mockReset();
98
+ mockDeliverVerificationSlack.mockReset();
99
+ mockLogWarn.mockReset();
100
+ mockLogInfo.mockReset();
101
+ mockLogError.mockReset();
102
+ });
103
+
104
+ test("legitimate verification dispatches DM", () => {
105
+ mockFindActiveSession.mockReturnValue({
106
+ destinationAddress: "U123",
107
+ status: "awaiting_response",
108
+ });
109
+
110
+ const output = JSON.stringify({
111
+ _pendingSlackDm: {
112
+ userId: "U123",
113
+ text: "code",
114
+ assistantId: "aid",
115
+ },
116
+ });
117
+
118
+ callWithBashHook(
119
+ "assistant channel-verification-sessions create ...",
120
+ output,
121
+ );
122
+
123
+ expect(mockDeliverVerificationSlack).toHaveBeenCalledTimes(1);
124
+ expect(mockDeliverVerificationSlack).toHaveBeenCalledWith(
125
+ "U123",
126
+ "code",
127
+ "aid",
128
+ );
129
+ });
130
+
131
+ test("no active session — DM not dispatched", () => {
132
+ mockFindActiveSession.mockReturnValue(null);
133
+
134
+ const output = JSON.stringify({
135
+ _pendingSlackDm: {
136
+ userId: "U123",
137
+ text: "code",
138
+ assistantId: "aid",
139
+ },
140
+ });
141
+
142
+ callWithBashHook(
143
+ "assistant channel-verification-sessions create ...",
144
+ output,
145
+ );
146
+
147
+ expect(mockDeliverVerificationSlack).not.toHaveBeenCalled();
148
+ expect(mockLogWarn).toHaveBeenCalledWith(
149
+ expect.objectContaining({ userId: "U123" }),
150
+ expect.stringContaining("no active Slack verification session"),
151
+ );
152
+ });
153
+
154
+ test("userId mismatch — DM not dispatched", () => {
155
+ mockFindActiveSession.mockReturnValue({
156
+ destinationAddress: "U999",
157
+ status: "awaiting_response",
158
+ });
159
+
160
+ const output = JSON.stringify({
161
+ _pendingSlackDm: {
162
+ userId: "U_ATTACKER",
163
+ text: "code",
164
+ assistantId: "aid",
165
+ },
166
+ });
167
+
168
+ callWithBashHook(
169
+ "assistant channel-verification-sessions create ...",
170
+ output,
171
+ );
172
+
173
+ expect(mockDeliverVerificationSlack).not.toHaveBeenCalled();
174
+ expect(mockLogWarn).toHaveBeenCalledWith(
175
+ expect.objectContaining({ userId: "U_ATTACKER", expected: "U999" }),
176
+ expect.stringContaining("does not match active session destination"),
177
+ );
178
+ });
179
+
180
+ test("command without verification substring — hook is no-op", () => {
181
+ mockFindActiveSession.mockReturnValue({
182
+ destinationAddress: "U123",
183
+ status: "awaiting_response",
184
+ });
185
+
186
+ const output = JSON.stringify({
187
+ _pendingSlackDm: {
188
+ userId: "U123",
189
+ text: "code",
190
+ assistantId: "aid",
191
+ },
192
+ });
193
+
194
+ callWithBashHook("echo hello", output);
195
+
196
+ expect(mockDeliverVerificationSlack).not.toHaveBeenCalled();
197
+ });
198
+
199
+ test("output without _pendingSlackDm — hook is no-op", () => {
200
+ mockFindActiveSession.mockReturnValue({
201
+ destinationAddress: "U123",
202
+ status: "awaiting_response",
203
+ });
204
+
205
+ callWithBashHook(
206
+ "assistant channel-verification-sessions create ...",
207
+ JSON.stringify({ success: true, sessionId: "s1" }),
208
+ );
209
+
210
+ expect(mockDeliverVerificationSlack).not.toHaveBeenCalled();
211
+ });
212
+
213
+ test("multi-line JSON output — dispatches from correct line", () => {
214
+ mockFindActiveSession.mockReturnValue({
215
+ destinationAddress: "U123",
216
+ status: "awaiting_response",
217
+ });
218
+
219
+ const cancelResult = JSON.stringify({ success: true, cancelled: true });
220
+ const createResult = JSON.stringify({
221
+ _pendingSlackDm: {
222
+ userId: "U123",
223
+ text: "verify-code",
224
+ assistantId: "aid2",
225
+ },
226
+ });
227
+ const multiLineOutput = `${cancelResult}\n${createResult}`;
228
+
229
+ callWithBashHook(
230
+ "assistant channel-verification-sessions create ...",
231
+ multiLineOutput,
232
+ );
233
+
234
+ expect(mockDeliverVerificationSlack).toHaveBeenCalledTimes(1);
235
+ expect(mockDeliverVerificationSlack).toHaveBeenCalledWith(
236
+ "U123",
237
+ "verify-code",
238
+ "aid2",
239
+ );
240
+ });
241
+
242
+ test("multi-line — rejected first line does not block valid second line", () => {
243
+ mockFindActiveSession.mockReturnValue({
244
+ destinationAddress: "U200",
245
+ status: "awaiting_response",
246
+ });
247
+
248
+ const staleResult = JSON.stringify({
249
+ _pendingSlackDm: {
250
+ userId: "U100",
251
+ text: "stale-code",
252
+ assistantId: "aid",
253
+ },
254
+ });
255
+ const validResult = JSON.stringify({
256
+ _pendingSlackDm: {
257
+ userId: "U200",
258
+ text: "valid-code",
259
+ assistantId: "aid2",
260
+ },
261
+ });
262
+ const multiLineOutput = `${staleResult}\n${validResult}`;
263
+
264
+ callWithBashHook(
265
+ "assistant channel-verification-sessions create ...",
266
+ multiLineOutput,
267
+ );
268
+
269
+ expect(mockDeliverVerificationSlack).toHaveBeenCalledTimes(1);
270
+ expect(mockDeliverVerificationSlack).toHaveBeenCalledWith(
271
+ "U200",
272
+ "valid-code",
273
+ "aid2",
274
+ );
275
+ });
276
+ });