@vellumai/assistant 0.9.0 → 0.10.0-staging.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (572) hide show
  1. package/ARCHITECTURE.md +18 -34
  2. package/bun.lock +7 -8
  3. package/docs/activation-funnel-telemetry.md +28 -22
  4. package/docs/architecture/security.md +29 -28
  5. package/docs/stt-provider-onboarding.md +3 -5
  6. package/docs/workflows-testing.md +13 -44
  7. package/docs/workflows.md +3 -5
  8. package/node_modules/@vellumai/ces-client/src/__tests__/ces-client.test.ts +47 -0
  9. package/node_modules/@vellumai/ces-client/src/rpc-client.ts +28 -5
  10. package/node_modules/@vellumai/environments/src/seeds.ts +2 -5
  11. package/node_modules/@vellumai/gateway-client/src/admission-policy-contract.ts +97 -0
  12. package/node_modules/@vellumai/gateway-client/src/inbound-contract.ts +10 -0
  13. package/node_modules/@vellumai/gateway-client/src/index.ts +32 -6
  14. package/node_modules/@vellumai/gateway-client/src/outbound-contract.ts +119 -0
  15. package/node_modules/@vellumai/gateway-client/src/types.ts +15 -84
  16. package/openapi.yaml +976 -63
  17. package/package.json +2 -1
  18. package/scripts/sync-llm-catalog.ts +6 -15
  19. package/scripts/sync-web-search-catalog.ts +3 -11
  20. package/src/__tests__/access-request-card-view.test.ts +98 -0
  21. package/src/__tests__/access-request-seed-content-blocks.test.ts +2 -4
  22. package/src/__tests__/actor-trust-resolver-address-fallback.test.ts +72 -32
  23. package/src/__tests__/agent-loop-compaction-strip.test.ts +241 -0
  24. package/src/__tests__/agent-loop-mutable-latest-user-message.test.ts +16 -13
  25. package/src/__tests__/agent-loop-output-hooks.test.ts +69 -0
  26. package/src/__tests__/agent-loop-override-profile.test.ts +25 -0
  27. package/src/__tests__/always-loaded-tools-guard.test.ts +2 -3
  28. package/src/__tests__/app-compiler.test.ts +15 -1
  29. package/src/__tests__/app-dir-path-guard.test.ts +0 -1
  30. package/src/__tests__/assistant-feature-flag-guard.test.ts +1 -4
  31. package/src/__tests__/assistant-feature-flag-guardrails.test.ts +0 -2
  32. package/src/__tests__/auth-fallback-events-store.test.ts +6 -14
  33. package/src/__tests__/avatar-identity-sync.test.ts +2 -27
  34. package/src/__tests__/btw-routes.test.ts +6 -8
  35. package/src/__tests__/call-pointer-messages.test.ts +28 -0
  36. package/src/__tests__/cancel-clears-processing.test.ts +89 -0
  37. package/src/__tests__/channel-approval-routes.test.ts +0 -4
  38. package/src/__tests__/channel-inbound-disk-pressure.test.ts +5 -15
  39. package/src/__tests__/checker.test.ts +0 -3
  40. package/src/__tests__/cli-memory-v2-reembed-skills.test.ts +3 -4
  41. package/src/__tests__/compactor-image-manifest-trust.test.ts +21 -1
  42. package/src/__tests__/compactor-summary-call-truncation.test.ts +223 -0
  43. package/src/__tests__/config-loader-backfill.test.ts +268 -27
  44. package/src/__tests__/config-schema.test.ts +35 -0
  45. package/src/__tests__/config-watcher.test.ts +0 -18
  46. package/src/__tests__/confirmation-request-guardian-bridge.test.ts +2 -2
  47. package/src/__tests__/contact-store-user-file.test.ts +0 -6
  48. package/src/__tests__/contacts-tools.test.ts +29 -0
  49. package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +22 -0
  50. package/src/__tests__/conversation-agent-loop-overflow.test.ts +1 -0
  51. package/src/__tests__/conversation-agent-loop.test.ts +58 -0
  52. package/src/__tests__/conversation-attention-telegram.test.ts +0 -1
  53. package/src/__tests__/conversation-lifecycle.test.ts +7 -9
  54. package/src/__tests__/conversation-load-history-repair.test.ts +101 -0
  55. package/src/__tests__/conversation-routes-guardian-reply.test.ts +15 -12
  56. package/src/__tests__/conversation-surfaces-activation-emit.test.ts +6 -3
  57. package/src/__tests__/conversation-title-service.test.ts +62 -0
  58. package/src/__tests__/credential-broker.test.ts +449 -1
  59. package/src/__tests__/credential-execution-shell-lockdown.test.ts +18 -11
  60. package/src/__tests__/credential-execution-tools.test.ts +0 -1
  61. package/src/__tests__/credential-prompt-route.test.ts +4 -4
  62. package/src/__tests__/credential-routes.test.ts +360 -0
  63. package/src/__tests__/credential-security-invariants.test.ts +4 -13
  64. package/src/__tests__/disk-pressure-policy.test.ts +12 -0
  65. package/src/__tests__/disk-usage.test.ts +65 -0
  66. package/src/__tests__/dynamic-page-surface.test.ts +152 -1
  67. package/src/__tests__/fixtures/credential-security-fixtures.ts +2 -33
  68. package/src/__tests__/gateway-flag-listener.test.ts +110 -1
  69. package/src/__tests__/gateway-only-guard.test.ts +3 -7
  70. package/src/__tests__/guardian-binding-drift-heal.test.ts +1 -1
  71. package/src/__tests__/guardian-card-withdrawal.test.ts +403 -0
  72. package/src/__tests__/guardian-decision-primitive-canonical.test.ts +5 -3
  73. package/src/__tests__/guardian-grant-minting.test.ts +3 -35
  74. package/src/__tests__/guardian-routing-invariants.test.ts +64 -26
  75. package/src/__tests__/guardian-routing-state.test.ts +0 -1
  76. package/src/__tests__/headless-browser-mode.test.ts +10 -0
  77. package/src/__tests__/headless-browser-navigate.test.ts +8 -3
  78. package/src/__tests__/helpers/create-guardian-binding.ts +0 -1
  79. package/src/__tests__/host-browser-proxy.test.ts +87 -0
  80. package/src/__tests__/identity-routes.test.ts +0 -189
  81. package/src/__tests__/inbound-invite-redemption.test.ts +4 -4
  82. package/src/__tests__/injector-v3-suppression.test.ts +27 -20
  83. package/src/__tests__/internal-telemetry-routes.test.ts +6 -14
  84. package/src/__tests__/invite-redemption-service.test.ts +4 -7
  85. package/src/__tests__/llm-callsite-catalog.test.ts +5 -6
  86. package/src/__tests__/llm-catalog-parity.test.ts +30 -23
  87. package/src/__tests__/llm-resolver.test.ts +70 -24
  88. package/src/__tests__/llm-schema.test.ts +1 -0
  89. package/src/__tests__/managed-profile-guard.test.ts +163 -4
  90. package/src/__tests__/mcp-health-check.test.ts +6 -7
  91. package/src/__tests__/media-stream-server-integration.test.ts +317 -13
  92. package/src/__tests__/oauth-provider-seed-logos.test.ts +4 -6
  93. package/src/__tests__/onboarding-persona-write.test.ts +1 -1
  94. package/src/__tests__/path-policy.test.ts +34 -0
  95. package/src/__tests__/persona-resolver.test.ts +49 -14
  96. package/src/__tests__/plugin-api-model-profiles.test.ts +178 -0
  97. package/src/__tests__/plugin-api-provider.test.ts +24 -0
  98. package/src/__tests__/plugin-tool-contribution.test.ts +6 -3
  99. package/src/__tests__/post-compaction-reinjection-idempotency.test.ts +214 -0
  100. package/src/__tests__/provider-send-message-override-profile.test.ts +76 -0
  101. package/src/__tests__/reaction-persistence.test.ts +150 -29
  102. package/src/__tests__/registry.test.ts +2 -7
  103. package/src/__tests__/relay-server.test.ts +285 -0
  104. package/src/__tests__/runtime-attachment-metadata.test.ts +0 -1
  105. package/src/__tests__/schedule-routes-workflow-validation.test.ts +1 -10
  106. package/src/__tests__/schedule-routes.test.ts +0 -30
  107. package/src/__tests__/schedule-tools.test.ts +2 -18
  108. package/src/__tests__/scheduler-reuse-conversation.test.ts +8 -5
  109. package/src/__tests__/skill-execute-input.test.ts +51 -1
  110. package/src/__tests__/skill-runtime-path.test.ts +2 -3
  111. package/src/__tests__/skills.test.ts +51 -0
  112. package/src/__tests__/slack-notification-approval-card.test.ts +176 -0
  113. package/src/__tests__/slack-reaction-canonical-approval.test.ts +285 -0
  114. package/src/__tests__/subagent-tools.test.ts +266 -0
  115. package/src/__tests__/surface-completion-nudge-hook.test.ts +367 -0
  116. package/src/__tests__/task-progress-nudge-hook.test.ts +1 -1
  117. package/src/__tests__/title-generate-hook.test.ts +100 -3
  118. package/src/__tests__/token-estimator-accuracy.benchmark.test.ts +1 -29
  119. package/src/__tests__/token-manager.test.ts +519 -0
  120. package/src/__tests__/tool-approval-seed-content-blocks.test.ts +1 -1
  121. package/src/__tests__/tool-audit-listener.test.ts +7 -7
  122. package/src/__tests__/tool-executor-lifecycle-events.test.ts +6 -3
  123. package/src/__tests__/tool-executor.test.ts +0 -79
  124. package/src/__tests__/trusted-contact-approval-notifier.test.ts +4 -2
  125. package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +220 -3
  126. package/src/__tests__/trusted-contact-multichannel.test.ts +3 -3
  127. package/src/__tests__/trusted-contact-verification.test.ts +8 -10
  128. package/src/__tests__/twilio-routes.test.ts +81 -1
  129. package/src/__tests__/voice-invite-redemption.test.ts +2 -3
  130. package/src/__tests__/weak-open-model.test.ts +30 -0
  131. package/src/__tests__/web-search-catalog-parity.test.ts +6 -25
  132. package/src/__tests__/workspace-greetings.test.ts +152 -0
  133. package/src/__tests__/workspace-migration-105-enable-memory-v3-live-for-new-workspaces.test.ts +149 -0
  134. package/src/__tests__/workspace-migration-108-drop-balanced-economy-profile.test.ts +285 -0
  135. package/src/__tests__/workspace-migration-add-send-diagnostics.test.ts +1 -1
  136. package/src/__tests__/workspace-migration-drop-collect-usage-data.test.ts +118 -0
  137. package/src/__tests__/workspace-migration-drop-send-diagnostics.test.ts +118 -0
  138. package/src/a2a/__tests__/e2e-a2a-channel.test.ts +0 -4
  139. package/src/agent/loop.ts +49 -29
  140. package/src/api/README.md +6 -6
  141. package/src/api/events/tool-result.ts +6 -0
  142. package/src/api/events/workflow-completed.ts +53 -0
  143. package/src/api/events/workflow-leaf-finished.ts +38 -0
  144. package/src/api/events/workflow-leaf-started.ts +35 -0
  145. package/src/api/events/workflow-progress.ts +32 -0
  146. package/src/api/events/workflow-started.ts +31 -0
  147. package/src/api/index.ts +40 -0
  148. package/src/api/responses/conversation-message.ts +28 -4
  149. package/src/api/responses/home.ts +26 -4
  150. package/src/api/responses/workflow-journal.ts +53 -0
  151. package/src/approvals/guardian-card-withdrawal.ts +145 -0
  152. package/src/approvals/guardian-decision-primitive.ts +26 -3
  153. package/src/approvals/guardian-request-resolvers.ts +183 -80
  154. package/src/calls/__tests__/channel-admission-reader.test.ts +132 -0
  155. package/src/calls/__tests__/relay-setup-router.test.ts +350 -0
  156. package/src/calls/call-pointer-messages.ts +10 -4
  157. package/src/calls/channel-admission-reader.ts +104 -0
  158. package/src/calls/guardian-dispatch.ts +17 -45
  159. package/src/calls/media-stream-server.ts +84 -2
  160. package/src/calls/relay-access-wait.ts +1 -1
  161. package/src/calls/relay-server.ts +66 -0
  162. package/src/calls/relay-setup-router.ts +82 -1
  163. package/src/calls/twilio-routes.ts +17 -8
  164. package/src/calls/voice-session-bridge.ts +2 -2
  165. package/src/cli/commands/clients.ts +3 -0
  166. package/src/cli/commands/{__tests__ → memory/__tests__}/memory-v2-compare-render.test.ts +1 -1
  167. package/src/cli/commands/{__tests__ → memory/__tests__}/memory-v2.test.ts +8 -7
  168. package/src/cli/commands/{__tests__ → memory/__tests__}/memory-v3.test.ts +5 -4
  169. package/src/cli/commands/memory/index.ts +30 -0
  170. package/src/cli/commands/{memory-v2-compare-render.ts → memory/memory-v2-compare-render.ts} +1 -1
  171. package/src/cli/commands/{memory-v2.ts → memory/memory-v2.ts} +6 -15
  172. package/src/cli/commands/{memory-v3.ts → memory/memory-v3.ts} +97 -11
  173. package/src/cli/commands/oauth/status.test.ts +36 -0
  174. package/src/cli/commands/oauth/status.ts +23 -3
  175. package/src/cli/commands/plugins.ts +197 -4
  176. package/src/cli/lib/__tests__/diff-plugin.test.ts +443 -0
  177. package/src/cli/lib/__tests__/inspect-plugin.test.ts +54 -0
  178. package/src/cli/lib/__tests__/merge-plugin-tree.test.ts +443 -0
  179. package/src/cli/lib/__tests__/plugin-surfaces.test.ts +111 -0
  180. package/src/cli/lib/__tests__/upgrade-plugin.test.ts +295 -2
  181. package/src/cli/lib/diff-plugin.ts +346 -0
  182. package/src/cli/lib/inspect-plugin.ts +12 -1
  183. package/src/cli/lib/install-from-github.ts +105 -17
  184. package/src/cli/lib/merge-plugin-tree.ts +328 -0
  185. package/src/cli/lib/plugin-fingerprint.ts +14 -0
  186. package/src/cli/lib/plugin-surfaces.ts +104 -0
  187. package/src/cli/lib/upgrade-plugin.ts +298 -10
  188. package/src/cli/program.ts +2 -6
  189. package/src/config/__tests__/sync-gated-profiles.test.ts +368 -0
  190. package/src/config/assistant-feature-flags.ts +22 -7
  191. package/src/config/bundled-skills/contacts/tools/contact-search.ts +0 -1
  192. package/src/config/bundled-skills/messaging/SKILL.md +6 -4
  193. package/src/config/bundled-skills/messaging/tools/messaging-archive-by-sender.ts +9 -8
  194. package/src/config/bundled-skills/subagent/SKILL.md +4 -0
  195. package/src/config/bundled-skills/subagent/TOOLS.json +4 -0
  196. package/src/config/bundled-skills/workflows/SKILL.md +14 -8
  197. package/src/config/bundled-tool-registry.ts +2 -7
  198. package/src/config/call-site-defaults.ts +15 -2
  199. package/src/config/feature-flag-registry.json +46 -31
  200. package/src/config/inference-profile-validation.ts +26 -0
  201. package/src/config/llm-resolver.ts +3 -0
  202. package/src/config/loader.ts +4 -0
  203. package/src/config/memory-v3-gate.ts +11 -0
  204. package/src/config/profile-order.ts +28 -0
  205. package/src/config/schema.ts +8 -6
  206. package/src/config/schemas/__tests__/memory-v3.test.ts +1 -0
  207. package/src/config/schemas/call-site-catalog.ts +7 -0
  208. package/src/config/schemas/channels.ts +11 -0
  209. package/src/config/schemas/elevenlabs.ts +0 -1
  210. package/src/config/schemas/llm.ts +31 -0
  211. package/src/config/schemas/memory-lifecycle.ts +3 -7
  212. package/src/config/schemas/memory-v3.ts +6 -0
  213. package/src/config/schemas/platform.ts +0 -8
  214. package/src/config/schemas/services.ts +18 -0
  215. package/src/config/seed-inference-profiles.ts +109 -44
  216. package/src/config/skills.ts +21 -0
  217. package/src/config/sync-gated-profiles.ts +220 -0
  218. package/src/contacts/contact-store.ts +89 -106
  219. package/src/contacts/contacts-write.ts +5 -22
  220. package/src/contacts/types.ts +0 -1
  221. package/src/context/compactor.ts +88 -54
  222. package/src/context/strip-injections.ts +58 -10
  223. package/src/context/token-estimator.ts +1 -1
  224. package/src/credential-execution/process-manager.ts +55 -14
  225. package/src/credential-execution/prompted-credential.ts +2 -3
  226. package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +3 -2
  227. package/src/daemon/config-watcher.ts +0 -4
  228. package/src/daemon/conversation-agent-loop-handlers.ts +2 -0
  229. package/src/daemon/conversation-agent-loop.ts +114 -22
  230. package/src/daemon/conversation-history.ts +1 -1
  231. package/src/daemon/conversation-lifecycle.ts +3 -5
  232. package/src/daemon/conversation-process.ts +13 -5
  233. package/src/daemon/conversation-runtime-assembly.ts +13 -15
  234. package/src/daemon/conversation-slash.ts +2 -23
  235. package/src/daemon/conversation-surfaces.ts +26 -0
  236. package/src/daemon/conversation-tool-setup.ts +27 -14
  237. package/src/daemon/conversation.ts +66 -14
  238. package/src/daemon/disk-pressure-policy.ts +5 -3
  239. package/src/daemon/handlers/__tests__/config-a2a-complete.test.ts +0 -1
  240. package/src/daemon/handlers/__tests__/config-a2a-redeem.test.ts +0 -1
  241. package/src/daemon/handlers/config-a2a.ts +0 -2
  242. package/src/daemon/handlers/config-channels.ts +15 -16
  243. package/src/daemon/handlers/config-slack-channel.ts +22 -3
  244. package/src/daemon/handlers/conversations.ts +107 -0
  245. package/src/daemon/host-browser-proxy.ts +41 -0
  246. package/src/daemon/lifecycle.ts +55 -27
  247. package/src/daemon/message-provenance.ts +2 -0
  248. package/src/daemon/message-types/contacts.ts +0 -1
  249. package/src/daemon/message-types/conversations.ts +3 -3
  250. package/src/daemon/message-types/sync.ts +0 -1
  251. package/src/daemon/message-types/web-activity.ts +7 -1
  252. package/src/daemon/message-types/workflows.ts +83 -1
  253. package/src/daemon/orphan-reaper.test.ts +0 -19
  254. package/src/daemon/orphan-reaper.ts +2 -24
  255. package/src/daemon/server.ts +0 -10
  256. package/src/daemon/tool-setup-types.ts +4 -0
  257. package/src/daemon/trust-context.ts +1 -1
  258. package/src/events/tool-audit-listener.ts +2 -2
  259. package/src/home/feed-source-enrichment.test.ts +151 -0
  260. package/src/home/feed-source-enrichment.ts +176 -0
  261. package/src/home/relationship-state.ts +2 -4
  262. package/src/instrument.ts +18 -6
  263. package/src/ipc/__tests__/binary-result-ipc.test.ts +81 -0
  264. package/src/ipc/__tests__/clients-list-ipc.test.ts +20 -0
  265. package/src/ipc/assistant-server.ts +37 -4
  266. package/src/ipc/gateway-flag-listener.ts +18 -2
  267. package/src/memory/__tests__/auto-analysis-enqueue.test.ts +5 -16
  268. package/src/memory/__tests__/jobs-store-enqueue-gate.test.ts +7 -11
  269. package/src/memory/__tests__/memory-retrospective-enqueue.test.ts +37 -7
  270. package/src/memory/__tests__/memory-retrospective-job.test.ts +229 -401
  271. package/src/memory/__tests__/onboarding-events-store.test.ts +7 -7
  272. package/src/memory/auth-fallback-events-store.ts +2 -2
  273. package/src/memory/auto-analysis-enqueue.ts +3 -5
  274. package/src/memory/bookmark-crud.ts +1 -2
  275. package/src/memory/canonical-guardian-store.ts +39 -1
  276. package/src/memory/conversation-crud.ts +9 -4
  277. package/src/memory/conversation-key-store.ts +17 -2
  278. package/src/memory/conversation-title-service.ts +64 -7
  279. package/src/memory/db-init.ts +17 -17
  280. package/src/memory/embedding-backend.ts +38 -1
  281. package/src/memory/embedding-billing-breaker.ts +96 -0
  282. package/src/memory/jobs-store.ts +25 -13
  283. package/src/memory/jobs-worker.ts +54 -1
  284. package/src/memory/lifecycle-events-store.ts +2 -2
  285. package/src/memory/memory-retrospective-constants.ts +4 -4
  286. package/src/memory/memory-retrospective-enqueue.ts +31 -6
  287. package/src/memory/memory-retrospective-job.ts +28 -227
  288. package/src/memory/migrations/129-contact-channels-access-fields.ts +18 -9
  289. package/src/memory/migrations/131-drop-legacy-member-guardian-tables.ts +14 -2
  290. package/src/memory/migrations/289-contact-channels-unique-ext-user.ts +10 -0
  291. package/src/memory/migrations/291-contact-channels-renormalize-addresses.ts +72 -0
  292. package/src/memory/migrations/292-schedule-default-no-reuse-conversation.test.ts +67 -0
  293. package/src/memory/migrations/292-schedule-default-no-reuse-conversation.ts +25 -0
  294. package/src/memory/migrations/293-workflow-journal-leaf-tokens.ts +32 -0
  295. package/src/memory/migrations/294-drop-external-user-id.ts +31 -0
  296. package/src/memory/migrations/295-drop-approval-prompt-ts-tracker.ts +20 -0
  297. package/src/memory/migrations/296-rewrite-balanced-economy-profile-pins.test.ts +110 -0
  298. package/src/memory/migrations/296-rewrite-balanced-economy-profile-pins.ts +68 -0
  299. package/src/memory/migrations/__tests__/131-drop-legacy-member-guardian-tables.test.ts +154 -0
  300. package/src/memory/migrations/__tests__/289-contact-channels-unique-ext-user.test.ts +31 -0
  301. package/src/memory/migrations/__tests__/291-contact-channels-renormalize-addresses.test.ts +341 -0
  302. package/src/memory/migrations/__tests__/run-migrations.test.ts +52 -0
  303. package/src/memory/migrations/index.ts +6 -0
  304. package/src/memory/migrations/run-migrations.ts +41 -0
  305. package/src/memory/migrations/validate-migration-state.ts +1 -1
  306. package/src/memory/onboarding-events-store.ts +3 -3
  307. package/src/memory/schema/contacts.ts +0 -5
  308. package/src/memory/skill-loaded-events-store.test.ts +7 -15
  309. package/src/memory/skill-loaded-events-store.ts +2 -2
  310. package/src/memory/tool-executed-events-store.test.ts +7 -7
  311. package/src/memory/turn-trace-store.test.ts +736 -0
  312. package/src/memory/turn-trace-store.ts +364 -0
  313. package/src/memory/v2/__tests__/consolidation-job.test.ts +8 -0
  314. package/src/memory/v2/__tests__/skill-content.test.ts +30 -0
  315. package/src/memory/v2/consolidation-job.ts +2 -2
  316. package/src/memory/v2/skill-content.ts +25 -7
  317. package/src/memory/v2/skill-store.ts +7 -1
  318. package/src/memory/v3-eval/__tests__/eval-packets.test.ts +248 -0
  319. package/src/memory/v3-eval/eval-packets.ts +546 -0
  320. package/src/messaging/providers/slack/adapter.ts +1 -1
  321. package/src/messaging/providers/slack/api.ts +31 -0
  322. package/src/messaging/providers/slack/send.test.ts +114 -2
  323. package/src/messaging/providers/slack/send.ts +30 -7
  324. package/src/messaging/providers/slack/withdraw.test.ts +200 -0
  325. package/src/messaging/providers/slack/withdraw.ts +161 -0
  326. package/src/notifications/AGENTS.md +2 -0
  327. package/src/notifications/access-request-copy.ts +72 -59
  328. package/src/notifications/adapters/shared.ts +29 -0
  329. package/src/notifications/adapters/slack.ts +58 -103
  330. package/src/notifications/adapters/telegram.ts +2 -20
  331. package/src/notifications/approval-card-data.ts +333 -0
  332. package/src/notifications/broadcaster.ts +16 -3
  333. package/src/notifications/canonical-delivery-recorder.ts +139 -0
  334. package/src/notifications/copy-composer.ts +3 -3
  335. package/src/notifications/decision-engine.ts +4 -2
  336. package/src/notifications/destination-resolver.ts +4 -6
  337. package/src/notifications/guardian-question-mode.ts +10 -0
  338. package/src/notifications/home-feed-side-effect.ts +7 -16
  339. package/src/notifications/notification-utils.ts +19 -20
  340. package/src/notifications/signal.ts +79 -43
  341. package/src/notifications/types.ts +98 -121
  342. package/src/oauth/AGENTS.md +5 -24
  343. package/src/permissions/checker.test.ts +51 -0
  344. package/src/permissions/checker.ts +185 -26
  345. package/src/permissions/ipc-risk-types.ts +24 -0
  346. package/src/permissions/question-prompter.test.ts +27 -0
  347. package/src/permissions/question-prompter.ts +4 -0
  348. package/src/platform/client.test.ts +119 -0
  349. package/src/platform/client.ts +66 -0
  350. package/src/platform/consent-cache.test.ts +267 -0
  351. package/src/platform/consent-cache.ts +174 -0
  352. package/src/plugin-api/constants.ts +1 -1
  353. package/src/plugin-api/index.ts +33 -1
  354. package/src/plugin-api/model-profiles.ts +33 -0
  355. package/src/plugin-api/types.ts +50 -2
  356. package/src/plugins/defaults/advisor/__tests__/advisor-gate.test.ts +56 -0
  357. package/src/plugins/defaults/advisor/__tests__/advisor-state-store.test.ts +43 -0
  358. package/src/plugins/defaults/advisor/__tests__/agent-loop-integration.test.ts +137 -0
  359. package/src/plugins/defaults/advisor/__tests__/consult.test.ts +153 -0
  360. package/src/plugins/defaults/advisor/__tests__/hooks.test.ts +138 -0
  361. package/src/plugins/defaults/advisor/__tests__/transcript.test.ts +147 -0
  362. package/src/plugins/defaults/advisor/advisor-gate.ts +29 -0
  363. package/src/plugins/defaults/advisor/advisor-state-store.ts +94 -0
  364. package/src/plugins/defaults/advisor/config.ts +21 -0
  365. package/src/plugins/defaults/advisor/consult.ts +93 -0
  366. package/src/plugins/defaults/advisor/hooks/post-model-call.ts +34 -0
  367. package/src/plugins/defaults/advisor/hooks/pre-model-call.ts +30 -0
  368. package/src/plugins/defaults/advisor/hooks/user-prompt-submit.ts +19 -0
  369. package/src/plugins/defaults/advisor/package.json +14 -0
  370. package/src/plugins/defaults/advisor/steering.ts +67 -0
  371. package/src/plugins/defaults/advisor/tools/advisor.ts +65 -0
  372. package/src/plugins/defaults/advisor/transcript.ts +76 -0
  373. package/src/plugins/defaults/index.ts +60 -0
  374. package/src/plugins/defaults/memory-retrieval/hooks/post-compact.ts +22 -9
  375. package/src/plugins/defaults/memory-retrieval/hooks/user-prompt-submit.ts +2 -2
  376. package/src/plugins/defaults/memory-retrieval/tail-reinjection-strip.ts +64 -0
  377. package/src/plugins/defaults/memory-retrieval/unified-turn-context.ts +29 -21
  378. package/src/plugins/defaults/memory-v3-shadow/__tests__/carry-integration.test.ts +1 -0
  379. package/src/plugins/defaults/memory-v3-shadow/__tests__/injection.test.ts +1 -0
  380. package/src/plugins/defaults/memory-v3-shadow/__tests__/maintain-job.test.ts +129 -9
  381. package/src/plugins/defaults/memory-v3-shadow/__tests__/orchestrate.test.ts +31 -4
  382. package/src/plugins/defaults/memory-v3-shadow/__tests__/selection-log-store.test.ts +77 -2
  383. package/src/plugins/defaults/memory-v3-shadow/__tests__/shadow-plugin.test.ts +1 -0
  384. package/src/plugins/defaults/memory-v3-shadow/injector.ts +7 -10
  385. package/src/plugins/defaults/memory-v3-shadow/maintain-job.ts +144 -11
  386. package/src/plugins/defaults/memory-v3-shadow/orchestrate.ts +32 -20
  387. package/src/plugins/defaults/memory-v3-shadow/selection-log-store.ts +56 -3
  388. package/src/plugins/defaults/memory-v3-shadow/shadow-plugin.ts +23 -2
  389. package/src/plugins/defaults/surface-completion-nudge/hooks/post-model-call.ts +276 -0
  390. package/src/plugins/defaults/surface-completion-nudge/hooks/stop.ts +22 -0
  391. package/src/plugins/defaults/surface-completion-nudge/nudge-state-store.ts +46 -0
  392. package/src/plugins/defaults/surface-completion-nudge/package.json +14 -0
  393. package/src/plugins/defaults/task-progress-nudge/hooks/post-tool-use.ts +3 -13
  394. package/src/plugins/defaults/title-generate/hooks/stop.ts +56 -21
  395. package/src/prompts/persona-resolver.ts +14 -4
  396. package/src/prompts/templates/system-sections.ts +7 -2
  397. package/src/providers/__tests__/provider-env-vars.test.ts +6 -0
  398. package/src/providers/__tests__/provider-secret-catalog.test.ts +1 -0
  399. package/src/providers/__tests__/retry-callsite.test.ts +176 -0
  400. package/src/providers/atlascloud/client.ts +85 -0
  401. package/src/providers/fetch-provider-catalog.ts +85 -0
  402. package/src/providers/inference/adapter-factory.ts +3 -0
  403. package/src/providers/model-catalog.ts +58 -0
  404. package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +33 -0
  405. package/src/providers/openai/chat-completions-provider.ts +7 -0
  406. package/src/providers/openai/responses-provider.ts +10 -0
  407. package/src/providers/provider-send-message.ts +11 -3
  408. package/src/providers/retry.ts +53 -12
  409. package/src/providers/search-provider-catalog.ts +10 -0
  410. package/src/providers/weak-open-model.ts +22 -0
  411. package/src/runtime/AGENTS.md +0 -1
  412. package/src/runtime/__tests__/agent-wake.test.ts +181 -0
  413. package/src/runtime/__tests__/client-health.test.ts +44 -0
  414. package/src/runtime/access-request-helper.ts +21 -53
  415. package/src/runtime/actor-trust-resolver.ts +59 -63
  416. package/src/runtime/agent-wake.ts +52 -0
  417. package/src/runtime/assistant-event-hub.ts +18 -4
  418. package/src/runtime/auth/__tests__/route-policy.test.ts +12 -0
  419. package/src/runtime/auth/require-bound-guardian.ts +1 -4
  420. package/src/runtime/btw-sidechain.ts +3 -6
  421. package/src/runtime/capabilities.test.ts +120 -0
  422. package/src/runtime/capabilities.ts +197 -0
  423. package/src/runtime/channel-approval-types.ts +22 -45
  424. package/src/runtime/channel-invite-transports/telegram.ts +4 -4
  425. package/src/runtime/channel-retry-sweep.ts +1 -0
  426. package/src/runtime/channel-verification-service.ts +3 -3
  427. package/src/runtime/client-health.ts +26 -0
  428. package/src/runtime/confirmation-request-guardian-bridge.ts +38 -29
  429. package/src/runtime/effective-capabilities.test.ts +128 -0
  430. package/src/runtime/effective-capabilities.ts +84 -0
  431. package/src/runtime/guardian-reply-router.ts +106 -21
  432. package/src/runtime/invite-redemption-service.ts +9 -25
  433. package/src/runtime/migrations/__tests__/vbundle-builder-fd-leak.test.ts +123 -0
  434. package/src/runtime/migrations/vbundle-builder.ts +49 -20
  435. package/src/runtime/pending-interactions.ts +15 -0
  436. package/src/runtime/routes/__tests__/client-routes.test.ts +13 -0
  437. package/src/runtime/routes/__tests__/conversation-management-routes.test.ts +67 -0
  438. package/src/runtime/routes/__tests__/plugins-routes.test.ts +240 -1
  439. package/src/runtime/routes/app-routes.ts +1 -1
  440. package/src/runtime/routes/approval-strategies/guardian-callback-strategy.ts +2 -2
  441. package/src/runtime/routes/assets/vellum-design-system.css +1959 -0
  442. package/src/runtime/routes/browser-tabs-routes.ts +9 -0
  443. package/src/runtime/routes/btw-routes.ts +1 -27
  444. package/src/runtime/routes/canonical-guardian-expiry-sweep.ts +17 -8
  445. package/src/runtime/routes/client-routes.ts +10 -0
  446. package/src/runtime/routes/contact-routes.ts +31 -8
  447. package/src/runtime/routes/conversation-compaction-routes.ts +1 -1
  448. package/src/runtime/routes/conversation-management-routes.ts +80 -1
  449. package/src/runtime/routes/conversation-query-routes.ts +68 -22
  450. package/src/runtime/routes/conversation-routes.ts +39 -14
  451. package/src/runtime/routes/credential-routes.ts +40 -16
  452. package/src/runtime/routes/empty-state-greeting-cache.ts +1 -2
  453. package/src/runtime/routes/events-routes.ts +1 -3
  454. package/src/runtime/routes/guardian-approval-interception.ts +14 -73
  455. package/src/runtime/routes/guardian-approval-prompt.ts +22 -4
  456. package/src/runtime/routes/home-feed-routes.ts +8 -3
  457. package/src/runtime/routes/identity-routes.ts +1 -296
  458. package/src/runtime/routes/inbound-message-handler.ts +214 -228
  459. package/src/runtime/routes/inbound-stages/acl-enforcement.ts +89 -7
  460. package/src/runtime/routes/inbound-stages/admission-policy.test.ts +154 -0
  461. package/src/runtime/routes/inbound-stages/admission-policy.ts +140 -0
  462. package/src/runtime/routes/inbound-stages/background-dispatch.test.ts +3 -3
  463. package/src/runtime/routes/inbound-stages/background-dispatch.ts +11 -6
  464. package/src/runtime/routes/inbound-stages/escalation-intercept.ts +1 -2
  465. package/src/runtime/routes/inbound-stages/guardian-activation-intercept.ts +1 -2
  466. package/src/runtime/routes/inbound-stages/guardian-reply-intercept.test.ts +7 -7
  467. package/src/runtime/routes/inbound-stages/guardian-reply-intercept.ts +47 -28
  468. package/src/runtime/routes/inbound-stages/reaction-intercept.ts +358 -0
  469. package/src/runtime/routes/index.ts +2 -0
  470. package/src/runtime/routes/integrations/slack/__tests__/channel.test.ts +8 -0
  471. package/src/runtime/routes/integrations/slack/channel.ts +36 -0
  472. package/src/runtime/routes/internal-telemetry-routes.ts +1 -1
  473. package/src/runtime/routes/mcp-auth-routes.ts +233 -41
  474. package/src/runtime/routes/memory-eval-routes.ts +87 -0
  475. package/src/runtime/routes/notification-routes.ts +122 -133
  476. package/src/runtime/routes/platform-routes.ts +2 -2
  477. package/src/runtime/routes/plugins-routes.ts +202 -3
  478. package/src/runtime/routes/schedule-routes.ts +0 -22
  479. package/src/runtime/routes/secret-routes.ts +10 -0
  480. package/src/runtime/routes/surface-action-routes.ts +2 -1
  481. package/src/runtime/routes/tool-call-question-enrichment.test.ts +146 -0
  482. package/src/runtime/routes/tool-call-question-enrichment.ts +66 -0
  483. package/src/runtime/routes/workflow-routes.test.ts +229 -44
  484. package/src/runtime/routes/workflow-routes.ts +131 -29
  485. package/src/runtime/routes/workspace-greetings.ts +55 -0
  486. package/src/runtime/sync/resource-sync-events.ts +1 -11
  487. package/src/runtime/tool-grant-request-helper.ts +18 -16
  488. package/src/runtime/trust-context-resolver.ts +8 -5
  489. package/src/schedule/inference-profile.ts +2 -14
  490. package/src/schedule/schedule-store.ts +1 -1
  491. package/src/schedule/scheduler-types.ts +5 -1
  492. package/src/security/__tests__/provider-key-env-fallback.test.ts +6 -0
  493. package/src/security/secret-patterns.ts +3 -0
  494. package/src/subagent/manager.ts +17 -4
  495. package/src/subagent/types.ts +6 -0
  496. package/src/telemetry/trace-collection-policy.test.ts +28 -0
  497. package/src/telemetry/trace-collection-policy.ts +30 -0
  498. package/src/telemetry/types.ts +89 -0
  499. package/src/telemetry/usage-telemetry-reporter.test.ts +586 -36
  500. package/src/telemetry/usage-telemetry-reporter.ts +148 -41
  501. package/src/tools/AGENTS.md +3 -3
  502. package/src/tools/browser/__tests__/browser-execution-acquire.test.ts +31 -0
  503. package/src/tools/browser/browser-execution.ts +30 -19
  504. package/src/tools/document/document-tool.ts +2 -3
  505. package/src/tools/executor.ts +5 -3
  506. package/src/tools/host-terminal/host-shell.ts +5 -4
  507. package/src/tools/memory/register.ts +2 -2
  508. package/src/tools/network/__tests__/web-fetch-firecrawl.test.ts +360 -0
  509. package/src/tools/network/__tests__/web-search.test.ts +143 -0
  510. package/src/tools/network/web-fetch.ts +372 -1
  511. package/src/tools/network/web-search-error.ts +1 -1
  512. package/src/tools/network/web-search.ts +213 -10
  513. package/src/tools/permission-checker.ts +4 -3
  514. package/src/tools/registry.ts +20 -0
  515. package/src/tools/schedule/create.ts +7 -12
  516. package/src/tools/schedule/update.ts +4 -11
  517. package/src/tools/shared/filesystem/path-policy.ts +39 -13
  518. package/src/tools/side-effects.ts +2 -17
  519. package/src/tools/skills/execute.ts +33 -0
  520. package/src/tools/subagent/spawn.ts +61 -12
  521. package/src/tools/terminal/shell.ts +10 -4
  522. package/src/tools/tool-approval-handler.ts +18 -13
  523. package/src/tools/tool-manifest.ts +0 -2
  524. package/src/tools/types.ts +9 -0
  525. package/src/tools/ui-surface/definitions.ts +64 -3
  526. package/src/tools/verification-control-plane-policy.ts +3 -1
  527. package/src/tools/workflows/run-workflow.test.ts +8 -18
  528. package/src/tools/workflows/run-workflow.ts +1 -0
  529. package/src/util/disk-usage.ts +78 -23
  530. package/src/util/platform.ts +10 -3
  531. package/src/watcher/telemetry.ts +2 -2
  532. package/src/workflows/capabilities.ts +2 -3
  533. package/src/workflows/engine.test.ts +175 -1
  534. package/src/workflows/engine.ts +82 -0
  535. package/src/workflows/journal-store.test.ts +70 -0
  536. package/src/workflows/journal-store.ts +18 -3
  537. package/src/workflows/run-manager.test.ts +171 -28
  538. package/src/workflows/run-manager.ts +66 -24
  539. package/src/workspace/migrations/105-enable-memory-v3-live-for-new-workspaces.ts +63 -0
  540. package/src/workspace/migrations/106-drop-collect-usage-data.ts +47 -0
  541. package/src/workspace/migrations/107-drop-send-diagnostics.ts +47 -0
  542. package/src/workspace/migrations/108-drop-balanced-economy-profile.ts +129 -0
  543. package/src/workspace/migrations/registry.ts +8 -0
  544. package/src/__tests__/app-control-no-global-cgevent.test.ts +0 -98
  545. package/src/__tests__/credential-security-e2e.test.ts +0 -362
  546. package/src/__tests__/credential-vault-unit.test.ts +0 -1528
  547. package/src/__tests__/credential-vault.test.ts +0 -1706
  548. package/src/__tests__/identity-intro-cache.test.ts +0 -315
  549. package/src/__tests__/secret-onetime-send.test.ts +0 -182
  550. package/src/cli/commands/__tests__/task.test.ts +0 -914
  551. package/src/cli/commands/task.ts +0 -771
  552. package/src/config/bundled-skills/personal-page/SKILL.md +0 -57
  553. package/src/config/bundled-skills/personal-page/TOOLS.json +0 -27
  554. package/src/config/bundled-skills/personal-page/tools/app-refresh.ts +0 -17
  555. package/src/config/preloaded-apps/personal-page/src/components/About.tsx +0 -22
  556. package/src/config/preloaded-apps/personal-page/src/components/App.tsx +0 -16
  557. package/src/config/preloaded-apps/personal-page/src/components/Features.tsx +0 -77
  558. package/src/config/preloaded-apps/personal-page/src/components/Hero.tsx +0 -57
  559. package/src/config/preloaded-apps/personal-page/src/components/Pending.tsx +0 -28
  560. package/src/config/preloaded-apps/personal-page/src/components/animations.tsx +0 -234
  561. package/src/config/preloaded-apps/personal-page/src/components/icons.tsx +0 -48
  562. package/src/config/preloaded-apps/personal-page/src/components/media.ts +0 -16
  563. package/src/config/preloaded-apps/personal-page/src/index.html +0 -20
  564. package/src/config/preloaded-apps/personal-page/src/main.tsx +0 -7
  565. package/src/config/preloaded-apps/personal-page/src/profile-data.ts +0 -82
  566. package/src/config/preloaded-apps/personal-page/src/styles.css +0 -759
  567. package/src/memory/__tests__/preloaded-apps.test.ts +0 -85
  568. package/src/memory/preloaded-apps.ts +0 -116
  569. package/src/notifications/tool-approval-copy.ts +0 -142
  570. package/src/runtime/routes/approval-prompt-ts-tracker.ts +0 -78
  571. package/src/runtime/routes/identity-intro-cache.ts +0 -172
  572. package/src/tools/credentials/vault.ts +0 -712
@@ -0,0 +1,736 @@
1
+ /**
2
+ * Tests for the turn-trace assembler.
3
+ *
4
+ * Verifies that a turn's transcript (user message, assistant responses, and
5
+ * tool_result rows) plus its tool invocations are gathered into a faithful,
6
+ * window-bounded trace, that the window stops at the next REAL user turn (and
7
+ * never at the turn's own tool-result rows), that tool inputs/results are
8
+ * captured verbatim (no field-level redaction), that coalesced-batch turns
9
+ * trace their natural windows (head user-only, shared response on the final
10
+ * batched turn — no batch inference), and that the size cap omits oversized
11
+ * traces fail-closed.
12
+ */
13
+
14
+ import { beforeEach, describe, expect, mock, test } from "bun:test";
15
+
16
+ import { makeMockLogger } from "../__tests__/helpers/mock-logger.js";
17
+
18
+ mock.module("../util/logger.js", () => ({
19
+ getLogger: () => makeMockLogger(),
20
+ }));
21
+
22
+ // Control the live-conversation lookup so `isTurnSettled` can be exercised
23
+ // without a running agent loop. Returns `undefined` (no live conversation) by
24
+ // default; tests set a fake with a chosen `isProcessing()`.
25
+ let mockLiveConversation: { isProcessing: () => boolean } | undefined;
26
+ mock.module("../daemon/conversation-registry.js", () => ({
27
+ findConversation: () => mockLiveConversation,
28
+ }));
29
+
30
+ import { createConversation } from "./conversation-crud.js";
31
+ import { getDb } from "./db-connection.js";
32
+ import { initializeDb } from "./db-init.js";
33
+ import { messages, toolInvocations } from "./schema.js";
34
+ import {
35
+ assembleBoundedTurnTrace,
36
+ assembleTurnTrace,
37
+ isTurnSettled,
38
+ MAX_TRACE_SERIALIZED_BYTES,
39
+ type TurnTraceBoundary,
40
+ } from "./turn-trace-store.js";
41
+
42
+ initializeDb();
43
+
44
+ function purge(): void {
45
+ const db = getDb();
46
+ db.run("DELETE FROM tool_invocations");
47
+ db.run("DELETE FROM messages");
48
+ db.run("DELETE FROM conversations");
49
+ }
50
+
51
+ beforeEach(() => {
52
+ purge();
53
+ mockLiveConversation = undefined;
54
+ });
55
+
56
+ interface MessageSeed {
57
+ id: string;
58
+ role: "user" | "assistant" | "system";
59
+ content: unknown;
60
+ createdAt: number;
61
+ }
62
+
63
+ function insertMessage(conversationId: string, seed: MessageSeed): void {
64
+ getDb()
65
+ .insert(messages)
66
+ .values({
67
+ id: seed.id,
68
+ conversationId,
69
+ role: seed.role,
70
+ content:
71
+ typeof seed.content === "string"
72
+ ? seed.content
73
+ : JSON.stringify(seed.content),
74
+ createdAt: seed.createdAt,
75
+ })
76
+ .run();
77
+ }
78
+
79
+ interface ToolSeed {
80
+ id: string;
81
+ toolName: string;
82
+ input: string;
83
+ result: string;
84
+ decision?: string;
85
+ durationMs?: number;
86
+ createdAt: number;
87
+ }
88
+
89
+ function insertTool(conversationId: string, seed: ToolSeed): void {
90
+ getDb()
91
+ .insert(toolInvocations)
92
+ .values({
93
+ id: seed.id,
94
+ conversationId,
95
+ toolName: seed.toolName,
96
+ input: seed.input,
97
+ result: seed.result,
98
+ decision: seed.decision ?? "allow",
99
+ riskLevel: "low",
100
+ durationMs: seed.durationMs ?? 5,
101
+ createdAt: seed.createdAt,
102
+ })
103
+ .run();
104
+ }
105
+
106
+ function boundary(
107
+ conversationId: string,
108
+ userMessageId: string,
109
+ createdAt: number,
110
+ ): TurnTraceBoundary {
111
+ return { conversationId, userMessageId, userMessageCreatedAt: createdAt };
112
+ }
113
+
114
+ describe("assembleTurnTrace", () => {
115
+ test("gathers user message, assistant responses, tool-result rows, and tool calls for a multi-message turn", () => {
116
+ const conv = createConversation({ conversationType: "standard" });
117
+
118
+ // Turn 1: user asks, assistant calls a tool, tool result lands as a
119
+ // role="user" row, assistant replies.
120
+ insertMessage(conv.id, {
121
+ id: "m-user-1",
122
+ role: "user",
123
+ content: [{ type: "text", text: "what's on my calendar?" }],
124
+ createdAt: 1000,
125
+ });
126
+ insertMessage(conv.id, {
127
+ id: "m-asst-1a",
128
+ role: "assistant",
129
+ content: [
130
+ {
131
+ type: "tool_use",
132
+ id: "tu-1",
133
+ name: "calendar_list_events",
134
+ input: { range: "today" },
135
+ },
136
+ ],
137
+ createdAt: 1100,
138
+ });
139
+ insertMessage(conv.id, {
140
+ id: "m-toolresult-1",
141
+ role: "user",
142
+ content: [
143
+ { type: "tool_result", tool_use_id: "tu-1", content: "2 events" },
144
+ ],
145
+ createdAt: 1200,
146
+ });
147
+ insertMessage(conv.id, {
148
+ id: "m-asst-1b",
149
+ role: "assistant",
150
+ content: [{ type: "text", text: "You have 2 events today." }],
151
+ createdAt: 1300,
152
+ });
153
+ insertTool(conv.id, {
154
+ id: "ti-1",
155
+ toolName: "calendar_list_events",
156
+ input: JSON.stringify({ range: "today" }),
157
+ result: JSON.stringify({ events: 2 }),
158
+ createdAt: 1150,
159
+ });
160
+
161
+ // Turn 2: next real user turn — must NOT be in turn 1's trace.
162
+ insertMessage(conv.id, {
163
+ id: "m-user-2",
164
+ role: "user",
165
+ content: [{ type: "text", text: "thanks" }],
166
+ createdAt: 2000,
167
+ });
168
+ insertTool(conv.id, {
169
+ id: "ti-2",
170
+ toolName: "noop",
171
+ input: "{}",
172
+ result: "{}",
173
+ createdAt: 2100,
174
+ });
175
+
176
+ const trace = assembleTurnTrace(boundary(conv.id, "m-user-1", 1000));
177
+
178
+ expect(trace.schema_version).toBe(1);
179
+ // Window stops before turn 2: only turn-1 message rows, oldest-first.
180
+ expect(trace.messages.map((m) => m.id)).toEqual([
181
+ "m-user-1",
182
+ "m-asst-1a",
183
+ "m-toolresult-1",
184
+ "m-asst-1b",
185
+ ]);
186
+ // The tool-result row keeps role="user" (faithful to what the model saw).
187
+ const toolResultMsg = trace.messages.find((m) => m.id === "m-toolresult-1");
188
+ expect(toolResultMsg?.role).toBe("user");
189
+ // Content is parsed JSON (ContentBlock[]), not a string.
190
+ expect(Array.isArray(toolResultMsg?.content)).toBe(true);
191
+
192
+ // Only turn-1's tool invocation is in scope.
193
+ expect(trace.tool_calls.map((t) => t.id)).toEqual(["ti-1"]);
194
+ expect(trace.tool_calls[0]).toMatchObject({
195
+ tool_name: "calendar_list_events",
196
+ decision: "allow",
197
+ duration_ms: 5,
198
+ created_at: 1150,
199
+ });
200
+ // Result is forwarded verbatim.
201
+ expect(trace.tool_calls[0].result).toBe(JSON.stringify({ events: 2 }));
202
+ });
203
+
204
+ test("the final turn's window runs to the end of the conversation", () => {
205
+ const conv = createConversation({ conversationType: "standard" });
206
+ insertMessage(conv.id, {
207
+ id: "m-user-1",
208
+ role: "user",
209
+ content: [{ type: "text", text: "first" }],
210
+ createdAt: 1000,
211
+ });
212
+ insertMessage(conv.id, {
213
+ id: "m-user-2",
214
+ role: "user",
215
+ content: [{ type: "text", text: "second (latest)" }],
216
+ createdAt: 2000,
217
+ });
218
+ insertMessage(conv.id, {
219
+ id: "m-asst-2",
220
+ role: "assistant",
221
+ content: [{ type: "text", text: "reply to second" }],
222
+ createdAt: 2100,
223
+ });
224
+ insertTool(conv.id, {
225
+ id: "ti-late",
226
+ toolName: "noop",
227
+ input: "{}",
228
+ result: "ok",
229
+ createdAt: 2200,
230
+ });
231
+
232
+ const trace = assembleTurnTrace(boundary(conv.id, "m-user-2", 2000));
233
+ expect(trace.messages.map((m) => m.id)).toEqual(["m-user-2", "m-asst-2"]);
234
+ expect(trace.tool_calls.map((t) => t.id)).toEqual(["ti-late"]);
235
+ });
236
+
237
+ test("two real user turns sharing created_at: the first turn's trace is not truncated and excludes the second turn", () => {
238
+ // Forked conversations preserve the source `created_at` with fresh ids, so
239
+ // two real user messages can share a millisecond. A timestamp-only upper
240
+ // bound would equal the current turn's own `created_at` and empty the
241
+ // window — the compound `(created_at, id)` bound must keep this turn's rows
242
+ // (which sort by id at the shared millisecond) while excluding the next.
243
+ const conv = createConversation({ conversationType: "standard" });
244
+
245
+ // Turn 1 (id "m-user-1") and turn 2 (id "m-user-2") share created_at=1000.
246
+ // Turn 1's assistant reply, tool-result row, and tool call also land at
247
+ // 1000 — the worst case for a timestamp-only bound.
248
+ insertMessage(conv.id, {
249
+ id: "m-user-1",
250
+ role: "user",
251
+ content: [{ type: "text", text: "first (same ms)" }],
252
+ createdAt: 1000,
253
+ });
254
+ insertMessage(conv.id, {
255
+ id: "m-user-1-asst",
256
+ role: "assistant",
257
+ content: [{ type: "text", text: "reply to first" }],
258
+ createdAt: 1000,
259
+ });
260
+ insertMessage(conv.id, {
261
+ id: "m-user-1-toolresult",
262
+ role: "user",
263
+ content: [{ type: "tool_result", tool_use_id: "tu-1", content: "ok" }],
264
+ createdAt: 1000,
265
+ });
266
+ insertTool(conv.id, {
267
+ id: "ti-turn1",
268
+ toolName: "noop",
269
+ input: "{}",
270
+ result: "r1",
271
+ createdAt: 1000,
272
+ });
273
+
274
+ // Turn 2 user message + its content, same created_at=1000 (higher id).
275
+ insertMessage(conv.id, {
276
+ id: "m-user-2",
277
+ role: "user",
278
+ content: [{ type: "text", text: "second (same ms)" }],
279
+ createdAt: 1000,
280
+ });
281
+ insertMessage(conv.id, {
282
+ id: "m-user-2-asst",
283
+ role: "assistant",
284
+ content: [{ type: "text", text: "reply to second" }],
285
+ createdAt: 1000,
286
+ });
287
+
288
+ const trace = assembleTurnTrace(boundary(conv.id, "m-user-1", 1000));
289
+
290
+ // Turn 1's rows (ids < "m-user-2" at ms 1000) are present; the trace is
291
+ // NOT truncated/emptied. The second user turn and its reply are excluded.
292
+ expect(trace.messages.map((m) => m.id)).toEqual([
293
+ "m-user-1",
294
+ "m-user-1-asst",
295
+ "m-user-1-toolresult",
296
+ ]);
297
+ // Turn 1's same-millisecond tool call is retained (degenerate `<=` window).
298
+ expect(trace.tool_calls.map((t) => t.id)).toEqual(["ti-turn1"]);
299
+ });
300
+
301
+ test("the SECOND of two same-created_at turns captures its own trace to end of conversation", () => {
302
+ // Complement of the previous test: assembling the trace for the later of
303
+ // two same-millisecond user turns must include only that turn's rows.
304
+ const conv = createConversation({ conversationType: "standard" });
305
+ insertMessage(conv.id, {
306
+ id: "m-user-1",
307
+ role: "user",
308
+ content: [{ type: "text", text: "first (same ms)" }],
309
+ createdAt: 1000,
310
+ });
311
+ insertMessage(conv.id, {
312
+ id: "m-user-1-asst",
313
+ role: "assistant",
314
+ content: [{ type: "text", text: "reply to first" }],
315
+ createdAt: 1000,
316
+ });
317
+ insertMessage(conv.id, {
318
+ id: "m-user-2",
319
+ role: "user",
320
+ content: [{ type: "text", text: "second (same ms, latest)" }],
321
+ createdAt: 1000,
322
+ });
323
+ insertMessage(conv.id, {
324
+ id: "m-user-2-asst",
325
+ role: "assistant",
326
+ content: [{ type: "text", text: "reply to second" }],
327
+ createdAt: 1100,
328
+ });
329
+
330
+ const trace = assembleTurnTrace(boundary(conv.id, "m-user-2", 1000));
331
+ expect(trace.messages.map((m) => m.id)).toEqual([
332
+ "m-user-2",
333
+ "m-user-2-asst",
334
+ ]);
335
+ });
336
+
337
+ test("a tool-result role=user row does NOT truncate the turn it belongs to", () => {
338
+ const conv = createConversation({ conversationType: "standard" });
339
+ insertMessage(conv.id, {
340
+ id: "m-user-1",
341
+ role: "user",
342
+ content: [{ type: "text", text: "do a thing" }],
343
+ createdAt: 1000,
344
+ });
345
+ // Tool-result row persisted as role="user" — must be treated as part of
346
+ // the turn, not as the next user turn.
347
+ insertMessage(conv.id, {
348
+ id: "m-toolresult",
349
+ role: "user",
350
+ content: [{ type: "tool_result", tool_use_id: "tu-x", content: "done" }],
351
+ createdAt: 1100,
352
+ });
353
+ insertMessage(conv.id, {
354
+ id: "m-asst-after-result",
355
+ role: "assistant",
356
+ content: [{ type: "text", text: "all done" }],
357
+ createdAt: 1200,
358
+ });
359
+
360
+ const trace = assembleTurnTrace(boundary(conv.id, "m-user-1", 1000));
361
+ // All three rows belong to the single turn — the tool-result row did not
362
+ // close the window early.
363
+ expect(trace.messages.map((m) => m.id)).toEqual([
364
+ "m-user-1",
365
+ "m-toolresult",
366
+ "m-asst-after-result",
367
+ ]);
368
+ });
369
+
370
+ test("captures tool inputs verbatim — no field-level redaction, even for credential-shaped keys", () => {
371
+ // The consented trace is full-fidelity. Keys that look sensitive
372
+ // (access_token, api_key) are NOT redacted — the protections are the
373
+ // consent gate, the PII-segregated table, and its TTL, not redaction.
374
+ const conv = createConversation({ conversationType: "standard" });
375
+ insertMessage(conv.id, {
376
+ id: "m-user-1",
377
+ role: "user",
378
+ content: [{ type: "text", text: "use my token" }],
379
+ createdAt: 1000,
380
+ });
381
+ const rawInput = {
382
+ url: "https://api.example.com",
383
+ access_token: "super-secret-value",
384
+ nested: { api_key: "also-secret" },
385
+ };
386
+ insertTool(conv.id, {
387
+ id: "ti-secret",
388
+ toolName: "http_request",
389
+ input: JSON.stringify(rawInput),
390
+ result: JSON.stringify({ status: 200 }),
391
+ createdAt: 1100,
392
+ });
393
+
394
+ const trace = assembleTurnTrace(boundary(conv.id, "m-user-1", 1000));
395
+ const call = trace.tool_calls[0];
396
+ // Parsed input matches the raw stored input exactly — including the
397
+ // credential-shaped values, which are present verbatim (not redacted).
398
+ expect(call.input).toEqual(rawInput);
399
+ const input = call.input as Record<string, unknown>;
400
+ expect(input.access_token).toBe("super-secret-value");
401
+ expect((input.nested as Record<string, unknown>).api_key).toBe(
402
+ "also-secret",
403
+ );
404
+ expect(JSON.stringify(call.input)).not.toContain("<redacted />");
405
+ // Result is also forwarded verbatim.
406
+ expect(call.result).toBe(JSON.stringify({ status: 200 }));
407
+ });
408
+
409
+ test("non-JSON tool input is forwarded as a raw string", () => {
410
+ const conv = createConversation({ conversationType: "standard" });
411
+ insertMessage(conv.id, {
412
+ id: "m-user-1",
413
+ role: "user",
414
+ content: [{ type: "text", text: "hi" }],
415
+ createdAt: 1000,
416
+ });
417
+ insertTool(conv.id, {
418
+ id: "ti-raw",
419
+ toolName: "bash",
420
+ input: "ls -la /tmp",
421
+ result: "ok",
422
+ createdAt: 1100,
423
+ });
424
+
425
+ const trace = assembleTurnTrace(boundary(conv.id, "m-user-1", 1000));
426
+ expect(trace.tool_calls[0].input).toBe("ls -la /tmp");
427
+ });
428
+
429
+ test("legacy plain-string message content is forwarded as a string", () => {
430
+ const conv = createConversation({ conversationType: "standard" });
431
+ // A legacy row stored the content as a bare (JSON) string, not a block
432
+ // array. JSON.parse of a quoted string yields a string; an unquoted
433
+ // legacy value falls back to the raw string.
434
+ insertMessage(conv.id, {
435
+ id: "m-user-1",
436
+ role: "user",
437
+ content: "plain legacy text",
438
+ createdAt: 1000,
439
+ });
440
+ const trace = assembleTurnTrace(boundary(conv.id, "m-user-1", 1000));
441
+ expect(trace.messages[0].content).toBe("plain legacy text");
442
+ });
443
+
444
+ test("scopes the trace to a single conversation", () => {
445
+ const a = createConversation({ conversationType: "standard" });
446
+ const b = createConversation({ conversationType: "standard" });
447
+ insertMessage(a.id, {
448
+ id: "m-a-user",
449
+ role: "user",
450
+ content: [{ type: "text", text: "in A" }],
451
+ createdAt: 1000,
452
+ });
453
+ insertMessage(b.id, {
454
+ id: "m-b-user",
455
+ role: "user",
456
+ content: [{ type: "text", text: "in B" }],
457
+ createdAt: 1050,
458
+ });
459
+ insertTool(b.id, {
460
+ id: "ti-b",
461
+ toolName: "noop",
462
+ input: "{}",
463
+ result: "ok",
464
+ createdAt: 1060,
465
+ });
466
+
467
+ const trace = assembleTurnTrace(boundary(a.id, "m-a-user", 1000));
468
+ expect(trace.messages.map((m) => m.id)).toEqual(["m-a-user"]);
469
+ // Tool calls from conversation B never leak into A's trace.
470
+ expect(trace.tool_calls).toEqual([]);
471
+ });
472
+ });
473
+
474
+ describe("assembleTurnTrace — coalesced-batch natural windows", () => {
475
+ // The daemon coalesces queued user messages: drainBatch persists every
476
+ // batched user row, then runs ONE shared response attributed to the LAST
477
+ // batched user row. On disk: [u1][u2][u3][assistant + tools][u4][assistant2].
478
+ // No batch inference is attempted (there is no durable batch signal in the
479
+ // stored messages, and a batch head is indistinguishable from a turn that
480
+ // failed/cancelled before responding). Each turn just traces its natural
481
+ // window, which is faithful.
482
+ function seedThreeMessageBatch(convId: string): void {
483
+ insertMessage(convId, {
484
+ id: "u1",
485
+ role: "user",
486
+ content: [{ type: "text", text: "first batched" }],
487
+ createdAt: 1000,
488
+ });
489
+ insertMessage(convId, {
490
+ id: "u2",
491
+ role: "user",
492
+ content: [{ type: "text", text: "second batched" }],
493
+ createdAt: 1010,
494
+ });
495
+ insertMessage(convId, {
496
+ id: "u3",
497
+ role: "user",
498
+ content: [{ type: "text", text: "third batched (final)" }],
499
+ createdAt: 1020,
500
+ });
501
+ // Shared response written AFTER the last batched user row, with a tool call.
502
+ insertMessage(convId, {
503
+ id: "a-shared",
504
+ role: "assistant",
505
+ content: [
506
+ { type: "tool_use", id: "tu-1", name: "calendar", input: {} },
507
+ { type: "text", text: "shared reply to all three" },
508
+ ],
509
+ createdAt: 1030,
510
+ });
511
+ insertMessage(convId, {
512
+ id: "a-shared-toolresult",
513
+ role: "user",
514
+ content: [{ type: "tool_result", tool_use_id: "tu-1", content: "ok" }],
515
+ createdAt: 1040,
516
+ });
517
+ insertTool(convId, {
518
+ id: "ti-shared",
519
+ toolName: "calendar",
520
+ input: "{}",
521
+ result: "ok",
522
+ createdAt: 1035,
523
+ });
524
+ }
525
+
526
+ test("a batched HEAD turn's trace contains only its own user row (faithful, no batch field)", () => {
527
+ const conv = createConversation({ conversationType: "standard" });
528
+ seedThreeMessageBatch(conv.id);
529
+
530
+ const trace = assembleTurnTrace(boundary(conv.id, "u1", 1000));
531
+ // Natural window: just the head's own user row. Its window genuinely has no
532
+ // assistant response (the shared response is on the final batched turn).
533
+ expect(trace.messages.map((m) => m.id)).toEqual(["u1"]);
534
+ expect(trace.tool_calls).toEqual([]);
535
+ // No batch inference: the response is not duplicated onto the head, and the
536
+ // trace carries no `batch` field.
537
+ expect(JSON.stringify(trace)).not.toContain("shared reply to all three");
538
+ expect("batch" in trace).toBe(false);
539
+ });
540
+
541
+ test("a batched MIDDLE turn's trace also contains only its own user row", () => {
542
+ const conv = createConversation({ conversationType: "standard" });
543
+ seedThreeMessageBatch(conv.id);
544
+
545
+ const trace = assembleTurnTrace(boundary(conv.id, "u2", 1010));
546
+ expect(trace.messages.map((m) => m.id)).toEqual(["u2"]);
547
+ expect(trace.tool_calls).toEqual([]);
548
+ expect("batch" in trace).toBe(false);
549
+ });
550
+
551
+ test("the FINAL batched turn's trace contains the shared assistant response + tools", () => {
552
+ const conv = createConversation({ conversationType: "standard" });
553
+ seedThreeMessageBatch(conv.id);
554
+
555
+ // The shared response is attributed by the daemon to the last batched user
556
+ // row (lastUserMessageId == u3); u3's natural window includes it.
557
+ const trace = assembleTurnTrace(boundary(conv.id, "u3", 1020));
558
+ expect(trace.messages.map((m) => m.id)).toEqual([
559
+ "u3",
560
+ "a-shared",
561
+ "a-shared-toolresult",
562
+ ]);
563
+ expect(trace.tool_calls.map((t) => t.id)).toEqual(["ti-shared"]);
564
+ expect("batch" in trace).toBe(false);
565
+ });
566
+ });
567
+
568
+ describe("assembleBoundedTurnTrace", () => {
569
+ test("returns the trace when under the size cap", () => {
570
+ const conv = createConversation({ conversationType: "standard" });
571
+ insertMessage(conv.id, {
572
+ id: "m-user-1",
573
+ role: "user",
574
+ content: [{ type: "text", text: "small" }],
575
+ createdAt: 1000,
576
+ });
577
+ const trace = assembleBoundedTurnTrace(boundary(conv.id, "m-user-1", 1000));
578
+ expect(trace).not.toBeNull();
579
+ expect(trace?.messages.map((m) => m.id)).toEqual(["m-user-1"]);
580
+ });
581
+
582
+ test("omits (returns null) when the serialized trace exceeds the cap", () => {
583
+ const conv = createConversation({ conversationType: "standard" });
584
+ insertMessage(conv.id, {
585
+ id: "m-user-1",
586
+ role: "user",
587
+ content: [{ type: "text", text: "huge" }],
588
+ createdAt: 1000,
589
+ });
590
+ // A single oversized tool result pushes the trace past the cap.
591
+ insertTool(conv.id, {
592
+ id: "ti-huge",
593
+ toolName: "dump",
594
+ input: "{}",
595
+ result: "x".repeat(MAX_TRACE_SERIALIZED_BYTES + 1024),
596
+ createdAt: 1100,
597
+ });
598
+
599
+ const trace = assembleBoundedTurnTrace(boundary(conv.id, "m-user-1", 1000));
600
+ expect(trace).toBeNull();
601
+ });
602
+ });
603
+
604
+ describe("isTurnSettled", () => {
605
+ test("batched head with a later real user row is NOT settled while the conversation is processing", () => {
606
+ // Batched-message path: drainBatch persists the head user row AND the tail
607
+ // user row(s) up front, then runs ONE shared response. So the head has a
608
+ // later real user turn while the shared response is still in flight — it
609
+ // must NOT be treated as settled (the old "successor exists" shortcut would
610
+ // have shipped a partial trace for the head).
611
+ const conv = createConversation({ conversationType: "standard" });
612
+ insertMessage(conv.id, {
613
+ id: "m-user-1",
614
+ role: "user",
615
+ content: [{ type: "text", text: "head of batch" }],
616
+ createdAt: 1000,
617
+ });
618
+ insertMessage(conv.id, {
619
+ id: "m-user-2",
620
+ role: "user",
621
+ content: [{ type: "text", text: "tail of batch" }],
622
+ createdAt: 2000,
623
+ });
624
+ // Shared response still generating.
625
+ mockLiveConversation = { isProcessing: () => true };
626
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(false);
627
+ // The tail (latest turn) is likewise deferred while processing.
628
+ expect(isTurnSettled(boundary(conv.id, "m-user-2", 2000))).toBe(false);
629
+ });
630
+
631
+ test("the batched head settles once the shared response completes (conversation idle)", () => {
632
+ const conv = createConversation({ conversationType: "standard" });
633
+ insertMessage(conv.id, {
634
+ id: "m-user-1",
635
+ role: "user",
636
+ content: [{ type: "text", text: "head of batch" }],
637
+ createdAt: 1000,
638
+ });
639
+ insertMessage(conv.id, {
640
+ id: "m-user-2",
641
+ role: "user",
642
+ content: [{ type: "text", text: "tail of batch" }],
643
+ createdAt: 2000,
644
+ });
645
+ // Shared response finished -> conversation idle -> both turns settle.
646
+ mockLiveConversation = { isProcessing: () => false };
647
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(true);
648
+ expect(isTurnSettled(boundary(conv.id, "m-user-2", 2000))).toBe(true);
649
+ });
650
+
651
+ test("a completed earlier turn defers while a later turn's response is in flight, then settles when idle", () => {
652
+ // Serialized (non-batch) path: T1 finished, T2 now generating. Gating on
653
+ // isProcessing() defers T1 until the conversation goes idle. This is a
654
+ // latency cost, not data loss — T1 traces completely once T2 finishes.
655
+ const conv = createConversation({ conversationType: "standard" });
656
+ insertMessage(conv.id, {
657
+ id: "m-user-1",
658
+ role: "user",
659
+ content: [{ type: "text", text: "first (done)" }],
660
+ createdAt: 1000,
661
+ });
662
+ insertMessage(conv.id, {
663
+ id: "m-user-2",
664
+ role: "user",
665
+ content: [{ type: "text", text: "second (generating)" }],
666
+ createdAt: 2000,
667
+ });
668
+ mockLiveConversation = { isProcessing: () => true };
669
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(false);
670
+
671
+ // Conversation goes idle -> the earlier turn settles promptly.
672
+ mockLiveConversation = { isProcessing: () => false };
673
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(true);
674
+ });
675
+
676
+ test("settledness follows the conversation's processing state regardless of intervening tool-result rows", () => {
677
+ const conv = createConversation({ conversationType: "standard" });
678
+ insertMessage(conv.id, {
679
+ id: "m-user-1",
680
+ role: "user",
681
+ content: [{ type: "text", text: "do a thing" }],
682
+ createdAt: 1000,
683
+ });
684
+ // Tool-result row persisted as role="user" — part of this turn's response.
685
+ insertMessage(conv.id, {
686
+ id: "m-toolresult",
687
+ role: "user",
688
+ content: [{ type: "tool_result", tool_use_id: "tu-x", content: "done" }],
689
+ createdAt: 1100,
690
+ });
691
+ // Still generating -> not settled.
692
+ mockLiveConversation = { isProcessing: () => true };
693
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(false);
694
+ // Response finished -> settled.
695
+ mockLiveConversation = { isProcessing: () => false };
696
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(true);
697
+ });
698
+
699
+ test("NOT settled when this is the latest real user turn and the conversation is processing", () => {
700
+ const conv = createConversation({ conversationType: "standard" });
701
+ insertMessage(conv.id, {
702
+ id: "m-user-1",
703
+ role: "user",
704
+ content: [{ type: "text", text: "still generating" }],
705
+ createdAt: 1000,
706
+ });
707
+ // Latest real turn + live conversation actively processing -> in-flight.
708
+ mockLiveConversation = { isProcessing: () => true };
709
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(false);
710
+ });
711
+
712
+ test("settled when this is the latest real user turn but the conversation is idle (final turn)", () => {
713
+ const conv = createConversation({ conversationType: "standard" });
714
+ insertMessage(conv.id, {
715
+ id: "m-user-1",
716
+ role: "user",
717
+ content: [{ type: "text", text: "final turn" }],
718
+ createdAt: 1000,
719
+ });
720
+ mockLiveConversation = { isProcessing: () => false };
721
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(true);
722
+ });
723
+
724
+ test("settled when the conversation is not in the live registry (evicted / not loaded)", () => {
725
+ const conv = createConversation({ conversationType: "standard" });
726
+ insertMessage(conv.id, {
727
+ id: "m-user-1",
728
+ role: "user",
729
+ content: [{ type: "text", text: "from an evicted conversation" }],
730
+ createdAt: 1000,
731
+ });
732
+ // No live conversation -> no in-flight turn -> settled.
733
+ mockLiveConversation = undefined;
734
+ expect(isTurnSettled(boundary(conv.id, "m-user-1", 1000))).toBe(true);
735
+ });
736
+ });