@vellumai/assistant 0.8.4 → 0.8.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (438) hide show
  1. package/ARCHITECTURE.md +2 -2
  2. package/docs/browser-use-architecture-phase2.md +1 -1
  3. package/knip.json +2 -1
  4. package/openapi.yaml +809 -11
  5. package/package.json +1 -1
  6. package/src/__tests__/anthropic-provider.test.ts +34 -37
  7. package/src/__tests__/assistant-event-hub-self-exclusion.test.ts +293 -0
  8. package/src/__tests__/assistant-feature-flags-integration.test.ts +3 -3
  9. package/src/__tests__/audit-log-rotation.test.ts +70 -16
  10. package/src/__tests__/background-workers-disk-pressure.test.ts +3 -3
  11. package/src/__tests__/btw-routes.test.ts +2 -3
  12. package/src/__tests__/call-controller.test.ts +0 -1
  13. package/src/__tests__/cancel-resolves-conversation-key.test.ts +1 -1
  14. package/src/__tests__/channel-guardian.test.ts +3 -3
  15. package/src/__tests__/checker.test.ts +6 -15
  16. package/src/__tests__/compaction-events.test.ts +1 -0
  17. package/src/__tests__/compactor-call-site-logging.test.ts +214 -0
  18. package/src/__tests__/computer-use-skill-manifest-regression.test.ts +5 -11
  19. package/src/__tests__/computer-use-tools.test.ts +2 -4
  20. package/src/__tests__/confirmation-request-guardian-bridge.test.ts +0 -1
  21. package/src/__tests__/conversation-agent-loop-disk-pressure.test.ts +1 -1
  22. package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +1 -1
  23. package/src/__tests__/conversation-agent-loop-overflow.test.ts +197 -2
  24. package/src/__tests__/conversation-agent-loop.test.ts +163 -122
  25. package/src/__tests__/conversation-app-control-instantiation.test.ts +2 -5
  26. package/src/__tests__/conversation-clear-safety.test.ts +25 -25
  27. package/src/__tests__/conversation-delete-schedule-cleanup.test.ts +1 -1
  28. package/src/__tests__/conversation-disk-view-integration.test.ts +2 -2
  29. package/src/__tests__/conversation-error.test.ts +31 -0
  30. package/src/__tests__/conversation-fork-crud.test.ts +178 -15
  31. package/src/__tests__/conversation-lifecycle.test.ts +52 -11
  32. package/src/__tests__/{conversation-load-cleaned-at.test.ts → conversation-load-history-stripped.test.ts} +13 -13
  33. package/src/__tests__/conversation-provider-retry-repair.test.ts +1 -0
  34. package/src/__tests__/conversation-routes-disk-view.test.ts +109 -0
  35. package/src/__tests__/conversation-routes-slash-commands.test.ts +35 -0
  36. package/src/__tests__/conversation-skill-tools.test.ts +2 -5
  37. package/src/__tests__/conversation-store.test.ts +1 -1
  38. package/src/__tests__/conversation-sync-tags.test.ts +99 -32
  39. package/src/__tests__/conversation-workspace-cache-state.test.ts +1 -0
  40. package/src/__tests__/conversation-workspace-injection.test.ts +1 -1
  41. package/src/__tests__/conversation-workspace-tool-tracking.test.ts +1 -1
  42. package/src/__tests__/credential-execution-feature-gates.test.ts +9 -7
  43. package/src/__tests__/credential-execution-tools.test.ts +6 -6
  44. package/src/__tests__/credential-security-invariants.test.ts +1 -0
  45. package/src/__tests__/credential-vault-unit.test.ts +2 -2
  46. package/src/__tests__/dynamic-page-surface.test.ts +2 -2
  47. package/src/__tests__/email-html-renderer.test.ts +12 -0
  48. package/src/__tests__/gateway-flag-listener.test.ts +237 -0
  49. package/src/__tests__/gemini-provider.test.ts +78 -0
  50. package/src/__tests__/guardian-dispatch.test.ts +0 -1
  51. package/src/__tests__/guardian-outbound-http.test.ts +7 -5
  52. package/src/__tests__/handlers-user-message-approval-consumption.test.ts +1 -1
  53. package/src/__tests__/heartbeat-disk-pressure.test.ts +4 -0
  54. package/src/__tests__/heartbeat-service.test.ts +4 -0
  55. package/src/__tests__/host-shell-tool.test.ts +1 -1
  56. package/src/__tests__/init-feature-flag-overrides.test.ts +5 -6
  57. package/src/__tests__/list-messages-tool-merge.test.ts +70 -11
  58. package/src/__tests__/llm-request-log-call-site.test.ts +136 -0
  59. package/src/__tests__/llm-request-log-source-clickhouse.test.ts +26 -0
  60. package/src/__tests__/llm-resolver.test.ts +77 -9
  61. package/src/__tests__/llm-usage-store.test.ts +66 -0
  62. package/src/__tests__/logger.test.ts +89 -0
  63. package/src/__tests__/mcp-abort-signal.test.ts +2 -2
  64. package/src/__tests__/media-generate-image.test.ts +31 -0
  65. package/src/__tests__/memory-v2-static-injector.test.ts +7 -7
  66. package/src/__tests__/model-intents.test.ts +2 -4
  67. package/src/__tests__/notification-guardian-path.test.ts +0 -1
  68. package/src/__tests__/onboarding-template-contract.test.ts +1 -1
  69. package/src/__tests__/openai-provider.test.ts +46 -0
  70. package/src/__tests__/openai-responses-provider.test.ts +114 -12
  71. package/src/__tests__/pending-interactions-resolved-event.test.ts +0 -1
  72. package/src/__tests__/platform-bash-auto-approve.test.ts +2 -2
  73. package/src/__tests__/platform.test.ts +2 -2
  74. package/src/__tests__/plugin-api-tool-definition.test.ts +92 -0
  75. package/src/__tests__/plugin-bootstrap.test.ts +2 -2
  76. package/src/__tests__/plugin-tool-contribution.test.ts +13 -6
  77. package/src/__tests__/plugin-types.test.ts +3 -2
  78. package/src/__tests__/prechat-onboarding-contract.test.ts +131 -98
  79. package/src/__tests__/pricing.test.ts +12 -0
  80. package/src/__tests__/prune-jobs-changes-parser.test.ts +61 -0
  81. package/src/__tests__/registry.test.ts +2 -8
  82. package/src/__tests__/require-fresh-approval.test.ts +2 -2
  83. package/src/__tests__/runtime-events-sse-bilingual.test.ts +154 -0
  84. package/src/__tests__/shell-tool-proxy-mode.test.ts +1 -1
  85. package/src/__tests__/skill-feature-flags.test.ts +2 -2
  86. package/src/__tests__/skill-projection-feature-flag.test.ts +4 -7
  87. package/src/__tests__/skill-projection.benchmark.test.ts +2 -6
  88. package/src/__tests__/skill-tool-factory.test.ts +1 -1
  89. package/src/__tests__/subagent-notify-parent.test.ts +1 -1
  90. package/src/__tests__/suggestion-routes.test.ts +1 -0
  91. package/src/__tests__/sync-message-contract.test.ts +59 -0
  92. package/src/__tests__/system-prompt.test.ts +145 -131
  93. package/src/__tests__/terminal-tools.test.ts +1 -1
  94. package/src/__tests__/tool-approval-handler.test.ts +1 -5
  95. package/src/__tests__/tool-execute-pipeline.test.ts +2 -2
  96. package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +2 -5
  97. package/src/__tests__/tool-executor-lifecycle-events.test.ts +15 -5
  98. package/src/__tests__/tool-executor.test.ts +9 -62
  99. package/src/__tests__/tool-grant-request-escalation.test.ts +1 -6
  100. package/src/__tests__/trusted-contact-approval-notifier.test.ts +0 -1
  101. package/src/__tests__/trusted-contact-inline-approval-integration.test.ts +1 -6
  102. package/src/__tests__/trusted-contact-multichannel.test.ts +0 -1
  103. package/src/__tests__/ui-file-upload-surface.test.ts +2 -2
  104. package/src/__tests__/usage-routes.test.ts +3 -0
  105. package/src/__tests__/verification-control-plane-policy.test.ts +2 -2
  106. package/src/__tests__/workspace-git-service.test.ts +6 -5
  107. package/src/__tests__/workspace-migration-089-move-memory-tree-out-of-v3.test.ts +86 -0
  108. package/src/acp/__tests__/prepare-agent-env.test.ts +146 -0
  109. package/src/acp/prepare-agent-env.ts +78 -0
  110. package/src/acp/session-manager.ts +1 -1
  111. package/src/agent/loop.ts +8 -0
  112. package/src/api/README.md +5 -0
  113. package/src/api/index.ts +4 -0
  114. package/src/api/package.json +10 -0
  115. package/src/background-wake/background-wake-routes.test.ts +233 -0
  116. package/src/background-wake/runtime-registry.ts +24 -0
  117. package/src/cli/commands/__tests__/browser.test.ts +23 -5
  118. package/src/cli/commands/__tests__/domain-register.test.ts +110 -0
  119. package/src/cli/commands/__tests__/domain-status.test.ts +33 -33
  120. package/src/cli/commands/__tests__/inference-send.test.ts +108 -5
  121. package/src/cli/commands/__tests__/memory-v2-compare-render.test.ts +98 -0
  122. package/src/cli/commands/__tests__/memory-v2.test.ts +1 -0
  123. package/src/cli/commands/__tests__/memory-v3-render.test.ts +340 -0
  124. package/src/cli/commands/browser.ts +247 -0
  125. package/src/cli/commands/domain.ts +91 -41
  126. package/src/cli/commands/inference.ts +93 -40
  127. package/src/cli/commands/memory-v2-compare-render.ts +115 -0
  128. package/src/cli/commands/memory-v2.ts +176 -1
  129. package/src/cli/commands/memory-v3-render.ts +344 -0
  130. package/src/cli/commands/memory-v3.ts +316 -0
  131. package/src/cli/program.ts +2 -0
  132. package/src/config/assistant-feature-flags.ts +21 -9
  133. package/src/config/bundled-skills/document-editor/SKILL.md +11 -2
  134. package/src/config/bundled-skills/document-editor/TOOLS.json +18 -0
  135. package/src/config/bundled-skills/document-editor/tools/document-open.ts +12 -0
  136. package/src/config/bundled-skills/image-studio/SKILL.md +4 -0
  137. package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +2 -2
  138. package/src/config/bundled-skills/media-processing/tools/ingest-media.ts +13 -8
  139. package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +10 -3
  140. package/src/config/bundled-skills/phone-calls/references/TRANSCRIPTS.md +16 -14
  141. package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +7 -2
  142. package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +7 -2
  143. package/src/config/bundled-tool-registry.ts +2 -0
  144. package/src/config/call-site-defaults.ts +7 -6
  145. package/src/config/feature-flag-registry.json +16 -0
  146. package/src/config/schemas/__tests__/memory-v2.test.ts +213 -1
  147. package/src/config/schemas/call-site-catalog.ts +21 -7
  148. package/src/config/schemas/llm.ts +12 -1
  149. package/src/config/schemas/memory-v2.ts +246 -0
  150. package/src/config/schemas/memory.ts +2 -1
  151. package/src/context/compactor.ts +52 -0
  152. package/src/conversations/__tests__/message-consolidation.test.ts +350 -0
  153. package/src/conversations/message-consolidation.ts +404 -0
  154. package/src/daemon/__tests__/conversation-tool-setup-exclude.test.ts +1 -1
  155. package/src/daemon/__tests__/meet-manifest-loader.test.ts +1 -1
  156. package/src/daemon/conversation-agent-loop-handlers.ts +2 -13
  157. package/src/daemon/conversation-agent-loop.ts +126 -76
  158. package/src/daemon/conversation-error.ts +31 -1
  159. package/src/daemon/conversation-lifecycle.ts +27 -22
  160. package/src/daemon/conversation-runtime-assembly.ts +10 -9
  161. package/src/daemon/conversation-tool-setup.ts +63 -3
  162. package/src/daemon/conversation-usage.ts +2 -0
  163. package/src/daemon/conversation.ts +14 -29
  164. package/src/daemon/disk-pressure-guard.ts +14 -2
  165. package/src/daemon/handlers/config-model.test.ts +1 -0
  166. package/src/daemon/handlers/conversations.ts +11 -3
  167. package/src/daemon/host-browser-proxy.ts +5 -5
  168. package/src/daemon/host-cu-proxy.ts +4 -4
  169. package/src/daemon/host-file-proxy.ts +4 -4
  170. package/src/daemon/host-proxy-base.ts +4 -4
  171. package/src/daemon/host-transfer-proxy.ts +10 -10
  172. package/src/daemon/lifecycle.ts +23 -20
  173. package/src/daemon/meet-manifest-loader.ts +1 -7
  174. package/src/daemon/message-types/conversations.ts +6 -9
  175. package/src/daemon/message-types/home.ts +1 -13
  176. package/src/daemon/message-types/messages.ts +6 -14
  177. package/src/daemon/message-types/sync.ts +14 -0
  178. package/src/daemon/shutdown-handlers.ts +24 -5
  179. package/src/daemon/switch-inference-profile-tool.ts +52 -0
  180. package/src/daemon/tool-setup-types.ts +13 -0
  181. package/src/events/relationship-state-updated.ts +25 -0
  182. package/src/heartbeat/__tests__/heartbeat-service.test.ts +1 -1
  183. package/src/home/home-greeting.ts +0 -9
  184. package/src/home/suggested-prompts.ts +0 -9
  185. package/src/ipc/gateway-flag-listener.ts +123 -0
  186. package/src/ipc/skill-routes/registries.ts +8 -12
  187. package/src/memory/__tests__/db-async-query.test.ts +165 -0
  188. package/src/memory/__tests__/db-maintenance.test.ts +115 -0
  189. package/src/memory/__tests__/jobs-store-enqueue-gate.test.ts +241 -0
  190. package/src/memory/__tests__/jobs-store-job-classes.test.ts +28 -1
  191. package/src/memory/__tests__/memory-retrospective-job.test.ts +7 -0
  192. package/src/memory/auto-analysis-enqueue.ts +5 -1
  193. package/src/memory/conversation-crud.ts +71 -70
  194. package/src/memory/conversation-starters-cadence.ts +3 -1
  195. package/src/memory/conversation-title-service.ts +19 -3
  196. package/src/memory/db-async-query.ts +214 -0
  197. package/src/memory/db-init.ts +10 -0
  198. package/src/memory/db-maintenance.ts +30 -21
  199. package/src/memory/graph/bootstrap.ts +8 -1
  200. package/src/memory/graph/capability-seed.ts +7 -3
  201. package/src/memory/graph/conversation-graph-memory.ts +100 -17
  202. package/src/memory/graph/extraction.ts +1 -5
  203. package/src/memory/graph/graph-search.ts +7 -1
  204. package/src/memory/indexer.ts +28 -18
  205. package/src/memory/job-handlers/cleanup.ts +76 -18
  206. package/src/memory/job-handlers/conversation-starters.ts +1 -4
  207. package/src/memory/jobs/embed-pkb-file.ts +6 -1
  208. package/src/memory/jobs-store.ts +14 -0
  209. package/src/memory/jobs-worker.ts +55 -22
  210. package/src/memory/llm-request-log-source-clickhouse.ts +42 -2
  211. package/src/memory/llm-request-log-source-local.ts +7 -0
  212. package/src/memory/llm-request-log-source.ts +9 -2
  213. package/src/memory/llm-request-log-store.ts +43 -1
  214. package/src/memory/llm-usage-store.ts +24 -0
  215. package/src/memory/memory-retrospective-enqueue.ts +8 -1
  216. package/src/memory/memory-retrospective-job.ts +5 -0
  217. package/src/memory/memory-v2-activation-log-store.ts +15 -6
  218. package/src/memory/migrations/260-rename-cleaned-at.ts +44 -0
  219. package/src/memory/migrations/261-llm-usage-add-raw-usage.ts +36 -0
  220. package/src/memory/migrations/262-memory-v3-coactivation.ts +57 -0
  221. package/src/memory/migrations/263-memory-v3-auto-edges.ts +50 -0
  222. package/src/memory/migrations/264-llm-request-log-call-site.ts +29 -0
  223. package/src/memory/migrations/index.ts +17 -0
  224. package/src/memory/migrations/registry.ts +33 -0
  225. package/src/memory/schema/conversations.ts +1 -1
  226. package/src/memory/schema/infrastructure.ts +21 -0
  227. package/src/memory/tool-usage-store.ts +36 -8
  228. package/src/memory/v2/__tests__/consolidation-job.test.ts +1 -0
  229. package/src/memory/v2/__tests__/harness-compare.test.ts +186 -0
  230. package/src/memory/v2/__tests__/harness-metrics.test.ts +74 -0
  231. package/src/memory/v2/__tests__/harness-oracle.test.ts +257 -0
  232. package/src/memory/v2/__tests__/harness-replay-input.test.ts +225 -0
  233. package/src/memory/v2/__tests__/harness-runner.test.ts +109 -0
  234. package/src/memory/v2/__tests__/injection.test.ts +127 -98
  235. package/src/memory/v2/__tests__/qdrant.test.ts +36 -0
  236. package/src/memory/v2/__tests__/router.test.ts +171 -3
  237. package/src/memory/v2/harness/compare.ts +57 -0
  238. package/src/memory/v2/harness/metrics.ts +124 -0
  239. package/src/memory/v2/harness/oracle.ts +145 -0
  240. package/src/memory/v2/harness/replay-input.ts +224 -0
  241. package/src/memory/v2/harness/retriever.ts +74 -0
  242. package/src/memory/v2/harness/router-retriever.ts +43 -0
  243. package/src/memory/v2/harness/runner.ts +106 -0
  244. package/src/memory/v2/harness/trace.ts +58 -0
  245. package/src/memory/v2/injection.ts +21 -15
  246. package/src/memory/v2/prompts/router.ts +26 -1
  247. package/src/memory/v2/qdrant.ts +14 -2
  248. package/src/memory/v2/router.ts +171 -18
  249. package/src/memory/v3/__tests__/coactivation-store.test.ts +422 -0
  250. package/src/memory/v3/__tests__/consolidation-job.test.ts +468 -0
  251. package/src/memory/v3/__tests__/edge-learning-job.test.ts +324 -0
  252. package/src/memory/v3/__tests__/edges.test.ts +563 -0
  253. package/src/memory/v3/__tests__/filter.test.ts +512 -0
  254. package/src/memory/v3/__tests__/gate.test.ts +574 -0
  255. package/src/memory/v3/__tests__/index-composition.test.ts +233 -0
  256. package/src/memory/v3/__tests__/loop.test.ts +530 -0
  257. package/src/memory/v3/__tests__/retriever.test.ts +226 -0
  258. package/src/memory/v3/__tests__/scouts.test.ts +440 -0
  259. package/src/memory/v3/__tests__/shadow-middleware.test.ts +312 -0
  260. package/src/memory/v3/__tests__/system-prompts.test.ts +154 -0
  261. package/src/memory/v3/__tests__/traversal.test.ts +469 -0
  262. package/src/memory/v3/__tests__/tree-index.test.ts +280 -0
  263. package/src/memory/v3/__tests__/tree-store.test.ts +529 -0
  264. package/src/memory/v3/__tests__/tree-walk.test.ts +707 -0
  265. package/src/memory/v3/__tests__/validate.test.ts +245 -0
  266. package/src/memory/v3/auto-edges.ts +223 -0
  267. package/src/memory/v3/coactivation-store.ts +124 -0
  268. package/src/memory/v3/consolidation-job.ts +323 -0
  269. package/src/memory/v3/edge-learning-job.ts +160 -0
  270. package/src/memory/v3/edges.ts +249 -0
  271. package/src/memory/v3/filter.ts +281 -0
  272. package/src/memory/v3/gate.ts +334 -0
  273. package/src/memory/v3/index-composition.ts +113 -0
  274. package/src/memory/v3/llm-capture.ts +46 -0
  275. package/src/memory/v3/loop.ts +382 -0
  276. package/src/memory/v3/maintenance.ts +144 -0
  277. package/src/memory/v3/prompt-context.ts +33 -0
  278. package/src/memory/v3/prompts/consolidation.ts +458 -0
  279. package/src/memory/v3/prompts/system-prompts.ts +196 -0
  280. package/src/memory/v3/retriever.ts +33 -0
  281. package/src/memory/v3/scouts.ts +420 -0
  282. package/src/memory/v3/shadow-middleware.ts +305 -0
  283. package/src/memory/v3/traversal.ts +206 -0
  284. package/src/memory/v3/tree-index.ts +237 -0
  285. package/src/memory/v3/tree-store.ts +394 -0
  286. package/src/memory/v3/tree-walk.ts +351 -0
  287. package/src/memory/v3/types.ts +65 -0
  288. package/src/memory/v3/validate.ts +300 -0
  289. package/src/notifications/adapters/macos.ts +18 -1
  290. package/src/notifications/adapters/platform.ts +1 -1
  291. package/src/notifications/decision-engine.ts +1 -4
  292. package/src/notifications/emit-signal.ts +29 -49
  293. package/src/permissions/prompter.ts +3 -3
  294. package/src/permissions/question-prompter.ts +5 -2
  295. package/src/permissions/secret-prompter.ts +2 -2
  296. package/src/plugin-api/index.ts +4 -0
  297. package/src/plugin-api/types.ts +7 -33
  298. package/src/plugins/defaults/index.ts +6 -0
  299. package/src/plugins/defaults/injectors.ts +18 -11
  300. package/src/plugins/external-plugin-loader.ts +5 -68
  301. package/src/plugins/types.ts +11 -16
  302. package/src/proactive-artifact/aux-message-injector.ts +17 -4
  303. package/src/prompts/__tests__/task-progress-hint-section.test.ts +3 -9
  304. package/src/prompts/persona-resolver.ts +36 -21
  305. package/src/prompts/sections.ts +39 -7
  306. package/src/prompts/system-prompt.ts +50 -185
  307. package/src/prompts/templates/BOOTSTRAP.md +2 -2
  308. package/src/prompts/templates/system-sections.ts +230 -8
  309. package/src/providers/__tests__/connection-model-compat.test.ts +234 -0
  310. package/src/providers/__tests__/retry-callsite.test.ts +85 -5
  311. package/src/providers/anthropic/client.ts +32 -66
  312. package/src/providers/call-site-routing.ts +14 -2
  313. package/src/providers/connection-model-compat.ts +38 -0
  314. package/src/providers/connection-resolution.ts +16 -2
  315. package/src/providers/gemini/client.ts +49 -6
  316. package/src/providers/inference/adapter-factory.ts +3 -0
  317. package/src/providers/minimax/client.ts +106 -0
  318. package/src/providers/model-catalog.ts +43 -0
  319. package/src/providers/model-intents.ts +1 -1
  320. package/src/providers/openai/chat-completions-provider.ts +6 -3
  321. package/src/providers/openai/codex-models.ts +18 -0
  322. package/src/providers/openai/responses-provider.ts +78 -21
  323. package/src/providers/provider-send-message.ts +7 -1
  324. package/src/providers/retry.ts +34 -3
  325. package/src/providers/thinking-config.ts +26 -1
  326. package/src/providers/usage-tracking.ts +2 -0
  327. package/src/runtime/AGENTS.md +2 -2
  328. package/src/runtime/agent-wake.ts +1 -0
  329. package/src/runtime/assistant-event-hub.ts +76 -6
  330. package/src/runtime/auth/route-policy.ts +36 -0
  331. package/src/runtime/btw-sidechain.ts +0 -6
  332. package/src/runtime/http-types.ts +0 -2
  333. package/src/runtime/migrations/vbundle-builder.ts +10 -3
  334. package/src/runtime/pending-interactions.ts +0 -1
  335. package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +106 -0
  336. package/src/runtime/routes/__tests__/memory-v2-simulate-route.test.ts +25 -6
  337. package/src/runtime/routes/__tests__/plugins-routes.test.ts +512 -0
  338. package/src/runtime/routes/acp-routes.test.ts +255 -6
  339. package/src/runtime/routes/acp-routes.ts +8 -1
  340. package/src/runtime/routes/avatar-routes.ts +10 -10
  341. package/src/runtime/routes/background-wake-routes.ts +188 -0
  342. package/src/runtime/routes/browser-tabs-routes.ts +200 -0
  343. package/src/runtime/routes/btw-routes.ts +0 -6
  344. package/src/runtime/routes/conversation-cli-routes.ts +1 -1
  345. package/src/runtime/routes/conversation-list-routes.ts +12 -4
  346. package/src/runtime/routes/conversation-management-routes.ts +77 -20
  347. package/src/runtime/routes/conversation-query-routes.ts +142 -36
  348. package/src/runtime/routes/conversation-routes.ts +252 -410
  349. package/src/runtime/routes/conversation-starter-routes.ts +6 -3
  350. package/src/runtime/routes/disk-pressure-routes.ts +1 -1
  351. package/src/runtime/routes/domain-routes.ts +60 -10
  352. package/src/runtime/routes/email-routes.ts +5 -2
  353. package/src/runtime/routes/events-routes.ts +54 -10
  354. package/src/runtime/routes/group-routes.ts +24 -8
  355. package/src/runtime/routes/host-browser-routes.ts +10 -2
  356. package/src/runtime/routes/host-cu-routes.ts +2 -2
  357. package/src/runtime/routes/inbound-stages/acl-enforcement.ts +96 -3
  358. package/src/runtime/routes/index.ts +8 -0
  359. package/src/runtime/routes/inference-profile-session-handler.ts +22 -12
  360. package/src/runtime/routes/inference-profile-session-routes.ts +7 -1
  361. package/src/runtime/routes/llm-call-sites-routes.ts +32 -5
  362. package/src/runtime/routes/memory-item-routes.ts +8 -3
  363. package/src/runtime/routes/memory-v2-routes.ts +215 -5
  364. package/src/runtime/routes/memory-v3-routes.ts +316 -0
  365. package/src/runtime/routes/migration-routes.ts +21 -24
  366. package/src/runtime/routes/plugins-routes.ts +337 -0
  367. package/src/runtime/routes/rename-conversation-routes.ts +6 -2
  368. package/src/runtime/routes/secret-routes.ts +25 -5
  369. package/src/runtime/routes/settings-routes.ts +12 -11
  370. package/src/runtime/routes/slack-channel-routes.ts +5 -4
  371. package/src/runtime/routes/workspace-routes.ts +25 -10
  372. package/src/runtime/sync/resource-sync-events.ts +106 -38
  373. package/src/runtime/sync/sync-publisher.test.ts +49 -0
  374. package/src/runtime/sync/sync-publisher.ts +2 -1
  375. package/src/runtime/verification-outbound-actions.ts +73 -1
  376. package/src/telemetry/types.ts +12 -0
  377. package/src/telemetry/usage-telemetry-reporter.test.ts +48 -0
  378. package/src/telemetry/usage-telemetry-reporter.ts +1 -0
  379. package/src/tools/acp/spawn.test.ts +119 -0
  380. package/src/tools/acp/spawn.ts +15 -2
  381. package/src/tools/apps/definitions.ts +2 -8
  382. package/src/tools/ask-question/ask-question-tool.test.ts +3 -3
  383. package/src/tools/ask-question/ask-question-tool.ts +38 -45
  384. package/src/tools/browser/__tests__/pinned-tabs.test.ts +70 -0
  385. package/src/tools/browser/browser-execution.ts +16 -3
  386. package/src/tools/browser/cdp-client/__tests__/browser-tabs-factory.test.ts +402 -0
  387. package/src/tools/browser/cdp-client/__tests__/types.test.ts +3 -0
  388. package/src/tools/browser/cdp-client/cdp-inspect-client.ts +12 -0
  389. package/src/tools/browser/cdp-client/extension-cdp-client.ts +27 -1
  390. package/src/tools/browser/cdp-client/factory.ts +100 -17
  391. package/src/tools/browser/cdp-client/local-cdp-client.ts +12 -0
  392. package/src/tools/browser/cdp-client/types.ts +65 -0
  393. package/src/tools/browser/pinned-tabs.ts +96 -40
  394. package/src/tools/computer-use/definitions.ts +22 -78
  395. package/src/tools/credential-execution/make-authenticated-request.ts +3 -9
  396. package/src/tools/credential-execution/manage-secure-command-tool.ts +3 -9
  397. package/src/tools/credential-execution/run-authenticated-command.ts +3 -9
  398. package/src/tools/credentials/vault.ts +3 -9
  399. package/src/tools/document/document-tool.ts +59 -0
  400. package/src/tools/execution-target.ts +21 -23
  401. package/src/tools/executor.ts +6 -1
  402. package/src/tools/filesystem/edit.ts +3 -9
  403. package/src/tools/filesystem/list.ts +3 -9
  404. package/src/tools/filesystem/read.ts +3 -9
  405. package/src/tools/filesystem/write.ts +3 -9
  406. package/src/tools/host-filesystem/edit.ts +3 -9
  407. package/src/tools/host-filesystem/read.ts +3 -9
  408. package/src/tools/host-filesystem/transfer.ts +3 -9
  409. package/src/tools/host-filesystem/write.ts +3 -9
  410. package/src/tools/host-terminal/host-shell.ts +3 -9
  411. package/src/tools/mcp/mcp-tool-factory.ts +1 -8
  412. package/src/tools/memory/register.test.ts +1 -1
  413. package/src/tools/memory/register.ts +4 -9
  414. package/src/tools/network/web-fetch.ts +3 -9
  415. package/src/tools/network/web-search.ts +25 -32
  416. package/src/tools/registry.ts +7 -23
  417. package/src/tools/schema-transforms.ts +1 -1
  418. package/src/tools/skills/execute.ts +3 -9
  419. package/src/tools/skills/load.ts +3 -9
  420. package/src/tools/skills/skill-tool-factory.ts +1 -8
  421. package/src/tools/subagent/notify-parent.ts +3 -9
  422. package/src/tools/system/request-permission.ts +3 -9
  423. package/src/tools/terminal/shell.ts +3 -9
  424. package/src/tools/tool-defaults.ts +94 -0
  425. package/src/tools/types.ts +27 -98
  426. package/src/tools/ui-surface/definitions.ts +6 -22
  427. package/src/usage/pricing.ts +23 -0
  428. package/src/usage/types.ts +12 -0
  429. package/src/util/logger.ts +16 -7
  430. package/src/util/platform.ts +7 -2
  431. package/src/util/sqlite3-runtime.ts +65 -0
  432. package/src/workspace/migrations/086-revert-stale-gemini-mis-rewrites.ts +1 -0
  433. package/src/workspace/migrations/089-move-memory-tree-out-of-v3.ts +86 -0
  434. package/src/workspace/migrations/registry.ts +2 -0
  435. package/src/__tests__/compaction-strip-metadata-clear.test.ts +0 -206
  436. package/src/__tests__/message-complete-display-id.test.ts +0 -175
  437. package/src/daemon/query-complexity-router.ts +0 -75
  438. package/src/prompts/cache-boundary.ts +0 -8
@@ -6,8 +6,8 @@
6
6
  * rendering, argument validation, and the no-message guard. They run
7
7
  * entirely inside the CLI process and need no daemon stub.
8
8
  *
9
- * Follow-up opportunity: mock `../../../ipc/cli-client.js` with canned
10
- * responses to cover the deeper send-message paths against the IPC contract.
9
+ * The IPC client is mocked with canned responses so tests can assert the
10
+ * request contract without opening an assistant socket.
11
11
  */
12
12
 
13
13
  import {
@@ -23,6 +23,34 @@ import { Command } from "commander";
23
23
  // ---------------------------------------------------------------------------
24
24
 
25
25
  let mockStdinContent: string | null = null;
26
+ let lastIpcCall: {
27
+ method: string;
28
+ params?: Record<string, unknown>;
29
+ options?: { timeoutMs?: number };
30
+ } | null = null;
31
+ let mockIpcResult: {
32
+ ok: boolean;
33
+ result?: unknown;
34
+ error?: string;
35
+ } = {
36
+ ok: true,
37
+ result: {
38
+ response: "Hello from the model.",
39
+ model: "test-model",
40
+ usage: { inputTokens: 3, outputTokens: 4 },
41
+ },
42
+ };
43
+
44
+ mock.module("../../../ipc/cli-client.js", () => ({
45
+ cliIpcCall: async (
46
+ method: string,
47
+ params?: Record<string, unknown>,
48
+ options?: { timeoutMs?: number },
49
+ ) => {
50
+ lastIpcCall = { method, params, options };
51
+ return mockIpcResult;
52
+ },
53
+ }));
26
54
 
27
55
  mock.module("../../../providers/provider-send-message.js", () => ({
28
56
  // The handler under test calls getConfiguredProvider before any of the
@@ -30,7 +58,10 @@ mock.module("../../../providers/provider-send-message.js", () => ({
30
58
  // loads cleanly even though no test actually drives a request.
31
59
  getConfiguredProvider: async () => null,
32
60
  extractAllText: () => "",
33
- userMessage: (text: string) => ({ role: "user", content: [{ type: "text", text }] }),
61
+ userMessage: (text: string) => ({
62
+ role: "user",
63
+ content: [{ type: "text", text }],
64
+ }),
34
65
  }));
35
66
 
36
67
  mock.module("../../../config/loader.js", () => ({
@@ -44,8 +75,18 @@ mock.module("../../../config/loader.js", () => ({
44
75
  }));
45
76
 
46
77
  mock.module("../../../util/logger.js", () => ({
47
- getLogger: () => ({ info: () => {}, warn: () => {}, error: () => {}, debug: () => {} }),
48
- getCliLogger: () => ({ info: () => {}, warn: () => {}, error: () => {}, debug: () => {} }),
78
+ getLogger: () => ({
79
+ info: () => {},
80
+ warn: () => {},
81
+ error: () => {},
82
+ debug: () => {},
83
+ }),
84
+ getCliLogger: () => ({
85
+ info: () => {},
86
+ warn: () => {},
87
+ error: () => {},
88
+ debug: () => {},
89
+ }),
49
90
  }));
50
91
 
51
92
  mock.module("node:fs", () => ({
@@ -127,6 +168,15 @@ async function runCommand(
127
168
 
128
169
  beforeEach(() => {
129
170
  mockStdinContent = null;
171
+ lastIpcCall = null;
172
+ mockIpcResult = {
173
+ ok: true,
174
+ result: {
175
+ response: "Hello from the model.",
176
+ model: "test-model",
177
+ usage: { inputTokens: 3, outputTokens: 4 },
178
+ },
179
+ };
130
180
  process.exitCode = 0;
131
181
  });
132
182
 
@@ -142,6 +192,7 @@ describe("help text", () => {
142
192
  expect(stdout).toContain("--model");
143
193
  expect(stdout).toContain("--profile");
144
194
  expect(stdout).toContain("--max-tokens");
195
+ expect(stdout).toContain("--timeout-seconds");
145
196
  expect(stdout).toContain("--json");
146
197
  expect(stdout).toContain("[message...]");
147
198
  });
@@ -153,6 +204,7 @@ describe("help text", () => {
153
204
  expect(stdout).toContain("--model");
154
205
  expect(stdout).toContain("--profile");
155
206
  expect(stdout).toContain("--max-tokens");
207
+ expect(stdout).toContain("--timeout-seconds");
156
208
  expect(stdout).toContain("--json");
157
209
  expect(stdout).toContain("[message...]");
158
210
  });
@@ -225,3 +277,54 @@ describe("--max-tokens", () => {
225
277
  expect(parsed.error).toContain("Invalid --max-tokens");
226
278
  });
227
279
  });
280
+
281
+ // ---------------------------------------------------------------------------
282
+ // IPC timeout
283
+ // ---------------------------------------------------------------------------
284
+
285
+ describe("--timeout-seconds", () => {
286
+ test("uses a long default IPC timeout for inference calls", async () => {
287
+ const { exitCode, stdout } = await runCommand([
288
+ "inference",
289
+ "send",
290
+ "--json",
291
+ "Hello",
292
+ ]);
293
+
294
+ expect(exitCode).toBe(0);
295
+ expect(JSON.parse(stdout).ok).toBe(true);
296
+ expect(lastIpcCall!.method).toBe("inference_send");
297
+ expect(lastIpcCall!.options!.timeoutMs).toBe(32 * 60 * 1000);
298
+ });
299
+
300
+ test("passes custom timeout to IPC call", async () => {
301
+ const { exitCode } = await runCommand([
302
+ "llm",
303
+ "send",
304
+ "--timeout-seconds",
305
+ "300",
306
+ "Hello",
307
+ ]);
308
+
309
+ expect(exitCode).toBe(0);
310
+ expect(lastIpcCall!.method).toBe("inference_send");
311
+ expect(lastIpcCall!.options!.timeoutMs).toBe(300_000);
312
+ });
313
+
314
+ test("errors on invalid timeout value", async () => {
315
+ const { exitCode, stdout } = await runCommand([
316
+ "inference",
317
+ "send",
318
+ "--timeout-seconds",
319
+ "0",
320
+ "--json",
321
+ "Hello",
322
+ ]);
323
+
324
+ expect(exitCode).toBe(1);
325
+ expect(lastIpcCall).toBeNull();
326
+ const parsed = JSON.parse(stdout);
327
+ expect(parsed.ok).toBe(false);
328
+ expect(parsed.error).toContain("Invalid --timeout-seconds");
329
+ });
330
+ });
@@ -0,0 +1,98 @@
1
+ import { describe, expect, test } from "bun:test";
2
+
3
+ import type { ComparisonReport } from "../../../memory/v2/harness/runner.js";
4
+ import {
5
+ renderComparisonReport,
6
+ renderTurnTrace,
7
+ } from "../memory-v2-compare-render.js";
8
+
9
+ function sampleReport(): ComparisonReport {
10
+ return {
11
+ ks: [5, 10],
12
+ turnsConsidered: 3,
13
+ turnsScored: 1,
14
+ turnsSkipped: 2,
15
+ perTurn: [
16
+ {
17
+ conversationId: "c1",
18
+ turn: 7,
19
+ byRetriever: {
20
+ router: {
21
+ groundTruth: ["a", "b"],
22
+ selected: ["a", "x"],
23
+ hits: ["a"],
24
+ misses: ["b"],
25
+ extras: ["x"],
26
+ recallAtK: { 5: 0.5, 10: 0.5 },
27
+ hitsByLane: { tier1: 1 },
28
+ failureReason: null,
29
+ },
30
+ },
31
+ },
32
+ ],
33
+ retrievers: [
34
+ {
35
+ name: "router",
36
+ aggregate: {
37
+ turns: 1,
38
+ meanRecallAtK: { 5: 0.5, 10: 0.5 },
39
+ failureRate: 0,
40
+ },
41
+ },
42
+ ],
43
+ };
44
+ }
45
+
46
+ describe("memory v2 compare — renderComparisonReport", () => {
47
+ test("renders turn counts, recall@k, and per-lane attribution", () => {
48
+ const out = renderComparisonReport(sampleReport());
49
+ expect(out).toContain("considered 3, scored 1, skipped 2");
50
+ expect(out).toContain("Retriever: router");
51
+ expect(out).toContain("recall@5: 0.500");
52
+ expect(out).toContain("recall@10: 0.500");
53
+ expect(out).toContain("failures: 0.0%");
54
+ expect(out).toContain("hits by lane: tier1=1");
55
+ });
56
+
57
+ test("renders mean cost when present", () => {
58
+ const report = sampleReport();
59
+ report.retrievers[0]!.aggregate.meanCostUsd = 0.0123;
60
+ expect(renderComparisonReport(report)).toContain("mean cost: $0.0123");
61
+ });
62
+
63
+ test("handles a report with no scored turns", () => {
64
+ const out = renderComparisonReport({
65
+ ks: [5],
66
+ turnsConsidered: 4,
67
+ turnsScored: 0,
68
+ turnsSkipped: 4,
69
+ perTurn: [],
70
+ retrievers: [
71
+ {
72
+ name: "router",
73
+ aggregate: { turns: 0, meanRecallAtK: { 5: 0 }, failureRate: 0 },
74
+ },
75
+ ],
76
+ });
77
+ expect(out).toContain("No turns scored");
78
+ });
79
+ });
80
+
81
+ describe("memory v2 compare — renderTurnTrace", () => {
82
+ test("renders the per-retriever breakdown for a scored turn", () => {
83
+ const out = renderTurnTrace(sampleReport(), "c1", 7);
84
+ expect(out).toContain("Turn c1:7");
85
+ expect(out).toContain("Retriever: router");
86
+ expect(out).toContain("selected (2): a, x");
87
+ expect(out).toContain("hits (1): a");
88
+ expect(out).toContain("misses (1): b");
89
+ expect(out).toContain("extras (1): x");
90
+ expect(out).toContain("(no descent trace — tier-based retriever)");
91
+ });
92
+
93
+ test("explains when the requested turn was not scored", () => {
94
+ const out = renderTurnTrace(sampleReport(), "c1", 999);
95
+ expect(out).toContain("not found");
96
+ expect(out).toContain("turnsSkipped=2");
97
+ });
98
+ });
@@ -143,6 +143,7 @@ describe("subcommand registration", () => {
143
143
  const subcommandNames = v2!.commands.map((c) => c.name()).sort();
144
144
  expect(subcommandNames).toEqual([
145
145
  "activation",
146
+ "compare",
146
147
  "ema",
147
148
  "reembed",
148
149
  "reembed-skills",
@@ -0,0 +1,340 @@
1
+ import { describe, expect, test } from "bun:test";
2
+
3
+ import type {
4
+ LlmCallRecord,
5
+ MemoryV3SimulateResult,
6
+ MemoryV3TreeResult,
7
+ MemoryV3ValidateResult,
8
+ } from "../../../runtime/routes/memory-v3-routes.js";
9
+ import {
10
+ renderLlmCalls,
11
+ renderSimulation,
12
+ renderTree,
13
+ renderValidationReport,
14
+ reportHasDefects,
15
+ } from "../memory-v3-render.js";
16
+
17
+ function cleanReport(): MemoryV3ValidateResult {
18
+ return {
19
+ danglingChildRefs: [],
20
+ danglingChildRefCount: 0,
21
+ orphanPages: [],
22
+ orphanPageCount: 0,
23
+ cycles: [],
24
+ cycleCount: 0,
25
+ staleIndex: [],
26
+ staleIndexCount: 0,
27
+ unknownEdgeTargets: [],
28
+ unknownEdgeTargetCount: 0,
29
+ };
30
+ }
31
+
32
+ describe("memory v3 — renderValidationReport", () => {
33
+ test("renders 'none' for every empty category", () => {
34
+ const out = renderValidationReport(cleanReport());
35
+ expect(out).toContain("Memory v3 Tree Validation");
36
+ expect(out).toContain("Dangling child refs: none");
37
+ expect(out).toContain("Orphan pages: none");
38
+ expect(out).toContain("Cycles: none");
39
+ expect(out).toContain("Stale index: none");
40
+ expect(out).toContain("Unknown edge targets: none");
41
+ });
42
+
43
+ test("renders counts and offending ids for each defect category", () => {
44
+ const report: MemoryV3ValidateResult = {
45
+ danglingChildRefs: [{ node: "people", ref: "ghost", kind: "node" }],
46
+ danglingChildRefCount: 1,
47
+ orphanPages: ["stray-page"],
48
+ orphanPageCount: 1,
49
+ cycles: [{ from: "a", to: "b" }],
50
+ cycleCount: 1,
51
+ staleIndex: [
52
+ { node: "root", child: "people", nodeMtimeMs: 1, childMtimeMs: 2 },
53
+ ],
54
+ staleIndexCount: 1,
55
+ unknownEdgeTargets: [{ from: "p1", to: "missing" }],
56
+ unknownEdgeTargetCount: 1,
57
+ };
58
+ const out = renderValidationReport(report);
59
+ expect(out).toContain("Dangling child refs: 1");
60
+ expect(out).toContain("people → node:ghost");
61
+ expect(out).toContain("Orphan pages: 1");
62
+ expect(out).toContain("- stray-page");
63
+ expect(out).toContain("Cycles: 1");
64
+ expect(out).toContain("a → b");
65
+ expect(out).toContain("Stale index: 1");
66
+ expect(out).toContain("root (older than child people)");
67
+ expect(out).toContain("Unknown edge targets: 1");
68
+ expect(out).toContain("p1 → missing");
69
+ });
70
+ });
71
+
72
+ describe("memory v3 — reportHasDefects", () => {
73
+ test("false for a clean report", () => {
74
+ expect(reportHasDefects(cleanReport())).toBe(false);
75
+ });
76
+
77
+ test("true when any single category is non-empty", () => {
78
+ const report = cleanReport();
79
+ report.orphanPageCount = 1;
80
+ report.orphanPages = ["x"];
81
+ expect(reportHasDefects(report)).toBe(true);
82
+ });
83
+ });
84
+
85
+ describe("memory v3 — renderTree", () => {
86
+ test("renders an indented tree descending node and page children", () => {
87
+ const view: MemoryV3TreeResult = {
88
+ root: "_root",
89
+ nodes: [
90
+ {
91
+ id: "_root",
92
+ children: [
93
+ { kind: "node", ref: "people" },
94
+ { kind: "page", ref: "overview" },
95
+ ],
96
+ },
97
+ {
98
+ id: "people",
99
+ children: [{ kind: "page", ref: "alice" }],
100
+ },
101
+ ],
102
+ };
103
+ const out = renderTree(view);
104
+ expect(out).toBe(
105
+ ["node:_root", " node:people", " page:alice", " page:overview"].join(
106
+ "\n",
107
+ ),
108
+ );
109
+ });
110
+
111
+ test("marks a shared DAG sub-node as a re-entry rather than re-expanding", () => {
112
+ const view: MemoryV3TreeResult = {
113
+ root: "_root",
114
+ nodes: [
115
+ {
116
+ id: "_root",
117
+ children: [
118
+ { kind: "node", ref: "a" },
119
+ { kind: "node", ref: "b" },
120
+ ],
121
+ },
122
+ { id: "a", children: [{ kind: "node", ref: "shared" }] },
123
+ { id: "b", children: [{ kind: "node", ref: "shared" }] },
124
+ { id: "shared", children: [{ kind: "page", ref: "leaf" }] },
125
+ ],
126
+ };
127
+ const out = renderTree(view);
128
+ // First reach under `a` expands; second reach under `b` is a marked re-entry.
129
+ expect(out).toContain(" node:a\n node:shared\n page:leaf");
130
+ expect(out).toContain("node:shared (↑ already shown)");
131
+ // The leaf page is expanded exactly once.
132
+ expect(out.match(/page:leaf/g)?.length).toBe(1);
133
+ });
134
+
135
+ test("bounds output on a cycle instead of looping forever", () => {
136
+ const view: MemoryV3TreeResult = {
137
+ root: "_root",
138
+ nodes: [
139
+ { id: "_root", children: [{ kind: "node", ref: "a" }] },
140
+ { id: "a", children: [{ kind: "node", ref: "_root" }] },
141
+ ],
142
+ };
143
+ const out = renderTree(view);
144
+ expect(out).toContain("node:_root (↑ already shown)");
145
+ });
146
+
147
+ test("flags a child ref whose target node is missing", () => {
148
+ const view: MemoryV3TreeResult = {
149
+ root: "_root",
150
+ nodes: [{ id: "_root", children: [{ kind: "node", ref: "ghost" }] }],
151
+ };
152
+ const out = renderTree(view);
153
+ expect(out).toContain("node:ghost (missing)");
154
+ });
155
+
156
+ test("lists nodes unreachable from the root", () => {
157
+ const view: MemoryV3TreeResult = {
158
+ root: "_root",
159
+ nodes: [
160
+ { id: "_root", children: [] },
161
+ { id: "floating", children: [] },
162
+ ],
163
+ };
164
+ const out = renderTree(view);
165
+ expect(out).toContain("Unreachable nodes (1):");
166
+ expect(out).toContain("- node:floating");
167
+ });
168
+ });
169
+
170
+ function simResult(): MemoryV3SimulateResult {
171
+ return {
172
+ query: "what should we ship next",
173
+ selectedSlugs: ["page-tree", "page-hot", "page-edge"],
174
+ sourceBySlug: {
175
+ "page-hot": "hot",
176
+ "page-tree": "tree",
177
+ "page-edge": "edge",
178
+ },
179
+ trace: {
180
+ passes: [
181
+ {
182
+ passNumber: 1,
183
+ scouts: [
184
+ { lane: "hot", slugs: ["page-hot"] },
185
+ { lane: "sparse", slugs: [] },
186
+ { lane: "dense", slugs: ["d1", "d2"] },
187
+ ],
188
+ treeLevels: [
189
+ {
190
+ node: "",
191
+ considered: ["people", "frames", "objects"],
192
+ descended: ["people", "frames"],
193
+ skipped: ["objects"],
194
+ reasoning: "query is about planning",
195
+ },
196
+ ],
197
+ edgeExpansions: [{ from: "page-tree", pulled: ["page-edge"] }],
198
+ gate: { decision: "more", questions: ["narrow to roadmap?"] },
199
+ },
200
+ {
201
+ passNumber: 2,
202
+ scouts: [{ lane: "hot", slugs: [] }],
203
+ gate: { decision: "ready" },
204
+ },
205
+ ],
206
+ },
207
+ cost: { ms: 1234 },
208
+ failureReason: null,
209
+ llmCalls: [],
210
+ effectiveConfig: {
211
+ passCap: 3,
212
+ lanes: { hot: true, sparse: true, dense: true, tree: true, edges: false },
213
+ },
214
+ };
215
+ }
216
+
217
+ describe("memory v3 — renderSimulation", () => {
218
+ test("renders query, effective config, per-pass trace, and grouped selection", () => {
219
+ const out = renderSimulation(simResult());
220
+ expect(out).toContain("Memory v3 Retrieval Simulation");
221
+ expect(out).toContain('Query: "what should we ship next"');
222
+ expect(out).toContain("passCap: 3");
223
+ // A disabled lane is surfaced in an `(off: …)` suffix.
224
+ expect(out).toContain("lanes: hot, sparse, dense, tree (off: edges)");
225
+
226
+ expect(out).toContain("Passes: 2");
227
+ expect(out).toContain("Pass 1");
228
+ expect(out).toContain("scouts: hot=1 sparse=0 dense=2");
229
+ // The root tree level ("" node) prints as [root] with branch counts.
230
+ expect(out).toContain("[root]: considered 3, descended 2, skipped 1");
231
+ expect(out).toContain("→ people, frames");
232
+ expect(out).toContain("reason: query is about planning");
233
+ expect(out).toContain("edges: 1 seed(s) expanded, 1 pulled");
234
+ expect(out).toContain("gate: more");
235
+ expect(out).toContain("? narrow to roadmap?");
236
+ expect(out).toContain("gate: ready");
237
+
238
+ expect(out).toContain("Selected: 3 page(s)");
239
+ expect(out).toContain("Cost: 1234 ms");
240
+ });
241
+
242
+ test("groups selected slugs by provenance lane in fanout order", () => {
243
+ const out = renderSimulation(simResult());
244
+ const hotAt = out.indexOf("hot (1)");
245
+ const treeAt = out.indexOf("tree (1)");
246
+ const edgeAt = out.indexOf("edge (1)");
247
+ expect(hotAt).toBeGreaterThan(-1);
248
+ expect(treeAt).toBeGreaterThan(-1);
249
+ expect(edgeAt).toBeGreaterThan(-1);
250
+ // hot precedes tree precedes edge in SIMULATE_LANE_ORDER.
251
+ expect(hotAt).toBeLessThan(treeAt);
252
+ expect(treeAt).toBeLessThan(edgeAt);
253
+ });
254
+
255
+ test("renders all lanes inline when none are disabled", () => {
256
+ const result = simResult();
257
+ result.effectiveConfig.lanes.edges = true;
258
+ const out = renderSimulation(result);
259
+ expect(out).toContain("lanes: hot, sparse, dense, tree, edges");
260
+ expect(out).not.toContain("(off:");
261
+ });
262
+
263
+ test("surfaces a failure reason when the loop degraded", () => {
264
+ const result = simResult();
265
+ result.failureReason = "dense filter failed open";
266
+ const out = renderSimulation(result);
267
+ expect(out).toContain("Failure: dense filter failed open");
268
+ });
269
+ });
270
+
271
+ function llmCall(over: Partial<LlmCallRecord> = {}): LlmCallRecord {
272
+ return {
273
+ pass: 1,
274
+ lane: "gate",
275
+ callSite: "memoryV3Gate",
276
+ request: {
277
+ systemPrompt: "SYS-PROMPT",
278
+ messages: [
279
+ { role: "user", content: [{ type: "text", text: "USER-MSG" }] },
280
+ ],
281
+ tools: [
282
+ {
283
+ name: "decide_selection",
284
+ description: "decide",
285
+ input_schema: { type: "object", properties: {} },
286
+ },
287
+ ],
288
+ },
289
+ response: {
290
+ model: "stub-model",
291
+ stopReason: "tool_use",
292
+ usage: { inputTokens: 0, outputTokens: 0 },
293
+ content: [
294
+ {
295
+ type: "tool_use",
296
+ id: "tu-1",
297
+ name: "decide_selection",
298
+ input: { decision: "ready", selected_slugs: ["a"] },
299
+ },
300
+ ],
301
+ },
302
+ ms: 42,
303
+ ...over,
304
+ };
305
+ }
306
+
307
+ describe("memory v3 — renderLlmCalls", () => {
308
+ test("compact: one line per call with lane, node, and tool summary", () => {
309
+ const out = renderLlmCalls(
310
+ [
311
+ llmCall(),
312
+ llmCall({
313
+ lane: "descent",
314
+ callSite: "memoryV3Descent",
315
+ node: "people",
316
+ }),
317
+ ],
318
+ { full: false },
319
+ );
320
+ expect(out).toContain("LLM calls (2):");
321
+ expect(out).toContain("pass1 · gate");
322
+ expect(out).toContain("pass1 · descent · node=people");
323
+ expect(out).toContain("decide_selection");
324
+ expect(out).toContain("42ms");
325
+ // Compact mode must not dump the full system prompt.
326
+ expect(out).not.toContain("SYS-PROMPT");
327
+ });
328
+
329
+ test("full: includes system prompt, messages, tools, and tool_use input", () => {
330
+ const out = renderLlmCalls([llmCall()], { full: true });
331
+ expect(out).toContain("SYS-PROMPT");
332
+ expect(out).toContain("USER-MSG");
333
+ expect(out).toContain("decide_selection");
334
+ expect(out).toContain('"decision"');
335
+ });
336
+
337
+ test("renders 'none' when there are no calls", () => {
338
+ expect(renderLlmCalls([], { full: false })).toBe("LLM calls: none");
339
+ });
340
+ });