vellum 0.2.1 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (349) hide show
  1. package/README.md +15 -2
  2. package/bun.lock +5 -2
  3. package/package.json +4 -2
  4. package/scripts/capture-x-graphql.ts +562 -0
  5. package/scripts/ipc/check-swift-decoder-drift.ts +2 -1
  6. package/scripts/test.sh +5 -0
  7. package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +133 -34
  8. package/src/__tests__/account-registry.test.ts +2 -1
  9. package/src/__tests__/agent-heartbeat-service.test.ts +250 -0
  10. package/src/__tests__/asset-materialize-tool.test.ts +16 -15
  11. package/src/__tests__/asset-search-tool.test.ts +23 -22
  12. package/src/__tests__/attachments-store.test.ts +56 -127
  13. package/src/__tests__/browser-skill-baseline-tool-payload.test.ts +5 -4
  14. package/src/__tests__/browser-skill-endstate.test.ts +4 -3
  15. package/src/__tests__/call-bridge.test.ts +385 -0
  16. package/src/__tests__/call-constants.test.ts +40 -0
  17. package/src/__tests__/call-orchestrator.test.ts +130 -4
  18. package/src/__tests__/call-recovery.test.ts +518 -0
  19. package/src/__tests__/call-routes-http.test.ts +459 -0
  20. package/src/__tests__/call-state-machine.test.ts +143 -0
  21. package/src/__tests__/call-store.test.ts +216 -1
  22. package/src/__tests__/cli-discover.test.ts +1 -1
  23. package/src/__tests__/commit-message-enrichment-service.test.ts +148 -7
  24. package/src/__tests__/compaction.benchmark.test.ts +176 -0
  25. package/src/__tests__/computer-use-tools.test.ts +250 -0
  26. package/src/__tests__/config-schema.test.ts +299 -3
  27. package/src/__tests__/conflict-store.test.ts +2 -1
  28. package/src/__tests__/contacts-tools.test.ts +331 -0
  29. package/src/__tests__/conversation-store.test.ts +30 -32
  30. package/src/__tests__/credential-security-invariants.test.ts +4 -0
  31. package/src/__tests__/date-context.test.ts +373 -0
  32. package/src/__tests__/db-schedule-syntax-migration.test.ts +129 -0
  33. package/src/__tests__/fixtures/media-reuse-fixtures.ts +3 -3
  34. package/src/__tests__/followup-tools.test.ts +303 -0
  35. package/src/__tests__/handlers-twitter-config.test.ts +718 -0
  36. package/src/__tests__/intent-routing.test.ts +64 -57
  37. package/src/__tests__/ipc-roundtrip.benchmark.test.ts +237 -0
  38. package/src/__tests__/ipc-snapshot.test.ts +62 -28
  39. package/src/__tests__/llm-usage-store.test.ts +3 -8
  40. package/src/__tests__/media-generate-image.test.ts +1 -1
  41. package/src/__tests__/media-reuse-story.e2e.test.ts +7 -7
  42. package/src/__tests__/memory-retrieval.benchmark.test.ts +430 -0
  43. package/src/__tests__/parallel-tool.benchmark.test.ts +294 -0
  44. package/src/__tests__/playbook-tools.test.ts +342 -0
  45. package/src/__tests__/profile-compiler.test.ts +2 -1
  46. package/src/__tests__/provider-streaming.benchmark.test.ts +773 -0
  47. package/src/__tests__/recurrence-engine-rruleset.test.ts +78 -0
  48. package/src/__tests__/recurrence-engine.test.ts +69 -0
  49. package/src/__tests__/recurrence-types.test.ts +71 -0
  50. package/src/__tests__/registry.test.ts +5 -3
  51. package/src/__tests__/relay-server.test.ts +633 -0
  52. package/src/__tests__/reminder-store.test.ts +6 -3
  53. package/src/__tests__/reminder.test.ts +43 -77
  54. package/src/__tests__/run-orchestrator-assistant-events.test.ts +8 -4
  55. package/src/__tests__/run-orchestrator.test.ts +4 -4
  56. package/src/__tests__/runtime-attachment-metadata.test.ts +7 -6
  57. package/src/__tests__/runtime-runs-http.test.ts +4 -4
  58. package/src/__tests__/runtime-runs.test.ts +4 -4
  59. package/src/__tests__/schedule-store.test.ts +482 -0
  60. package/src/__tests__/schedule-tools.test.ts +700 -0
  61. package/src/__tests__/scheduler-recurrence.test.ts +329 -0
  62. package/src/__tests__/server-history-render.test.ts +14 -13
  63. package/src/__tests__/session-error.test.ts +28 -0
  64. package/src/__tests__/session-init.benchmark.test.ts +462 -0
  65. package/src/__tests__/session-queue.test.ts +71 -48
  66. package/src/__tests__/session-runtime-assembly.test.ts +161 -0
  67. package/src/__tests__/session-surfaces-task-progress.test.ts +104 -0
  68. package/src/__tests__/signup-e2e.test.ts +2 -1
  69. package/src/__tests__/skill-projection.benchmark.test.ts +328 -0
  70. package/src/__tests__/skill-script-runner.test.ts +159 -0
  71. package/src/__tests__/speaker-identification.test.ts +52 -0
  72. package/src/__tests__/subagent-manager-notify.test.ts +42 -10
  73. package/src/__tests__/subagent-tools.test.ts +141 -41
  74. package/src/__tests__/task-compiler.test.ts +2 -1
  75. package/src/__tests__/task-runner.test.ts +2 -1
  76. package/src/__tests__/task-scheduler.test.ts +2 -1
  77. package/src/__tests__/task-tools.test.ts +49 -56
  78. package/src/__tests__/tool-audit-listener.test.ts +1 -0
  79. package/src/__tests__/tool-domain-event-publisher.test.ts +2 -0
  80. package/src/__tests__/tool-execution-pipeline.benchmark.test.ts +500 -0
  81. package/src/__tests__/tool-executor.test.ts +13 -17
  82. package/src/__tests__/turn-commit.test.ts +218 -3
  83. package/src/__tests__/twilio-provider.test.ts +143 -0
  84. package/src/__tests__/twilio-routes.test.ts +789 -0
  85. package/src/__tests__/twitter-auth-handler.test.ts +581 -0
  86. package/src/__tests__/view-image-tool.test.ts +217 -0
  87. package/src/__tests__/workspace-git-service.test.ts +186 -0
  88. package/src/__tests__/workspace-heartbeat-service.test.ts +13 -3
  89. package/src/agent-heartbeat/agent-heartbeat-service.ts +155 -0
  90. package/src/bundler/app-bundler.ts +12 -8
  91. package/src/calls/call-bridge.ts +95 -0
  92. package/src/calls/call-constants.ts +43 -5
  93. package/src/calls/call-domain.ts +276 -0
  94. package/src/calls/call-orchestrator.ts +43 -17
  95. package/src/calls/call-recovery.ts +207 -0
  96. package/src/calls/call-state-machine.ts +68 -0
  97. package/src/calls/call-store.ts +192 -5
  98. package/src/calls/relay-server.ts +41 -4
  99. package/src/calls/speaker-identification.ts +213 -0
  100. package/src/calls/twilio-provider.ts +10 -6
  101. package/src/calls/twilio-routes.ts +90 -76
  102. package/src/calls/types.ts +1 -1
  103. package/src/cli/config-commands.ts +334 -0
  104. package/src/cli/core-commands.ts +776 -0
  105. package/src/cli/doordash.ts +251 -1
  106. package/src/cli/ipc-client.ts +82 -0
  107. package/src/cli/map.ts +246 -0
  108. package/src/cli/twitter.ts +575 -0
  109. package/src/cli.ts +7 -5
  110. package/src/commands/__tests__/cc-command-registry.test.ts +319 -0
  111. package/src/commands/cc-command-registry.ts +209 -0
  112. package/src/config/bundled-skills/contacts/SKILL.md +39 -0
  113. package/src/config/bundled-skills/contacts/TOOLS.json +122 -0
  114. package/src/config/bundled-skills/contacts/tools/contact-merge.ts +9 -0
  115. package/src/config/bundled-skills/contacts/tools/contact-search.ts +9 -0
  116. package/src/config/bundled-skills/contacts/tools/contact-upsert.ts +9 -0
  117. package/src/config/bundled-skills/document/SKILL.md +18 -0
  118. package/src/config/bundled-skills/document/TOOLS.json +53 -0
  119. package/src/config/bundled-skills/document/tools/document-create.ts +9 -0
  120. package/src/config/bundled-skills/document/tools/document-update.ts +9 -0
  121. package/src/config/bundled-skills/doordash/SKILL.md +82 -23
  122. package/src/config/bundled-skills/followups/SKILL.md +32 -0
  123. package/src/config/bundled-skills/followups/TOOLS.json +100 -0
  124. package/src/config/bundled-skills/followups/tools/followup-create.ts +9 -0
  125. package/src/config/bundled-skills/followups/tools/followup-list.ts +9 -0
  126. package/src/config/bundled-skills/followups/tools/followup-resolve.ts +9 -0
  127. package/src/config/bundled-skills/image-studio/tools/media-generate-image.ts +1 -23
  128. package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +2 -1
  129. package/src/config/bundled-skills/playbooks/SKILL.md +31 -0
  130. package/src/config/bundled-skills/playbooks/TOOLS.json +126 -0
  131. package/src/config/bundled-skills/playbooks/tools/playbook-create.ts +9 -0
  132. package/src/config/bundled-skills/playbooks/tools/playbook-delete.ts +9 -0
  133. package/src/config/bundled-skills/playbooks/tools/playbook-list.ts +9 -0
  134. package/src/config/bundled-skills/playbooks/tools/playbook-update.ts +9 -0
  135. package/src/config/bundled-skills/reminder/SKILL.md +20 -0
  136. package/src/config/bundled-skills/reminder/TOOLS.json +67 -0
  137. package/src/config/bundled-skills/reminder/tools/reminder-cancel.ts +9 -0
  138. package/src/config/bundled-skills/reminder/tools/reminder-create.ts +9 -0
  139. package/src/config/bundled-skills/reminder/tools/reminder-list.ts +9 -0
  140. package/src/config/bundled-skills/schedule/SKILL.md +74 -0
  141. package/src/config/bundled-skills/schedule/TOOLS.json +135 -0
  142. package/src/config/bundled-skills/schedule/tools/schedule-create.ts +9 -0
  143. package/src/config/bundled-skills/schedule/tools/schedule-delete.ts +9 -0
  144. package/src/config/bundled-skills/schedule/tools/schedule-list.ts +9 -0
  145. package/src/config/bundled-skills/schedule/tools/schedule-update.ts +9 -0
  146. package/src/config/bundled-skills/subagent/SKILL.md +25 -0
  147. package/src/config/bundled-skills/subagent/TOOLS.json +107 -0
  148. package/src/config/bundled-skills/subagent/tools/subagent-abort.ts +9 -0
  149. package/src/config/bundled-skills/subagent/tools/subagent-message.ts +9 -0
  150. package/src/config/bundled-skills/subagent/tools/subagent-read.ts +9 -0
  151. package/src/config/bundled-skills/subagent/tools/subagent-spawn.ts +9 -0
  152. package/src/config/bundled-skills/subagent/tools/subagent-status.ts +9 -0
  153. package/src/config/bundled-skills/tasks/SKILL.md +28 -0
  154. package/src/config/bundled-skills/tasks/TOOLS.json +256 -0
  155. package/src/config/bundled-skills/tasks/tools/task-delete.ts +9 -0
  156. package/src/config/bundled-skills/tasks/tools/task-list-add.ts +9 -0
  157. package/src/config/bundled-skills/tasks/tools/task-list-remove.ts +9 -0
  158. package/src/config/bundled-skills/tasks/tools/task-list-show.ts +9 -0
  159. package/src/config/bundled-skills/tasks/tools/task-list-update.ts +9 -0
  160. package/src/config/bundled-skills/tasks/tools/task-list.ts +9 -0
  161. package/src/config/bundled-skills/tasks/tools/task-run.ts +9 -0
  162. package/src/config/bundled-skills/tasks/tools/task-save.ts +9 -0
  163. package/src/config/bundled-skills/twitter/SKILL.md +134 -0
  164. package/src/config/bundled-skills/watcher/SKILL.md +27 -0
  165. package/src/config/bundled-skills/watcher/TOOLS.json +147 -0
  166. package/src/config/bundled-skills/watcher/tools/watcher-create.ts +9 -0
  167. package/src/config/bundled-skills/watcher/tools/watcher-delete.ts +9 -0
  168. package/src/config/bundled-skills/watcher/tools/watcher-digest.ts +9 -0
  169. package/src/config/bundled-skills/watcher/tools/watcher-list.ts +9 -0
  170. package/src/config/bundled-skills/watcher/tools/watcher-update.ts +9 -0
  171. package/src/config/defaults.ts +33 -0
  172. package/src/config/loader.ts +4 -1
  173. package/src/config/schema.ts +161 -1
  174. package/src/config/system-prompt.ts +61 -16
  175. package/src/config/templates/IDENTITY.md +7 -0
  176. package/src/config/types.ts +4 -0
  177. package/src/contacts/contact-store.ts +4 -4
  178. package/src/daemon/assistant-attachments.ts +10 -0
  179. package/src/daemon/classifier.ts +3 -1
  180. package/src/daemon/computer-use-session.ts +3 -1
  181. package/src/daemon/date-context.ts +136 -0
  182. package/src/daemon/handlers/apps.ts +16 -1
  183. package/src/daemon/handlers/browser.ts +54 -0
  184. package/src/daemon/handlers/computer-use.ts +7 -1
  185. package/src/daemon/handlers/config.ts +163 -5
  186. package/src/daemon/handlers/diagnostics.ts +5 -1
  187. package/src/daemon/handlers/documents.ts +18 -29
  188. package/src/daemon/handlers/home-base.ts +5 -1
  189. package/src/daemon/handlers/index.ts +40 -277
  190. package/src/daemon/handlers/misc.ts +9 -1
  191. package/src/daemon/handlers/publish.ts +6 -1
  192. package/src/daemon/handlers/sessions.ts +65 -12
  193. package/src/daemon/handlers/shared.ts +36 -1
  194. package/src/daemon/handlers/signing.ts +37 -0
  195. package/src/daemon/handlers/skills.ts +20 -6
  196. package/src/daemon/handlers/subagents.ts +8 -3
  197. package/src/daemon/handlers/twitter-auth.ts +169 -0
  198. package/src/daemon/handlers/work-items.ts +384 -68
  199. package/src/daemon/ipc-contract-inventory.json +28 -4
  200. package/src/daemon/ipc-contract.ts +133 -37
  201. package/src/daemon/ipc-protocol.ts +7 -2
  202. package/src/daemon/lifecycle.ts +21 -0
  203. package/src/daemon/main.ts +10 -4
  204. package/src/daemon/ride-shotgun-handler.ts +74 -10
  205. package/src/daemon/server.ts +143 -26
  206. package/src/daemon/session-agent-loop.ts +887 -0
  207. package/src/daemon/session-attachments.ts +28 -5
  208. package/src/daemon/session-error.ts +24 -3
  209. package/src/daemon/session-lifecycle.ts +147 -0
  210. package/src/daemon/session-media-retry.ts +147 -0
  211. package/src/daemon/session-messaging.ts +145 -0
  212. package/src/daemon/session-notifiers.ts +164 -0
  213. package/src/daemon/session-process.ts +2 -2
  214. package/src/daemon/session-queue-manager.ts +1 -0
  215. package/src/daemon/session-runtime-assembly.ts +52 -0
  216. package/src/daemon/session-skill-tools.ts +124 -5
  217. package/src/daemon/session-slash.ts +3 -0
  218. package/src/daemon/session-surfaces.ts +77 -2
  219. package/src/daemon/session-tool-setup.ts +216 -2
  220. package/src/daemon/session-usage.ts +0 -2
  221. package/src/daemon/session.ts +114 -1404
  222. package/src/daemon/video-thumbnail.ts +60 -0
  223. package/src/doordash/client.ts +121 -27
  224. package/src/doordash/queries.ts +1 -2
  225. package/src/export/formatter.ts +3 -1
  226. package/src/followups/followup-store.ts +4 -2
  227. package/src/followups/types.ts +6 -0
  228. package/src/hooks/templates.ts +1 -1
  229. package/src/index.ts +32 -1153
  230. package/src/memory/attachments-store.ts +28 -83
  231. package/src/memory/channel-delivery-store.ts +7 -21
  232. package/src/memory/clarification-resolver.ts +6 -5
  233. package/src/memory/contradiction-checker.ts +3 -2
  234. package/src/memory/conversation-key-store.ts +10 -29
  235. package/src/memory/conversation-store.ts +2 -1
  236. package/src/memory/db.ts +96 -2
  237. package/src/memory/entity-extractor.ts +6 -3
  238. package/src/memory/items-extractor.ts +5 -4
  239. package/src/memory/jobs-store.ts +3 -2
  240. package/src/memory/llm-usage-store.ts +1 -2
  241. package/src/memory/runs-store.ts +1 -2
  242. package/src/memory/schema.ts +23 -2
  243. package/src/messaging/style-analyzer.ts +3 -2
  244. package/src/messaging/thread-summarizer.ts +8 -12
  245. package/src/messaging/triage-engine.ts +4 -2
  246. package/src/providers/openrouter/client.ts +20 -0
  247. package/src/providers/registry.ts +8 -0
  248. package/src/runtime/http-server.ts +108 -20
  249. package/src/runtime/routes/attachment-routes.ts +2 -3
  250. package/src/runtime/routes/call-routes.ts +140 -0
  251. package/src/runtime/routes/channel-routes.ts +5 -10
  252. package/src/runtime/routes/conversation-routes.ts +5 -5
  253. package/src/runtime/routes/run-routes.ts +2 -2
  254. package/src/runtime/run-orchestrator.ts +9 -3
  255. package/src/schedule/recurrence-engine.ts +138 -0
  256. package/src/schedule/recurrence-types.ts +67 -0
  257. package/src/schedule/schedule-store.ts +102 -57
  258. package/src/schedule/scheduler.ts +9 -6
  259. package/src/security/oauth2.ts +29 -4
  260. package/src/security/secret-allowlist.ts +46 -0
  261. package/src/skills/clawhub.ts +1 -1
  262. package/src/subagent/manager.ts +40 -8
  263. package/src/swarm/backend-claude-code.ts +64 -9
  264. package/src/swarm/worker-prompts.ts +2 -1
  265. package/src/tasks/SPEC.md +34 -28
  266. package/src/tasks/ephemeral-permissions.ts +16 -7
  267. package/src/tasks/task-compiler.ts +5 -4
  268. package/src/tasks/task-runner.ts +10 -5
  269. package/src/tasks/task-scheduler.ts +1 -1
  270. package/src/tasks/tool-sanitizer.ts +36 -0
  271. package/src/tools/assets/search.ts +4 -4
  272. package/src/tools/browser/api-map.ts +220 -0
  273. package/src/tools/browser/auto-navigate.ts +270 -0
  274. package/src/tools/browser/browser-execution.ts +2 -1
  275. package/src/tools/browser/browser-manager.ts +2 -2
  276. package/src/tools/browser/network-recorder.ts +5 -4
  277. package/src/tools/browser/x-auto-navigate.ts +207 -0
  278. package/src/tools/calls/call-end.ts +17 -67
  279. package/src/tools/calls/call-start.ts +24 -85
  280. package/src/tools/calls/call-status.ts +35 -51
  281. package/src/tools/claude-code/claude-code.ts +77 -11
  282. package/src/tools/contacts/contact-merge.ts +46 -78
  283. package/src/tools/contacts/contact-search.ts +35 -79
  284. package/src/tools/contacts/contact-upsert.ts +35 -108
  285. package/src/tools/credentials/vault.ts +20 -4
  286. package/src/tools/document/document-tool.ts +71 -144
  287. package/src/tools/executor.ts +129 -10
  288. package/src/tools/followups/followup_create.ts +46 -88
  289. package/src/tools/followups/followup_list.ts +34 -74
  290. package/src/tools/followups/followup_resolve.ts +31 -66
  291. package/src/tools/host-terminal/cli-discover.ts +2 -1
  292. package/src/tools/host-terminal/host-shell.ts +10 -0
  293. package/src/tools/memory/handlers.ts +5 -4
  294. package/src/tools/network/__tests__/web-search.test.ts +427 -0
  295. package/src/tools/network/script-proxy/__tests__/logging.test.ts +248 -0
  296. package/src/tools/network/script-proxy/__tests__/policy.test.ts +234 -0
  297. package/src/tools/network/script-proxy/__tests__/router.test.ts +76 -0
  298. package/src/tools/network/web-fetch.ts +18 -6
  299. package/src/tools/playbooks/index.ts +4 -5
  300. package/src/tools/playbooks/playbook-create.ts +3 -47
  301. package/src/tools/playbooks/playbook-delete.ts +1 -25
  302. package/src/tools/playbooks/playbook-list.ts +1 -28
  303. package/src/tools/playbooks/playbook-update.ts +3 -51
  304. package/src/tools/reminder/reminder.ts +5 -78
  305. package/src/tools/schedule/create.ts +69 -74
  306. package/src/tools/schedule/delete.ts +21 -47
  307. package/src/tools/schedule/list.ts +55 -74
  308. package/src/tools/schedule/update.ts +77 -84
  309. package/src/tools/subagent/abort.ts +29 -58
  310. package/src/tools/subagent/message.ts +30 -63
  311. package/src/tools/subagent/read.ts +53 -84
  312. package/src/tools/subagent/spawn.ts +43 -82
  313. package/src/tools/subagent/status.ts +42 -71
  314. package/src/tools/swarm/delegate.ts +2 -1
  315. package/src/tools/tasks/index.ts +8 -8
  316. package/src/tools/tasks/task-delete.ts +60 -88
  317. package/src/tools/tasks/task-list.ts +31 -52
  318. package/src/tools/tasks/task-run.ts +72 -108
  319. package/src/tools/tasks/task-save.ts +33 -65
  320. package/src/tools/tasks/work-item-enqueue.ts +183 -215
  321. package/src/tools/tasks/work-item-list.ts +33 -63
  322. package/src/tools/tasks/work-item-remove.ts +45 -97
  323. package/src/tools/tasks/work-item-update.ts +91 -163
  324. package/src/tools/terminal/backends/native.ts +3 -1
  325. package/src/tools/tool-manifest.ts +0 -62
  326. package/src/tools/types.ts +6 -0
  327. package/src/tools/ui-surface/definitions.ts +3 -1
  328. package/src/tools/watch/screen-watch.ts +3 -1
  329. package/src/tools/watcher/create.ts +52 -98
  330. package/src/tools/watcher/delete.ts +20 -46
  331. package/src/tools/watcher/digest.ts +36 -70
  332. package/src/tools/watcher/list.ts +49 -79
  333. package/src/tools/watcher/update.ts +45 -91
  334. package/src/twitter/client.ts +690 -0
  335. package/src/twitter/session.ts +91 -0
  336. package/src/usage/types.ts +0 -1
  337. package/src/util/truncate.ts +6 -0
  338. package/src/watcher/providers/slack.ts +2 -1
  339. package/src/watcher/watcher-store.ts +3 -2
  340. package/src/work-items/work-item-store.ts +27 -2
  341. package/src/workspace/commit-message-enrichment-service.ts +31 -7
  342. package/src/workspace/git-service.ts +87 -22
  343. package/src/workspace/provider-commit-message-generator.ts +242 -0
  344. package/src/workspace/turn-commit.ts +62 -3
  345. package/src/tools/contacts/index.ts +0 -4
  346. package/src/tools/document/index.ts +0 -5
  347. package/src/tools/followups/index.ts +0 -3
  348. package/src/tools/subagent/index.ts +0 -5
  349. /package/src/__tests__/{memory-context-benchmark.test.ts → memory-context-benchmark.benchmark.test.ts} +0 -0
@@ -0,0 +1,250 @@
1
+ import { describe, test, expect } from 'bun:test';
2
+ import {
3
+ allComputerUseTools,
4
+ computerUseClickTool,
5
+ computerUseDoubleClickTool,
6
+ computerUseRightClickTool,
7
+ computerUseTypeTextTool,
8
+ computerUseKeyTool,
9
+ computerUseScrollTool,
10
+ computerUseDragTool,
11
+ computerUseWaitTool,
12
+ computerUseOpenAppTool,
13
+ computerUseRunAppleScriptTool,
14
+ computerUseDoneTool,
15
+ computerUseRespondTool,
16
+ } from '../tools/computer-use/definitions.js';
17
+ import { requestComputerControlTool } from '../tools/computer-use/request-computer-control.js';
18
+ import { forwardComputerUseProxyTool } from '../tools/computer-use/skill-proxy-bridge.js';
19
+ import type { ToolContext } from '../tools/types.js';
20
+
21
+ interface JsonSchema {
22
+ type?: string;
23
+ required?: string[];
24
+ properties?: Record<string, unknown>;
25
+ }
26
+
27
+ /** Cast a tool definition's input_schema to a usable JSON Schema shape. */
28
+ function schema(tool: { getDefinition(): { input_schema: object } }): JsonSchema {
29
+ return tool.getDefinition().input_schema as JsonSchema;
30
+ }
31
+
32
+ const ctx: ToolContext = {
33
+ workingDir: '/tmp',
34
+ sessionId: 'test-session',
35
+ conversationId: 'test-conversation',
36
+ };
37
+
38
+ // ── Tool definitions ────────────────────────────────────────────────
39
+
40
+ describe('computer-use tool definitions', () => {
41
+ test('allComputerUseTools contains 12 tools', () => {
42
+ expect(allComputerUseTools.length).toBe(12);
43
+ });
44
+
45
+ test('all tools have proxy execution mode', () => {
46
+ for (const tool of allComputerUseTools) {
47
+ expect(tool.executionMode).toBe('proxy');
48
+ }
49
+ expect(requestComputerControlTool.executionMode).toBe('proxy');
50
+ });
51
+
52
+ test('all tools belong to computer-use category', () => {
53
+ for (const tool of allComputerUseTools) {
54
+ expect(tool.category).toBe('computer-use');
55
+ }
56
+ expect(requestComputerControlTool.category).toBe('computer-use');
57
+ });
58
+
59
+ test('all tools have unique names', () => {
60
+ const names = allComputerUseTools.map((t) => t.name);
61
+ expect(new Set(names).size).toBe(names.length);
62
+ });
63
+
64
+ test('all tools have descriptions', () => {
65
+ for (const tool of allComputerUseTools) {
66
+ expect(tool.description.length).toBeGreaterThan(0);
67
+ }
68
+ });
69
+ });
70
+
71
+ // ── Click tool variants ─────────────────────────────────────────────
72
+
73
+ describe('click tool variants', () => {
74
+ for (const [tool, label] of [
75
+ [computerUseClickTool, 'click'],
76
+ [computerUseDoubleClickTool, 'double_click'],
77
+ [computerUseRightClickTool, 'right_click'],
78
+ ] as const) {
79
+ test(`${tool.name} has correct name`, () => {
80
+ expect(tool.name).toBe(`computer_use_${label}`);
81
+ });
82
+
83
+ test(`${tool.name} schema requires reasoning`, () => {
84
+ expect(schema(tool).required).toContain('reasoning');
85
+ });
86
+
87
+ test(`${tool.name} schema supports element_id and coordinates`, () => {
88
+ const props = schema(tool).properties as Record<string, { type: string }>;
89
+ expect(props.element_id.type).toBe('integer');
90
+ expect(props.x.type).toBe('integer');
91
+ expect(props.y.type).toBe('integer');
92
+ });
93
+
94
+ test(`${tool.name} execute throws proxy error`, () => {
95
+ expect(() => tool.execute({}, ctx)).toThrow('Proxy tool');
96
+ });
97
+ }
98
+ });
99
+
100
+ // ── type_text ───────────────────────────────────────────────────────
101
+
102
+ describe('computer_use_type_text', () => {
103
+ test('requires text and reasoning', () => {
104
+ expect(schema(computerUseTypeTextTool).required).toContain('text');
105
+ expect(schema(computerUseTypeTextTool).required).toContain('reasoning');
106
+ });
107
+
108
+ test('execute throws proxy error', () => {
109
+ expect(() => computerUseTypeTextTool.execute({}, ctx)).toThrow('Proxy tool');
110
+ });
111
+ });
112
+
113
+ // ── key ─────────────────────────────────────────────────────────────
114
+
115
+ describe('computer_use_key', () => {
116
+ test('requires key and reasoning', () => {
117
+ expect(schema(computerUseKeyTool).required).toContain('key');
118
+ expect(schema(computerUseKeyTool).required).toContain('reasoning');
119
+ });
120
+
121
+ test('execute throws proxy error', () => {
122
+ expect(() => computerUseKeyTool.execute({}, ctx)).toThrow('Proxy tool');
123
+ });
124
+ });
125
+
126
+ // ── scroll ──────────────────────────────────────────────────────────
127
+
128
+ describe('computer_use_scroll', () => {
129
+ test('requires direction, amount, and reasoning', () => {
130
+ expect(schema(computerUseScrollTool).required).toContain('direction');
131
+ expect(schema(computerUseScrollTool).required).toContain('amount');
132
+ expect(schema(computerUseScrollTool).required).toContain('reasoning');
133
+ });
134
+
135
+ test('direction enum includes up, down, left, right', () => {
136
+ const props = schema(computerUseScrollTool).properties as Record<string, { enum?: string[] }>;
137
+ expect(props.direction.enum).toEqual(['up', 'down', 'left', 'right']);
138
+ });
139
+ });
140
+
141
+ // ── drag ────────────────────────────────────────────────────────────
142
+
143
+ describe('computer_use_drag', () => {
144
+ test('supports source and destination coordinates', () => {
145
+ const props = schema(computerUseDragTool).properties as Record<string, { type: string }>;
146
+ expect(props.element_id.type).toBe('integer');
147
+ expect(props.to_element_id.type).toBe('integer');
148
+ expect(props.x.type).toBe('integer');
149
+ expect(props.y.type).toBe('integer');
150
+ expect(props.to_x.type).toBe('integer');
151
+ expect(props.to_y.type).toBe('integer');
152
+ });
153
+
154
+ test('requires reasoning only', () => {
155
+ expect(schema(computerUseDragTool).required).toEqual(['reasoning']);
156
+ });
157
+ });
158
+
159
+ // ── wait ────────────────────────────────────────────────────────────
160
+
161
+ describe('computer_use_wait', () => {
162
+ test('requires duration_ms and reasoning', () => {
163
+ expect(schema(computerUseWaitTool).required).toContain('duration_ms');
164
+ expect(schema(computerUseWaitTool).required).toContain('reasoning');
165
+ });
166
+ });
167
+
168
+ // ── open_app ────────────────────────────────────────────────────────
169
+
170
+ describe('computer_use_open_app', () => {
171
+ test('requires app_name and reasoning', () => {
172
+ expect(schema(computerUseOpenAppTool).required).toContain('app_name');
173
+ expect(schema(computerUseOpenAppTool).required).toContain('reasoning');
174
+ });
175
+ });
176
+
177
+ // ── run_applescript ─────────────────────────────────────────────────
178
+
179
+ describe('computer_use_run_applescript', () => {
180
+ test('requires script and reasoning', () => {
181
+ expect(schema(computerUseRunAppleScriptTool).required).toContain('script');
182
+ expect(schema(computerUseRunAppleScriptTool).required).toContain('reasoning');
183
+ });
184
+
185
+ test('description warns against do shell script', () => {
186
+ expect(computerUseRunAppleScriptTool.description).toContain('do shell script');
187
+ expect(computerUseRunAppleScriptTool.description).toContain('blocked');
188
+ });
189
+ });
190
+
191
+ // ── done ────────────────────────────────────────────────────────────
192
+
193
+ describe('computer_use_done', () => {
194
+ test('requires summary', () => {
195
+ expect(schema(computerUseDoneTool).required).toContain('summary');
196
+ });
197
+ });
198
+
199
+ // ── respond ─────────────────────────────────────────────────────────
200
+
201
+ describe('computer_use_respond', () => {
202
+ test('requires answer and reasoning', () => {
203
+ expect(schema(computerUseRespondTool).required).toContain('answer');
204
+ expect(schema(computerUseRespondTool).required).toContain('reasoning');
205
+ });
206
+ });
207
+
208
+ // ── request_computer_control ────────────────────────────────────────
209
+
210
+ describe('computer_use_request_control', () => {
211
+ test('requires task parameter', () => {
212
+ expect(schema(requestComputerControlTool).required).toContain('task');
213
+ });
214
+
215
+ test('execute throws proxy error', () => {
216
+ expect(() => requestComputerControlTool.execute({}, ctx)).toThrow('surfaceProxyResolver');
217
+ });
218
+ });
219
+
220
+ // ── skill-proxy-bridge ──────────────────────────────────────────────
221
+
222
+ describe('forwardComputerUseProxyTool', () => {
223
+ test('returns error when no proxy resolver available', async () => {
224
+ const result = await forwardComputerUseProxyTool('computer_use_click', {}, ctx);
225
+
226
+ expect(result.isError).toBe(true);
227
+ expect(result.content).toContain('no proxy resolver available');
228
+ expect(result.content).toContain('computer_use_click');
229
+ });
230
+
231
+ test('delegates to proxy resolver when available', async () => {
232
+ const ctxWithProxy: ToolContext = {
233
+ ...ctx,
234
+ proxyToolResolver: async (name: string, input: Record<string, unknown>) => ({
235
+ content: `Forwarded ${name} with ${JSON.stringify(input)}`,
236
+ isError: false,
237
+ }),
238
+ };
239
+
240
+ const result = await forwardComputerUseProxyTool(
241
+ 'computer_use_screenshot',
242
+ { reasoning: 'test' },
243
+ ctxWithProxy,
244
+ );
245
+
246
+ expect(result.isError).toBe(false);
247
+ expect(result.content).toContain('Forwarded computer_use_screenshot');
248
+ expect(result.content).toContain('test');
249
+ });
250
+ });
@@ -26,10 +26,16 @@ function ensureTestDir(): void {
26
26
  }
27
27
  }
28
28
 
29
+ function makeLoggerStub(): Record<string, unknown> {
30
+ const stub: Record<string, unknown> = {};
31
+ for (const m of ['info', 'warn', 'error', 'debug', 'trace', 'fatal', 'silent', 'child']) {
32
+ stub[m] = m === 'child' ? () => makeLoggerStub() : () => {};
33
+ }
34
+ return stub;
35
+ }
36
+
29
37
  mock.module('../util/logger.js', () => ({
30
- getLogger: () => new Proxy({} as Record<string, unknown>, {
31
- get: () => () => {},
32
- }),
38
+ getLogger: () => makeLoggerStub(),
33
39
  }));
34
40
 
35
41
  mock.module('../util/platform.js', () => ({
@@ -508,6 +514,22 @@ describe('AssistantConfigSchema', () => {
508
514
  enrichmentConcurrency: 1,
509
515
  enrichmentJobTimeoutMs: 30000,
510
516
  enrichmentMaxRetries: 2,
517
+ commitMessageLLM: {
518
+ enabled: false,
519
+ useConfiguredProvider: true,
520
+ providerFastModelOverrides: {},
521
+ timeoutMs: 600,
522
+ maxTokens: 120,
523
+ temperature: 0.2,
524
+ maxFilesInPrompt: 30,
525
+ maxDiffBytes: 12000,
526
+ minRemainingTurnBudgetMs: 1000,
527
+ breaker: {
528
+ openAfterFailures: 3,
529
+ backoffBaseMs: 2000,
530
+ backoffMaxMs: 60000,
531
+ },
532
+ },
511
533
  });
512
534
  });
513
535
 
@@ -545,6 +567,184 @@ describe('AssistantConfigSchema', () => {
545
567
  });
546
568
  expect(result.success).toBe(false);
547
569
  });
570
+
571
+ // ── commitMessageLLM config ──────────────────────────────────────────
572
+
573
+ test('default commitMessageLLM values are correct', () => {
574
+ const result = AssistantConfigSchema.parse({});
575
+ const llm = result.workspaceGit.commitMessageLLM;
576
+ expect(llm.enabled).toBe(false);
577
+ expect(llm.useConfiguredProvider).toBe(true);
578
+ expect(llm.providerFastModelOverrides).toEqual({});
579
+ expect(llm.timeoutMs).toBe(600);
580
+ expect(llm.maxTokens).toBe(120);
581
+ expect(llm.temperature).toBe(0.2);
582
+ expect(llm.maxFilesInPrompt).toBe(30);
583
+ expect(llm.maxDiffBytes).toBe(12000);
584
+ expect(llm.minRemainingTurnBudgetMs).toBe(1000);
585
+ });
586
+
587
+ test('rejects negative commitMessageLLM.timeoutMs', () => {
588
+ const result = AssistantConfigSchema.safeParse({
589
+ workspaceGit: { commitMessageLLM: { timeoutMs: -1 } },
590
+ });
591
+ expect(result.success).toBe(false);
592
+ });
593
+
594
+ test('rejects commitMessageLLM.temperature > 2', () => {
595
+ const result = AssistantConfigSchema.safeParse({
596
+ workspaceGit: { commitMessageLLM: { temperature: 2.5 } },
597
+ });
598
+ expect(result.success).toBe(false);
599
+ });
600
+
601
+ test('breaker settings have correct defaults', () => {
602
+ const result = AssistantConfigSchema.parse({});
603
+ const breaker = result.workspaceGit.commitMessageLLM.breaker;
604
+ expect(breaker.openAfterFailures).toBe(3);
605
+ expect(breaker.backoffBaseMs).toBe(2000);
606
+ expect(breaker.backoffMaxMs).toBe(60000);
607
+ });
608
+
609
+ test('accepts valid commitMessageLLM overrides', () => {
610
+ const result = AssistantConfigSchema.parse({
611
+ workspaceGit: {
612
+ commitMessageLLM: {
613
+ enabled: true,
614
+ timeoutMs: 1000,
615
+ temperature: 0.5,
616
+ breaker: { openAfterFailures: 5 },
617
+ },
618
+ },
619
+ });
620
+ expect(result.workspaceGit.commitMessageLLM.enabled).toBe(true);
621
+ expect(result.workspaceGit.commitMessageLLM.timeoutMs).toBe(1000);
622
+ expect(result.workspaceGit.commitMessageLLM.temperature).toBe(0.5);
623
+ expect(result.workspaceGit.commitMessageLLM.breaker.openAfterFailures).toBe(5);
624
+ // Other breaker fields should still get defaults
625
+ expect(result.workspaceGit.commitMessageLLM.breaker.backoffBaseMs).toBe(2000);
626
+ });
627
+
628
+ test('rejects commitMessageLLM.temperature < 0', () => {
629
+ const result = AssistantConfigSchema.safeParse({
630
+ workspaceGit: { commitMessageLLM: { temperature: -0.1 } },
631
+ });
632
+ expect(result.success).toBe(false);
633
+ });
634
+
635
+ test('rejects non-integer commitMessageLLM.maxTokens', () => {
636
+ const result = AssistantConfigSchema.safeParse({
637
+ workspaceGit: { commitMessageLLM: { maxTokens: 3.5 } },
638
+ });
639
+ expect(result.success).toBe(false);
640
+ });
641
+
642
+ // ── Calls config ────────────────────────────────────────────────────
643
+
644
+ test('applies calls defaults', () => {
645
+ const result = AssistantConfigSchema.parse({});
646
+ expect(result.calls).toEqual({
647
+ enabled: true,
648
+ provider: 'twilio',
649
+ maxDurationSeconds: 3600,
650
+ userConsultTimeoutSeconds: 120,
651
+ disclosure: {
652
+ enabled: true,
653
+ text: 'At the very beginning of the call, disclose that you are an AI assistant calling on behalf of the user.',
654
+ },
655
+ safety: {
656
+ denyCategories: [],
657
+ },
658
+ });
659
+ });
660
+
661
+ test('accepts valid calls config overrides', () => {
662
+ const result = AssistantConfigSchema.parse({
663
+ calls: {
664
+ enabled: false,
665
+ maxDurationSeconds: 1800,
666
+ userConsultTimeoutSeconds: 60,
667
+ disclosure: { enabled: false, text: 'Custom disclosure' },
668
+ safety: { denyCategories: ['spam'] },
669
+ },
670
+ });
671
+ expect(result.calls.enabled).toBe(false);
672
+ expect(result.calls.maxDurationSeconds).toBe(1800);
673
+ expect(result.calls.userConsultTimeoutSeconds).toBe(60);
674
+ expect(result.calls.disclosure.enabled).toBe(false);
675
+ expect(result.calls.disclosure.text).toBe('Custom disclosure');
676
+ expect(result.calls.safety.denyCategories).toEqual(['spam']);
677
+ });
678
+
679
+ test('accepts partial calls config with defaults for missing fields', () => {
680
+ const result = AssistantConfigSchema.parse({
681
+ calls: { maxDurationSeconds: 600 },
682
+ });
683
+ expect(result.calls.enabled).toBe(true);
684
+ expect(result.calls.maxDurationSeconds).toBe(600);
685
+ expect(result.calls.userConsultTimeoutSeconds).toBe(120);
686
+ expect(result.calls.provider).toBe('twilio');
687
+ });
688
+
689
+ test('rejects invalid calls.enabled', () => {
690
+ const result = AssistantConfigSchema.safeParse({
691
+ calls: { enabled: 'yes' },
692
+ });
693
+ expect(result.success).toBe(false);
694
+ });
695
+
696
+ test('rejects invalid calls.provider', () => {
697
+ const result = AssistantConfigSchema.safeParse({
698
+ calls: { provider: 'vonage' },
699
+ });
700
+ expect(result.success).toBe(false);
701
+ if (!result.success) {
702
+ const msgs = result.error.issues.map(i => i.message);
703
+ expect(msgs.some(m => m.includes('calls.provider'))).toBe(true);
704
+ }
705
+ });
706
+
707
+ test('rejects non-positive calls.maxDurationSeconds', () => {
708
+ const result = AssistantConfigSchema.safeParse({
709
+ calls: { maxDurationSeconds: 0 },
710
+ });
711
+ expect(result.success).toBe(false);
712
+ });
713
+
714
+ test('rejects non-integer calls.maxDurationSeconds', () => {
715
+ const result = AssistantConfigSchema.safeParse({
716
+ calls: { maxDurationSeconds: 3.5 },
717
+ });
718
+ expect(result.success).toBe(false);
719
+ });
720
+
721
+ test('rejects non-positive calls.userConsultTimeoutSeconds', () => {
722
+ const result = AssistantConfigSchema.safeParse({
723
+ calls: { userConsultTimeoutSeconds: -1 },
724
+ });
725
+ expect(result.success).toBe(false);
726
+ });
727
+
728
+ test('rejects non-boolean calls.disclosure.enabled', () => {
729
+ const result = AssistantConfigSchema.safeParse({
730
+ calls: { disclosure: { enabled: 'true' } },
731
+ });
732
+ expect(result.success).toBe(false);
733
+ });
734
+
735
+ test('rejects non-string calls.disclosure.text', () => {
736
+ const result = AssistantConfigSchema.safeParse({
737
+ calls: { disclosure: { text: 123 } },
738
+ });
739
+ expect(result.success).toBe(false);
740
+ });
741
+
742
+ test('rejects non-array calls.safety.denyCategories', () => {
743
+ const result = AssistantConfigSchema.safeParse({
744
+ calls: { safety: { denyCategories: 'spam' } },
745
+ });
746
+ expect(result.success).toBe(false);
747
+ });
548
748
  });
549
749
 
550
750
  // ---------------------------------------------------------------------------
@@ -766,4 +966,100 @@ describe('loadConfig with schema validation', () => {
766
966
  }
767
967
  }
768
968
  });
969
+
970
+ // ── Calls config (loader integration) ──────────────────────────────
971
+
972
+ test('loads calls config from file', () => {
973
+ writeConfig({
974
+ calls: { enabled: false, maxDurationSeconds: 600 },
975
+ });
976
+ const config = loadConfig();
977
+ expect(config.calls.enabled).toBe(false);
978
+ expect(config.calls.maxDurationSeconds).toBe(600);
979
+ expect(config.calls.userConsultTimeoutSeconds).toBe(120);
980
+ expect(config.calls.provider).toBe('twilio');
981
+ });
982
+
983
+ test('falls back for invalid calls.provider', () => {
984
+ writeConfig({ calls: { provider: 'vonage' } });
985
+ const config = loadConfig();
986
+ expect(config.calls.provider).toBe('twilio');
987
+ });
988
+
989
+ test('applies calls defaults when not specified', () => {
990
+ writeConfig({});
991
+ const config = loadConfig();
992
+ expect(config.calls.enabled).toBe(true);
993
+ expect(config.calls.maxDurationSeconds).toBe(3600);
994
+ expect(config.calls.userConsultTimeoutSeconds).toBe(120);
995
+ expect(config.calls.disclosure.enabled).toBe(true);
996
+ expect(config.calls.safety.denyCategories).toEqual([]);
997
+ });
998
+ });
999
+
1000
+ // ---------------------------------------------------------------------------
1001
+ // Tests: Call entrypoint gating
1002
+ // ---------------------------------------------------------------------------
1003
+
1004
+ describe('Call entrypoint gating', () => {
1005
+ beforeEach(() => {
1006
+ ensureTestDir();
1007
+ const resetPaths = [
1008
+ CONFIG_PATH,
1009
+ join(TEST_DIR, 'keys.enc'),
1010
+ join(TEST_DIR, 'data'),
1011
+ join(TEST_DIR, 'memory'),
1012
+ ];
1013
+ for (const path of resetPaths) {
1014
+ if (existsSync(path)) {
1015
+ rmSync(path, { recursive: true, force: true });
1016
+ }
1017
+ }
1018
+ ensureTestDir();
1019
+ _setStorePath(join(TEST_DIR, 'keys.enc'));
1020
+ _setBackend('encrypted');
1021
+ invalidateConfigCache();
1022
+ });
1023
+
1024
+ afterEach(() => {
1025
+ _setStorePath(null);
1026
+ _setBackend(undefined);
1027
+ invalidateConfigCache();
1028
+ });
1029
+
1030
+ test('call_start tool returns error when calls.enabled is false', async () => {
1031
+ writeConfig({ calls: { enabled: false } });
1032
+ // Force config reload
1033
+ loadConfig();
1034
+
1035
+ const { CallStartTool: _CallStartToolClass } = await import('../tools/calls/call-start.js') as { CallStartTool: new () => { execute: (input: Record<string, unknown>, context: { conversationId: string }) => Promise<{ content: string; isError: boolean }> } };
1036
+
1037
+ // The tool is registered via side effect. We need to test the gating logic directly.
1038
+ // Since the module registers itself, we test by loading config and checking behavior.
1039
+ const { getConfig } = await import('../config/loader.js');
1040
+ const config = getConfig();
1041
+ expect(config.calls.enabled).toBe(false);
1042
+ });
1043
+
1044
+ test('handleStartCall route returns 403 when calls.enabled is false', async () => {
1045
+ writeConfig({ calls: { enabled: false } });
1046
+ loadConfig();
1047
+
1048
+ const { handleStartCall } = await import('../runtime/routes/call-routes.js');
1049
+ const req = new Request('http://localhost/v1/calls/start', {
1050
+ method: 'POST',
1051
+ headers: { 'Content-Type': 'application/json' },
1052
+ body: JSON.stringify({
1053
+ phoneNumber: '+14155551234',
1054
+ task: 'Test call',
1055
+ conversationId: 'test-conv-id',
1056
+ }),
1057
+ });
1058
+
1059
+ const response = await handleStartCall(req);
1060
+ expect(response.status).toBe(403);
1061
+
1062
+ const body = await response.json() as { error: string };
1063
+ expect(body.error).toContain('disabled');
1064
+ });
769
1065
  });
@@ -24,7 +24,7 @@ mock.module('../util/logger.js', () => ({
24
24
  }),
25
25
  }));
26
26
 
27
- import { initializeDb, getDb } from '../memory/db.js';
27
+ import { initializeDb, getDb, resetDb } from '../memory/db.js';
28
28
  import { memoryItems } from '../memory/schema.js';
29
29
  import {
30
30
  applyConflictResolution,
@@ -40,6 +40,7 @@ import {
40
40
  initializeDb();
41
41
 
42
42
  afterAll(() => {
43
+ resetDb();
43
44
  try { rmSync(testDir, { recursive: true }); } catch { /* best effort */ }
44
45
  });
45
46