@vellumai/assistant 0.8.1 → 0.8.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (506) hide show
  1. package/ARCHITECTURE.md +2 -7
  2. package/Dockerfile +75 -1
  3. package/bun.lock +11 -1
  4. package/docker-entrypoint.sh +5 -0
  5. package/docker-init-apt-root.sh +94 -0
  6. package/docker-kata-apt-env.sh +39 -0
  7. package/docs/plugins.md +88 -47
  8. package/docs/skills.md +9 -7
  9. package/examples/plugins/echo/README.md +27 -27
  10. package/examples/plugins/echo/package.json +3 -0
  11. package/examples/plugins/echo/register.ts +31 -31
  12. package/node_modules/@vellumai/slack-text/src/index.test.ts +114 -14
  13. package/node_modules/@vellumai/slack-text/src/index.ts +82 -18
  14. package/openapi.yaml +325 -3
  15. package/package.json +3 -1
  16. package/scripts/generate-openapi.ts +83 -10
  17. package/scripts/sync-llm-catalog.ts +2 -2
  18. package/scripts/sync-web-search-catalog.ts +47 -25
  19. package/src/__tests__/agent-image-optimize.test.ts +11 -3
  20. package/src/__tests__/agent-wake-disk-pressure-callsite.test.ts +131 -0
  21. package/src/__tests__/anthropic-provider.test.ts +45 -0
  22. package/src/__tests__/app-builder-tool-scripts.test.ts +9 -3
  23. package/src/__tests__/app-executors.test.ts +220 -4
  24. package/src/__tests__/auto-analysis-end-to-end.test.ts +35 -0
  25. package/src/__tests__/bundled-asset.test.ts +6 -6
  26. package/src/__tests__/channel-availability-routes.test.ts +206 -0
  27. package/src/__tests__/channel-delivery-store.test.ts +289 -1
  28. package/src/__tests__/circuit-breaker-pipeline.test.ts +0 -1
  29. package/src/__tests__/clawhub.test.ts +75 -16
  30. package/src/__tests__/compactor-tail-resolution.test.ts +41 -0
  31. package/src/__tests__/config-schema.test.ts +21 -0
  32. package/src/__tests__/config-set-route.test.ts +80 -0
  33. package/src/__tests__/config-sounds-sync.test.ts +97 -0
  34. package/src/__tests__/config-watcher-skill-reseed.test.ts +453 -0
  35. package/src/__tests__/context-search-conversations-source.test.ts +117 -2
  36. package/src/__tests__/context-search-memory-v2-source.test.ts +0 -1
  37. package/src/__tests__/context-search-workspace-source.test.ts +7 -0
  38. package/src/__tests__/context-token-estimator.test.ts +1 -0
  39. package/src/__tests__/conversation-abort-tool-results.test.ts +4 -1
  40. package/src/__tests__/conversation-agent-loop-inference-profile.test.ts +1 -0
  41. package/src/__tests__/conversation-agent-loop-overflow.test.ts +92 -92
  42. package/src/__tests__/conversation-agent-loop.test.ts +2 -0
  43. package/src/__tests__/conversation-error.test.ts +42 -3
  44. package/src/__tests__/conversation-fork-crud.test.ts +82 -0
  45. package/src/__tests__/conversation-inference-profile-route.test.ts +40 -4
  46. package/src/__tests__/conversation-lifecycle.test.ts +173 -0
  47. package/src/__tests__/conversation-message-sync-tags.test.ts +97 -0
  48. package/src/__tests__/conversation-pairing.test.ts +54 -0
  49. package/src/__tests__/conversation-process-callsite.test.ts +4 -1
  50. package/src/__tests__/conversation-provider-retry-repair.test.ts +5 -1
  51. package/src/__tests__/conversation-queue.test.ts +4 -1
  52. package/src/__tests__/conversation-runtime-assembly.test.ts +76 -9
  53. package/src/__tests__/conversation-slash-queue.test.ts +59 -1
  54. package/src/__tests__/conversation-slash-unknown.test.ts +4 -1
  55. package/src/__tests__/conversation-surfaces-table-action.test.ts +360 -0
  56. package/src/__tests__/conversation-sync-tags.test.ts +235 -0
  57. package/src/__tests__/conversation-workspace-injection.test.ts +5 -1
  58. package/src/__tests__/conversation-workspace-tool-tracking.test.ts +5 -1
  59. package/src/__tests__/credential-security-invariants.test.ts +3 -2
  60. package/src/__tests__/db-slack-external-content-normalization.test.ts +301 -0
  61. package/src/__tests__/delete-managed-skill-tool.test.ts +55 -13
  62. package/src/__tests__/disk-pressure-tools.test.ts +1 -0
  63. package/src/__tests__/dm-backfill.test.ts +121 -10
  64. package/src/__tests__/document-tool-security.test.ts +258 -0
  65. package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +0 -1
  66. package/src/__tests__/edit-propagation.test.ts +33 -0
  67. package/src/__tests__/empty-response-pipeline.test.ts +0 -4
  68. package/src/__tests__/external-plugin-loader.test.ts +60 -36
  69. package/src/__tests__/filing-service.test.ts +140 -0
  70. package/src/__tests__/get-skill-detail-audit.test.ts +0 -4
  71. package/src/__tests__/handlers-skills-memory-v2-reseed.test.ts +43 -62
  72. package/src/__tests__/helpers/tar-fixtures.ts +39 -0
  73. package/src/__tests__/helpers/wait-for.ts +21 -0
  74. package/src/__tests__/history-repair-pipeline.test.ts +0 -3
  75. package/src/__tests__/history-repair.test.ts +73 -0
  76. package/src/__tests__/host-app-control-proxy.test.ts +266 -10
  77. package/src/__tests__/image-credentials.test.ts +1 -1
  78. package/src/__tests__/inbound-slack-persistence.test.ts +2 -0
  79. package/src/__tests__/inference-no-mode-boot-e2e.test.ts +1 -1
  80. package/src/__tests__/inference-profile-reaper.test.ts +4 -2
  81. package/src/__tests__/inference-profile-session-handler.test.ts +18 -6
  82. package/src/__tests__/inference-profile-session-ipc.test.ts +17 -5
  83. package/src/__tests__/injector-chain.test.ts +10 -8
  84. package/src/__tests__/install-skill-routing.test.ts +155 -37
  85. package/src/__tests__/lifecycle-memory-v2-seed.test.ts +92 -3
  86. package/src/__tests__/list-messages-page-latest.test.ts +55 -0
  87. package/src/__tests__/llm-call-pipeline.test.ts +0 -3
  88. package/src/__tests__/llm-catalog-parity.test.ts +55 -13
  89. package/src/__tests__/llm-request-log-source-clickhouse.test.ts +34 -0
  90. package/src/__tests__/llm-request-log-source-factory.test.ts +29 -53
  91. package/src/__tests__/llm-usage-store.test.ts +114 -0
  92. package/src/__tests__/managed-profile-guard.test.ts +31 -29
  93. package/src/__tests__/managed-skill-lifecycle.test.ts +109 -18
  94. package/src/__tests__/managed-store.test.ts +84 -192
  95. package/src/__tests__/media-generate-image.test.ts +1 -1
  96. package/src/__tests__/memory-retrieval-pipeline.test.ts +0 -2
  97. package/src/__tests__/messages-after-tiebreaker.test.ts +122 -0
  98. package/src/__tests__/oauth-commands-routes.test.ts +168 -16
  99. package/src/__tests__/oauth-provider-profiles.test.ts +9 -0
  100. package/src/__tests__/openai-provider.test.ts +24 -0
  101. package/src/__tests__/openai-responses-cutover-guard.test.ts +17 -9
  102. package/src/__tests__/overflow-reduce-pipeline.test.ts +0 -2
  103. package/src/__tests__/persistence-pipeline.test.ts +0 -2
  104. package/src/__tests__/{managed-proxy-context.test.ts → platform-proxy-context.test.ts} +1 -1
  105. package/src/__tests__/platform.test.ts +2 -0
  106. package/src/__tests__/plugin-api-shim.test.ts +125 -0
  107. package/src/__tests__/plugin-bootstrap.test.ts +10 -36
  108. package/src/__tests__/plugin-external-api.test.ts +68 -0
  109. package/src/__tests__/plugin-registry.test.ts +0 -77
  110. package/src/__tests__/plugin-route-contribution.test.ts +0 -1
  111. package/src/__tests__/plugin-skill-contribution.test.ts +0 -2
  112. package/src/__tests__/plugin-tool-contribution.test.ts +16 -15
  113. package/src/__tests__/plugin-types.test.ts +3 -13
  114. package/src/__tests__/process-message-background-slack.test.ts +8 -1
  115. package/src/__tests__/process-message-display-content.test.ts +421 -0
  116. package/src/__tests__/provider-catalog-visibility.test.ts +142 -0
  117. package/src/__tests__/provider-error-scenarios.test.ts +111 -0
  118. package/src/__tests__/{provider-managed-proxy-integration.test.ts → provider-platform-proxy-integration.test.ts} +8 -8
  119. package/src/__tests__/scaffold-managed-skill-tool.test.ts +65 -13
  120. package/src/__tests__/schedule-routes.test.ts +50 -3
  121. package/src/__tests__/schedule-store.test.ts +94 -0
  122. package/src/__tests__/scheduler-reuse-conversation.test.ts +54 -7
  123. package/src/__tests__/schema-transforms.test.ts +20 -0
  124. package/src/__tests__/search-skills-unified.test.ts +0 -5
  125. package/src/__tests__/server-history-render.test.ts +43 -0
  126. package/src/__tests__/skill-load-feature-flag.test.ts +0 -12
  127. package/src/__tests__/skill-load-tool.test.ts +27 -89
  128. package/src/__tests__/skill-memory.test.ts +23 -3
  129. package/src/__tests__/skills-file-content-endpoint.test.ts +9 -38
  130. package/src/__tests__/skills-files-catalog-fallback.test.ts +0 -3
  131. package/src/__tests__/skills-install-extract.test.ts +49 -38
  132. package/src/__tests__/skills-install-staging.test.ts +159 -0
  133. package/src/__tests__/skills-uninstall.test.ts +9 -41
  134. package/src/__tests__/skills.test.ts +51 -58
  135. package/src/__tests__/slack-channel-config.test.ts +9 -0
  136. package/src/__tests__/subagent-tool-filtering.test.ts +50 -0
  137. package/src/__tests__/system-prompt.test.ts +737 -63
  138. package/src/__tests__/terminal-tools.test.ts +28 -1
  139. package/src/__tests__/thread-backfill.test.ts +557 -27
  140. package/src/__tests__/title-generate-pipeline.test.ts +0 -13
  141. package/src/__tests__/token-estimate-pipeline.test.ts +0 -3
  142. package/src/__tests__/tool-error-pipeline.test.ts +0 -3
  143. package/src/__tests__/tool-execute-pipeline.test.ts +0 -5
  144. package/src/__tests__/tool-executor-lifecycle-events.test.ts +1 -1
  145. package/src/__tests__/tool-executor.test.ts +16 -4
  146. package/src/__tests__/tool-result-truncate-pipeline.test.ts +0 -12
  147. package/src/__tests__/turn-events-store.test.ts +256 -0
  148. package/src/__tests__/twilio-routes.test.ts +4 -0
  149. package/src/__tests__/user-plugin-loader.test.ts +0 -7
  150. package/src/__tests__/voice-session-bridge.test.ts +198 -0
  151. package/src/__tests__/web-search-catalog-parity.test.ts +32 -10
  152. package/src/__tests__/workspace-migration-057-repair-stale-gemini-model-ids.test.ts +115 -3
  153. package/src/__tests__/workspace-migration-072-seed-reply-suggestion-callsite.test.ts +50 -0
  154. package/src/__tests__/workspace-migration-073-repair-recall-callsite-empty-profile.test.ts +153 -0
  155. package/src/__tests__/workspace-migration-085-memory-v2-bm25-b-reembed-disabled-v2-pages.test.ts +220 -0
  156. package/src/__tests__/workspace-migration-086-revert-stale-gemini-mis-rewrites.test.ts +269 -0
  157. package/src/__tests__/workspace-migration-remove-legacy-skills-index.test.ts +309 -0
  158. package/src/__tests__/workspace-migrations-runner.test.ts +111 -3
  159. package/src/acp/resolve-agent.ts +1 -1
  160. package/src/agent/image-optimize.ts +13 -5
  161. package/src/calls/voice-session-bridge.ts +61 -42
  162. package/src/channels/types.ts +108 -0
  163. package/src/cli/__tests__/unknown-command.test.ts +24 -0
  164. package/src/cli/commands/__tests__/changelog.test.ts +304 -319
  165. package/src/cli/commands/__tests__/schedules.test.ts +491 -0
  166. package/src/cli/commands/changelog.ts +106 -42
  167. package/src/cli/commands/conversations.ts +102 -17
  168. package/src/cli/commands/default-action.ts +10 -53
  169. package/src/cli/commands/notifications.ts +329 -317
  170. package/src/cli/commands/plugins.ts +185 -0
  171. package/src/cli/commands/schedules.ts +391 -0
  172. package/src/cli/commands/telemetry.ts +40 -0
  173. package/src/cli/lib/__tests__/cli-colors.test.ts +48 -0
  174. package/src/cli/lib/__tests__/confirm-prompt.test.ts +159 -0
  175. package/src/cli/lib/__tests__/install-from-github.test.ts +355 -0
  176. package/src/cli/lib/__tests__/list-installed-plugins.test.ts +154 -0
  177. package/src/cli/lib/__tests__/uninstall-plugin.test.ts +124 -0
  178. package/src/cli/lib/__tests__/unknown-command.test.ts +106 -0
  179. package/src/cli/lib/cli-colors.ts +12 -0
  180. package/src/cli/lib/confirm-prompt.ts +79 -0
  181. package/src/cli/lib/install-from-github.ts +304 -0
  182. package/src/cli/lib/list-installed-plugins.ts +137 -0
  183. package/src/cli/lib/uninstall-plugin.ts +82 -0
  184. package/src/cli/lib/unknown-command.ts +111 -0
  185. package/src/cli/program.ts +38 -2
  186. package/src/config/bundled-skills/app-builder/SKILL.md +23 -21
  187. package/src/config/bundled-skills/app-builder/TOOLS.json +7 -0
  188. package/src/config/bundled-skills/computer-use/TOOLS.json +15 -52
  189. package/src/config/bundled-skills/document/SKILL.md +23 -3
  190. package/src/config/bundled-skills/document/TOOLS.json +53 -0
  191. package/src/config/bundled-skills/document/tools/document-delete.ts +12 -0
  192. package/src/config/bundled-skills/document/tools/document-list.ts +12 -0
  193. package/src/config/bundled-skills/document/tools/document-read.ts +12 -0
  194. package/src/config/bundled-skills/skill-management/SKILL.md +2 -2
  195. package/src/config/bundled-skills/skill-management/TOOLS.json +7 -7
  196. package/src/config/bundled-tool-registry.ts +6 -0
  197. package/src/config/feature-flag-registry.json +41 -1
  198. package/src/config/loader.ts +64 -38
  199. package/src/config/schema.ts +7 -10
  200. package/src/config/schemas/__tests__/llm-request-logs.test.ts +36 -0
  201. package/src/config/schemas/channels.ts +8 -0
  202. package/src/config/schemas/compaction.ts +28 -0
  203. package/src/config/schemas/heartbeat.ts +9 -0
  204. package/src/config/schemas/llm-request-logs.ts +31 -7
  205. package/src/config/schemas/llm.ts +3 -0
  206. package/src/config/schemas/memory-retrieval.ts +18 -0
  207. package/src/config/schemas/tools.ts +14 -0
  208. package/src/config/skills.ts +3 -96
  209. package/src/context/compactor.ts +1047 -0
  210. package/src/context/token-estimator.ts +2 -2
  211. package/src/context/window-manager.ts +197 -1520
  212. package/src/credential-execution/managed-catalog.ts +37 -0
  213. package/src/credential-health/credential-health-service.ts +280 -19
  214. package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +34 -0
  215. package/src/daemon/__tests__/conversation-tool-setup-exclude.test.ts +138 -0
  216. package/src/daemon/__tests__/conversation-tool-setup.test.ts +74 -0
  217. package/src/daemon/approval-generators.ts +8 -6
  218. package/src/daemon/config-watcher.ts +94 -31
  219. package/src/daemon/conversation-agent-loop.ts +169 -9
  220. package/src/daemon/conversation-error.ts +171 -37
  221. package/src/daemon/conversation-lifecycle.ts +53 -40
  222. package/src/daemon/conversation-messaging.ts +25 -6
  223. package/src/daemon/conversation-process.ts +49 -12
  224. package/src/daemon/conversation-runtime-assembly.ts +16 -1
  225. package/src/daemon/conversation-slash.ts +12 -5
  226. package/src/daemon/conversation-store.ts +11 -4
  227. package/src/daemon/conversation-tool-setup.ts +39 -7
  228. package/src/daemon/conversation.ts +33 -1
  229. package/src/daemon/external-plugins-bootstrap.ts +217 -181
  230. package/src/daemon/first-greeting.ts +22 -2
  231. package/src/daemon/handlers/config-model.ts +6 -5
  232. package/src/daemon/handlers/config-slack-channel.ts +15 -3
  233. package/src/daemon/handlers/shared.ts +14 -5
  234. package/src/daemon/handlers/skills.ts +111 -108
  235. package/src/daemon/history-repair.ts +28 -1
  236. package/src/daemon/host-app-control-proxy.ts +98 -23
  237. package/src/daemon/lifecycle.ts +45 -35
  238. package/src/daemon/meet-host-supervisor.ts +5 -4
  239. package/src/daemon/memory-v2-startup.ts +49 -0
  240. package/src/daemon/message-protocol.ts +1 -0
  241. package/src/daemon/message-types/conversations.ts +25 -0
  242. package/src/daemon/message-types/messages.ts +61 -0
  243. package/src/daemon/message-types/subagents.ts +1 -0
  244. package/src/daemon/message-types/sync.ts +1 -0
  245. package/src/daemon/pkb-reminder-builder.test.ts +1 -1
  246. package/src/daemon/pkb-reminder-builder.ts +1 -1
  247. package/src/daemon/plugin-source-watcher.ts +146 -0
  248. package/src/daemon/process-message.ts +21 -3
  249. package/src/daemon/server.ts +11 -2
  250. package/src/daemon/skill-memory-refresh.ts +29 -0
  251. package/src/documents/document-store.ts +221 -3
  252. package/src/embedded/plugin-api.ts +40 -0
  253. package/src/filing/filing-service.ts +39 -0
  254. package/src/heartbeat/__tests__/heartbeat-service.test.ts +91 -6
  255. package/src/heartbeat/heartbeat-run-store.ts +2 -1
  256. package/src/heartbeat/heartbeat-service.ts +41 -0
  257. package/src/home/__tests__/feed-types.test.ts +40 -0
  258. package/src/home/feed-types.ts +22 -0
  259. package/src/home/post-connect-feed.ts +1 -0
  260. package/src/index.ts +18 -1
  261. package/src/live-voice/__tests__/live-voice-stt.test.ts +57 -0
  262. package/src/mcp/client.ts +20 -4
  263. package/src/media/image-credentials.ts +3 -3
  264. package/src/memory/__tests__/bookmark-crud.test.ts +33 -27
  265. package/src/memory/__tests__/conversation-queries.test.ts +263 -0
  266. package/src/memory/__tests__/jobs-worker-v2-graph-trigger-embed.test.ts +113 -0
  267. package/src/memory/__tests__/memory-retrospective-startup-cleanup.test.ts +119 -14
  268. package/src/memory/__tests__/message-content.test.ts +35 -0
  269. package/src/memory/bookmark-crud.ts +42 -10
  270. package/src/memory/context-search/sources/conversations.ts +62 -2
  271. package/src/memory/context-search/sources/workspace.ts +4 -0
  272. package/src/memory/conversation-crud.ts +63 -19
  273. package/src/memory/conversation-queries.ts +110 -10
  274. package/src/memory/db-init.ts +6 -0
  275. package/src/memory/delivery-crud.ts +152 -5
  276. package/src/memory/embedding-backend.ts +4 -4
  277. package/src/memory/external-conversation-store.ts +66 -5
  278. package/src/memory/graph/__tests__/conversation-graph-memory-v2-routing.test.ts +66 -9
  279. package/src/memory/graph/conversation-graph-memory.ts +31 -15
  280. package/src/memory/graph/tools.ts +3 -3
  281. package/src/memory/indexer.ts +34 -29
  282. package/src/memory/jobs/__tests__/embed-concept-page.test.ts +73 -0
  283. package/src/memory/jobs/embed-concept-page.ts +20 -11
  284. package/src/memory/jobs-worker.ts +6 -1
  285. package/src/memory/llm-request-log-source-clickhouse.ts +17 -10
  286. package/src/memory/llm-request-log-source.ts +19 -52
  287. package/src/memory/llm-usage-store.ts +125 -5
  288. package/src/memory/memory-retrospective-startup-cleanup.ts +72 -5
  289. package/src/memory/message-content.ts +1 -1
  290. package/src/memory/migrations/109-external-conversation-bindings.ts +15 -4
  291. package/src/memory/migrations/229-delete-private-conversations.test.ts +38 -1
  292. package/src/memory/migrations/229-delete-private-conversations.ts +7 -0
  293. package/src/memory/migrations/247-external-conversation-binding-thread-id.ts +78 -0
  294. package/src/memory/migrations/248-create-onboarding-events.ts +21 -0
  295. package/src/memory/migrations/249-normalize-slack-external-content.ts +240 -0
  296. package/src/memory/migrations/index.ts +6 -0
  297. package/src/memory/migrations/registry.ts +8 -0
  298. package/src/memory/onboarding-events-store.ts +106 -0
  299. package/src/memory/schema/bookmarks.ts +0 -2
  300. package/src/memory/schema/calls.ts +1 -0
  301. package/src/memory/schema/inference.ts +1 -3
  302. package/src/memory/schema/infrastructure.ts +12 -0
  303. package/src/memory/turn-events-store.ts +127 -2
  304. package/src/memory/v2/__tests__/activation.test.ts +0 -8
  305. package/src/memory/v2/__tests__/injection.test.ts +98 -8
  306. package/src/memory/v2/__tests__/migration.test.ts +87 -0
  307. package/src/memory/v2/__tests__/page-index.test.ts +83 -0
  308. package/src/memory/v2/__tests__/prompts-router.test.ts +58 -6
  309. package/src/memory/v2/__tests__/qdrant.test.ts +66 -3
  310. package/src/memory/v2/__tests__/router.test.ts +15 -0
  311. package/src/memory/v2/__tests__/skill-store.test.ts +387 -8
  312. package/src/memory/v2/injection.ts +32 -6
  313. package/src/memory/v2/migration.ts +49 -19
  314. package/src/memory/v2/page-index.ts +35 -5
  315. package/src/memory/v2/prompts/router.ts +11 -8
  316. package/src/memory/v2/prompts/sweep.ts +2 -2
  317. package/src/memory/v2/qdrant.ts +135 -7
  318. package/src/memory/v2/router.ts +9 -8
  319. package/src/memory/v2/skill-store.ts +120 -35
  320. package/src/messaging/providers/slack/__tests__/adapter-token-routing.test.ts +45 -5
  321. package/src/messaging/providers/slack/__tests__/download.test.ts +231 -0
  322. package/src/messaging/providers/slack/adapter.ts +43 -5
  323. package/src/messaging/providers/slack/client.ts +27 -0
  324. package/src/messaging/providers/slack/deep-link.ts +65 -0
  325. package/src/messaging/providers/slack/download.ts +104 -0
  326. package/src/messaging/providers/slack/message-metadata.test.ts +32 -0
  327. package/src/messaging/providers/slack/message-metadata.ts +27 -0
  328. package/src/messaging/providers/slack/render-transcript.test.ts +134 -0
  329. package/src/messaging/providers/slack/render-transcript.ts +69 -5
  330. package/src/messaging/providers/slack/types.ts +20 -1
  331. package/src/notifications/conversation-pairing.ts +2 -1
  332. package/src/notifications/decision-engine.ts +2 -1
  333. package/src/notifications/emit-signal.ts +20 -1
  334. package/src/notifications/home-feed-side-effect.ts +54 -0
  335. package/src/notifications/signal.ts +3 -1
  336. package/src/oauth/connection-resolver.ts +8 -4
  337. package/src/oauth/platform-connection.ts +6 -2
  338. package/src/oauth/seed-providers.ts +10 -1
  339. package/src/permissions/checker.ts +2 -0
  340. package/src/permissions/ipc-risk-types.ts +1 -0
  341. package/src/permissions/question-prompter.test.ts +416 -0
  342. package/src/permissions/question-prompter.ts +294 -0
  343. package/src/platform/client.test.ts +1 -1
  344. package/src/platform/client.ts +1 -1
  345. package/src/plugin-api/constants.ts +26 -0
  346. package/src/plugin-api/index.ts +34 -1
  347. package/src/plugin-api/types.ts +104 -22
  348. package/src/plugins/defaults/circuit-breaker.ts +0 -5
  349. package/src/plugins/defaults/compaction.ts +0 -4
  350. package/src/plugins/defaults/empty-response.ts +0 -2
  351. package/src/plugins/defaults/history-repair.ts +0 -2
  352. package/src/plugins/defaults/injectors.ts +36 -3
  353. package/src/plugins/defaults/llm-call.ts +0 -2
  354. package/src/plugins/defaults/memory-retrieval.ts +0 -1
  355. package/src/plugins/defaults/overflow-reduce.ts +0 -1
  356. package/src/plugins/defaults/persistence.ts +0 -2
  357. package/src/plugins/defaults/title-generate.ts +0 -5
  358. package/src/plugins/defaults/token-estimate.ts +0 -2
  359. package/src/plugins/defaults/tool-error.ts +0 -7
  360. package/src/plugins/defaults/tool-execute.ts +0 -2
  361. package/src/plugins/defaults/tool-result-truncate.ts +0 -4
  362. package/src/plugins/ensure-plugin-api-shim.ts +96 -0
  363. package/src/plugins/external-api.ts +104 -0
  364. package/src/plugins/external-plugin-loader.ts +105 -32
  365. package/src/plugins/feature-gate.ts +22 -0
  366. package/src/plugins/pipeline.ts +37 -0
  367. package/src/plugins/registry.ts +48 -80
  368. package/src/plugins/types.ts +31 -26
  369. package/src/plugins/user-loader.ts +21 -2
  370. package/src/proactive-artifact/aux-message-injector.ts +11 -0
  371. package/src/proactive-artifact/job.test.ts +37 -5
  372. package/src/prompts/__tests__/system-prompt.test.ts +12 -0
  373. package/src/prompts/__tests__/task-progress-hint-section.test.ts +99 -0
  374. package/src/prompts/normalize-onboarding.ts +27 -0
  375. package/src/prompts/sections.ts +302 -0
  376. package/src/prompts/system-prompt.ts +63 -166
  377. package/src/prompts/templates/BOOTSTRAP.md +17 -1
  378. package/src/prompts/templates/system-sections.ts +173 -0
  379. package/src/providers/__tests__/inference.test.ts +22 -7
  380. package/src/providers/anthropic/client.ts +28 -28
  381. package/src/providers/connection-resolution.ts +7 -0
  382. package/src/providers/inference/adapter-factory.ts +41 -4
  383. package/src/providers/inference/connections.ts +74 -29
  384. package/src/providers/inference/resolve-auth.ts +12 -4
  385. package/src/providers/model-catalog.ts +294 -12
  386. package/src/providers/openai/chat-completions-provider.ts +10 -2
  387. package/src/providers/openrouter/client.ts +7 -0
  388. package/src/providers/{managed-proxy → platform-proxy}/constants.ts +4 -1
  389. package/src/providers/{managed-proxy → platform-proxy}/context.ts +3 -3
  390. package/src/providers/provider-availability.ts +17 -2
  391. package/src/providers/provider-catalog-visibility.ts +36 -0
  392. package/src/providers/registry.ts +22 -14
  393. package/src/providers/retry.ts +47 -1
  394. package/src/runtime/__tests__/agent-wake.test.ts +152 -0
  395. package/src/runtime/agent-wake.ts +42 -14
  396. package/src/runtime/auth/route-policy.ts +8 -1
  397. package/src/runtime/btw-sidechain.ts +2 -0
  398. package/src/runtime/http-types.ts +19 -0
  399. package/src/runtime/migrations/origin-mode.ts +1 -1
  400. package/src/runtime/pending-interactions.ts +1 -0
  401. package/src/runtime/routes/__tests__/bookmark-routes.test.ts +17 -0
  402. package/src/runtime/routes/__tests__/conversation-management-routes.test.ts +5 -1
  403. package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +107 -20
  404. package/src/runtime/routes/__tests__/question-routes.test.ts +395 -0
  405. package/src/runtime/routes/__tests__/tts-routes.test.ts +64 -1
  406. package/src/runtime/routes/acp-routes-list.test.ts +143 -0
  407. package/src/runtime/routes/acp-routes.ts +5 -3
  408. package/src/runtime/routes/auth-routes.ts +1 -1
  409. package/src/runtime/routes/bookmark-routes.ts +5 -3
  410. package/src/runtime/routes/btw-routes.ts +5 -1
  411. package/src/runtime/routes/channel-availability-routes.ts +121 -0
  412. package/src/runtime/routes/conversation-cli-routes.ts +44 -3
  413. package/src/runtime/routes/conversation-list-routes.ts +3 -20
  414. package/src/runtime/routes/conversation-management-routes.ts +17 -42
  415. package/src/runtime/routes/conversation-query-routes.ts +40 -35
  416. package/src/runtime/routes/conversation-routes.ts +90 -11
  417. package/src/runtime/routes/documents-routes.ts +25 -86
  418. package/src/runtime/routes/group-routes.ts +5 -0
  419. package/src/runtime/routes/inbound-conversation.ts +28 -8
  420. package/src/runtime/routes/inbound-message-handler.ts +236 -41
  421. package/src/runtime/routes/inbound-stages/background-dispatch.test.ts +111 -0
  422. package/src/runtime/routes/inbound-stages/background-dispatch.ts +32 -1
  423. package/src/runtime/routes/inbound-stages/edit-intercept.ts +17 -4
  424. package/src/runtime/routes/index.ts +6 -0
  425. package/src/runtime/routes/inference-profile-session-handler.ts +17 -44
  426. package/src/runtime/routes/inference-profile-session-reaper.ts +7 -21
  427. package/src/runtime/routes/inference-provider-connection-routes.ts +65 -21
  428. package/src/runtime/routes/integrations/slack/share.ts +4 -52
  429. package/src/runtime/routes/integrations/slack/token.ts +43 -0
  430. package/src/runtime/routes/integrations/twilio.ts +6 -13
  431. package/src/runtime/routes/notification-routes.ts +1 -1
  432. package/src/runtime/routes/oauth-commands-routes.ts +105 -15
  433. package/src/runtime/routes/oauth-lifecycle-routes.ts +43 -0
  434. package/src/runtime/routes/question-routes.ts +259 -0
  435. package/src/runtime/routes/rename-conversation-routes.ts +2 -33
  436. package/src/runtime/routes/schedule-routes.ts +4 -7
  437. package/src/runtime/routes/subagents-routes.ts +57 -18
  438. package/src/runtime/routes/telemetry-routes.ts +27 -0
  439. package/src/runtime/routes/tts-routes.ts +27 -2
  440. package/src/runtime/routes/workspace-routes.test.ts +43 -0
  441. package/src/runtime/routes/workspace-routes.ts +28 -0
  442. package/src/runtime/services/conversation-serializer.ts +39 -7
  443. package/src/runtime/sync/resource-sync-events.ts +93 -1
  444. package/src/schedule/schedule-store.ts +27 -2
  445. package/src/schedule/scheduler.ts +9 -1
  446. package/src/security/__tests__/untrusted-content.test.ts +86 -0
  447. package/src/security/untrusted-content.ts +93 -8
  448. package/src/skills/catalog-files.ts +1 -1
  449. package/src/skills/catalog-install.ts +233 -116
  450. package/src/skills/clawhub.ts +70 -13
  451. package/src/skills/managed-store.ts +4 -119
  452. package/src/skills/skillssh-registry.ts +27 -48
  453. package/src/subagent/manager.ts +15 -7
  454. package/src/telemetry/types.ts +113 -1
  455. package/src/telemetry/usage-telemetry-reporter.test.ts +312 -5
  456. package/src/telemetry/usage-telemetry-reporter.ts +113 -7
  457. package/src/tools/apps/executors.ts +58 -7
  458. package/src/tools/ask-question/ask-question-tool.test.ts +509 -0
  459. package/src/tools/ask-question/ask-question-tool.ts +304 -0
  460. package/src/tools/browser/browser-execution.ts +15 -11
  461. package/src/tools/computer-use/definitions.ts +3 -3
  462. package/src/tools/credentials/vault.ts +1 -1
  463. package/src/tools/document/document-tool.ts +124 -1
  464. package/src/tools/filesystem/edit.ts +1 -1
  465. package/src/tools/filesystem/list.ts +1 -1
  466. package/src/tools/filesystem/read.ts +1 -1
  467. package/src/tools/filesystem/write.ts +5 -2
  468. package/src/tools/host-filesystem/transfer.ts +1 -1
  469. package/src/tools/host-terminal/host-shell.ts +1 -1
  470. package/src/tools/permission-checker.ts +1 -1
  471. package/src/tools/registry.ts +17 -7
  472. package/src/tools/schedule/create.ts +2 -2
  473. package/src/tools/schema-transforms.ts +7 -2
  474. package/src/tools/side-effects.ts +1 -0
  475. package/src/tools/skills/delete-managed.ts +4 -4
  476. package/src/tools/skills/execute.ts +1 -1
  477. package/src/tools/skills/scaffold-managed.ts +3 -2
  478. package/src/tools/subagent/notify-parent.ts +1 -1
  479. package/src/tools/system/request-permission.ts +2 -2
  480. package/src/tools/terminal/safe-env.ts +60 -1
  481. package/src/tools/tool-manifest.ts +2 -0
  482. package/src/tools/types.ts +72 -21
  483. package/src/tools/ui-surface/definitions.ts +6 -5
  484. package/src/tts/__tests__/provider-adapters.test.ts +76 -2
  485. package/src/tts/providers/elevenlabs-provider.ts +75 -1
  486. package/src/types/onboarding-context.ts +2 -0
  487. package/src/util/errors.ts +17 -0
  488. package/src/util/platform.ts +10 -0
  489. package/src/watcher/__tests__/engine.test.ts +22 -0
  490. package/src/watcher/engine.ts +6 -2
  491. package/src/workspace/migrations/057-repair-stale-gemini-model-ids.ts +80 -15
  492. package/src/workspace/migrations/072-seed-reply-suggestion-callsite.ts +35 -22
  493. package/src/workspace/migrations/073-repair-recall-callsite-empty-profile.ts +3 -1
  494. package/src/workspace/migrations/083-system-prompt-prefix-to-file.ts +191 -0
  495. package/src/workspace/migrations/084-remove-legacy-skills-index.ts +276 -0
  496. package/src/workspace/migrations/085-memory-v2-bm25-b-reembed-disabled-v2-pages.ts +137 -0
  497. package/src/workspace/migrations/086-revert-stale-gemini-mis-rewrites.ts +198 -0
  498. package/src/workspace/migrations/registry.ts +8 -0
  499. package/src/workspace/migrations/runner.ts +39 -9
  500. package/src/workspace/migrations/types.ts +4 -0
  501. package/examples/plugins/echo/bun.lock +0 -25
  502. package/src/__tests__/context-window-manager.test.ts +0 -2481
  503. package/src/context/__tests__/compact-prompt.test.ts +0 -63
  504. package/src/context/prompts/compact.md +0 -26
  505. package/src/prompts/__tests__/build-cli-reference-section.test.ts +0 -37
  506. /package/src/__tests__/{secret-routes-managed-proxy.test.ts → secret-routes-platform-proxy.test.ts} +0 -0
@@ -86,6 +86,7 @@ export interface AppCreateInput {
86
86
  pages?: unknown;
87
87
  auto_open?: boolean;
88
88
  preview?: Record<string, unknown>;
89
+ source_files?: Record<string, string>;
89
90
  }
90
91
 
91
92
  export async function executeAppCreate(
@@ -129,6 +130,31 @@ export async function executeAppCreate(
129
130
  };
130
131
  }
131
132
 
133
+ if (input.source_files != null) {
134
+ if (
135
+ typeof input.source_files !== "object" ||
136
+ Array.isArray(input.source_files)
137
+ ) {
138
+ return {
139
+ content: JSON.stringify({
140
+ error:
141
+ "source_files must be an object mapping relative file paths to string contents",
142
+ }),
143
+ isError: true,
144
+ };
145
+ }
146
+ for (const [key, val] of Object.entries(input.source_files)) {
147
+ if (typeof val !== "string") {
148
+ return {
149
+ content: JSON.stringify({
150
+ error: `source_files["${key}"] must be a string, got ${typeof val}`,
151
+ }),
152
+ isError: true,
153
+ };
154
+ }
155
+ }
156
+ }
157
+
132
158
  // Extract icon from preview if provided - only persist emoji-like values,
133
159
  // not URLs which would render as raw strings in UI and bundle manifests.
134
160
  const rawIcon = preview?.icon as string | undefined;
@@ -172,17 +198,32 @@ function App() {
172
198
  render(<App />, document.getElementById('app')!);
173
199
  `;
174
200
 
175
- // Only write scaffold files when they don't already exist on disk.
176
- // The LLM may have written custom source files via file_write before
177
- // calling app_create, and overwriting them would destroy the real app
178
- // content, leaving only the scaffold placeholder.
201
+ if (input.source_files) {
202
+ for (const [filePath, content] of Object.entries(input.source_files)) {
203
+ store.writeAppFile(app.id, filePath, content);
204
+ }
205
+ }
206
+
207
+ const mainTsxScaffolded = !store.appFileExists(app.id, "src/main.tsx");
179
208
  if (!store.appFileExists(app.id, "src/index.html")) {
180
209
  store.writeAppFile(app.id, "src/index.html", indexHtml);
181
210
  }
182
- if (!store.appFileExists(app.id, "src/main.tsx")) {
211
+ if (mainTsxScaffolded) {
183
212
  store.writeAppFile(app.id, "src/main.tsx", mainTsx);
184
213
  }
185
214
 
215
+ // When the placeholder main.tsx was actually scaffolded, the tool result
216
+ // must steer the agent toward writing the real source files instead of
217
+ // treating success + inline AppCard as task-done. When the agent pre-wrote
218
+ // src/main.tsx before calling app_create, this directive would be false
219
+ // and risks prompting a destructive rewrite, so omit it in that case.
220
+ const nextStepsField = mainTsxScaffolded
221
+ ? {
222
+ next_steps:
223
+ "Scaffold created with a placeholder src/main.tsx only. The app is NOT built yet. You MUST now (1) write the real src/main.tsx, components under src/components/, and src/styles.css with file_write, then (2) call app_refresh once. Stopping here leaves an empty Hello-world placeholder as the only result.",
224
+ }
225
+ : {};
226
+
186
227
  // Compile src/ → dist/
187
228
  const appDir = getAppDirPath(app.id);
188
229
  const compileResult = await compileApp(appDir);
@@ -193,6 +234,7 @@ render(<App />, document.getElementById('app')!);
193
234
  compile_errors: compileResult.errors,
194
235
  compile_warnings: compileResult.warnings,
195
236
  compile_duration_ms: compileResult.durationMs,
237
+ ...nextStepsField,
196
238
  }),
197
239
  isError: false,
198
240
  };
@@ -200,7 +242,7 @@ render(<App />, document.getElementById('app')!);
200
242
 
201
243
  // Emit the inline preview card via the proxy without opening a workspace panel.
202
244
  // open_mode: "preview" signals to the client that this should be shown inline only.
203
- if (autoOpen && proxyToolResolver) {
245
+ if (autoOpen && !mainTsxScaffolded && proxyToolResolver) {
204
246
  const createPreview = {
205
247
  ...(preview ?? {}),
206
248
  context: "app_create" as const,
@@ -217,6 +259,7 @@ render(<App />, document.getElementById('app')!);
217
259
  ...app,
218
260
  auto_opened: false,
219
261
  auto_open_error: openResult.content,
262
+ ...nextStepsField,
220
263
  }),
221
264
  isError: false,
222
265
  };
@@ -226,6 +269,7 @@ render(<App />, document.getElementById('app')!);
226
269
  ...app,
227
270
  auto_opened: true,
228
271
  open_result: openResult.content,
272
+ ...nextStepsField,
229
273
  }),
230
274
  isError: false,
231
275
  };
@@ -237,13 +281,20 @@ render(<App />, document.getElementById('app')!);
237
281
  auto_opened: false,
238
282
  auto_open_error:
239
283
  "Failed to auto-open app. Use app_open to open it manually.",
284
+ ...nextStepsField,
240
285
  }),
241
286
  isError: false,
242
287
  };
243
288
  }
244
289
  }
245
290
 
246
- return { content: JSON.stringify(app), isError: false };
291
+ return {
292
+ content: JSON.stringify({
293
+ ...app,
294
+ ...nextStepsField,
295
+ }),
296
+ isError: false,
297
+ };
247
298
  }
248
299
 
249
300
  // ---------------------------------------------------------------------------
@@ -0,0 +1,509 @@
1
+ import { describe, expect, test } from "bun:test";
2
+
3
+ import type { QuestionPromptResult } from "../../permissions/question-prompter.js";
4
+ import type { ToolContext } from "../types.js";
5
+ import { AskQuestionTool } from "./ask-question-tool.js";
6
+
7
+ type PromptParams = Parameters<
8
+ import("../../permissions/question-prompter.js").QuestionPrompter["prompt"]
9
+ >[0];
10
+
11
+ function makeContext(overrides: Partial<ToolContext> = {}): ToolContext {
12
+ return {
13
+ workingDir: "/tmp",
14
+ conversationId: "conv-1",
15
+ trustClass: "guardian",
16
+ toolUseId: "tu-1",
17
+ ...overrides,
18
+ };
19
+ }
20
+
21
+ function makeToolWithStub(result: QuestionPromptResult): {
22
+ tool: AskQuestionTool;
23
+ calls: PromptParams[];
24
+ } {
25
+ const calls: PromptParams[] = [];
26
+ const tool = new AskQuestionTool(() => ({
27
+ async prompt(params: PromptParams) {
28
+ calls.push(params);
29
+ return result;
30
+ },
31
+ }));
32
+ return { tool, calls };
33
+ }
34
+
35
+ const validInput = {
36
+ question: "Which fruit?",
37
+ description: "Pick one to add to the smoothie.",
38
+ options: [
39
+ { id: "a", label: "Apple" },
40
+ { id: "b", label: "Banana", description: "Ripe" },
41
+ ],
42
+ freeTextPlaceholder: "Type a fruit",
43
+ };
44
+
45
+ const singleQ = {
46
+ question: validInput.question,
47
+ description: validInput.description,
48
+ options: validInput.options,
49
+ freeTextPlaceholder: validInput.freeTextPlaceholder,
50
+ };
51
+
52
+ describe("AskQuestionTool definition", () => {
53
+ test("exposes the expected schema shape and description language", () => {
54
+ const def = new AskQuestionTool().getDefinition();
55
+ expect(def.name).toBe("ask_question");
56
+ expect(def.description).toContain("free-text fallback is always added");
57
+ expect(def.description).toContain("do not");
58
+ expect(def.description).toContain("'something else'");
59
+ expect(def.description).toContain("plain-text clarification");
60
+ expect(def.description).toContain("obvious from context");
61
+ expect(def.description).toContain("Use this tool whenever");
62
+ expect(def.description).toContain("When in doubt");
63
+ expect(def.description).toContain("plausible interpretations");
64
+ expect(def.description).toContain("remove guessing");
65
+ expect(def.description).toContain("a question is skipped");
66
+ expect(def.description).toContain("every question in the batch is skipped");
67
+ // Batching language is back now that the prompter handles batches.
68
+ expect(def.description).toContain("Batch related clarifications");
69
+ expect(def.description).toContain("up to 5");
70
+ expect(def.description).toContain("Skip button");
71
+
72
+ const schema = def.input_schema as {
73
+ properties: Record<
74
+ string,
75
+ { type?: string; minItems?: number; maxItems?: number }
76
+ >;
77
+ required?: string[];
78
+ };
79
+ expect(schema.properties.options?.type).toBe("array");
80
+ expect(schema.properties.options?.minItems).toBe(2);
81
+ expect(schema.properties.options?.maxItems).toBe(4);
82
+ });
83
+ });
84
+
85
+ // Build a single-question completed result for tests that just need to
86
+ // exercise the formatter on a one-element batch.
87
+ function singleCompleted(
88
+ entry:
89
+ | { decision: "option"; optionId: string }
90
+ | { decision: "free_text"; text: string }
91
+ | { decision: "skipped" },
92
+ ): QuestionPromptResult {
93
+ return {
94
+ entries: [{ questionId: "q1", ...entry }],
95
+ overall: "completed",
96
+ };
97
+ }
98
+
99
+ describe("AskQuestionTool.execute", () => {
100
+ test("forwards questions array unchanged to the prompter", async () => {
101
+ const { tool, calls } = makeToolWithStub(
102
+ singleCompleted({ decision: "option", optionId: "a" }),
103
+ );
104
+
105
+ const result = await tool.execute(validInput, makeContext());
106
+
107
+ expect(calls).toHaveLength(1);
108
+ expect(calls[0]?.conversationId).toBe("conv-1");
109
+ expect(calls[0]?.questions).toHaveLength(1);
110
+ expect(calls[0]?.questions[0]?.question).toBe(validInput.question);
111
+ expect(calls[0]?.questions[0]?.description).toBe(validInput.description);
112
+ expect(calls[0]?.questions[0]?.options).toEqual(validInput.options);
113
+ expect(calls[0]?.questions[0]?.freeTextPlaceholder).toBe(
114
+ validInput.freeTextPlaceholder,
115
+ );
116
+ expect(calls[0]?.toolUseId).toBe("tu-1");
117
+
118
+ expect(result.isError).toBe(false);
119
+ expect(result.content).toBe(
120
+ `Question "${validInput.question}" → Option: a (Apple)`,
121
+ );
122
+ });
123
+
124
+ test("formats option result with looked-up label", async () => {
125
+ const { tool } = makeToolWithStub(
126
+ singleCompleted({ decision: "option", optionId: "b" }),
127
+ );
128
+ const result = await tool.execute(validInput, makeContext());
129
+ expect(result.content).toBe(
130
+ `Question "${validInput.question}" → Option: b (Banana)`,
131
+ );
132
+ expect(result.isError).toBe(false);
133
+ });
134
+
135
+ test("falls back to '(unknown)' label when optionId is not in options", async () => {
136
+ const { tool } = makeToolWithStub(
137
+ singleCompleted({ decision: "option", optionId: "ghost" }),
138
+ );
139
+ const result = await tool.execute(validInput, makeContext());
140
+ expect(result.content).toBe(
141
+ `Question "${validInput.question}" → Option: ghost ((unknown))`,
142
+ );
143
+ expect(result.isError).toBe(false);
144
+ });
145
+
146
+ test("formats free-text result", async () => {
147
+ const { tool } = makeToolWithStub(
148
+ singleCompleted({ decision: "free_text", text: "Cherry" }),
149
+ );
150
+ const result = await tool.execute(validInput, makeContext());
151
+ expect(result.content).toBe(
152
+ `Question "${validInput.question}" → Free text: Cherry`,
153
+ );
154
+ expect(result.isError).toBe(false);
155
+ });
156
+
157
+ test("formats skipped result", async () => {
158
+ const { tool } = makeToolWithStub(singleCompleted({ decision: "skipped" }));
159
+ const result = await tool.execute(validInput, makeContext());
160
+ expect(result.content).toBe(`Question "${validInput.question}" → Skipped`);
161
+ expect(result.isError).toBe(false);
162
+ });
163
+
164
+ test("timeout produces tool error", async () => {
165
+ const { tool } = makeToolWithStub({
166
+ entries: [{ questionId: "q1", decision: "timed_out" }],
167
+ overall: "timed_out",
168
+ });
169
+ const result = await tool.execute(validInput, makeContext());
170
+ expect(result.isError).toBe(true);
171
+ expect(result.content).toBe("User did not respond within timeout");
172
+ });
173
+
174
+ test("aborted produces tool error", async () => {
175
+ const { tool } = makeToolWithStub({
176
+ entries: [{ questionId: "q1", decision: "skipped" }],
177
+ overall: "aborted",
178
+ });
179
+ const result = await tool.execute(validInput, makeContext());
180
+ expect(result.isError).toBe(true);
181
+ expect(result.content).toBe("Question aborted");
182
+ });
183
+
184
+ test("rejects input with fewer than 2 options", async () => {
185
+ const { tool, calls } = makeToolWithStub(
186
+ singleCompleted({ decision: "option", optionId: "a" }),
187
+ );
188
+ const result = await tool.execute(
189
+ { ...validInput, options: [{ id: "a", label: "Apple" }] },
190
+ makeContext(),
191
+ );
192
+ expect(result.isError).toBe(true);
193
+ expect(result.content.toLowerCase()).toContain("invalid input");
194
+ expect(calls).toHaveLength(0);
195
+ });
196
+
197
+ test("rejects input with more than 4 options", async () => {
198
+ const { tool, calls } = makeToolWithStub(
199
+ singleCompleted({ decision: "option", optionId: "a" }),
200
+ );
201
+ const result = await tool.execute(
202
+ {
203
+ ...validInput,
204
+ options: [
205
+ { id: "a", label: "A" },
206
+ { id: "b", label: "B" },
207
+ { id: "c", label: "C" },
208
+ { id: "d", label: "D" },
209
+ { id: "e", label: "E" },
210
+ ],
211
+ },
212
+ makeContext(),
213
+ );
214
+ expect(result.isError).toBe(true);
215
+ expect(calls).toHaveLength(0);
216
+ });
217
+
218
+ test("rejects input with empty question", async () => {
219
+ const { tool, calls } = makeToolWithStub(
220
+ singleCompleted({ decision: "option", optionId: "a" }),
221
+ );
222
+ const result = await tool.execute(
223
+ { ...validInput, question: "" },
224
+ makeContext(),
225
+ );
226
+ expect(result.isError).toBe(true);
227
+ expect(calls).toHaveLength(0);
228
+ });
229
+
230
+ test("propagates abort signal into the prompter", async () => {
231
+ const { tool, calls } = makeToolWithStub(
232
+ singleCompleted({ decision: "option", optionId: "a" }),
233
+ );
234
+ const ac = new AbortController();
235
+ await tool.execute(validInput, makeContext({ signal: ac.signal }));
236
+ expect(calls[0]?.signal).toBe(ac.signal);
237
+ });
238
+ });
239
+
240
+ // ── Batched input ───────────────────────────────────────────────────
241
+
242
+ describe("AskQuestionTool batched input", () => {
243
+ test("normalizes legacy flat input into a one-element batch forwarded to the prompter", async () => {
244
+ const { tool, calls } = makeToolWithStub(
245
+ singleCompleted({ decision: "option", optionId: "a" }),
246
+ );
247
+
248
+ const result = await tool.execute(validInput, makeContext());
249
+
250
+ expect(calls).toHaveLength(1);
251
+ expect(calls[0]?.questions).toHaveLength(1);
252
+ expect(calls[0]?.questions[0]?.question).toBe(validInput.question);
253
+ expect(calls[0]?.questions[0]?.options).toEqual(validInput.options);
254
+ expect(result.isError).toBe(false);
255
+ });
256
+
257
+ test("accepts a single-element `questions` batch", async () => {
258
+ const { tool, calls } = makeToolWithStub(
259
+ singleCompleted({ decision: "option", optionId: "a" }),
260
+ );
261
+
262
+ const result = await tool.execute({ questions: [singleQ] }, makeContext());
263
+
264
+ expect(calls).toHaveLength(1);
265
+ expect(calls[0]?.questions).toHaveLength(1);
266
+ expect(calls[0]?.questions[0]?.question).toBe(singleQ.question);
267
+ expect(calls[0]?.questions[0]?.options).toEqual(singleQ.options);
268
+ expect(calls[0]?.questions[0]?.description).toBe(singleQ.description);
269
+ expect(calls[0]?.questions[0]?.freeTextPlaceholder).toBe(
270
+ singleQ.freeTextPlaceholder,
271
+ );
272
+ expect(result.isError).toBe(false);
273
+ });
274
+
275
+ test("forwards the full questions array for a multi-question batch", async () => {
276
+ const q2 = {
277
+ question: "Preferred time?",
278
+ options: [
279
+ { id: "morning", label: "Morning" },
280
+ { id: "afternoon", label: "Afternoon" },
281
+ ],
282
+ freeTextPlaceholder: "or specify",
283
+ };
284
+ const q3 = {
285
+ question: "Send invite?",
286
+ options: [
287
+ { id: "yes", label: "Yes" },
288
+ { id: "no", label: "No" },
289
+ ],
290
+ };
291
+
292
+ const { tool, calls } = makeToolWithStub({
293
+ entries: [
294
+ { questionId: "q1", decision: "option", optionId: "a" },
295
+ { questionId: "q2", decision: "free_text", text: "noon-ish" },
296
+ { questionId: "q3", decision: "option", optionId: "yes" },
297
+ ],
298
+ overall: "completed",
299
+ });
300
+
301
+ const result = await tool.execute(
302
+ { questions: [singleQ, q2, q3] },
303
+ makeContext(),
304
+ );
305
+
306
+ expect(calls).toHaveLength(1);
307
+ expect(calls[0]?.questions).toHaveLength(3);
308
+ expect(calls[0]?.questions.map((q) => q.question)).toEqual([
309
+ singleQ.question,
310
+ q2.question,
311
+ q3.question,
312
+ ]);
313
+
314
+ expect(result.isError).toBe(false);
315
+ expect(result.content).toBe(
316
+ [
317
+ `Question "${singleQ.question}" → Option: a (Apple)`,
318
+ `Question "${q2.question}" → Free text: noon-ish`,
319
+ `Question "${q3.question}" → Option: yes (Yes)`,
320
+ ].join("\n"),
321
+ );
322
+ });
323
+
324
+ test("formats all-skipped batch as a non-error transcript", async () => {
325
+ const q2 = {
326
+ question: "Preferred time?",
327
+ options: [
328
+ { id: "morning", label: "Morning" },
329
+ { id: "afternoon", label: "Afternoon" },
330
+ ],
331
+ };
332
+ const q3 = {
333
+ question: "Send invite?",
334
+ options: [
335
+ { id: "yes", label: "Yes" },
336
+ { id: "no", label: "No" },
337
+ ],
338
+ };
339
+ const { tool } = makeToolWithStub({
340
+ entries: [
341
+ { questionId: "q1", decision: "skipped" },
342
+ { questionId: "q2", decision: "skipped" },
343
+ { questionId: "q3", decision: "skipped" },
344
+ ],
345
+ overall: "completed",
346
+ });
347
+
348
+ const result = await tool.execute(
349
+ { questions: [singleQ, q2, q3] },
350
+ makeContext(),
351
+ );
352
+
353
+ expect(result.isError).toBe(false);
354
+ expect(result.content).toBe(
355
+ [
356
+ `Question "${singleQ.question}" → Skipped`,
357
+ `Question "${q2.question}" → Skipped`,
358
+ `Question "${q3.question}" → Skipped`,
359
+ ].join("\n"),
360
+ );
361
+ });
362
+
363
+ test("closed batch prepends a summary line and remains non-error", async () => {
364
+ const q2 = {
365
+ question: "Preferred time?",
366
+ options: [
367
+ { id: "morning", label: "Morning" },
368
+ { id: "afternoon", label: "Afternoon" },
369
+ ],
370
+ };
371
+ const { tool } = makeToolWithStub({
372
+ entries: [
373
+ { questionId: "q1", decision: "skipped" },
374
+ { questionId: "q2", decision: "skipped" },
375
+ ],
376
+ overall: "closed",
377
+ });
378
+
379
+ const result = await tool.execute(
380
+ { questions: [singleQ, q2] },
381
+ makeContext(),
382
+ );
383
+
384
+ expect(result.isError).toBe(false);
385
+ expect(result.content).toBe(
386
+ [
387
+ "User closed the question card without answering. All questions skipped.",
388
+ `Question "${singleQ.question}" → Skipped`,
389
+ `Question "${q2.question}" → Skipped`,
390
+ ].join("\n"),
391
+ );
392
+ });
393
+
394
+ test("accepts a 5-entry batch (max allowed)", async () => {
395
+ const { tool, calls } = makeToolWithStub({
396
+ entries: [
397
+ { questionId: "q1", decision: "skipped" },
398
+ { questionId: "q2", decision: "skipped" },
399
+ { questionId: "q3", decision: "skipped" },
400
+ { questionId: "q4", decision: "skipped" },
401
+ { questionId: "q5", decision: "skipped" },
402
+ ],
403
+ overall: "completed",
404
+ });
405
+ const five = [singleQ, singleQ, singleQ, singleQ, singleQ];
406
+
407
+ const result = await tool.execute({ questions: five }, makeContext());
408
+
409
+ expect(result.isError).toBe(false);
410
+ expect(calls).toHaveLength(1);
411
+ expect(calls[0]?.questions).toHaveLength(5);
412
+ });
413
+
414
+ test("rejects batches with 6+ questions", async () => {
415
+ const { tool, calls } = makeToolWithStub(
416
+ singleCompleted({ decision: "option", optionId: "a" }),
417
+ );
418
+ const six = [singleQ, singleQ, singleQ, singleQ, singleQ, singleQ];
419
+
420
+ const result = await tool.execute({ questions: six }, makeContext());
421
+
422
+ expect(result.isError).toBe(true);
423
+ expect(result.content.toLowerCase()).toContain("invalid input");
424
+ expect(calls).toHaveLength(0);
425
+ });
426
+
427
+ test("rejects empty `questions` array", async () => {
428
+ const { tool, calls } = makeToolWithStub(
429
+ singleCompleted({ decision: "option", optionId: "a" }),
430
+ );
431
+
432
+ const result = await tool.execute({ questions: [] }, makeContext());
433
+
434
+ expect(result.isError).toBe(true);
435
+ expect(result.content.toLowerCase()).toContain("invalid input");
436
+ expect(calls).toHaveLength(0);
437
+ });
438
+
439
+ test("rejects input missing both `questions` and flat fields", async () => {
440
+ const { tool, calls } = makeToolWithStub(
441
+ singleCompleted({ decision: "option", optionId: "a" }),
442
+ );
443
+
444
+ const result = await tool.execute({}, makeContext());
445
+
446
+ expect(result.isError).toBe(true);
447
+ expect(result.content.toLowerCase()).toContain("invalid input");
448
+ expect(calls).toHaveLength(0);
449
+ });
450
+
451
+ test("rejects legacy `question` without `options`", async () => {
452
+ const { tool, calls } = makeToolWithStub(
453
+ singleCompleted({ decision: "option", optionId: "a" }),
454
+ );
455
+
456
+ const result = await tool.execute({ question: "Hi?" }, makeContext());
457
+
458
+ expect(result.isError).toBe(true);
459
+ expect(result.content.toLowerCase()).toContain("invalid input");
460
+ expect(calls).toHaveLength(0);
461
+ });
462
+ });
463
+
464
+ describe("AskQuestionTool definition (batched schema)", () => {
465
+ test("exposes `questions[]` shape, keeps legacy fields, omits per-question id", () => {
466
+ const def = new AskQuestionTool().getDefinition();
467
+ const schema = def.input_schema as {
468
+ properties: Record<
469
+ string,
470
+ {
471
+ type?: string;
472
+ minItems?: number;
473
+ maxItems?: number;
474
+ items?: {
475
+ type?: string;
476
+ properties?: Record<string, unknown>;
477
+ required?: string[];
478
+ };
479
+ }
480
+ >;
481
+ required?: string[];
482
+ };
483
+
484
+ const questions = schema.properties.questions;
485
+ expect(questions?.type).toBe("array");
486
+ expect(questions?.minItems).toBe(1);
487
+ expect(questions?.maxItems).toBe(5);
488
+
489
+ const itemProps = questions?.items?.properties ?? {};
490
+ expect(Object.keys(itemProps)).toEqual(
491
+ expect.arrayContaining([
492
+ "question",
493
+ "description",
494
+ "options",
495
+ "freeTextPlaceholder",
496
+ ]),
497
+ );
498
+ expect(Object.keys(itemProps)).not.toContain("id");
499
+ expect(questions?.items?.required).toEqual(["question", "options"]);
500
+
501
+ expect(schema.properties.question?.type).toBe("string");
502
+ expect(schema.properties.options?.type).toBe("array");
503
+ expect(schema.properties.options?.minItems).toBe(2);
504
+ expect(schema.properties.options?.maxItems).toBe(4);
505
+ expect(schema.properties.freeTextPlaceholder?.type).toBe("string");
506
+
507
+ expect(schema.required).toBeUndefined();
508
+ });
509
+ });