@vellumai/assistant 0.3.4 → 0.3.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (506) hide show
  1. package/Dockerfile +2 -0
  2. package/README.md +88 -2
  3. package/eslint.config.mjs +31 -0
  4. package/package.json +1 -1
  5. package/scripts/ipc/check-swift-decoder-drift.ts +4 -1
  6. package/scripts/ipc/generate-swift.ts +31 -2
  7. package/src/__tests__/__snapshots__/ipc-snapshot.test.ts.snap +438 -1
  8. package/src/__tests__/approval-conversation-turn.test.ts +214 -0
  9. package/src/__tests__/approval-hardcoded-copy-guard.test.ts +41 -0
  10. package/src/__tests__/approval-message-composer.test.ts +253 -0
  11. package/src/__tests__/browser-manager.test.ts +1 -0
  12. package/src/__tests__/call-conversation-messages.test.ts +130 -0
  13. package/src/__tests__/call-domain.test.ts +12 -2
  14. package/src/__tests__/call-orchestrator.test.ts +799 -249
  15. package/src/__tests__/call-pointer-messages.test.ts +148 -0
  16. package/src/__tests__/call-recovery.test.ts +3 -0
  17. package/src/__tests__/call-routes-http.test.ts +32 -2
  18. package/src/__tests__/call-store.test.ts +3 -0
  19. package/src/__tests__/channel-approval-routes.test.ts +1277 -98
  20. package/src/__tests__/channel-approval.test.ts +37 -0
  21. package/src/__tests__/channel-approvals.test.ts +36 -50
  22. package/src/__tests__/channel-guardian.test.ts +630 -22
  23. package/src/__tests__/channel-readiness-service.test.ts +324 -0
  24. package/src/__tests__/checker.test.ts +14 -7
  25. package/src/__tests__/clarification-resolver.test.ts +44 -24
  26. package/src/__tests__/commit-message-enrichment-service.test.ts +9 -4
  27. package/src/__tests__/computer-use-session-working-dir.test.ts +8 -0
  28. package/src/__tests__/config-schema.test.ts +14 -8
  29. package/src/__tests__/context-window-manager.test.ts +30 -2
  30. package/src/__tests__/contradiction-checker.test.ts +20 -5
  31. package/src/__tests__/credential-security-invariants.test.ts +7 -2
  32. package/src/__tests__/daemon-lifecycle.test.ts +13 -12
  33. package/src/__tests__/db-migration-rollback.test.ts +752 -0
  34. package/src/__tests__/dictation-mode-detection.test.ts +63 -0
  35. package/src/__tests__/dynamic-skill-workflow-prompt.test.ts +2 -0
  36. package/src/__tests__/entity-search.test.ts +615 -0
  37. package/src/__tests__/fuzzy-match-property.test.ts +5 -5
  38. package/src/__tests__/guardian-action-store.test.ts +123 -0
  39. package/src/__tests__/guardian-action-sweep.test.ts +277 -0
  40. package/src/__tests__/guardian-dispatch.test.ts +389 -0
  41. package/src/__tests__/guardian-question-copy.test.ts +47 -0
  42. package/src/__tests__/handlers-telegram-config.test.ts +4 -2
  43. package/src/__tests__/handlers-twilio-config.test.ts +533 -0
  44. package/src/__tests__/intent-routing.test.ts +2 -0
  45. package/src/__tests__/ipc-snapshot.test.ts +291 -1
  46. package/src/__tests__/memory-upsert-concurrency.test.ts +828 -0
  47. package/src/__tests__/messaging-send-tool.test.ts +65 -0
  48. package/src/__tests__/model-intents.test.ts +96 -0
  49. package/src/__tests__/no-direct-anthropic-sdk-imports.test.ts +42 -0
  50. package/src/__tests__/oauth2-gateway-transport.test.ts +130 -0
  51. package/src/__tests__/onboarding-starter-tasks.test.ts +2 -0
  52. package/src/__tests__/provider-commit-message-generator.test.ts +89 -13
  53. package/src/__tests__/provider-error-scenarios.test.ts +621 -0
  54. package/src/__tests__/provider-fail-open-selection.test.ts +119 -0
  55. package/src/__tests__/qdrant-manager.test.ts +27 -20
  56. package/src/__tests__/relay-server.test.ts +779 -40
  57. package/src/__tests__/run-orchestrator-assistant-events.test.ts +6 -0
  58. package/src/__tests__/run-orchestrator.test.ts +42 -4
  59. package/src/__tests__/runtime-runs-http.test.ts +17 -1
  60. package/src/__tests__/runtime-runs.test.ts +16 -0
  61. package/src/__tests__/schedule-store.test.ts +18 -4
  62. package/src/__tests__/scheduler-recurrence.test.ts +13 -4
  63. package/src/__tests__/session-abort-tool-results.test.ts +6 -0
  64. package/src/__tests__/session-agent-loop.test.ts +857 -0
  65. package/src/__tests__/session-conflict-gate.test.ts +6 -0
  66. package/src/__tests__/session-pre-run-repair.test.ts +6 -0
  67. package/src/__tests__/session-profile-injection.test.ts +6 -0
  68. package/src/__tests__/session-provider-retry-repair.test.ts +6 -0
  69. package/src/__tests__/session-queue.test.ts +6 -0
  70. package/src/__tests__/session-runtime-assembly.test.ts +321 -13
  71. package/src/__tests__/session-slash-known.test.ts +6 -0
  72. package/src/__tests__/session-slash-queue.test.ts +6 -0
  73. package/src/__tests__/session-slash-unknown.test.ts +6 -0
  74. package/src/__tests__/session-surfaces-task-progress.test.ts +2 -0
  75. package/src/__tests__/session-tool-setup-app-refresh.test.ts +1 -0
  76. package/src/__tests__/session-tool-setup-memory-scope.test.ts +1 -0
  77. package/src/__tests__/session-tool-setup-side-effect-flag.test.ts +1 -0
  78. package/src/__tests__/session-workspace-injection.test.ts +6 -0
  79. package/src/__tests__/session-workspace-tool-tracking.test.ts +6 -0
  80. package/src/__tests__/skills.test.ts +2 -0
  81. package/src/__tests__/sms-messaging-provider.test.ts +126 -0
  82. package/src/__tests__/starter-task-flow.test.ts +2 -0
  83. package/src/__tests__/swarm-dag-pathological.test.ts +535 -0
  84. package/src/__tests__/system-prompt.test.ts +2 -0
  85. package/src/__tests__/task-management-tools.test.ts +2 -2
  86. package/src/__tests__/task-runner.test.ts +14 -4
  87. package/src/__tests__/terminal-tools.test.ts +25 -19
  88. package/src/__tests__/tool-execution-abort-cleanup.test.ts +545 -0
  89. package/src/__tests__/tool-executor-shell-integration.test.ts +11 -11
  90. package/src/__tests__/tool-executor.test.ts +23 -24
  91. package/src/__tests__/trust-store.test.ts +3 -3
  92. package/src/__tests__/twilio-rest.test.ts +29 -0
  93. package/src/__tests__/twilio-routes-elevenlabs.test.ts +3 -0
  94. package/src/__tests__/twilio-routes-twiml.test.ts +11 -0
  95. package/src/__tests__/twilio-routes.test.ts +167 -11
  96. package/src/__tests__/twitter-cli-error-shaping.test.ts +2 -2
  97. package/src/__tests__/user-reference.test.ts +2 -0
  98. package/src/__tests__/voice-quality.test.ts +222 -0
  99. package/src/__tests__/web-search.test.ts +46 -30
  100. package/src/__tests__/work-item-output.test.ts +110 -0
  101. package/src/agent/loop.ts +1 -1
  102. package/src/agent-heartbeat/agent-heartbeat-service.ts +2 -10
  103. package/src/amazon/client.ts +1418 -0
  104. package/src/amazon/request-extractor.ts +135 -0
  105. package/src/amazon/session.ts +109 -0
  106. package/src/autonomy/autonomy-store.ts +5 -5
  107. package/src/browser-extension-relay/client.ts +124 -0
  108. package/src/browser-extension-relay/protocol.ts +63 -0
  109. package/src/browser-extension-relay/server.ts +177 -0
  110. package/src/bundler/app-bundler.ts +3 -3
  111. package/src/bundler/bundle-signer.ts +1 -1
  112. package/src/bundler/signature-verifier.ts +1 -1
  113. package/src/calls/call-conversation-messages.ts +33 -0
  114. package/src/calls/call-domain.ts +114 -10
  115. package/src/calls/call-orchestrator.ts +268 -59
  116. package/src/calls/call-pointer-messages.ts +53 -0
  117. package/src/calls/call-recovery.ts +3 -8
  118. package/src/calls/call-store.ts +69 -87
  119. package/src/calls/elevenlabs-config.ts +3 -2
  120. package/src/calls/guardian-action-sweep.ts +105 -0
  121. package/src/calls/guardian-dispatch.ts +203 -0
  122. package/src/calls/guardian-question-copy.ts +133 -0
  123. package/src/calls/relay-server.ts +466 -8
  124. package/src/calls/speaker-identification.ts +1 -1
  125. package/src/calls/twilio-config.ts +22 -14
  126. package/src/calls/twilio-provider.ts +6 -4
  127. package/src/calls/twilio-rest.ts +308 -7
  128. package/src/calls/twilio-routes.ts +65 -12
  129. package/src/calls/types.ts +3 -1
  130. package/src/channels/types.ts +25 -0
  131. package/src/cli/amazon.ts +815 -0
  132. package/src/cli/config-commands.ts +2 -2
  133. package/src/cli/core-commands.ts +4 -3
  134. package/src/cli/influencer.ts +244 -0
  135. package/src/cli/map.ts +89 -6
  136. package/src/cli.ts +1 -1
  137. package/src/config/agent-schema.ts +171 -0
  138. package/src/config/bundled-skills/amazon/SKILL.md +127 -0
  139. package/src/config/bundled-skills/amazon/icon.svg +13 -0
  140. package/src/config/bundled-skills/api-mapping/SKILL.md +78 -0
  141. package/src/config/bundled-skills/browser/SKILL.md +1 -0
  142. package/src/config/bundled-skills/browser/TOOLS.json +17 -0
  143. package/src/config/bundled-skills/browser/tools/browser-wait-for-download.ts +25 -0
  144. package/src/config/bundled-skills/doordash/SKILL.md +51 -51
  145. package/src/config/bundled-skills/email-setup/SKILL.md +14 -5
  146. package/src/config/bundled-skills/google-oauth-setup/SKILL.md +183 -0
  147. package/src/config/bundled-skills/influencer/SKILL.md +144 -0
  148. package/src/config/bundled-skills/knowledge-graph/SKILL.md +15 -0
  149. package/src/config/bundled-skills/knowledge-graph/TOOLS.json +56 -0
  150. package/src/config/bundled-skills/knowledge-graph/tools/graph-query.ts +185 -0
  151. package/src/config/bundled-skills/macos-automation/icon.svg +12 -0
  152. package/src/config/bundled-skills/media-processing/SKILL.md +176 -0
  153. package/src/config/bundled-skills/media-processing/TOOLS.json +230 -0
  154. package/src/config/bundled-skills/media-processing/__tests__/concurrency-pool.test.ts +77 -0
  155. package/src/config/bundled-skills/media-processing/__tests__/cost-tracker.test.ts +69 -0
  156. package/src/config/bundled-skills/media-processing/__tests__/preprocess.test.ts +303 -0
  157. package/src/config/bundled-skills/media-processing/services/concurrency-pool.ts +55 -0
  158. package/src/config/bundled-skills/media-processing/services/cost-tracker.ts +86 -0
  159. package/src/config/bundled-skills/media-processing/services/gemini-map.ts +339 -0
  160. package/src/config/bundled-skills/media-processing/services/preprocess.ts +551 -0
  161. package/src/config/bundled-skills/media-processing/services/processing-pipeline.ts +259 -0
  162. package/src/config/bundled-skills/media-processing/services/reduce.ts +197 -0
  163. package/src/config/bundled-skills/media-processing/tools/analyze-keyframes.ts +136 -0
  164. package/src/config/bundled-skills/media-processing/tools/extract-keyframes.ts +59 -0
  165. package/src/config/bundled-skills/media-processing/tools/generate-clip.ts +195 -0
  166. package/src/config/bundled-skills/media-processing/tools/ingest-media.ts +197 -0
  167. package/src/config/bundled-skills/media-processing/tools/media-diagnostics.ts +143 -0
  168. package/src/config/bundled-skills/media-processing/tools/media-status.ts +75 -0
  169. package/src/config/bundled-skills/media-processing/tools/query-media-events.ts +65 -0
  170. package/src/config/bundled-skills/messaging/SKILL.md +33 -8
  171. package/src/config/bundled-skills/messaging/tools/messaging-analyze-style.ts +4 -7
  172. package/src/config/bundled-skills/messaging/tools/messaging-reply.ts +2 -1
  173. package/src/config/bundled-skills/messaging/tools/messaging-send.ts +5 -1
  174. package/src/config/bundled-skills/phone-calls/SKILL.md +88 -23
  175. package/src/config/bundled-skills/twitter/SKILL.md +19 -3
  176. package/src/config/bundled-skills/twitter/icon.svg +14 -0
  177. package/src/config/bundled-tool-registry.ts +310 -0
  178. package/src/config/calls-schema.ts +181 -0
  179. package/src/config/core-schema.ts +309 -0
  180. package/src/config/defaults.ts +28 -3
  181. package/src/config/env-registry.ts +162 -0
  182. package/src/config/env.ts +175 -0
  183. package/src/config/loader.ts +6 -6
  184. package/src/config/memory-schema.ts +528 -0
  185. package/src/config/sandbox-schema.ts +55 -0
  186. package/src/config/schema.ts +158 -1133
  187. package/src/config/skill-state.ts +1 -1
  188. package/src/config/skills-schema.ts +32 -0
  189. package/src/config/skills.ts +35 -24
  190. package/src/config/system-prompt.ts +131 -56
  191. package/src/config/templates/IDENTITY.md +2 -2
  192. package/src/config/templates/SOUL.md +1 -1
  193. package/src/config/types.ts +1 -0
  194. package/src/config/user-reference.ts +4 -9
  195. package/src/config/vellum-skills/catalog.json +6 -7
  196. package/src/config/vellum-skills/chatgpt-import/tools/chatgpt-import.ts +5 -1
  197. package/src/config/vellum-skills/slack-oauth-setup/SKILL.md +4 -3
  198. package/src/config/vellum-skills/sms-setup/SKILL.md +216 -0
  199. package/src/config/vellum-skills/twilio-setup/SKILL.md +40 -8
  200. package/src/context/window-manager.ts +27 -7
  201. package/src/daemon/approval-generators.ts +186 -0
  202. package/src/daemon/approved-devices-store.ts +140 -0
  203. package/src/daemon/assistant-attachments.ts +1 -1
  204. package/src/daemon/classifier.ts +35 -32
  205. package/src/daemon/config-watcher.ts +1 -1
  206. package/src/daemon/daemon-control.ts +217 -0
  207. package/src/daemon/handlers/apps.ts +2 -3
  208. package/src/daemon/handlers/config-channels.ts +158 -0
  209. package/src/daemon/handlers/config-inbox.ts +540 -0
  210. package/src/daemon/handlers/config-ingress.ts +231 -0
  211. package/src/daemon/handlers/config-integrations.ts +258 -0
  212. package/src/daemon/handlers/config-model.ts +143 -0
  213. package/src/daemon/handlers/config-parental.ts +163 -0
  214. package/src/daemon/handlers/config-scheduling.ts +172 -0
  215. package/src/daemon/handlers/config-slack.ts +92 -0
  216. package/src/daemon/handlers/config-telegram.ts +301 -0
  217. package/src/daemon/handlers/config-tools.ts +177 -0
  218. package/src/daemon/handlers/config-trust.ts +104 -0
  219. package/src/daemon/handlers/config-twilio.ts +1080 -0
  220. package/src/daemon/handlers/config.ts +53 -1689
  221. package/src/daemon/handlers/diagnostics.ts +1 -1
  222. package/src/daemon/handlers/dictation.ts +180 -0
  223. package/src/daemon/handlers/documents.ts +18 -32
  224. package/src/daemon/handlers/identity.ts +14 -23
  225. package/src/daemon/handlers/index.ts +11 -0
  226. package/src/daemon/handlers/misc.ts +3 -5
  227. package/src/daemon/handlers/pairing.ts +98 -0
  228. package/src/daemon/handlers/sessions.ts +56 -5
  229. package/src/daemon/handlers/shared.ts +6 -1
  230. package/src/daemon/handlers/skills.ts +1 -1
  231. package/src/daemon/handlers/twitter-auth.ts +2 -0
  232. package/src/daemon/handlers/work-items.ts +17 -9
  233. package/src/daemon/handlers/workspace-files.ts +4 -3
  234. package/src/daemon/install-cli-launchers.ts +113 -0
  235. package/src/daemon/ipc-contract/apps.ts +356 -0
  236. package/src/daemon/ipc-contract/browser.ts +74 -0
  237. package/src/daemon/ipc-contract/computer-use.ts +151 -0
  238. package/src/daemon/ipc-contract/diagnostics.ts +56 -0
  239. package/src/daemon/ipc-contract/documents.ts +74 -0
  240. package/src/daemon/ipc-contract/inbox.ts +209 -0
  241. package/src/daemon/ipc-contract/integrations.ts +284 -0
  242. package/src/daemon/ipc-contract/memory.ts +48 -0
  243. package/src/daemon/ipc-contract/messages.ts +211 -0
  244. package/src/daemon/ipc-contract/pairing.ts +45 -0
  245. package/src/daemon/ipc-contract/parental-control.ts +95 -0
  246. package/src/daemon/ipc-contract/schedules.ts +97 -0
  247. package/src/daemon/ipc-contract/sessions.ts +315 -0
  248. package/src/daemon/ipc-contract/shared.ts +42 -0
  249. package/src/daemon/ipc-contract/skills.ts +120 -0
  250. package/src/daemon/ipc-contract/subagents.ts +58 -0
  251. package/src/daemon/ipc-contract/surfaces.ts +250 -0
  252. package/src/daemon/ipc-contract/trust.ts +60 -0
  253. package/src/daemon/ipc-contract/work-items.ts +225 -0
  254. package/src/daemon/ipc-contract/workspace.ts +113 -0
  255. package/src/daemon/ipc-contract-inventory.json +70 -0
  256. package/src/daemon/ipc-contract-inventory.ts +55 -29
  257. package/src/daemon/ipc-contract.ts +229 -2426
  258. package/src/daemon/ipc-protocol.ts +1 -1
  259. package/src/daemon/ipc-validate.ts +7 -0
  260. package/src/daemon/lifecycle.ts +97 -377
  261. package/src/daemon/pairing-store.ts +177 -0
  262. package/src/daemon/providers-setup.ts +43 -0
  263. package/src/daemon/ride-shotgun-handler.ts +68 -3
  264. package/src/daemon/server.ts +66 -46
  265. package/src/daemon/session-agent-loop-handlers.ts +421 -0
  266. package/src/daemon/session-agent-loop.ts +117 -275
  267. package/src/daemon/session-dynamic-profile.ts +1 -1
  268. package/src/daemon/session-history.ts +1 -1
  269. package/src/daemon/session-media-retry.ts +1 -1
  270. package/src/daemon/session-messaging.ts +37 -2
  271. package/src/daemon/session-notifiers.ts +5 -25
  272. package/src/daemon/session-process.ts +99 -59
  273. package/src/daemon/session-queue-manager.ts +96 -4
  274. package/src/daemon/session-runtime-assembly.ts +199 -10
  275. package/src/daemon/session-surfaces.ts +19 -4
  276. package/src/daemon/session-tool-setup.ts +30 -30
  277. package/src/daemon/session-workspace.ts +1 -1
  278. package/src/daemon/session.ts +35 -2
  279. package/src/daemon/shutdown-handlers.ts +122 -0
  280. package/src/daemon/trace-emitter.ts +1 -1
  281. package/src/daemon/watch-handler.ts +36 -33
  282. package/src/doordash/cart-queries.ts +787 -0
  283. package/src/doordash/client.ts +144 -127
  284. package/src/doordash/order-queries.ts +85 -0
  285. package/src/doordash/queries.ts +10 -1308
  286. package/src/doordash/search-queries.ts +203 -0
  287. package/src/doordash/session.ts +3 -2
  288. package/src/doordash/store-queries.ts +246 -0
  289. package/src/doordash/types.ts +367 -0
  290. package/src/email/providers/agentmail.ts +2 -1
  291. package/src/email/providers/index.ts +3 -2
  292. package/src/email/service.ts +3 -2
  293. package/src/errors.ts +43 -0
  294. package/src/home-base/prebuilt/seed.ts +1 -1
  295. package/src/hooks/cli.ts +6 -5
  296. package/src/hooks/config.ts +6 -8
  297. package/src/hooks/discovery.ts +6 -5
  298. package/src/hooks/manager.ts +4 -3
  299. package/src/hooks/runner.ts +2 -2
  300. package/src/hooks/templates.ts +5 -5
  301. package/src/inbound/public-ingress-urls.ts +6 -4
  302. package/src/index.ts +4 -2
  303. package/src/influencer/client.ts +1104 -0
  304. package/src/instrument.ts +4 -3
  305. package/src/logfire.ts +4 -3
  306. package/src/memory/admin.ts +25 -35
  307. package/src/memory/attachments-store.ts +4 -7
  308. package/src/memory/channel-delivery-store.ts +30 -1
  309. package/src/memory/channel-guardian-store.ts +202 -2
  310. package/src/memory/clarification-resolver.ts +37 -33
  311. package/src/memory/conflict-store.ts +67 -61
  312. package/src/memory/contradiction-checker.ts +141 -117
  313. package/src/memory/conversation-store.ts +335 -51
  314. package/src/memory/db-connection.ts +27 -4
  315. package/src/memory/db-init.ts +265 -4
  316. package/src/memory/db.ts +14 -1
  317. package/src/memory/embedding-backend.ts +27 -5
  318. package/src/memory/embedding-ollama.ts +2 -1
  319. package/src/memory/entity-extractor.ts +38 -35
  320. package/src/memory/guardian-action-store.ts +430 -0
  321. package/src/memory/inbox-escalation-projection.ts +59 -0
  322. package/src/memory/inbox-thread-store.ts +218 -0
  323. package/src/memory/ingress-invite-store.ts +338 -0
  324. package/src/memory/ingress-member-store.ts +350 -0
  325. package/src/memory/items-extractor.ts +91 -97
  326. package/src/memory/job-handlers/index-maintenance.ts +3 -3
  327. package/src/memory/job-handlers/media-processing.ts +69 -0
  328. package/src/memory/job-handlers/summarization.ts +32 -26
  329. package/src/memory/job-utils.ts +3 -10
  330. package/src/memory/jobs-store.ts +8 -10
  331. package/src/memory/jobs-worker.ts +55 -36
  332. package/src/memory/media-store.ts +759 -0
  333. package/src/memory/migrations/001-job-deferrals.ts +45 -0
  334. package/src/memory/migrations/002-tool-invocations-fk.ts +43 -0
  335. package/src/memory/migrations/003-memory-fts-backfill.ts +24 -0
  336. package/src/memory/migrations/004-entity-relation-dedup.ts +87 -0
  337. package/src/memory/migrations/005-fingerprint-scope-unique.ts +80 -0
  338. package/src/memory/migrations/006-scope-salted-fingerprints.ts +62 -0
  339. package/src/memory/migrations/007-assistant-id-to-self.ts +254 -0
  340. package/src/memory/migrations/008-remove-assistant-id-columns.ts +208 -0
  341. package/src/memory/migrations/009-llm-usage-events-drop-assistant-id.ts +83 -0
  342. package/src/memory/migrations/010-ext-conv-bindings-channel-chat-unique.ts +56 -0
  343. package/src/memory/migrations/011-call-sessions-provider-sid-dedup.ts +63 -0
  344. package/src/memory/migrations/012-call-sessions-add-initiated-from.ts +19 -0
  345. package/src/memory/migrations/013-guardian-action-tables.ts +68 -0
  346. package/src/memory/migrations/014-backfill-inbox-thread-state.ts +76 -0
  347. package/src/memory/migrations/015-drop-active-search-index.ts +27 -0
  348. package/src/memory/migrations/016-memory-segments-indexes.ts +11 -0
  349. package/src/memory/migrations/017-memory-items-indexes.ts +10 -0
  350. package/src/memory/migrations/018-remaining-table-indexes.ts +13 -0
  351. package/src/memory/migrations/index.ts +24 -0
  352. package/src/memory/migrations/registry.ts +79 -0
  353. package/src/memory/migrations/validate-migration-state.ts +69 -0
  354. package/src/memory/qdrant-manager.ts +49 -8
  355. package/src/memory/query-builder.ts +1 -1
  356. package/src/memory/raw-query.ts +119 -0
  357. package/src/memory/recall-cache.ts +4 -1
  358. package/src/memory/retriever.ts +165 -47
  359. package/src/memory/schema-migration.ts +25 -984
  360. package/src/memory/schema.ts +228 -7
  361. package/src/memory/search/entity.ts +205 -31
  362. package/src/memory/search/lexical.ts +81 -52
  363. package/src/memory/search/ranking.ts +27 -23
  364. package/src/memory/search/semantic.ts +157 -19
  365. package/src/memory/search/types.ts +24 -0
  366. package/src/memory/shared-app-links-store.ts +4 -5
  367. package/src/memory/validation.ts +19 -0
  368. package/src/messaging/draft-store.ts +5 -6
  369. package/src/messaging/provider-types.ts +2 -0
  370. package/src/messaging/providers/sms/adapter.ts +201 -0
  371. package/src/messaging/providers/sms/client.ts +93 -0
  372. package/src/messaging/providers/sms/types.ts +7 -0
  373. package/src/messaging/providers/telegram-bot/adapter.ts +2 -5
  374. package/src/messaging/providers/whatsapp/adapter.ts +136 -0
  375. package/src/messaging/providers/whatsapp/client.ts +67 -0
  376. package/src/messaging/style-analyzer.ts +5 -4
  377. package/src/messaging/thread-summarizer.ts +61 -69
  378. package/src/messaging/triage-engine.ts +62 -71
  379. package/src/migrations/config-merge.ts +53 -0
  380. package/src/migrations/data-layout.ts +68 -0
  381. package/src/migrations/data-merge.ts +33 -0
  382. package/src/migrations/hooks-merge.ts +90 -0
  383. package/src/migrations/index.ts +6 -0
  384. package/src/migrations/log.ts +23 -0
  385. package/src/migrations/skills-merge.ts +33 -0
  386. package/src/migrations/workspace-layout.ts +79 -0
  387. package/src/permissions/checker.ts +133 -11
  388. package/src/permissions/prompter.ts +14 -0
  389. package/src/permissions/shell-identity.ts +31 -1
  390. package/src/permissions/trust-store.ts +21 -1
  391. package/src/providers/anthropic/client.ts +4 -4
  392. package/src/providers/failover.ts +2 -2
  393. package/src/providers/model-intents.ts +70 -0
  394. package/src/providers/ollama/client.ts +2 -1
  395. package/src/providers/provider-send-message.ts +176 -0
  396. package/src/providers/registry.ts +71 -30
  397. package/src/providers/retry.ts +35 -1
  398. package/src/providers/types.ts +12 -1
  399. package/src/runtime/approval-conversation-turn.ts +97 -0
  400. package/src/runtime/approval-message-composer.ts +253 -0
  401. package/src/runtime/channel-approval-parser.ts +36 -2
  402. package/src/runtime/channel-approvals.ts +11 -24
  403. package/src/runtime/channel-guardian-service.ts +88 -21
  404. package/src/runtime/channel-readiness-service.ts +418 -0
  405. package/src/runtime/channel-readiness-types.ts +35 -0
  406. package/src/runtime/channel-retry-sweep.ts +184 -0
  407. package/src/runtime/guardian-context-resolver.ts +108 -0
  408. package/src/runtime/http-server.ts +275 -717
  409. package/src/runtime/http-types.ts +59 -3
  410. package/src/runtime/middleware/auth.ts +116 -0
  411. package/src/runtime/middleware/error-handler.ts +33 -0
  412. package/src/runtime/middleware/twilio-validation.ts +127 -0
  413. package/src/runtime/routes/app-routes.ts +1 -1
  414. package/src/runtime/routes/call-routes.ts +51 -7
  415. package/src/runtime/routes/channel-delivery-routes.ts +170 -0
  416. package/src/runtime/routes/channel-guardian-routes.ts +1191 -0
  417. package/src/runtime/routes/channel-inbound-routes.ts +1152 -0
  418. package/src/runtime/routes/channel-route-shared.ts +144 -0
  419. package/src/runtime/routes/channel-routes.ts +32 -1588
  420. package/src/runtime/routes/conversation-routes.ts +50 -7
  421. package/src/runtime/routes/events-routes.ts +2 -2
  422. package/src/runtime/routes/identity-routes.ts +126 -0
  423. package/src/runtime/routes/pairing-routes.ts +143 -0
  424. package/src/runtime/routes/run-routes.ts +15 -1
  425. package/src/runtime/run-orchestrator.ts +86 -35
  426. package/src/schedule/schedule-store.ts +36 -32
  427. package/src/schedule/scheduler.ts +3 -3
  428. package/src/security/encrypted-store.ts +5 -7
  429. package/src/security/oauth2.ts +45 -15
  430. package/src/security/parental-control-store.ts +183 -0
  431. package/src/security/secret-allowlist.ts +4 -3
  432. package/src/security/secret-scanner.ts +5 -5
  433. package/src/security/secure-keys.ts +1 -1
  434. package/src/security/token-manager.ts +3 -2
  435. package/src/services/vercel-deploy.ts +6 -2
  436. package/src/skills/tool-manifest.ts +3 -3
  437. package/src/skills/vellum-catalog-remote.ts +75 -16
  438. package/src/slack/slack-webhook.ts +2 -1
  439. package/src/swarm/orchestrator.ts +92 -1
  440. package/src/swarm/router-planner.ts +6 -9
  441. package/src/swarm/worker-prompts.ts +9 -12
  442. package/src/tasks/task-compiler.ts +19 -28
  443. package/src/tasks/task-runner.ts +1 -1
  444. package/src/tools/assets/materialize.ts +2 -2
  445. package/src/tools/assets/search.ts +15 -14
  446. package/src/tools/browser/__tests__/auth-detector.test.ts +1 -0
  447. package/src/tools/browser/auto-navigate.ts +1 -0
  448. package/src/tools/browser/browser-execution.ts +10 -1
  449. package/src/tools/browser/browser-manager.ts +119 -4
  450. package/src/tools/browser/network-recorder.ts +5 -0
  451. package/src/tools/calls/call-start.ts +1 -0
  452. package/src/tools/credentials/broker.ts +11 -2
  453. package/src/tools/credentials/metadata-store.ts +18 -14
  454. package/src/tools/credentials/post-connect-hooks.ts +61 -0
  455. package/src/tools/credentials/vault.ts +49 -23
  456. package/src/tools/execution-target.ts +11 -1
  457. package/src/tools/executor.ts +68 -9
  458. package/src/tools/host-terminal/cli-discover.ts +1 -1
  459. package/src/tools/network/script-proxy/http-forwarder.ts +1 -1
  460. package/src/tools/network/script-proxy/mitm-handler.ts +1 -1
  461. package/src/tools/network/script-proxy/server.ts +1 -1
  462. package/src/tools/network/script-proxy/session-manager.ts +6 -5
  463. package/src/tools/network/web-fetch.ts +18 -2
  464. package/src/tools/network/web-search.ts +8 -4
  465. package/src/tools/reminder/reminder-store.ts +14 -15
  466. package/src/tools/schedule/create.ts +1 -0
  467. package/src/tools/schedule/list.ts +2 -1
  468. package/src/tools/shared/filesystem/file-ops-service.ts +5 -7
  469. package/src/tools/skills/skill-script-runner.ts +24 -9
  470. package/src/tools/skills/skill-tool-factory.ts +1 -0
  471. package/src/tools/tasks/work-item-enqueue.ts +2 -2
  472. package/src/tools/terminal/evaluate-typescript.ts +21 -12
  473. package/src/tools/terminal/parser.ts +50 -0
  474. package/src/tools/types.ts +2 -0
  475. package/src/tools/watcher/delete.ts +6 -0
  476. package/src/tools/weather/service.ts +1 -1
  477. package/src/twitter/client.ts +190 -24
  478. package/src/twitter/router.ts +1 -1
  479. package/src/twitter/session.ts +4 -3
  480. package/src/util/clipboard.ts +1 -1
  481. package/src/util/errors.ts +65 -8
  482. package/src/util/fs.ts +40 -0
  483. package/src/util/json.ts +10 -0
  484. package/src/util/log-redact.ts +189 -0
  485. package/src/util/logger.ts +19 -17
  486. package/src/util/object.ts +3 -0
  487. package/src/util/platform.ts +105 -363
  488. package/src/util/pricing.ts +1 -1
  489. package/src/util/promise-guard.ts +1 -1
  490. package/src/util/retry.ts +19 -0
  491. package/src/util/row-mapper.ts +79 -0
  492. package/src/util/silently.ts +21 -0
  493. package/src/watcher/engine.ts +5 -1
  494. package/src/watcher/provider-types.ts +20 -0
  495. package/src/watcher/providers/github.ts +156 -0
  496. package/src/watcher/providers/gmail.ts +1 -0
  497. package/src/watcher/providers/google-calendar.ts +1 -0
  498. package/src/watcher/providers/linear.ts +460 -0
  499. package/src/watcher/providers/slack.ts +1 -0
  500. package/src/work-items/work-item-runner.ts +1 -1
  501. package/src/workspace/git-service.ts +1 -1
  502. package/src/workspace/provider-commit-message-generator.ts +51 -22
  503. package/src/__tests__/call-bridge.test.ts +0 -517
  504. package/src/__tests__/session-process-bridge.test.ts +0 -244
  505. package/src/calls/call-bridge.ts +0 -168
  506. package/src/config/vellum-skills/google-oauth-setup/SKILL.md +0 -199
@@ -0,0 +1,857 @@
1
+ import { describe, expect, mock, test, beforeEach } from 'bun:test';
2
+ import type { Message, ContentBlock } from '../providers/types.js';
3
+ import type { AgentEvent, CheckpointDecision, CheckpointInfo } from '../agent/loop.js';
4
+ import type { ServerMessage } from '../daemon/ipc-protocol.js';
5
+
6
+ // ── Module mocks (must precede imports of the module under test) ─────
7
+
8
+ mock.module('../util/logger.js', () => ({
9
+ getLogger: () => new Proxy({} as Record<string, unknown>, { get: () => () => {} }),
10
+ }));
11
+
12
+ mock.module('../util/platform.js', () => ({
13
+ getSocketPath: () => '/tmp/test.sock',
14
+ getDataDir: () => '/tmp',
15
+ }));
16
+
17
+ mock.module('../config/loader.js', () => ({
18
+ getConfig: () => ({
19
+ provider: 'mock-provider',
20
+ maxTokens: 4096,
21
+ thinking: false,
22
+ contextWindow: {
23
+ maxInputTokens: 100000,
24
+ thresholdTokens: 80000,
25
+ preserveRecentMessages: 6,
26
+ summaryModel: 'mock-model',
27
+ maxSummaryTokens: 512,
28
+ },
29
+ rateLimit: { maxRequestsPerMinute: 0, maxTokensPerSession: 0 },
30
+ apiKeys: {},
31
+ workspaceGit: { turnCommitMaxWaitMs: 10 },
32
+ }),
33
+ loadRawConfig: () => ({}),
34
+ saveRawConfig: () => {},
35
+ invalidateConfigCache: () => {},
36
+ }));
37
+
38
+ let hookBlocked = false;
39
+ let hookBlockedBy = '';
40
+
41
+ mock.module('../hooks/manager.js', () => ({
42
+ getHookManager: () => ({
43
+ trigger: async (hookName: string) => {
44
+ if (hookName === 'pre-message' && hookBlocked) {
45
+ return { blocked: true, blockedBy: hookBlockedBy };
46
+ }
47
+ return { blocked: false };
48
+ },
49
+ }),
50
+ }));
51
+
52
+ mock.module('../memory/conversation-store.js', () => ({
53
+ addMessage: () => ({ id: 'mock-msg-id' }),
54
+ deleteMessageById: () => {},
55
+ updateConversationContextWindow: () => {},
56
+ updateConversationTitle: () => {},
57
+ getConversationOriginChannel: () => null,
58
+ }));
59
+
60
+ mock.module('../memory/retriever.js', () => ({
61
+ buildMemoryRecall: async () => ({
62
+ enabled: false,
63
+ degraded: false,
64
+ injectedText: '',
65
+ lexicalHits: 0,
66
+ semanticHits: 0,
67
+ recencyHits: 0,
68
+ injectedTokens: 0,
69
+ latencyMs: 0,
70
+ }),
71
+ injectMemoryRecallIntoUserMessage: (msg: Message) => msg,
72
+ stripMemoryRecallMessages: (msgs: Message[]) => msgs,
73
+ }));
74
+
75
+ mock.module('../memory/app-store.js', () => ({
76
+ getApp: () => null,
77
+ listAppFiles: () => [],
78
+ getAppsDir: () => '/tmp/apps',
79
+ }));
80
+
81
+ mock.module('../memory/app-git-service.js', () => ({
82
+ commitAppTurnChanges: () => Promise.resolve(),
83
+ }));
84
+
85
+ mock.module('../daemon/session-memory.js', () => ({
86
+ prepareMemoryContext: async (_ctx: unknown, _content: string, _id: string, _signal: AbortSignal) => ({
87
+ runMessages: [],
88
+ recall: { enabled: false, degraded: false, injectedText: '', lexicalHits: 0, semanticHits: 0, recencyHits: 0, injectedTokens: 0, latencyMs: 0 },
89
+ dynamicProfile: { text: '' },
90
+ softConflictInstruction: null,
91
+ recallInjectionStrategy: 'prepend_user_block' as const,
92
+ conflictClarification: null,
93
+ }),
94
+ }));
95
+
96
+ mock.module('../daemon/session-runtime-assembly.js', () => ({
97
+ applyRuntimeInjections: (msgs: Message[]) => msgs,
98
+ stripInjectedContext: (msgs: Message[]) => msgs,
99
+ }));
100
+
101
+ mock.module('../daemon/session-dynamic-profile.js', () => ({
102
+ stripDynamicProfileMessages: (msgs: Message[]) => msgs,
103
+ injectDynamicProfileIntoUserMessage: (msg: Message) => msg,
104
+ }));
105
+
106
+ mock.module('../daemon/date-context.js', () => ({
107
+ buildTemporalContext: () => null,
108
+ }));
109
+
110
+ mock.module('../daemon/history-repair.js', () => ({
111
+ repairHistory: (msgs: Message[]) => ({ messages: msgs, stats: { assistantToolResultsMigrated: 0, missingToolResultsInserted: 0, orphanToolResultsDowngraded: 0, consecutiveSameRoleMerged: 0 } }),
112
+ deepRepairHistory: (msgs: Message[]) => ({ messages: msgs, stats: {} }),
113
+ }));
114
+
115
+ mock.module('../daemon/session-history.js', () => ({
116
+ consolidateAssistantMessages: () => {},
117
+ }));
118
+
119
+ mock.module('../daemon/session-usage.js', () => ({
120
+ recordUsage: () => {},
121
+ }));
122
+
123
+ mock.module('../daemon/session-attachments.js', () => ({
124
+ resolveAssistantAttachments: async () => ({
125
+ assistantAttachments: [],
126
+ emittedAttachments: [],
127
+ directiveWarnings: [],
128
+ }),
129
+ approveHostAttachmentRead: async () => true,
130
+ formatAttachmentWarnings: () => '',
131
+ }));
132
+
133
+ mock.module('../daemon/assistant-attachments.js', () => ({
134
+ cleanAssistantContent: (content: unknown[]) => ({
135
+ cleanedContent: content,
136
+ directives: [],
137
+ warnings: [],
138
+ }),
139
+ drainDirectiveDisplayBuffer: (buffer: string) => ({
140
+ emitText: buffer,
141
+ bufferedRemainder: '',
142
+ }),
143
+ }));
144
+
145
+ mock.module('../daemon/session-media-retry.js', () => ({
146
+ stripMediaPayloadsForRetry: (msgs: Message[]) => ({
147
+ messages: msgs,
148
+ modified: false,
149
+ replacedBlocks: 0,
150
+ latestUserIndex: null,
151
+ }),
152
+ raceWithTimeout: async () => 'completed' as const,
153
+ }));
154
+
155
+ mock.module('../workspace/turn-commit.js', () => ({
156
+ commitTurnChanges: async () => {},
157
+ }));
158
+
159
+ mock.module('../workspace/git-service.js', () => ({
160
+ getWorkspaceGitService: () => ({
161
+ ensureInitialized: async () => {},
162
+ }),
163
+ }));
164
+
165
+ mock.module('../daemon/session-error.js', () => ({
166
+ classifySessionError: (_err: unknown, _ctx: unknown) => ({
167
+ code: 'SESSION_PROCESSING_FAILED',
168
+ userMessage: 'Something went wrong processing your message.',
169
+ retryable: false,
170
+ }),
171
+ isUserCancellation: (err: unknown, ctx: { aborted?: boolean }) => {
172
+ if (!ctx.aborted) return false;
173
+ if (err instanceof DOMException && err.name === 'AbortError') return true;
174
+ if (err instanceof Error && err.name === 'AbortError') return true;
175
+ return false;
176
+ },
177
+ buildSessionErrorMessage: (sessionId: string, classified: Record<string, unknown>) => ({
178
+ type: 'session_error',
179
+ sessionId,
180
+ ...classified,
181
+ }),
182
+ isContextTooLarge: (msg: string) => /context.?length.?exceeded/i.test(msg),
183
+ }));
184
+
185
+ mock.module('../daemon/session-slash.js', () => ({
186
+ isProviderOrderingError: (msg: string) => /ordering|before.*after|messages.*order/i.test(msg),
187
+ }));
188
+
189
+ mock.module('../util/truncate.js', () => ({
190
+ truncate: (s: string) => s,
191
+ }));
192
+
193
+ mock.module('../agent/message-types.js', () => ({
194
+ createAssistantMessage: (text: string) => ({
195
+ role: 'assistant' as const,
196
+ content: [{ type: 'text', text }],
197
+ }),
198
+ }));
199
+
200
+ mock.module('../memory/llm-request-log-store.js', () => ({
201
+ recordRequestLog: () => {},
202
+ }));
203
+
204
+ // ── Imports (after mocks) ────────────────────────────────────────────
205
+
206
+ import { runAgentLoopImpl, type AgentLoopSessionContext } from '../daemon/session-agent-loop.js';
207
+
208
+ // ── Test helpers ─────────────────────────────────────────────────────
209
+
210
+ type AgentLoopRun = (
211
+ messages: Message[],
212
+ onEvent: (event: AgentEvent) => void,
213
+ signal?: AbortSignal,
214
+ requestId?: string,
215
+ onCheckpoint?: (checkpoint: CheckpointInfo) => CheckpointDecision,
216
+ ) => Promise<Message[]>;
217
+
218
+ function makeCtx(overrides?: Partial<AgentLoopSessionContext> & { agentLoopRun?: AgentLoopRun }): AgentLoopSessionContext {
219
+ const agentLoopRun = overrides?.agentLoopRun ?? (async (messages: Message[]) => [
220
+ ...messages,
221
+ { role: 'assistant' as const, content: [{ type: 'text' as const, text: 'response' }] },
222
+ ]);
223
+
224
+ return {
225
+ conversationId: 'test-conv',
226
+ messages: [
227
+ { role: 'user', content: [{ type: 'text', text: 'Hello' }] },
228
+ ] as Message[],
229
+ processing: true,
230
+ abortController: new AbortController(),
231
+ currentRequestId: 'test-req',
232
+
233
+ agentLoop: {
234
+ run: agentLoopRun,
235
+ } as unknown as AgentLoopSessionContext['agentLoop'],
236
+ provider: {
237
+ name: 'mock-provider',
238
+ sendMessage: async () => ({
239
+ content: [{ type: 'text', text: 'title' }],
240
+ model: 'mock',
241
+ usage: { inputTokens: 0, outputTokens: 0 },
242
+ stopReason: 'end_turn',
243
+ }),
244
+ } as unknown as AgentLoopSessionContext['provider'],
245
+ systemPrompt: 'system prompt',
246
+
247
+ contextWindowManager: {
248
+ maybeCompact: async () => ({ compacted: false }),
249
+ } as unknown as AgentLoopSessionContext['contextWindowManager'],
250
+ contextCompactedMessageCount: 0,
251
+ contextCompactedAt: null,
252
+
253
+ conflictGate: { evaluate: async () => null } as unknown as AgentLoopSessionContext['conflictGate'],
254
+ memoryPolicy: { scopeId: 'default', includeDefaultFallback: true },
255
+
256
+ currentActiveSurfaceId: undefined,
257
+ currentPage: undefined,
258
+ surfaceState: new Map(),
259
+ pendingSurfaceActions: new Map(),
260
+ currentTurnSurfaces: [],
261
+
262
+ workingDir: '/tmp',
263
+ workspaceTopLevelContext: null,
264
+ workspaceTopLevelDirty: false,
265
+ channelCapabilities: undefined,
266
+ commandIntent: undefined,
267
+ guardianContext: undefined,
268
+
269
+ coreToolNames: new Set(),
270
+ allowedToolNames: undefined,
271
+ preactivatedSkillIds: undefined,
272
+ skillProjectionState: new Map(),
273
+ skillProjectionCache: new Map() as unknown as AgentLoopSessionContext['skillProjectionCache'],
274
+
275
+ traceEmitter: {
276
+ emit: () => {},
277
+ } as unknown as AgentLoopSessionContext['traceEmitter'],
278
+ profiler: {
279
+ startRequest: () => {},
280
+ emitSummary: () => {},
281
+ } as unknown as AgentLoopSessionContext['profiler'],
282
+ usageStats: { totalInputTokens: 0, totalOutputTokens: 0, totalEstimatedCost: 0, model: '' },
283
+ turnCount: 0,
284
+
285
+ lastAssistantAttachments: [],
286
+ lastAttachmentWarnings: [],
287
+
288
+ hasNoClient: false,
289
+ prompter: {} as unknown as AgentLoopSessionContext['prompter'],
290
+ queue: {} as unknown as AgentLoopSessionContext['queue'],
291
+
292
+ getWorkspaceGitService: () => ({ ensureInitialized: async () => {} }),
293
+ commitTurnChanges: async () => {},
294
+
295
+ refreshWorkspaceTopLevelContextIfNeeded: () => {},
296
+ markWorkspaceTopLevelDirty: () => {},
297
+ getQueueDepth: () => 0,
298
+ hasQueuedMessages: () => false,
299
+ canHandoffAtCheckpoint: () => false,
300
+ drainQueue: () => {},
301
+ getTurnChannelContext: () => ({
302
+ userMessageChannel: 'macos' as const,
303
+ assistantMessageChannel: 'macos' as const,
304
+ }),
305
+
306
+ ...overrides,
307
+ } as AgentLoopSessionContext;
308
+ }
309
+
310
+
311
+ // ── Tests ────────────────────────────────────────────────────────────
312
+
313
+ beforeEach(() => {
314
+ hookBlocked = false;
315
+ hookBlockedBy = '';
316
+ });
317
+
318
+ describe('session-agent-loop', () => {
319
+
320
+ describe('pre-flight checks', () => {
321
+ test('throws if called without an abortController', async () => {
322
+ const ctx = makeCtx();
323
+ ctx.abortController = null;
324
+ await expect(
325
+ runAgentLoopImpl(ctx, 'hello', 'msg-1', () => {}),
326
+ ).rejects.toThrow('runAgentLoop called without prior persistUserMessage');
327
+ });
328
+ });
329
+
330
+ describe('pre-message hook blocking', () => {
331
+ test('emits error and returns early when pre-message hook blocks', async () => {
332
+ hookBlocked = true;
333
+ hookBlockedBy = 'test-hook';
334
+ const events: ServerMessage[] = [];
335
+ const ctx = makeCtx();
336
+
337
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
338
+
339
+ const errorEvent = events.find((e) => e.type === 'error');
340
+ expect(errorEvent).toBeDefined();
341
+ expect((errorEvent as { message: string }).message).toContain('test-hook');
342
+ });
343
+
344
+ test('removes user message when hook blocks without skipPreMessageRollback', async () => {
345
+ hookBlocked = true;
346
+ hookBlockedBy = 'guard';
347
+ const ctx = makeCtx();
348
+ const originalLength = ctx.messages.length;
349
+
350
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', () => {});
351
+
352
+ expect(ctx.messages.length).toBe(originalLength - 1);
353
+ });
354
+
355
+ test('keeps user message when hook blocks with skipPreMessageRollback', async () => {
356
+ hookBlocked = true;
357
+ hookBlockedBy = 'guard';
358
+ const ctx = makeCtx();
359
+ const originalLength = ctx.messages.length;
360
+
361
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', () => {}, { skipPreMessageRollback: true });
362
+
363
+ expect(ctx.messages.length).toBe(originalLength);
364
+ });
365
+ });
366
+
367
+ describe('tool execution errors via agent loop', () => {
368
+ test('error events from agent loop are classified and emitted', async () => {
369
+ const events: ServerMessage[] = [];
370
+
371
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
372
+ // Simulate tool_use + error during execution
373
+ onEvent({ type: 'tool_use', id: 'tu-1', name: 'bash', input: { cmd: 'ls' } });
374
+ onEvent({
375
+ type: 'error',
376
+ error: new Error('Tool execution failed: permission denied'),
377
+ });
378
+ onEvent({
379
+ type: 'message_complete',
380
+ message: {
381
+ role: 'assistant',
382
+ content: [{ type: 'text', text: 'I encountered an error' }],
383
+ },
384
+ });
385
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 50, model: 'test-model', providerDurationMs: 200 });
386
+ return [
387
+ ...messages,
388
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'I encountered an error' }] as ContentBlock[] },
389
+ ];
390
+ };
391
+
392
+ const ctx = makeCtx({ agentLoopRun });
393
+ await runAgentLoopImpl(ctx, 'run ls', 'msg-1', (msg) => events.push(msg));
394
+
395
+ const sessionError = events.find((e) => e.type === 'session_error');
396
+ expect(sessionError).toBeDefined();
397
+ });
398
+
399
+ test('non-error agent loop completion does not emit session_error', async () => {
400
+ const events: ServerMessage[] = [];
401
+
402
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
403
+ onEvent({
404
+ type: 'message_complete',
405
+ message: {
406
+ role: 'assistant',
407
+ content: [{ type: 'text', text: 'All good' }],
408
+ },
409
+ });
410
+ onEvent({ type: 'usage', inputTokens: 50, outputTokens: 25, model: 'test-model', providerDurationMs: 100 });
411
+ return [
412
+ ...messages,
413
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'All good' }] as ContentBlock[] },
414
+ ];
415
+ };
416
+
417
+ const ctx = makeCtx({ agentLoopRun });
418
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
419
+
420
+ const sessionError = events.find((e) => e.type === 'session_error');
421
+ expect(sessionError).toBeUndefined();
422
+ const complete = events.find((e) => e.type === 'message_complete');
423
+ expect(complete).toBeDefined();
424
+ });
425
+ });
426
+
427
+ describe('context window exhaustion (context-too-large recovery)', () => {
428
+ test('triggers forced compaction when context-too-large is detected', async () => {
429
+ const events: ServerMessage[] = [];
430
+ let callCount = 0;
431
+ let compactForceCalled = false;
432
+
433
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
434
+ callCount++;
435
+ if (callCount === 1) {
436
+ // First call: emit context_too_large error, return same messages (no progress)
437
+ onEvent({
438
+ type: 'error',
439
+ error: new Error('context_length_exceeded'),
440
+ });
441
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 0, model: 'test-model', providerDurationMs: 50 });
442
+ return messages;
443
+ }
444
+ // Second call (after compaction): succeed
445
+ onEvent({
446
+ type: 'message_complete',
447
+ message: { role: 'assistant', content: [{ type: 'text', text: 'recovered' }] },
448
+ });
449
+ onEvent({ type: 'usage', inputTokens: 50, outputTokens: 25, model: 'test-model', providerDurationMs: 100 });
450
+ return [
451
+ ...messages,
452
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'recovered' }] as ContentBlock[] },
453
+ ];
454
+ };
455
+
456
+ const ctx = makeCtx({
457
+ agentLoopRun,
458
+ contextWindowManager: {
459
+ maybeCompact: async (_msgs: Message[], _signal: AbortSignal, opts?: { force?: boolean }) => {
460
+ if (opts?.force) {
461
+ compactForceCalled = true;
462
+ return {
463
+ compacted: true,
464
+ messages: [{ role: 'user', content: [{ type: 'text', text: 'Hello' }] }] as Message[],
465
+ compactedPersistedMessages: 5,
466
+ summaryText: 'Summary of prior conversation',
467
+ previousEstimatedInputTokens: 90000,
468
+ estimatedInputTokens: 30000,
469
+ maxInputTokens: 100000,
470
+ thresholdTokens: 80000,
471
+ compactedMessages: 10,
472
+ summaryCalls: 1,
473
+ summaryInputTokens: 500,
474
+ summaryOutputTokens: 200,
475
+ summaryModel: 'mock-model',
476
+ };
477
+ }
478
+ return { compacted: false };
479
+ },
480
+ } as unknown as AgentLoopSessionContext['contextWindowManager'],
481
+ });
482
+
483
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
484
+
485
+ expect(compactForceCalled).toBe(true);
486
+ expect(callCount).toBe(2);
487
+ const compactEvent = events.find((e) => e.type === 'context_compacted');
488
+ expect(compactEvent).toBeDefined();
489
+ });
490
+
491
+ test('emits session_error when context stays too large after all recovery attempts', async () => {
492
+ const events: ServerMessage[] = [];
493
+
494
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
495
+ onEvent({
496
+ type: 'error',
497
+ error: new Error('context_length_exceeded'),
498
+ });
499
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 0, model: 'test-model', providerDurationMs: 50 });
500
+ return messages;
501
+ };
502
+
503
+ const ctx = makeCtx({
504
+ agentLoopRun,
505
+ contextWindowManager: {
506
+ // Compaction succeeds but context is still too large
507
+ maybeCompact: async () => ({
508
+ compacted: true,
509
+ messages: [{ role: 'user', content: [{ type: 'text', text: 'Hello' }] }] as Message[],
510
+ compactedPersistedMessages: 5,
511
+ summaryText: 'Summary',
512
+ previousEstimatedInputTokens: 90000,
513
+ estimatedInputTokens: 85000,
514
+ maxInputTokens: 100000,
515
+ thresholdTokens: 80000,
516
+ compactedMessages: 2,
517
+ summaryCalls: 1,
518
+ summaryInputTokens: 500,
519
+ summaryOutputTokens: 200,
520
+ summaryModel: 'mock-model',
521
+ }),
522
+ } as unknown as AgentLoopSessionContext['contextWindowManager'],
523
+ });
524
+
525
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
526
+
527
+ const sessionError = events.find((e) => e.type === 'session_error');
528
+ expect(sessionError).toBeDefined();
529
+ });
530
+ });
531
+
532
+ describe('provider ordering error retry', () => {
533
+ test('retries with deep repair when ordering error is detected', async () => {
534
+ const events: ServerMessage[] = [];
535
+ let callCount = 0;
536
+
537
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
538
+ callCount++;
539
+ if (callCount === 1) {
540
+ onEvent({
541
+ type: 'error',
542
+ error: new Error('messages ordering error'),
543
+ });
544
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 0, model: 'test-model', providerDurationMs: 50 });
545
+ return messages;
546
+ }
547
+ // Retry succeeds
548
+ onEvent({
549
+ type: 'message_complete',
550
+ message: { role: 'assistant', content: [{ type: 'text', text: 'fixed' }] },
551
+ });
552
+ onEvent({ type: 'usage', inputTokens: 50, outputTokens: 25, model: 'test-model', providerDurationMs: 100 });
553
+ return [
554
+ ...messages,
555
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'fixed' }] as ContentBlock[] },
556
+ ];
557
+ };
558
+
559
+ const ctx = makeCtx({ agentLoopRun });
560
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
561
+
562
+ expect(callCount).toBe(2);
563
+ });
564
+
565
+ test('emits deferred ordering error when retry also fails', async () => {
566
+ const events: ServerMessage[] = [];
567
+
568
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
569
+ onEvent({
570
+ type: 'error',
571
+ error: new Error('messages ordering error'),
572
+ });
573
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 0, model: 'test-model', providerDurationMs: 50 });
574
+ return messages;
575
+ };
576
+
577
+ const ctx = makeCtx({ agentLoopRun });
578
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
579
+
580
+ const sessionError = events.find((e) => e.type === 'session_error');
581
+ expect(sessionError).toBeDefined();
582
+ });
583
+ });
584
+
585
+ describe('checkpoint handoff (infinite loop prevention)', () => {
586
+ test('yields at checkpoint when canHandoffAtCheckpoint returns true', async () => {
587
+ const events: ServerMessage[] = [];
588
+
589
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent, _signal, _reqId, onCheckpoint) => {
590
+ // Simulate tool use followed by checkpoint
591
+ onEvent({ type: 'tool_use', id: 'tu-1', name: 'file_read', input: {} });
592
+ onEvent({
593
+ type: 'tool_result',
594
+ toolUseId: 'tu-1',
595
+ content: 'file content',
596
+ isError: false,
597
+ });
598
+ onEvent({
599
+ type: 'message_complete',
600
+ message: { role: 'assistant', content: [{ type: 'text', text: 'partial' }] },
601
+ });
602
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 50, model: 'test-model', providerDurationMs: 100 });
603
+ if (onCheckpoint) {
604
+ const decision = onCheckpoint({ turnIndex: 0, toolCount: 1, hasToolUse: true });
605
+ if (decision === 'yield') {
606
+ return [
607
+ ...messages,
608
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'partial' }] as ContentBlock[] },
609
+ ];
610
+ }
611
+ }
612
+ return [
613
+ ...messages,
614
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'partial' }] as ContentBlock[] },
615
+ ];
616
+ };
617
+
618
+ const ctx = makeCtx({
619
+ agentLoopRun,
620
+ canHandoffAtCheckpoint: () => true,
621
+ } as unknown as Partial<AgentLoopSessionContext>);
622
+
623
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
624
+
625
+ const handoff = events.find((e) => e.type === 'generation_handoff');
626
+ expect(handoff).toBeDefined();
627
+ });
628
+
629
+ test('continues when canHandoffAtCheckpoint returns false', async () => {
630
+ const events: ServerMessage[] = [];
631
+
632
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent, _signal, _reqId, onCheckpoint) => {
633
+ onEvent({ type: 'tool_use', id: 'tu-1', name: 'file_read', input: {} });
634
+ onEvent({
635
+ type: 'tool_result',
636
+ toolUseId: 'tu-1',
637
+ content: 'content',
638
+ isError: false,
639
+ });
640
+ onEvent({
641
+ type: 'message_complete',
642
+ message: { role: 'assistant', content: [{ type: 'text', text: 'done' }] },
643
+ });
644
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 50, model: 'test-model', providerDurationMs: 100 });
645
+ if (onCheckpoint) {
646
+ onCheckpoint({ turnIndex: 0, toolCount: 1, hasToolUse: true });
647
+ }
648
+ return [
649
+ ...messages,
650
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'done' }] as ContentBlock[] },
651
+ ];
652
+ };
653
+
654
+ const ctx = makeCtx({
655
+ agentLoopRun,
656
+ canHandoffAtCheckpoint: () => false,
657
+ } as unknown as Partial<AgentLoopSessionContext>);
658
+
659
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
660
+
661
+ const handoff = events.find((e) => e.type === 'generation_handoff');
662
+ expect(handoff).toBeUndefined();
663
+ const complete = events.find((e) => e.type === 'message_complete');
664
+ expect(complete).toBeDefined();
665
+ });
666
+
667
+ test('does not yield during browser flow even when handoff is available', async () => {
668
+ const events: ServerMessage[] = [];
669
+
670
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent, _signal, _reqId, onCheckpoint) => {
671
+ // All tool uses are browser_ prefixed
672
+ onEvent({ type: 'tool_use', id: 'tu-1', name: 'browser_navigate', input: {} });
673
+ onEvent({
674
+ type: 'tool_result',
675
+ toolUseId: 'tu-1',
676
+ content: 'navigated',
677
+ isError: false,
678
+ });
679
+ onEvent({
680
+ type: 'message_complete',
681
+ message: { role: 'assistant', content: [{ type: 'text', text: 'browsing' }] },
682
+ });
683
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 50, model: 'test-model', providerDurationMs: 100 });
684
+ if (onCheckpoint) {
685
+ onCheckpoint({ turnIndex: 0, toolCount: 1, hasToolUse: true });
686
+ }
687
+ return [
688
+ ...messages,
689
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'browsing' }] as ContentBlock[] },
690
+ ];
691
+ };
692
+
693
+ const ctx = makeCtx({
694
+ agentLoopRun,
695
+ canHandoffAtCheckpoint: () => true,
696
+ } as unknown as Partial<AgentLoopSessionContext>);
697
+
698
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
699
+
700
+ // Browser flows should NOT yield
701
+ const handoff = events.find((e) => e.type === 'generation_handoff');
702
+ expect(handoff).toBeUndefined();
703
+ });
704
+ });
705
+
706
+ describe('user cancellation', () => {
707
+ test('emits generation_cancelled when abort signal fires', async () => {
708
+ const events: ServerMessage[] = [];
709
+ const abortController = new AbortController();
710
+
711
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
712
+ onEvent({
713
+ type: 'message_complete',
714
+ message: { role: 'assistant', content: [{ type: 'text', text: 'partial' }] },
715
+ });
716
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 50, model: 'test-model', providerDurationMs: 100 });
717
+ // Simulate abort after processing
718
+ abortController.abort();
719
+ return [
720
+ ...messages,
721
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'partial' }] as ContentBlock[] },
722
+ ];
723
+ };
724
+
725
+ const ctx = makeCtx({ agentLoopRun, abortController });
726
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
727
+
728
+ const cancelled = events.find((e) => e.type === 'generation_cancelled');
729
+ expect(cancelled).toBeDefined();
730
+ });
731
+
732
+ test('handles AbortError thrown from agent loop as user cancellation', async () => {
733
+ const events: ServerMessage[] = [];
734
+ const abortController = new AbortController();
735
+
736
+ const agentLoopRun: AgentLoopRun = async () => {
737
+ abortController.abort();
738
+ const err = new DOMException('The operation was aborted', 'AbortError');
739
+ throw err;
740
+ };
741
+
742
+ const ctx = makeCtx({ agentLoopRun, abortController });
743
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
744
+
745
+ const cancelled = events.find((e) => e.type === 'generation_cancelled');
746
+ expect(cancelled).toBeDefined();
747
+ // Should NOT emit a session_error for user cancellation
748
+ const sessionError = events.find((e) => e.type === 'session_error');
749
+ expect(sessionError).toBeUndefined();
750
+ });
751
+ });
752
+
753
+ describe('finally block cleanup', () => {
754
+ test('increments turnCount after successful run', async () => {
755
+ const ctx = makeCtx({
756
+ agentLoopRun: async (messages, onEvent) => {
757
+ onEvent({
758
+ type: 'message_complete',
759
+ message: { role: 'assistant', content: [{ type: 'text', text: 'hi' }] },
760
+ });
761
+ onEvent({ type: 'usage', inputTokens: 10, outputTokens: 5, model: 'test', providerDurationMs: 50 });
762
+ return [
763
+ ...messages,
764
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'hi' }] as ContentBlock[] },
765
+ ];
766
+ },
767
+ });
768
+ expect(ctx.turnCount).toBe(0);
769
+
770
+ await runAgentLoopImpl(ctx, 'hi', 'msg-1', () => {});
771
+
772
+ expect(ctx.turnCount).toBe(1);
773
+ });
774
+
775
+ test('clears processing state and abort controller', async () => {
776
+ const ctx = makeCtx({
777
+ agentLoopRun: async (messages, onEvent) => {
778
+ onEvent({
779
+ type: 'message_complete',
780
+ message: { role: 'assistant', content: [{ type: 'text', text: 'hi' }] },
781
+ });
782
+ onEvent({ type: 'usage', inputTokens: 10, outputTokens: 5, model: 'test', providerDurationMs: 50 });
783
+ return [
784
+ ...messages,
785
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'hi' }] as ContentBlock[] },
786
+ ];
787
+ },
788
+ });
789
+
790
+ await runAgentLoopImpl(ctx, 'hi', 'msg-1', () => {});
791
+
792
+ expect(ctx.processing).toBe(false);
793
+ expect(ctx.abortController).toBeNull();
794
+ expect(ctx.currentRequestId).toBeUndefined();
795
+ expect(ctx.commandIntent).toBeUndefined();
796
+ });
797
+
798
+ test('clears state even when agent loop throws', async () => {
799
+ const ctx = makeCtx({
800
+ agentLoopRun: async () => {
801
+ throw new Error('unexpected crash');
802
+ },
803
+ });
804
+
805
+ await runAgentLoopImpl(ctx, 'hi', 'msg-1', () => {});
806
+
807
+ expect(ctx.processing).toBe(false);
808
+ expect(ctx.abortController).toBeNull();
809
+ });
810
+
811
+ test('drains queue after completion', async () => {
812
+ let drainReason: string | undefined;
813
+ const ctx = makeCtx({
814
+ agentLoopRun: async (messages: Message[], onEvent: (event: AgentEvent) => void) => {
815
+ onEvent({
816
+ type: 'message_complete',
817
+ message: { role: 'assistant', content: [{ type: 'text', text: 'ok' }] },
818
+ });
819
+ onEvent({ type: 'usage', inputTokens: 10, outputTokens: 5, model: 'test', providerDurationMs: 50 });
820
+ return [
821
+ ...messages,
822
+ { role: 'assistant' as const, content: [{ type: 'text', text: 'ok' }] as ContentBlock[] },
823
+ ];
824
+ },
825
+ drainQueue: (reason: string) => { drainReason = reason; },
826
+ } as unknown as Partial<AgentLoopSessionContext>);
827
+
828
+ await runAgentLoopImpl(ctx, 'hi', 'msg-1', () => {});
829
+
830
+ expect(drainReason).toBe('loop_complete');
831
+ });
832
+ });
833
+
834
+ describe('error-only response with no assistant text', () => {
835
+ test('synthesizes error assistant message when provider returns no response', async () => {
836
+ const events: ServerMessage[] = [];
837
+
838
+ const agentLoopRun: AgentLoopRun = async (messages, onEvent) => {
839
+ // Emit a non-ordering, non-context-too-large error that sets providerErrorUserMessage
840
+ onEvent({
841
+ type: 'error',
842
+ error: new Error('Internal processing failure'),
843
+ });
844
+ onEvent({ type: 'usage', inputTokens: 100, outputTokens: 0, model: 'test-model', providerDurationMs: 50 });
845
+ // Return same messages (no assistant message appended)
846
+ return messages;
847
+ };
848
+
849
+ const ctx = makeCtx({ agentLoopRun });
850
+ await runAgentLoopImpl(ctx, 'hello', 'msg-1', (msg) => events.push(msg));
851
+
852
+ // The providerErrorUserMessage should trigger a synthesized assistant_text_delta
853
+ const textDeltas = events.filter((e) => e.type === 'assistant_text_delta');
854
+ expect(textDeltas.length).toBeGreaterThanOrEqual(1);
855
+ });
856
+ });
857
+ });