@build-astron-co/nimbus 0.4.1 → 0.4.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (435) hide show
  1. package/CHANGELOG.md +268 -89
  2. package/README.md +26 -567
  3. package/dist/src/agent/compaction-agent.js +24 -12
  4. package/dist/src/agent/context-manager.js +2 -1
  5. package/dist/src/agent/expand-files.js +2 -1
  6. package/dist/src/agent/loop.js +71 -33
  7. package/dist/src/agent/permissions.js +4 -2
  8. package/dist/src/agent/system-prompt.js +34 -17
  9. package/dist/src/app.js +1 -1
  10. package/dist/src/auth/keychain.js +8 -4
  11. package/dist/src/auth/store.js +70 -107
  12. package/dist/src/cli/init.js +35 -19
  13. package/dist/src/cli/run.js +18 -10
  14. package/dist/src/cli/serve.js +4 -2
  15. package/dist/src/cli.js +52 -11
  16. package/dist/src/commands/alias.js +5 -3
  17. package/dist/src/commands/audit/index.js +2 -1
  18. package/dist/src/commands/aws-terraform.js +36 -18
  19. package/dist/src/commands/completions.js +1 -1
  20. package/dist/src/commands/config.js +3 -2
  21. package/dist/src/commands/connect-github.js +92 -0
  22. package/dist/src/commands/cost/index.js +3 -2
  23. package/dist/src/commands/deploy.js +15 -10
  24. package/dist/src/commands/doctor.js +9 -6
  25. package/dist/src/commands/drift/index.js +2 -1
  26. package/dist/src/commands/export.js +5 -3
  27. package/dist/src/commands/generate-terraform.js +110 -2
  28. package/dist/src/commands/import.js +3 -3
  29. package/dist/src/commands/incident.js +10 -5
  30. package/dist/src/commands/login.js +8 -93
  31. package/dist/src/commands/logs.js +16 -8
  32. package/dist/src/commands/onboarding.js +6 -4
  33. package/dist/src/commands/pipeline.js +6 -3
  34. package/dist/src/commands/plugin.js +3 -2
  35. package/dist/src/commands/profile.js +27 -14
  36. package/dist/src/commands/questionnaire.js +1 -1
  37. package/dist/src/commands/rollback.js +3 -2
  38. package/dist/src/commands/rollout.js +5 -3
  39. package/dist/src/commands/runbook.js +17 -10
  40. package/dist/src/commands/schedule.js +10 -5
  41. package/dist/src/commands/status.js +2 -1
  42. package/dist/src/commands/team-context.js +12 -7
  43. package/dist/src/commands/template.js +1 -1
  44. package/dist/src/commands/tf/index.js +6 -3
  45. package/dist/src/commands/upgrade.js +5 -3
  46. package/dist/src/commands/version.js +6 -3
  47. package/dist/src/commands/watch.js +6 -3
  48. package/dist/src/compat/sqlite.js +5 -3
  49. package/dist/src/config/mode-store.js +2 -1
  50. package/dist/src/config/profiles.js +4 -2
  51. package/dist/src/config/types.js +2 -1
  52. package/dist/src/engine/executor.js +8 -4
  53. package/dist/src/engine/planner.js +9 -5
  54. package/dist/src/llm/providers/anthropic.js +6 -3
  55. package/dist/src/llm/providers/ollama.js +1 -1
  56. package/dist/src/llm/router.js +22 -7
  57. package/dist/src/nimbus.js +1 -0
  58. package/dist/src/sessions/manager.js +6 -3
  59. package/dist/src/sharing/viewer.js +2 -1
  60. package/dist/src/tools/file-ops.js +1 -2
  61. package/dist/src/tools/schemas/devops.js +197 -108
  62. package/dist/src/tools/schemas/standard.js +1 -1
  63. package/dist/src/ui/App.js +25 -13
  64. package/dist/src/ui/FileDiffModal.js +22 -11
  65. package/dist/src/ui/HelpModal.js +2 -1
  66. package/dist/src/ui/InputBox.js +6 -3
  67. package/dist/src/ui/MessageList.js +40 -20
  68. package/dist/src/ui/TerminalPane.js +2 -1
  69. package/dist/src/ui/ToolCallDisplay.js +12 -6
  70. package/dist/src/ui/TreePane.js +2 -1
  71. package/dist/src/ui/ink/index.js +37 -21
  72. package/dist/src/version.js +1 -1
  73. package/dist/src/watcher/index.js +8 -4
  74. package/package.json +3 -5
  75. package/src/__tests__/alias.test.ts +0 -133
  76. package/src/__tests__/app.test.ts +0 -76
  77. package/src/__tests__/audit.test.ts +0 -877
  78. package/src/__tests__/circuit-breaker.test.ts +0 -116
  79. package/src/__tests__/cli-run.test.ts +0 -351
  80. package/src/__tests__/compat-sqlite.test.ts +0 -68
  81. package/src/__tests__/context-manager.test.ts +0 -632
  82. package/src/__tests__/context.test.ts +0 -242
  83. package/src/__tests__/devops-terminal-gaps.test.ts +0 -718
  84. package/src/__tests__/doctor.test.ts +0 -48
  85. package/src/__tests__/enterprise.test.ts +0 -401
  86. package/src/__tests__/export.test.ts +0 -236
  87. package/src/__tests__/gap-11-18-20.test.ts +0 -958
  88. package/src/__tests__/generator.test.ts +0 -433
  89. package/src/__tests__/helm-streaming.test.ts +0 -127
  90. package/src/__tests__/hooks.test.ts +0 -582
  91. package/src/__tests__/incident.test.ts +0 -179
  92. package/src/__tests__/init.test.ts +0 -487
  93. package/src/__tests__/intent-parser.test.ts +0 -229
  94. package/src/__tests__/llm-router.test.ts +0 -209
  95. package/src/__tests__/logs.test.ts +0 -107
  96. package/src/__tests__/loop-errors.test.ts +0 -244
  97. package/src/__tests__/lsp.test.ts +0 -293
  98. package/src/__tests__/modes.test.ts +0 -336
  99. package/src/__tests__/perf-optimizations.test.ts +0 -847
  100. package/src/__tests__/permissions.test.ts +0 -338
  101. package/src/__tests__/pipeline.test.ts +0 -50
  102. package/src/__tests__/polish-phase3.test.ts +0 -340
  103. package/src/__tests__/profile.test.ts +0 -237
  104. package/src/__tests__/rollback.test.ts +0 -83
  105. package/src/__tests__/runbook.test.ts +0 -219
  106. package/src/__tests__/schedule.test.ts +0 -206
  107. package/src/__tests__/serve.test.ts +0 -275
  108. package/src/__tests__/sessions.test.ts +0 -322
  109. package/src/__tests__/sharing.test.ts +0 -340
  110. package/src/__tests__/snapshots.test.ts +0 -581
  111. package/src/__tests__/standalone-migration.test.ts +0 -199
  112. package/src/__tests__/state-db.test.ts +0 -334
  113. package/src/__tests__/status.test.ts +0 -158
  114. package/src/__tests__/stream-with-tools.test.ts +0 -778
  115. package/src/__tests__/subagents.test.ts +0 -176
  116. package/src/__tests__/system-prompt.test.ts +0 -248
  117. package/src/__tests__/terminal-gap-v2.test.ts +0 -395
  118. package/src/__tests__/terminal-parity.test.ts +0 -393
  119. package/src/__tests__/tf-apply.test.ts +0 -187
  120. package/src/__tests__/tool-converter.test.ts +0 -256
  121. package/src/__tests__/tool-schemas.test.ts +0 -602
  122. package/src/__tests__/tools.test.ts +0 -144
  123. package/src/__tests__/version-json.test.ts +0 -184
  124. package/src/__tests__/version.test.ts +0 -49
  125. package/src/__tests__/watch.test.ts +0 -129
  126. package/src/agent/compaction-agent.ts +0 -266
  127. package/src/agent/context-manager.ts +0 -499
  128. package/src/agent/context.ts +0 -427
  129. package/src/agent/deploy-preview.ts +0 -487
  130. package/src/agent/expand-files.ts +0 -108
  131. package/src/agent/index.ts +0 -68
  132. package/src/agent/loop.ts +0 -1998
  133. package/src/agent/modes.ts +0 -429
  134. package/src/agent/permissions.ts +0 -513
  135. package/src/agent/subagents/base.ts +0 -116
  136. package/src/agent/subagents/cost.ts +0 -51
  137. package/src/agent/subagents/explore.ts +0 -42
  138. package/src/agent/subagents/general.ts +0 -54
  139. package/src/agent/subagents/index.ts +0 -102
  140. package/src/agent/subagents/infra.ts +0 -59
  141. package/src/agent/subagents/security.ts +0 -69
  142. package/src/agent/system-prompt.ts +0 -990
  143. package/src/app.ts +0 -180
  144. package/src/audit/activity-log.ts +0 -290
  145. package/src/audit/compliance-checker.ts +0 -540
  146. package/src/audit/cost-tracker.ts +0 -318
  147. package/src/audit/index.ts +0 -23
  148. package/src/audit/security-scanner.ts +0 -641
  149. package/src/auth/guard.ts +0 -75
  150. package/src/auth/index.ts +0 -56
  151. package/src/auth/keychain.ts +0 -82
  152. package/src/auth/oauth.ts +0 -465
  153. package/src/auth/providers.ts +0 -470
  154. package/src/auth/sso.ts +0 -113
  155. package/src/auth/store.ts +0 -505
  156. package/src/auth/types.ts +0 -187
  157. package/src/build.ts +0 -141
  158. package/src/cli/index.ts +0 -16
  159. package/src/cli/init.ts +0 -1227
  160. package/src/cli/openapi-spec.ts +0 -356
  161. package/src/cli/run.ts +0 -628
  162. package/src/cli/serve-auth.ts +0 -80
  163. package/src/cli/serve.ts +0 -539
  164. package/src/cli/web.ts +0 -71
  165. package/src/cli.ts +0 -1728
  166. package/src/clients/core-engine-client.ts +0 -227
  167. package/src/clients/enterprise-client.ts +0 -334
  168. package/src/clients/generator-client.ts +0 -351
  169. package/src/clients/git-client.ts +0 -627
  170. package/src/clients/github-client.ts +0 -410
  171. package/src/clients/helm-client.ts +0 -504
  172. package/src/clients/index.ts +0 -80
  173. package/src/clients/k8s-client.ts +0 -497
  174. package/src/clients/llm-client.ts +0 -161
  175. package/src/clients/rest-client.ts +0 -130
  176. package/src/clients/service-discovery.ts +0 -38
  177. package/src/clients/terraform-client.ts +0 -482
  178. package/src/clients/tools-client.ts +0 -1843
  179. package/src/clients/ws-client.ts +0 -115
  180. package/src/commands/alias.ts +0 -100
  181. package/src/commands/analyze/index.ts +0 -352
  182. package/src/commands/apply/helm.ts +0 -473
  183. package/src/commands/apply/index.ts +0 -213
  184. package/src/commands/apply/k8s.ts +0 -454
  185. package/src/commands/apply/terraform.ts +0 -582
  186. package/src/commands/ask.ts +0 -167
  187. package/src/commands/audit/index.ts +0 -357
  188. package/src/commands/auth-cloud.ts +0 -407
  189. package/src/commands/auth-list.ts +0 -134
  190. package/src/commands/auth-profile.ts +0 -121
  191. package/src/commands/auth-refresh.ts +0 -187
  192. package/src/commands/auth-status.ts +0 -141
  193. package/src/commands/aws/ec2.ts +0 -501
  194. package/src/commands/aws/iam.ts +0 -397
  195. package/src/commands/aws/index.ts +0 -133
  196. package/src/commands/aws/lambda.ts +0 -396
  197. package/src/commands/aws/rds.ts +0 -439
  198. package/src/commands/aws/s3.ts +0 -439
  199. package/src/commands/aws/vpc.ts +0 -393
  200. package/src/commands/aws-discover.ts +0 -542
  201. package/src/commands/aws-terraform.ts +0 -755
  202. package/src/commands/azure/aks.ts +0 -376
  203. package/src/commands/azure/functions.ts +0 -253
  204. package/src/commands/azure/index.ts +0 -116
  205. package/src/commands/azure/storage.ts +0 -478
  206. package/src/commands/azure/vm.ts +0 -355
  207. package/src/commands/billing/index.ts +0 -256
  208. package/src/commands/chat.ts +0 -320
  209. package/src/commands/completions.ts +0 -268
  210. package/src/commands/config.ts +0 -372
  211. package/src/commands/cost/cloud-cost-estimator.ts +0 -266
  212. package/src/commands/cost/estimator.ts +0 -79
  213. package/src/commands/cost/index.ts +0 -810
  214. package/src/commands/cost/parsers/terraform.ts +0 -273
  215. package/src/commands/cost/parsers/types.ts +0 -25
  216. package/src/commands/cost/pricing/aws.ts +0 -544
  217. package/src/commands/cost/pricing/azure.ts +0 -499
  218. package/src/commands/cost/pricing/gcp.ts +0 -396
  219. package/src/commands/cost/pricing/index.ts +0 -40
  220. package/src/commands/demo.ts +0 -250
  221. package/src/commands/deploy.ts +0 -260
  222. package/src/commands/doctor.ts +0 -1386
  223. package/src/commands/drift/index.ts +0 -787
  224. package/src/commands/explain.ts +0 -277
  225. package/src/commands/export.ts +0 -146
  226. package/src/commands/feedback.ts +0 -389
  227. package/src/commands/fix.ts +0 -324
  228. package/src/commands/fs/index.ts +0 -402
  229. package/src/commands/gcp/compute.ts +0 -325
  230. package/src/commands/gcp/functions.ts +0 -271
  231. package/src/commands/gcp/gke.ts +0 -438
  232. package/src/commands/gcp/iam.ts +0 -344
  233. package/src/commands/gcp/index.ts +0 -129
  234. package/src/commands/gcp/storage.ts +0 -284
  235. package/src/commands/generate-helm.ts +0 -1249
  236. package/src/commands/generate-k8s.ts +0 -1508
  237. package/src/commands/generate-terraform.ts +0 -1202
  238. package/src/commands/gh/index.ts +0 -863
  239. package/src/commands/git/index.ts +0 -1343
  240. package/src/commands/helm/index.ts +0 -1126
  241. package/src/commands/help.ts +0 -715
  242. package/src/commands/history.ts +0 -149
  243. package/src/commands/import.ts +0 -868
  244. package/src/commands/incident.ts +0 -166
  245. package/src/commands/index.ts +0 -367
  246. package/src/commands/init.ts +0 -1051
  247. package/src/commands/k8s/index.ts +0 -1137
  248. package/src/commands/login.ts +0 -716
  249. package/src/commands/logout.ts +0 -83
  250. package/src/commands/logs.ts +0 -167
  251. package/src/commands/onboarding.ts +0 -405
  252. package/src/commands/pipeline.ts +0 -186
  253. package/src/commands/plan/display.ts +0 -279
  254. package/src/commands/plan/index.ts +0 -599
  255. package/src/commands/plugin.ts +0 -398
  256. package/src/commands/preview.ts +0 -452
  257. package/src/commands/profile.ts +0 -342
  258. package/src/commands/questionnaire.ts +0 -1172
  259. package/src/commands/resume.ts +0 -47
  260. package/src/commands/rollback.ts +0 -315
  261. package/src/commands/rollout.ts +0 -88
  262. package/src/commands/runbook.ts +0 -346
  263. package/src/commands/schedule.ts +0 -236
  264. package/src/commands/status.ts +0 -252
  265. package/src/commands/team/index.ts +0 -346
  266. package/src/commands/team-context.ts +0 -220
  267. package/src/commands/template.ts +0 -233
  268. package/src/commands/tf/index.ts +0 -1093
  269. package/src/commands/upgrade.ts +0 -607
  270. package/src/commands/usage/index.ts +0 -134
  271. package/src/commands/version.ts +0 -174
  272. package/src/commands/watch.ts +0 -153
  273. package/src/compat/index.ts +0 -2
  274. package/src/compat/runtime.ts +0 -12
  275. package/src/compat/sqlite.ts +0 -177
  276. package/src/config/index.ts +0 -17
  277. package/src/config/manager.ts +0 -530
  278. package/src/config/mode-store.ts +0 -62
  279. package/src/config/profiles.ts +0 -84
  280. package/src/config/safety-policy.ts +0 -358
  281. package/src/config/schema.ts +0 -125
  282. package/src/config/types.ts +0 -609
  283. package/src/config/workspace-state.ts +0 -53
  284. package/src/context/context-db.ts +0 -199
  285. package/src/demo/index.ts +0 -349
  286. package/src/demo/scenarios/full-journey.ts +0 -229
  287. package/src/demo/scenarios/getting-started.ts +0 -127
  288. package/src/demo/scenarios/helm-release.ts +0 -341
  289. package/src/demo/scenarios/k8s-deployment.ts +0 -194
  290. package/src/demo/scenarios/terraform-vpc.ts +0 -170
  291. package/src/demo/types.ts +0 -92
  292. package/src/engine/cost-estimator.ts +0 -480
  293. package/src/engine/diagram-generator.ts +0 -256
  294. package/src/engine/drift-detector.ts +0 -902
  295. package/src/engine/executor.ts +0 -1066
  296. package/src/engine/index.ts +0 -76
  297. package/src/engine/orchestrator.ts +0 -636
  298. package/src/engine/planner.ts +0 -787
  299. package/src/engine/safety.ts +0 -743
  300. package/src/engine/verifier.ts +0 -770
  301. package/src/enterprise/audit.ts +0 -348
  302. package/src/enterprise/auth.ts +0 -270
  303. package/src/enterprise/billing.ts +0 -822
  304. package/src/enterprise/index.ts +0 -17
  305. package/src/enterprise/teams.ts +0 -443
  306. package/src/generator/best-practices.ts +0 -1608
  307. package/src/generator/helm.ts +0 -630
  308. package/src/generator/index.ts +0 -37
  309. package/src/generator/intent-parser.ts +0 -514
  310. package/src/generator/kubernetes.ts +0 -976
  311. package/src/generator/terraform.ts +0 -1875
  312. package/src/history/index.ts +0 -8
  313. package/src/history/manager.ts +0 -250
  314. package/src/history/types.ts +0 -34
  315. package/src/hooks/config.ts +0 -432
  316. package/src/hooks/engine.ts +0 -392
  317. package/src/hooks/index.ts +0 -4
  318. package/src/llm/auth-bridge.ts +0 -198
  319. package/src/llm/circuit-breaker.ts +0 -140
  320. package/src/llm/config-loader.ts +0 -201
  321. package/src/llm/cost-calculator.ts +0 -171
  322. package/src/llm/index.ts +0 -8
  323. package/src/llm/model-aliases.ts +0 -115
  324. package/src/llm/provider-registry.ts +0 -63
  325. package/src/llm/providers/anthropic.ts +0 -462
  326. package/src/llm/providers/bedrock.ts +0 -477
  327. package/src/llm/providers/google.ts +0 -405
  328. package/src/llm/providers/ollama.ts +0 -767
  329. package/src/llm/providers/openai-compatible.ts +0 -340
  330. package/src/llm/providers/openai.ts +0 -328
  331. package/src/llm/providers/openrouter.ts +0 -338
  332. package/src/llm/router.ts +0 -1104
  333. package/src/llm/types.ts +0 -232
  334. package/src/lsp/client.ts +0 -298
  335. package/src/lsp/languages.ts +0 -119
  336. package/src/lsp/manager.ts +0 -294
  337. package/src/mcp/client.ts +0 -402
  338. package/src/mcp/index.ts +0 -5
  339. package/src/mcp/manager.ts +0 -133
  340. package/src/nimbus.ts +0 -233
  341. package/src/plugins/index.ts +0 -27
  342. package/src/plugins/loader.ts +0 -334
  343. package/src/plugins/manager.ts +0 -376
  344. package/src/plugins/types.ts +0 -284
  345. package/src/scanners/cicd-scanner.ts +0 -258
  346. package/src/scanners/cloud-scanner.ts +0 -466
  347. package/src/scanners/framework-scanner.ts +0 -469
  348. package/src/scanners/iac-scanner.ts +0 -388
  349. package/src/scanners/index.ts +0 -539
  350. package/src/scanners/language-scanner.ts +0 -276
  351. package/src/scanners/package-manager-scanner.ts +0 -277
  352. package/src/scanners/types.ts +0 -172
  353. package/src/sessions/manager.ts +0 -472
  354. package/src/sessions/types.ts +0 -44
  355. package/src/sharing/sync.ts +0 -300
  356. package/src/sharing/viewer.ts +0 -163
  357. package/src/snapshots/index.ts +0 -2
  358. package/src/snapshots/manager.ts +0 -530
  359. package/src/state/artifacts.ts +0 -147
  360. package/src/state/audit.ts +0 -137
  361. package/src/state/billing.ts +0 -240
  362. package/src/state/checkpoints.ts +0 -117
  363. package/src/state/config.ts +0 -67
  364. package/src/state/conversations.ts +0 -14
  365. package/src/state/credentials.ts +0 -154
  366. package/src/state/db.ts +0 -58
  367. package/src/state/index.ts +0 -26
  368. package/src/state/messages.ts +0 -115
  369. package/src/state/projects.ts +0 -123
  370. package/src/state/schema.ts +0 -236
  371. package/src/state/sessions.ts +0 -147
  372. package/src/state/teams.ts +0 -200
  373. package/src/telemetry.ts +0 -108
  374. package/src/tools/aws-ops.ts +0 -952
  375. package/src/tools/azure-ops.ts +0 -579
  376. package/src/tools/file-ops.ts +0 -615
  377. package/src/tools/gcp-ops.ts +0 -625
  378. package/src/tools/git-ops.ts +0 -773
  379. package/src/tools/github-ops.ts +0 -799
  380. package/src/tools/helm-ops.ts +0 -943
  381. package/src/tools/index.ts +0 -17
  382. package/src/tools/k8s-ops.ts +0 -819
  383. package/src/tools/schemas/converter.ts +0 -184
  384. package/src/tools/schemas/devops.ts +0 -3502
  385. package/src/tools/schemas/index.ts +0 -73
  386. package/src/tools/schemas/standard.ts +0 -1148
  387. package/src/tools/schemas/types.ts +0 -735
  388. package/src/tools/spawn-exec.ts +0 -148
  389. package/src/tools/terraform-ops.ts +0 -862
  390. package/src/types/ambient.d.ts +0 -193
  391. package/src/types/config.ts +0 -83
  392. package/src/types/drift.ts +0 -116
  393. package/src/types/enterprise.ts +0 -335
  394. package/src/types/index.ts +0 -20
  395. package/src/types/plan.ts +0 -44
  396. package/src/types/request.ts +0 -65
  397. package/src/types/response.ts +0 -54
  398. package/src/types/service.ts +0 -51
  399. package/src/ui/App.tsx +0 -2114
  400. package/src/ui/DeployPreview.tsx +0 -174
  401. package/src/ui/FileDiffModal.tsx +0 -162
  402. package/src/ui/Header.tsx +0 -131
  403. package/src/ui/HelpModal.tsx +0 -57
  404. package/src/ui/InputBox.tsx +0 -503
  405. package/src/ui/MessageList.tsx +0 -1032
  406. package/src/ui/PermissionPrompt.tsx +0 -163
  407. package/src/ui/StatusBar.tsx +0 -277
  408. package/src/ui/TerminalPane.tsx +0 -84
  409. package/src/ui/ToolCallDisplay.tsx +0 -643
  410. package/src/ui/TreePane.tsx +0 -132
  411. package/src/ui/chat-ui.ts +0 -850
  412. package/src/ui/index.ts +0 -33
  413. package/src/ui/ink/index.ts +0 -1444
  414. package/src/ui/streaming.ts +0 -176
  415. package/src/ui/theme.ts +0 -104
  416. package/src/ui/types.ts +0 -75
  417. package/src/utils/analytics.ts +0 -72
  418. package/src/utils/cost-warning.ts +0 -27
  419. package/src/utils/env.ts +0 -46
  420. package/src/utils/errors.ts +0 -69
  421. package/src/utils/event-bus.ts +0 -38
  422. package/src/utils/index.ts +0 -24
  423. package/src/utils/logger.ts +0 -171
  424. package/src/utils/rate-limiter.ts +0 -121
  425. package/src/utils/service-auth.ts +0 -49
  426. package/src/utils/validation.ts +0 -53
  427. package/src/version.ts +0 -4
  428. package/src/watcher/index.ts +0 -214
  429. package/src/wizard/approval.ts +0 -383
  430. package/src/wizard/index.ts +0 -25
  431. package/src/wizard/prompts.ts +0 -338
  432. package/src/wizard/types.ts +0 -172
  433. package/src/wizard/ui.ts +0 -556
  434. package/src/wizard/wizard.ts +0 -304
  435. package/tsconfig.json +0 -24
@@ -1,778 +0,0 @@
1
- /**
2
- * streamWithTools() Tests
3
- *
4
- * Validates the streamWithTools() method added to three LLM providers:
5
- * - OllamaProvider (src/llm/providers/ollama.ts)
6
- * - OpenRouterProvider (src/llm/providers/openrouter.ts)
7
- * - OpenAICompatibleProvider (src/llm/providers/openai-compatible.ts)
8
- *
9
- * Each provider is tested for:
10
- * 1. Text-only streaming (yields text chunks then a final done chunk)
11
- * 2. Tool call streaming (yields tool calls in the final chunk)
12
- * 3. Fallback behavior (when streaming fails, falls back gracefully)
13
- *
14
- * All tests use mocks -- no real API calls are made.
15
- */
16
-
17
- import { describe, test, it, expect, vi, beforeEach } from 'vitest';
18
- import type { ToolCompletionRequest, StreamChunk } from '../llm/types';
19
-
20
- // ---------------------------------------------------------------------------
21
- // Helpers
22
- // ---------------------------------------------------------------------------
23
-
24
- /** Collect all chunks from an async generator into an array. */
25
- async function collectChunks(gen: AsyncIterable<StreamChunk>): Promise<StreamChunk[]> {
26
- const chunks: StreamChunk[] = [];
27
- for await (const chunk of gen) {
28
- chunks.push(chunk);
29
- }
30
- return chunks;
31
- }
32
-
33
- /** Minimal ToolCompletionRequest used across all tests. */
34
- function makeRequest(overrides?: Partial<ToolCompletionRequest>): ToolCompletionRequest {
35
- return {
36
- messages: [{ role: 'user', content: 'List files in the current directory' }],
37
- tools: [
38
- {
39
- type: 'function',
40
- function: {
41
- name: 'bash',
42
- description: 'Run a bash command',
43
- parameters: {
44
- type: 'object',
45
- properties: {
46
- command: { type: 'string', description: 'The command to run' },
47
- },
48
- required: ['command'],
49
- },
50
- },
51
- },
52
- ],
53
- ...overrides,
54
- };
55
- }
56
-
57
- /**
58
- * Build a ReadableStream from an array of raw strings.
59
- * Each string becomes one chunk the reader yields.
60
- */
61
- function buildReadableStream(lines: string[]): ReadableStream<Uint8Array> {
62
- const encoder = new TextEncoder();
63
- let index = 0;
64
- return new ReadableStream<Uint8Array>({
65
- pull(controller) {
66
- if (index < lines.length) {
67
- controller.enqueue(encoder.encode(lines[index]));
68
- index++;
69
- } else {
70
- controller.close();
71
- }
72
- },
73
- });
74
- }
75
-
76
- /**
77
- * Create a mock async iterable (simulating the OpenAI SDK stream object).
78
- * Accepts an array of chunk objects and yields them in order.
79
- */
80
- function createMockOpenAIStream(
81
- chunks: Array<{
82
- choices: Array<{
83
- delta: { content?: string; tool_calls?: any[] };
84
- finish_reason: string | null;
85
- }>;
86
- usage?: { prompt_tokens: number; completion_tokens: number; total_tokens: number };
87
- }>
88
- ) {
89
- return {
90
- async *[Symbol.asyncIterator]() {
91
- for (const chunk of chunks) {
92
- yield chunk;
93
- }
94
- },
95
- };
96
- }
97
-
98
- // ===========================================================================
99
- // OllamaProvider
100
- // ===========================================================================
101
-
102
- describe('OllamaProvider.streamWithTools', () => {
103
- let originalFetch: typeof globalThis.fetch;
104
-
105
- beforeEach(() => {
106
- originalFetch = globalThis.fetch;
107
- });
108
-
109
- // Restore fetch after each test to avoid leaking mocks
110
- function restoreFetch() {
111
- globalThis.fetch = originalFetch;
112
- }
113
-
114
- test('text-only streaming yields text chunks then a done chunk', async () => {
115
- // Mock the fetch for /v1/chat/completions (native tool streaming endpoint)
116
- const sseLines = [
117
- 'data: {"choices":[{"delta":{"content":"Hello"},"finish_reason":null}]}\n\n',
118
- 'data: {"choices":[{"delta":{"content":" world"},"finish_reason":null}]}\n\n',
119
- 'data: {"choices":[{"delta":{},"finish_reason":"stop"}],"usage":{"prompt_tokens":10,"completion_tokens":5,"total_tokens":15}}\n\n',
120
- 'data: [DONE]\n\n',
121
- ];
122
-
123
- globalThis.fetch = vi.fn(() =>
124
- Promise.resolve(
125
- new Response(buildReadableStream(sseLines), {
126
- status: 200,
127
- headers: { 'Content-Type': 'text/event-stream' },
128
- })
129
- )
130
- ) as any;
131
-
132
- try {
133
- const { OllamaProvider } = await import('../llm/providers/ollama');
134
- const provider = new OllamaProvider('http://localhost:11434');
135
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
136
-
137
- // Should have text chunks followed by a done chunk
138
- const textChunks = chunks.filter(c => c.content && !c.done);
139
- const doneChunks = chunks.filter(c => c.done);
140
-
141
- expect(textChunks.length).toBe(2);
142
- expect(textChunks[0].content).toBe('Hello');
143
- expect(textChunks[1].content).toBe(' world');
144
-
145
- expect(doneChunks.length).toBe(1);
146
- expect(doneChunks[0].done).toBe(true);
147
- expect(doneChunks[0].toolCalls).toBeUndefined();
148
-
149
- // Usage should be present on the final chunk
150
- expect(doneChunks[0].usage).toEqual({
151
- promptTokens: 10,
152
- completionTokens: 5,
153
- totalTokens: 15,
154
- });
155
- } finally {
156
- restoreFetch();
157
- }
158
- });
159
-
160
- test('tool call streaming accumulates tool calls and yields them on the done chunk', async () => {
161
- const sseLines = [
162
- // First chunk: tool call header
163
- 'data: {"choices":[{"delta":{"tool_calls":[{"index":0,"id":"call_abc123","function":{"name":"bash","arguments":""}}]},"finish_reason":null}]}\n\n',
164
- // Second chunk: tool call arguments (streamed incrementally)
165
- 'data: {"choices":[{"delta":{"tool_calls":[{"index":0,"function":{"arguments":"{\\"command\\""}}]},"finish_reason":null}]}\n\n',
166
- // Third chunk: remaining arguments
167
- 'data: {"choices":[{"delta":{"tool_calls":[{"index":0,"function":{"arguments":":\\"ls -la\\"}"}}]},"finish_reason":null}]}\n\n',
168
- // Final chunk with finish_reason
169
- 'data: {"choices":[{"delta":{},"finish_reason":"tool_calls"}]}\n\n',
170
- 'data: [DONE]\n\n',
171
- ];
172
-
173
- globalThis.fetch = vi.fn(() =>
174
- Promise.resolve(
175
- new Response(buildReadableStream(sseLines), {
176
- status: 200,
177
- headers: { 'Content-Type': 'text/event-stream' },
178
- })
179
- )
180
- ) as any;
181
-
182
- try {
183
- const { OllamaProvider } = await import('../llm/providers/ollama');
184
- const provider = new OllamaProvider('http://localhost:11434');
185
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
186
-
187
- const doneChunk = chunks.find(c => c.done);
188
- expect(doneChunk).toBeDefined();
189
- expect(doneChunk!.toolCalls).toBeDefined();
190
- expect(doneChunk!.toolCalls!.length).toBe(1);
191
-
192
- const tc = doneChunk!.toolCalls![0];
193
- expect(tc.id).toBe('call_abc123');
194
- expect(tc.type).toBe('function');
195
- expect(tc.function.name).toBe('bash');
196
- expect(tc.function.arguments).toBe('{"command":"ls -la"}');
197
- } finally {
198
- restoreFetch();
199
- }
200
- });
201
-
202
- test('fallback: when native streaming fails, falls back to completeWithTools', async () => {
203
- let _callCount = 0;
204
-
205
- globalThis.fetch = vi.fn((url: string | URL | Request) => {
206
- _callCount++;
207
- const urlStr = typeof url === 'string' ? url : url instanceof URL ? url.toString() : url.url;
208
-
209
- // First call: /v1/chat/completions (native streaming) -- fail
210
- if (urlStr.includes('/v1/chat/completions')) {
211
- return Promise.resolve(new Response('Not found', { status: 404 }));
212
- }
213
-
214
- // Second call: /api/chat (native tool calling attempt) -- return tool call
215
- if (urlStr.includes('/api/chat')) {
216
- return Promise.resolve(
217
- new Response(
218
- JSON.stringify({
219
- message: {
220
- content: '',
221
- tool_calls: [
222
- {
223
- function: {
224
- name: 'bash',
225
- arguments: { command: 'ls -la' },
226
- },
227
- },
228
- ],
229
- },
230
- model: 'llama3.2',
231
- prompt_eval_count: 20,
232
- eval_count: 10,
233
- }),
234
- { status: 200, headers: { 'Content-Type': 'application/json' } }
235
- )
236
- );
237
- }
238
-
239
- return Promise.reject(new Error(`Unexpected fetch to ${urlStr}`));
240
- }) as any;
241
-
242
- try {
243
- const { OllamaProvider } = await import('../llm/providers/ollama');
244
- const provider = new OllamaProvider('http://localhost:11434');
245
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
246
-
247
- // Fallback should yield a final done chunk with tool calls
248
- const doneChunk = chunks.find(c => c.done);
249
- expect(doneChunk).toBeDefined();
250
- expect(doneChunk!.toolCalls).toBeDefined();
251
- expect(doneChunk!.toolCalls!.length).toBe(1);
252
- expect(doneChunk!.toolCalls![0].function.name).toBe('bash');
253
- } finally {
254
- restoreFetch();
255
- }
256
- });
257
-
258
- test('multiple tool calls are accumulated correctly', async () => {
259
- const sseLines = [
260
- // Two tool calls starting in the same delta
261
- 'data: {"choices":[{"delta":{"tool_calls":[{"index":0,"id":"call_1","function":{"name":"bash","arguments":""}},{"index":1,"id":"call_2","function":{"name":"bash","arguments":""}}]},"finish_reason":null}]}\n\n',
262
- // Arguments for first tool call
263
- 'data: {"choices":[{"delta":{"tool_calls":[{"index":0,"function":{"arguments":"{\\"command\\":\\"ls\\"}"}}]},"finish_reason":null}]}\n\n',
264
- // Arguments for second tool call
265
- 'data: {"choices":[{"delta":{"tool_calls":[{"index":1,"function":{"arguments":"{\\"command\\":\\"pwd\\"}"}}]},"finish_reason":null}]}\n\n',
266
- // Done
267
- 'data: {"choices":[{"delta":{},"finish_reason":"tool_calls"}]}\n\n',
268
- 'data: [DONE]\n\n',
269
- ];
270
-
271
- globalThis.fetch = vi.fn(() =>
272
- Promise.resolve(
273
- new Response(buildReadableStream(sseLines), {
274
- status: 200,
275
- headers: { 'Content-Type': 'text/event-stream' },
276
- })
277
- )
278
- ) as any;
279
-
280
- try {
281
- const { OllamaProvider } = await import('../llm/providers/ollama');
282
- const provider = new OllamaProvider('http://localhost:11434');
283
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
284
-
285
- const doneChunk = chunks.find(c => c.done);
286
- expect(doneChunk).toBeDefined();
287
- expect(doneChunk!.toolCalls).toBeDefined();
288
- expect(doneChunk!.toolCalls!.length).toBe(2);
289
- expect(doneChunk!.toolCalls![0].function.name).toBe('bash');
290
- expect(doneChunk!.toolCalls![0].function.arguments).toBe('{"command":"ls"}');
291
- expect(doneChunk!.toolCalls![1].function.name).toBe('bash');
292
- expect(doneChunk!.toolCalls![1].function.arguments).toBe('{"command":"pwd"}');
293
- } finally {
294
- restoreFetch();
295
- }
296
- });
297
- });
298
-
299
- // ===========================================================================
300
- // OpenRouterProvider
301
- // ===========================================================================
302
-
303
- describe('OpenRouterProvider.streamWithTools', () => {
304
- test('text-only streaming yields text chunks then a done chunk', async () => {
305
- const streamChunks = createMockOpenAIStream([
306
- { choices: [{ delta: { content: 'Here is' }, finish_reason: null }] },
307
- { choices: [{ delta: { content: ' the answer' }, finish_reason: null }] },
308
- {
309
- choices: [{ delta: {}, finish_reason: 'stop' }],
310
- usage: { prompt_tokens: 12, completion_tokens: 8, total_tokens: 20 },
311
- },
312
- ]);
313
-
314
- const mockCreate = vi.fn(() => Promise.resolve(streamChunks));
315
-
316
- const { OpenRouterProvider } = await import('../llm/providers/openrouter');
317
- const provider = new OpenRouterProvider('test-api-key');
318
-
319
- // Replace the client's create method with our mock
320
- (provider as any).client = {
321
- chat: { completions: { create: mockCreate } },
322
- };
323
-
324
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
325
-
326
- // Verify text chunks
327
- const textChunks = chunks.filter(c => c.content && !c.done);
328
- expect(textChunks.length).toBe(2);
329
- expect(textChunks[0].content).toBe('Here is');
330
- expect(textChunks[1].content).toBe(' the answer');
331
-
332
- // Verify done chunk
333
- const doneChunk = chunks.find(c => c.done);
334
- expect(doneChunk).toBeDefined();
335
- expect(doneChunk!.done).toBe(true);
336
- expect(doneChunk!.toolCalls).toBeUndefined();
337
-
338
- // Verify usage
339
- expect(doneChunk!.usage).toEqual({
340
- promptTokens: 12,
341
- completionTokens: 8,
342
- totalTokens: 20,
343
- });
344
-
345
- // Verify the create call was made with stream: true and tools
346
- expect(mockCreate).toHaveBeenCalledTimes(1);
347
- const createArg = (mockCreate.mock.calls[0] as unknown[])[0] as any;
348
- expect(createArg.stream).toBe(true);
349
- expect(createArg.tools).toBeDefined();
350
- expect(createArg.tools.length).toBe(1);
351
- expect(createArg.tools[0].function.name).toBe('bash');
352
- expect(createArg.stream_options).toEqual({ include_usage: true });
353
- });
354
-
355
- test('tool call streaming accumulates tool calls and yields them on the done chunk', async () => {
356
- const streamChunks = createMockOpenAIStream([
357
- // Tool call header
358
- {
359
- choices: [
360
- {
361
- delta: {
362
- tool_calls: [{ index: 0, id: 'call_xyz', function: { name: 'bash', arguments: '' } }],
363
- },
364
- finish_reason: null,
365
- },
366
- ],
367
- },
368
- // Streamed arguments
369
- {
370
- choices: [
371
- {
372
- delta: {
373
- tool_calls: [{ index: 0, function: { arguments: '{"command"' } }],
374
- },
375
- finish_reason: null,
376
- },
377
- ],
378
- },
379
- {
380
- choices: [
381
- {
382
- delta: {
383
- tool_calls: [{ index: 0, function: { arguments: ':"ls -la"}' } }],
384
- },
385
- finish_reason: null,
386
- },
387
- ],
388
- },
389
- // Finish with tool_calls reason
390
- {
391
- choices: [{ delta: {}, finish_reason: 'tool_calls' }],
392
- },
393
- ]);
394
-
395
- const mockCreate = vi.fn(() => Promise.resolve(streamChunks));
396
-
397
- const { OpenRouterProvider } = await import('../llm/providers/openrouter');
398
- const provider = new OpenRouterProvider('test-api-key');
399
- (provider as any).client = {
400
- chat: { completions: { create: mockCreate } },
401
- };
402
-
403
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
404
-
405
- const doneChunk = chunks.find(c => c.done);
406
- expect(doneChunk).toBeDefined();
407
- expect(doneChunk!.toolCalls).toBeDefined();
408
- expect(doneChunk!.toolCalls!.length).toBe(1);
409
-
410
- const tc = doneChunk!.toolCalls![0];
411
- expect(tc.id).toBe('call_xyz');
412
- expect(tc.type).toBe('function');
413
- expect(tc.function.name).toBe('bash');
414
- expect(tc.function.arguments).toBe('{"command":"ls -la"}');
415
- });
416
-
417
- test('fallback: when SDK stream creation throws, the generator yields nothing', async () => {
418
- const mockCreate = vi.fn(() => Promise.reject(new Error('API unavailable')));
419
-
420
- const { OpenRouterProvider } = await import('../llm/providers/openrouter');
421
- const provider = new OpenRouterProvider('test-api-key');
422
- (provider as any).client = {
423
- chat: { completions: { create: mockCreate } },
424
- };
425
-
426
- // The method is an async generator that will throw when it tries to create
427
- // the stream. The error propagates to the caller.
428
- try {
429
- await collectChunks(provider.streamWithTools(makeRequest()));
430
- // If we get here, it means no error was thrown (unexpected)
431
- expect(true).toBe(false);
432
- } catch (err: any) {
433
- expect(err.message).toBe('API unavailable');
434
- }
435
- });
436
-
437
- test('mixed content and tool calls are handled correctly', async () => {
438
- const streamChunks = createMockOpenAIStream([
439
- // Some text content first
440
- { choices: [{ delta: { content: 'Let me run that' }, finish_reason: null }] },
441
- // Then a tool call
442
- {
443
- choices: [
444
- {
445
- delta: {
446
- tool_calls: [
447
- {
448
- index: 0,
449
- id: 'call_mix',
450
- function: { name: 'bash', arguments: '{"command":"ls"}' },
451
- },
452
- ],
453
- },
454
- finish_reason: null,
455
- },
456
- ],
457
- },
458
- // Done
459
- {
460
- choices: [{ delta: {}, finish_reason: 'tool_calls' }],
461
- usage: { prompt_tokens: 5, completion_tokens: 3, total_tokens: 8 },
462
- },
463
- ]);
464
-
465
- const mockCreate = vi.fn(() => Promise.resolve(streamChunks));
466
-
467
- const { OpenRouterProvider } = await import('../llm/providers/openrouter');
468
- const provider = new OpenRouterProvider('test-api-key');
469
- (provider as any).client = {
470
- chat: { completions: { create: mockCreate } },
471
- };
472
-
473
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
474
-
475
- // Text chunk
476
- const textChunks = chunks.filter(c => c.content && !c.done);
477
- expect(textChunks.length).toBe(1);
478
- expect(textChunks[0].content).toBe('Let me run that');
479
-
480
- // Done chunk with tool calls
481
- const doneChunk = chunks.find(c => c.done);
482
- expect(doneChunk).toBeDefined();
483
- expect(doneChunk!.toolCalls).toBeDefined();
484
- expect(doneChunk!.toolCalls![0].function.name).toBe('bash');
485
- expect(doneChunk!.usage).toEqual({
486
- promptTokens: 5,
487
- completionTokens: 3,
488
- totalTokens: 8,
489
- });
490
- });
491
- });
492
-
493
- // ===========================================================================
494
- // OpenAICompatibleProvider
495
- // ===========================================================================
496
-
497
- describe('OpenAICompatibleProvider.streamWithTools', () => {
498
- async function createProvider() {
499
- const { OpenAICompatibleProvider } = await import('../llm/providers/openai-compatible');
500
- return new OpenAICompatibleProvider({
501
- name: 'test-compat',
502
- apiKey: 'test-key',
503
- baseURL: 'https://api.test.com/v1',
504
- defaultModel: 'test-model',
505
- });
506
- }
507
-
508
- test('text-only streaming yields text chunks then a done chunk', async () => {
509
- const streamChunks = createMockOpenAIStream([
510
- { choices: [{ delta: { content: 'Response' }, finish_reason: null }] },
511
- { choices: [{ delta: { content: ' text' }, finish_reason: null }] },
512
- {
513
- choices: [{ delta: {}, finish_reason: 'stop' }],
514
- usage: { prompt_tokens: 8, completion_tokens: 4, total_tokens: 12 },
515
- },
516
- ]);
517
-
518
- const mockCreate = vi.fn(() => Promise.resolve(streamChunks));
519
-
520
- const provider = await createProvider();
521
- (provider as any).client = {
522
- chat: { completions: { create: mockCreate } },
523
- };
524
-
525
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
526
-
527
- // Text chunks
528
- const textChunks = chunks.filter(c => c.content && !c.done);
529
- expect(textChunks.length).toBe(2);
530
- expect(textChunks[0].content).toBe('Response');
531
- expect(textChunks[1].content).toBe(' text');
532
-
533
- // Done chunk
534
- const doneChunk = chunks.find(c => c.done);
535
- expect(doneChunk).toBeDefined();
536
- expect(doneChunk!.done).toBe(true);
537
- expect(doneChunk!.toolCalls).toBeUndefined();
538
- expect(doneChunk!.usage).toEqual({
539
- promptTokens: 8,
540
- completionTokens: 4,
541
- totalTokens: 12,
542
- });
543
-
544
- // Verify stream options
545
- const createArg = (mockCreate.mock.calls[0] as unknown[])[0] as any;
546
- expect(createArg.stream).toBe(true);
547
- expect(createArg.stream_options).toEqual({ include_usage: true });
548
- });
549
-
550
- test('tool call streaming accumulates tool calls and yields them on the done chunk', async () => {
551
- const streamChunks = createMockOpenAIStream([
552
- {
553
- choices: [
554
- {
555
- delta: {
556
- tool_calls: [
557
- { index: 0, id: 'call_compat1', function: { name: 'bash', arguments: '' } },
558
- ],
559
- },
560
- finish_reason: null,
561
- },
562
- ],
563
- },
564
- {
565
- choices: [
566
- {
567
- delta: {
568
- tool_calls: [{ index: 0, function: { arguments: '{"command":"pwd"}' } }],
569
- },
570
- finish_reason: null,
571
- },
572
- ],
573
- },
574
- {
575
- choices: [{ delta: {}, finish_reason: 'tool_calls' }],
576
- },
577
- ]);
578
-
579
- const mockCreate = vi.fn(() => Promise.resolve(streamChunks));
580
-
581
- const provider = await createProvider();
582
- (provider as any).client = {
583
- chat: { completions: { create: mockCreate } },
584
- };
585
-
586
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
587
-
588
- const doneChunk = chunks.find(c => c.done);
589
- expect(doneChunk).toBeDefined();
590
- expect(doneChunk!.toolCalls).toBeDefined();
591
- expect(doneChunk!.toolCalls!.length).toBe(1);
592
-
593
- const tc = doneChunk!.toolCalls![0];
594
- expect(tc.id).toBe('call_compat1');
595
- expect(tc.type).toBe('function');
596
- expect(tc.function.name).toBe('bash');
597
- expect(tc.function.arguments).toBe('{"command":"pwd"}');
598
- });
599
-
600
- test('fallback: when SDK stream creation throws, the error propagates', async () => {
601
- const mockCreate = vi.fn(() => Promise.reject(new Error('Provider down')));
602
-
603
- const provider = await createProvider();
604
- (provider as any).client = {
605
- chat: { completions: { create: mockCreate } },
606
- };
607
-
608
- try {
609
- await collectChunks(provider.streamWithTools(makeRequest()));
610
- expect(true).toBe(false);
611
- } catch (err: any) {
612
- expect(err.message).toBe('Provider down');
613
- }
614
- });
615
-
616
- test('multiple tool calls across different indices are accumulated', async () => {
617
- const streamChunks = createMockOpenAIStream([
618
- // Two tool calls in separate chunks
619
- {
620
- choices: [
621
- {
622
- delta: {
623
- tool_calls: [
624
- {
625
- index: 0,
626
- id: 'call_a',
627
- function: { name: 'bash', arguments: '{"command":"ls"}' },
628
- },
629
- ],
630
- },
631
- finish_reason: null,
632
- },
633
- ],
634
- },
635
- {
636
- choices: [
637
- {
638
- delta: {
639
- tool_calls: [
640
- {
641
- index: 1,
642
- id: 'call_b',
643
- function: { name: 'bash', arguments: '{"command":"cat file.txt"}' },
644
- },
645
- ],
646
- },
647
- finish_reason: null,
648
- },
649
- ],
650
- },
651
- {
652
- choices: [{ delta: {}, finish_reason: 'tool_calls' }],
653
- },
654
- ]);
655
-
656
- const mockCreate = vi.fn(() => Promise.resolve(streamChunks));
657
-
658
- const provider = await createProvider();
659
- (provider as any).client = {
660
- chat: { completions: { create: mockCreate } },
661
- };
662
-
663
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
664
-
665
- const doneChunk = chunks.find(c => c.done);
666
- expect(doneChunk).toBeDefined();
667
- expect(doneChunk!.toolCalls).toBeDefined();
668
- expect(doneChunk!.toolCalls!.length).toBe(2);
669
- expect(doneChunk!.toolCalls![0].id).toBe('call_a');
670
- expect(doneChunk!.toolCalls![0].function.arguments).toBe('{"command":"ls"}');
671
- expect(doneChunk!.toolCalls![1].id).toBe('call_b');
672
- expect(doneChunk!.toolCalls![1].function.arguments).toBe('{"command":"cat file.txt"}');
673
- });
674
-
675
- test('usage from a mid-stream chunk is captured on the done chunk', async () => {
676
- const streamChunks = createMockOpenAIStream([
677
- { choices: [{ delta: { content: 'ok' }, finish_reason: null }] },
678
- {
679
- choices: [{ delta: {}, finish_reason: null }],
680
- usage: { prompt_tokens: 100, completion_tokens: 50, total_tokens: 150 },
681
- },
682
- {
683
- choices: [{ delta: {}, finish_reason: 'stop' }],
684
- },
685
- ]);
686
-
687
- const mockCreate = vi.fn(() => Promise.resolve(streamChunks));
688
-
689
- const provider = await createProvider();
690
- (provider as any).client = {
691
- chat: { completions: { create: mockCreate } },
692
- };
693
-
694
- const chunks = await collectChunks(provider.streamWithTools(makeRequest()));
695
-
696
- const doneChunk = chunks.find(c => c.done);
697
- expect(doneChunk).toBeDefined();
698
- expect(doneChunk!.usage).toEqual({
699
- promptTokens: 100,
700
- completionTokens: 50,
701
- totalTokens: 150,
702
- });
703
- });
704
-
705
- test('tool_choice is forwarded to the API call', async () => {
706
- const streamChunks = createMockOpenAIStream([
707
- { choices: [{ delta: { content: 'done' }, finish_reason: 'stop' }] },
708
- ]);
709
-
710
- const mockCreate = vi.fn(() => Promise.resolve(streamChunks));
711
-
712
- const provider = await createProvider();
713
- (provider as any).client = {
714
- chat: { completions: { create: mockCreate } },
715
- };
716
-
717
- const request = makeRequest({
718
- toolChoice: { type: 'function', function: { name: 'bash' } },
719
- temperature: 0.5,
720
- maxTokens: 1024,
721
- });
722
-
723
- await collectChunks(provider.streamWithTools(request));
724
-
725
- const createArg = (mockCreate.mock.calls[0] as unknown[])[0] as any;
726
- expect(createArg.tool_choice).toEqual({ type: 'function', function: { name: 'bash' } });
727
- expect(createArg.temperature).toBe(0.5);
728
- expect(createArg.max_tokens).toBe(1024);
729
- });
730
- });
731
-
732
- // ---------------------------------------------------------------------------
733
- // PERF-2c: Unbuffered streaming in LLMRouter fallback branch
734
- // ---------------------------------------------------------------------------
735
-
736
- describe('PERF-2c: LLMRouter unbuffered streaming', () => {
737
- it('streamWithTools fallback loop no longer buffers chunks before yielding', async () => {
738
- const { readFileSync } = await import('node:fs');
739
- const { join } = await import('node:path');
740
- const src = readFileSync(join(process.cwd(), 'src/llm/router.ts'), 'utf-8');
741
- // Extract only the streamWithTools section (between the streamWithTools guards)
742
- const swStart = src.indexOf('Use native streaming-with-tools if providers support it');
743
- const swEnd = src.indexOf('If all providers with streamWithTools failed', swStart);
744
- const swSection = swStart > 0 && swEnd > swStart ? src.slice(swStart, swEnd) : '';
745
- // The streamWithTools fallback section should NOT contain buffering
746
- expect(swSection).not.toContain('bufferedChunks');
747
- // It should contain yield chunk directly
748
- expect(swSection).toContain('yield chunk;');
749
- });
750
-
751
- it('router.ts yields each chunk immediately inside the for-await loop', async () => {
752
- const { readFileSync } = await import('node:fs');
753
- const { join } = await import('node:path');
754
- const src = readFileSync(join(process.cwd(), 'src/llm/router.ts'), 'utf-8');
755
- // The yield statement should appear inside the for-await (before circuitBreaker.recordSuccess)
756
- expect(src).toContain('yield chunk;');
757
- // circuitBreaker.recordSuccess comes after the loop ends (done chunk received)
758
- expect(src).toContain('circuitBreaker.recordSuccess(p.name);');
759
- });
760
-
761
- it('circuitBreaker.recordSuccess is called after stream ends (not before yield)', async () => {
762
- const { readFileSync } = await import('node:fs');
763
- const { join } = await import('node:path');
764
- const src = readFileSync(join(process.cwd(), 'src/llm/router.ts'), 'utf-8');
765
- // Find the fallback for-loop block that has yield chunk
766
- const yieldIdx = src.indexOf('yield chunk;');
767
- const recordSuccessIdx = src.indexOf('circuitBreaker.recordSuccess(p.name);');
768
- // recordSuccess should appear AFTER the yield in the source
769
- expect(recordSuccessIdx).toBeGreaterThan(yieldIdx);
770
- });
771
-
772
- it('stream error path still calls circuitBreaker.recordFailure', async () => {
773
- const { readFileSync } = await import('node:fs');
774
- const { join } = await import('node:path');
775
- const src = readFileSync(join(process.cwd(), 'src/llm/router.ts'), 'utf-8');
776
- expect(src).toContain('circuitBreaker.recordFailure(p.name);');
777
- });
778
- });