@build-astron-co/nimbus 0.2.0 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (469) hide show
  1. package/bin/nimbus +26 -10
  2. package/bin/nimbus.cmd +41 -0
  3. package/bin/nimbus.mjs +70 -0
  4. package/completions/nimbus.bash +38 -0
  5. package/completions/nimbus.fish +48 -0
  6. package/completions/nimbus.zsh +81 -0
  7. package/dist/src/agent/compaction-agent.js +215 -0
  8. package/dist/src/agent/context-manager.js +385 -0
  9. package/dist/src/agent/context.js +322 -0
  10. package/dist/src/agent/deploy-preview.js +395 -0
  11. package/dist/src/agent/expand-files.js +95 -0
  12. package/dist/src/agent/index.js +18 -0
  13. package/dist/src/agent/loop.js +1535 -0
  14. package/dist/src/agent/modes.js +347 -0
  15. package/dist/src/agent/permissions.js +396 -0
  16. package/dist/src/agent/subagents/base.js +67 -0
  17. package/dist/src/agent/subagents/cost.js +45 -0
  18. package/dist/src/agent/subagents/explore.js +36 -0
  19. package/dist/src/agent/subagents/general.js +41 -0
  20. package/dist/src/agent/subagents/index.js +88 -0
  21. package/dist/src/agent/subagents/infra.js +52 -0
  22. package/dist/src/agent/subagents/security.js +60 -0
  23. package/dist/src/agent/system-prompt.js +860 -0
  24. package/dist/src/app.js +152 -0
  25. package/dist/src/audit/activity-log.js +209 -0
  26. package/dist/src/audit/compliance-checker.js +419 -0
  27. package/dist/src/audit/cost-tracker.js +231 -0
  28. package/dist/src/audit/index.js +10 -0
  29. package/dist/src/audit/security-scanner.js +490 -0
  30. package/dist/src/auth/guard.js +64 -0
  31. package/dist/src/auth/index.js +19 -0
  32. package/dist/src/auth/keychain.js +79 -0
  33. package/dist/src/auth/oauth.js +389 -0
  34. package/dist/src/auth/providers.js +415 -0
  35. package/dist/src/auth/sso.js +87 -0
  36. package/dist/src/auth/store.js +424 -0
  37. package/dist/src/auth/types.js +5 -0
  38. package/dist/src/cli/index.js +8 -0
  39. package/dist/src/cli/init.js +1048 -0
  40. package/dist/src/cli/openapi-spec.js +346 -0
  41. package/dist/src/cli/run.js +505 -0
  42. package/dist/src/cli/serve-auth.js +56 -0
  43. package/dist/src/cli/serve.js +432 -0
  44. package/dist/src/cli/web.js +50 -0
  45. package/dist/src/cli.js +1574 -0
  46. package/dist/src/clients/core-engine-client.js +156 -0
  47. package/dist/src/clients/enterprise-client.js +246 -0
  48. package/dist/src/clients/generator-client.js +219 -0
  49. package/dist/src/clients/git-client.js +367 -0
  50. package/dist/src/clients/github-client.js +229 -0
  51. package/dist/src/clients/helm-client.js +299 -0
  52. package/dist/src/clients/index.js +18 -0
  53. package/dist/src/clients/k8s-client.js +270 -0
  54. package/dist/src/clients/llm-client.js +119 -0
  55. package/dist/src/clients/rest-client.js +104 -0
  56. package/dist/src/clients/service-discovery.js +35 -0
  57. package/dist/src/clients/terraform-client.js +302 -0
  58. package/dist/src/clients/tools-client.js +1227 -0
  59. package/dist/src/clients/ws-client.js +93 -0
  60. package/dist/src/commands/alias.js +91 -0
  61. package/dist/src/commands/analyze/index.js +313 -0
  62. package/dist/src/commands/apply/helm.js +375 -0
  63. package/dist/src/commands/apply/index.js +176 -0
  64. package/dist/src/commands/apply/k8s.js +350 -0
  65. package/dist/src/commands/apply/terraform.js +465 -0
  66. package/dist/src/commands/ask.js +137 -0
  67. package/dist/src/commands/audit/index.js +322 -0
  68. package/dist/src/commands/auth-cloud.js +345 -0
  69. package/dist/src/commands/auth-list.js +112 -0
  70. package/dist/src/commands/auth-profile.js +104 -0
  71. package/dist/src/commands/auth-refresh.js +161 -0
  72. package/dist/src/commands/auth-status.js +122 -0
  73. package/dist/src/commands/aws/ec2.js +402 -0
  74. package/dist/src/commands/aws/iam.js +304 -0
  75. package/dist/src/commands/aws/index.js +108 -0
  76. package/dist/src/commands/aws/lambda.js +317 -0
  77. package/dist/src/commands/aws/rds.js +345 -0
  78. package/dist/src/commands/aws/s3.js +346 -0
  79. package/dist/src/commands/aws/vpc.js +302 -0
  80. package/dist/src/commands/aws-discover.js +413 -0
  81. package/dist/src/commands/aws-terraform.js +618 -0
  82. package/dist/src/commands/azure/aks.js +305 -0
  83. package/dist/src/commands/azure/functions.js +200 -0
  84. package/dist/src/commands/azure/index.js +93 -0
  85. package/dist/src/commands/azure/storage.js +378 -0
  86. package/dist/src/commands/azure/vm.js +291 -0
  87. package/dist/src/commands/billing/index.js +224 -0
  88. package/dist/src/commands/chat.js +259 -0
  89. package/dist/src/commands/completions.js +255 -0
  90. package/dist/src/commands/config.js +291 -0
  91. package/dist/src/commands/cost/cloud-cost-estimator.js +211 -0
  92. package/dist/src/commands/cost/estimator.js +73 -0
  93. package/dist/src/commands/cost/index.js +625 -0
  94. package/dist/src/commands/cost/parsers/terraform.js +234 -0
  95. package/dist/src/commands/cost/parsers/types.js +4 -0
  96. package/dist/src/commands/cost/pricing/aws.js +501 -0
  97. package/dist/src/commands/cost/pricing/azure.js +462 -0
  98. package/dist/src/commands/cost/pricing/gcp.js +359 -0
  99. package/dist/src/commands/cost/pricing/index.js +24 -0
  100. package/dist/src/commands/demo.js +196 -0
  101. package/dist/src/commands/deploy.js +215 -0
  102. package/dist/src/commands/doctor.js +1291 -0
  103. package/dist/src/commands/drift/index.js +674 -0
  104. package/dist/src/commands/explain.js +235 -0
  105. package/dist/src/commands/export.js +120 -0
  106. package/dist/src/commands/feedback.js +319 -0
  107. package/dist/src/commands/fix.js +263 -0
  108. package/dist/src/commands/fs/index.js +338 -0
  109. package/dist/src/commands/gcp/compute.js +266 -0
  110. package/dist/src/commands/gcp/functions.js +221 -0
  111. package/dist/src/commands/gcp/gke.js +357 -0
  112. package/dist/src/commands/gcp/iam.js +295 -0
  113. package/dist/src/commands/gcp/index.js +105 -0
  114. package/dist/src/commands/gcp/storage.js +232 -0
  115. package/dist/src/commands/generate-helm.js +1026 -0
  116. package/dist/src/commands/generate-k8s.js +1263 -0
  117. package/dist/src/commands/generate-terraform.js +1058 -0
  118. package/dist/src/commands/gh/index.js +663 -0
  119. package/dist/src/commands/git/index.js +1208 -0
  120. package/dist/src/commands/helm/index.js +985 -0
  121. package/dist/src/commands/help.js +639 -0
  122. package/dist/src/commands/history.js +120 -0
  123. package/dist/src/commands/import.js +782 -0
  124. package/dist/src/commands/incident.js +144 -0
  125. package/dist/src/commands/index.js +109 -0
  126. package/dist/src/commands/init.js +955 -0
  127. package/dist/src/commands/k8s/index.js +979 -0
  128. package/dist/src/commands/login.js +588 -0
  129. package/dist/src/commands/logout.js +61 -0
  130. package/dist/src/commands/logs.js +160 -0
  131. package/dist/src/commands/onboarding.js +382 -0
  132. package/dist/src/commands/pipeline.js +153 -0
  133. package/dist/src/commands/plan/display.js +216 -0
  134. package/dist/src/commands/plan/index.js +525 -0
  135. package/dist/src/commands/plugin.js +325 -0
  136. package/dist/src/commands/preview.js +356 -0
  137. package/dist/src/commands/profile.js +297 -0
  138. package/dist/src/commands/questionnaire.js +1021 -0
  139. package/dist/src/commands/resume.js +35 -0
  140. package/dist/src/commands/rollback.js +259 -0
  141. package/dist/src/commands/rollout.js +74 -0
  142. package/dist/src/commands/runbook.js +307 -0
  143. package/dist/src/commands/schedule.js +202 -0
  144. package/dist/src/commands/status.js +213 -0
  145. package/dist/src/commands/team/index.js +309 -0
  146. package/dist/src/commands/team-context.js +200 -0
  147. package/dist/src/commands/template.js +204 -0
  148. package/dist/src/commands/tf/index.js +989 -0
  149. package/dist/src/commands/upgrade.js +515 -0
  150. package/dist/src/commands/usage/index.js +118 -0
  151. package/dist/src/commands/version.js +145 -0
  152. package/dist/src/commands/watch.js +127 -0
  153. package/dist/src/compat/index.js +2 -0
  154. package/dist/src/compat/runtime.js +10 -0
  155. package/dist/src/compat/sqlite.js +144 -0
  156. package/dist/src/config/index.js +6 -0
  157. package/dist/src/config/manager.js +469 -0
  158. package/dist/src/config/mode-store.js +57 -0
  159. package/dist/src/config/profiles.js +66 -0
  160. package/dist/src/config/safety-policy.js +251 -0
  161. package/dist/src/config/schema.js +107 -0
  162. package/dist/src/config/types.js +311 -0
  163. package/dist/src/config/workspace-state.js +38 -0
  164. package/dist/src/context/context-db.js +138 -0
  165. package/dist/src/demo/index.js +295 -0
  166. package/dist/src/demo/scenarios/full-journey.js +226 -0
  167. package/dist/src/demo/scenarios/getting-started.js +124 -0
  168. package/dist/src/demo/scenarios/helm-release.js +334 -0
  169. package/dist/src/demo/scenarios/k8s-deployment.js +190 -0
  170. package/dist/src/demo/scenarios/terraform-vpc.js +167 -0
  171. package/dist/src/demo/types.js +6 -0
  172. package/dist/src/engine/cost-estimator.js +334 -0
  173. package/dist/src/engine/diagram-generator.js +192 -0
  174. package/dist/src/engine/drift-detector.js +688 -0
  175. package/dist/src/engine/executor.js +832 -0
  176. package/dist/src/engine/index.js +39 -0
  177. package/dist/src/engine/orchestrator.js +436 -0
  178. package/dist/src/engine/planner.js +616 -0
  179. package/dist/src/engine/safety.js +609 -0
  180. package/dist/src/engine/verifier.js +664 -0
  181. package/dist/src/enterprise/audit.js +241 -0
  182. package/dist/src/enterprise/auth.js +189 -0
  183. package/dist/src/enterprise/billing.js +512 -0
  184. package/dist/src/enterprise/index.js +16 -0
  185. package/dist/src/enterprise/teams.js +315 -0
  186. package/dist/src/generator/best-practices.js +1375 -0
  187. package/dist/src/generator/helm.js +495 -0
  188. package/dist/src/generator/index.js +11 -0
  189. package/dist/src/generator/intent-parser.js +420 -0
  190. package/dist/src/generator/kubernetes.js +773 -0
  191. package/dist/src/generator/terraform.js +1472 -0
  192. package/dist/src/history/index.js +6 -0
  193. package/dist/src/history/manager.js +199 -0
  194. package/dist/src/history/types.js +6 -0
  195. package/dist/src/hooks/config.js +318 -0
  196. package/dist/src/hooks/engine.js +317 -0
  197. package/dist/src/hooks/index.js +2 -0
  198. package/dist/src/llm/auth-bridge.js +157 -0
  199. package/dist/src/llm/circuit-breaker.js +116 -0
  200. package/dist/src/llm/config-loader.js +172 -0
  201. package/dist/src/llm/cost-calculator.js +137 -0
  202. package/dist/src/llm/index.js +7 -0
  203. package/dist/src/llm/model-aliases.js +99 -0
  204. package/dist/src/llm/provider-registry.js +57 -0
  205. package/dist/src/llm/providers/anthropic.js +430 -0
  206. package/dist/src/llm/providers/bedrock.js +409 -0
  207. package/dist/src/llm/providers/google.js +344 -0
  208. package/dist/src/llm/providers/ollama.js +661 -0
  209. package/dist/src/llm/providers/openai-compatible.js +289 -0
  210. package/dist/src/llm/providers/openai.js +284 -0
  211. package/dist/src/llm/providers/openrouter.js +293 -0
  212. package/dist/src/llm/router.js +844 -0
  213. package/dist/src/llm/types.js +69 -0
  214. package/dist/src/lsp/client.js +239 -0
  215. package/dist/src/lsp/languages.js +95 -0
  216. package/dist/src/lsp/manager.js +243 -0
  217. package/dist/src/mcp/client.js +289 -0
  218. package/dist/src/mcp/index.js +5 -0
  219. package/dist/src/mcp/manager.js +113 -0
  220. package/dist/src/nimbus.js +212 -0
  221. package/dist/src/plugins/index.js +13 -0
  222. package/dist/src/plugins/loader.js +280 -0
  223. package/dist/src/plugins/manager.js +282 -0
  224. package/dist/src/plugins/types.js +23 -0
  225. package/dist/src/scanners/cicd-scanner.js +230 -0
  226. package/dist/src/scanners/cloud-scanner.js +415 -0
  227. package/dist/src/scanners/framework-scanner.js +430 -0
  228. package/dist/src/scanners/iac-scanner.js +350 -0
  229. package/dist/src/scanners/index.js +454 -0
  230. package/dist/src/scanners/language-scanner.js +258 -0
  231. package/dist/src/scanners/package-manager-scanner.js +252 -0
  232. package/dist/src/scanners/types.js +6 -0
  233. package/dist/src/sessions/manager.js +395 -0
  234. package/dist/src/sessions/types.js +4 -0
  235. package/dist/src/sharing/sync.js +238 -0
  236. package/dist/src/sharing/viewer.js +131 -0
  237. package/dist/src/snapshots/index.js +1 -0
  238. package/dist/src/snapshots/manager.js +432 -0
  239. package/dist/src/state/artifacts.js +94 -0
  240. package/dist/src/state/audit.js +73 -0
  241. package/dist/src/state/billing.js +126 -0
  242. package/dist/src/state/checkpoints.js +81 -0
  243. package/dist/src/state/config.js +58 -0
  244. package/dist/src/state/conversations.js +7 -0
  245. package/dist/src/state/credentials.js +96 -0
  246. package/dist/src/state/db.js +53 -0
  247. package/dist/src/state/index.js +23 -0
  248. package/dist/src/state/messages.js +76 -0
  249. package/dist/src/state/projects.js +92 -0
  250. package/dist/src/state/schema.js +233 -0
  251. package/dist/src/state/sessions.js +79 -0
  252. package/dist/src/state/teams.js +131 -0
  253. package/dist/src/telemetry.js +91 -0
  254. package/dist/src/tools/aws-ops.js +747 -0
  255. package/dist/src/tools/azure-ops.js +491 -0
  256. package/dist/src/tools/file-ops.js +451 -0
  257. package/dist/src/tools/gcp-ops.js +559 -0
  258. package/dist/src/tools/git-ops.js +557 -0
  259. package/dist/src/tools/github-ops.js +460 -0
  260. package/dist/src/tools/helm-ops.js +634 -0
  261. package/dist/src/tools/index.js +16 -0
  262. package/dist/src/tools/k8s-ops.js +579 -0
  263. package/dist/src/tools/schemas/converter.js +129 -0
  264. package/dist/src/tools/schemas/devops.js +3319 -0
  265. package/dist/src/tools/schemas/index.js +19 -0
  266. package/dist/src/tools/schemas/standard.js +966 -0
  267. package/dist/src/tools/schemas/types.js +409 -0
  268. package/dist/src/tools/spawn-exec.js +109 -0
  269. package/dist/src/tools/terraform-ops.js +627 -0
  270. package/dist/src/types/config.js +1 -0
  271. package/dist/src/types/drift.js +4 -0
  272. package/dist/src/types/enterprise.js +5 -0
  273. package/dist/src/types/index.js +14 -0
  274. package/dist/src/types/plan.js +1 -0
  275. package/dist/src/types/request.js +1 -0
  276. package/dist/src/types/response.js +1 -0
  277. package/dist/src/types/service.js +1 -0
  278. package/dist/src/ui/App.js +1672 -0
  279. package/dist/src/ui/DeployPreview.js +60 -0
  280. package/dist/src/ui/FileDiffModal.js +108 -0
  281. package/dist/src/ui/Header.js +46 -0
  282. package/dist/src/ui/HelpModal.js +9 -0
  283. package/dist/src/ui/InputBox.js +408 -0
  284. package/dist/src/ui/MessageList.js +795 -0
  285. package/dist/src/ui/PermissionPrompt.js +72 -0
  286. package/dist/src/ui/StatusBar.js +109 -0
  287. package/dist/src/ui/TerminalPane.js +31 -0
  288. package/dist/src/ui/ToolCallDisplay.js +303 -0
  289. package/dist/src/ui/TreePane.js +83 -0
  290. package/dist/src/ui/chat-ui.js +721 -0
  291. package/dist/src/ui/index.js +11 -0
  292. package/dist/src/ui/ink/index.js +1325 -0
  293. package/dist/src/ui/streaming.js +137 -0
  294. package/dist/src/ui/theme.js +78 -0
  295. package/dist/src/ui/types.js +7 -0
  296. package/dist/src/utils/analytics.js +61 -0
  297. package/dist/src/utils/cost-warning.js +25 -0
  298. package/dist/src/utils/env.js +42 -0
  299. package/dist/src/utils/errors.js +54 -0
  300. package/dist/src/utils/event-bus.js +22 -0
  301. package/dist/src/utils/index.js +16 -0
  302. package/dist/src/utils/logger.js +150 -0
  303. package/dist/src/utils/rate-limiter.js +90 -0
  304. package/dist/src/utils/service-auth.js +36 -0
  305. package/dist/src/utils/validation.js +39 -0
  306. package/dist/src/version.js +3 -0
  307. package/dist/src/watcher/index.js +192 -0
  308. package/dist/src/wizard/approval.js +275 -0
  309. package/dist/src/wizard/index.js +13 -0
  310. package/dist/src/wizard/prompts.js +273 -0
  311. package/dist/src/wizard/types.js +4 -0
  312. package/dist/src/wizard/ui.js +453 -0
  313. package/dist/src/wizard/wizard.js +227 -0
  314. package/package.json +31 -23
  315. package/src/__tests__/alias.test.ts +133 -0
  316. package/src/__tests__/app.test.ts +1 -1
  317. package/src/__tests__/audit.test.ts +1 -1
  318. package/src/__tests__/circuit-breaker.test.ts +1 -1
  319. package/src/__tests__/cli-run.test.ts +237 -1
  320. package/src/__tests__/compat-sqlite.test.ts +68 -0
  321. package/src/__tests__/context-manager.test.ts +131 -1
  322. package/src/__tests__/context.test.ts +1 -1
  323. package/src/__tests__/devops-terminal-gaps.test.ts +718 -0
  324. package/src/__tests__/doctor.test.ts +48 -0
  325. package/src/__tests__/enterprise.test.ts +1 -1
  326. package/src/__tests__/export.test.ts +236 -0
  327. package/src/__tests__/gap-11-18-20.test.ts +958 -0
  328. package/src/__tests__/generator.test.ts +1 -1
  329. package/src/__tests__/helm-streaming.test.ts +127 -0
  330. package/src/__tests__/hooks.test.ts +1 -1
  331. package/src/__tests__/incident.test.ts +179 -0
  332. package/src/__tests__/init.test.ts +55 -4
  333. package/src/__tests__/intent-parser.test.ts +1 -1
  334. package/src/__tests__/llm-router.test.ts +1 -1
  335. package/src/__tests__/logs.test.ts +107 -0
  336. package/src/__tests__/loop-errors.test.ts +244 -0
  337. package/src/__tests__/lsp.test.ts +1 -1
  338. package/src/__tests__/modes.test.ts +1 -1
  339. package/src/__tests__/perf-optimizations.test.ts +847 -0
  340. package/src/__tests__/permissions.test.ts +1 -1
  341. package/src/__tests__/pipeline.test.ts +50 -0
  342. package/src/__tests__/polish-phase3.test.ts +340 -0
  343. package/src/__tests__/profile.test.ts +237 -0
  344. package/src/__tests__/rollback.test.ts +83 -0
  345. package/src/__tests__/runbook.test.ts +219 -0
  346. package/src/__tests__/schedule.test.ts +206 -0
  347. package/src/__tests__/serve.test.ts +1 -1
  348. package/src/__tests__/sessions.test.ts +96 -1
  349. package/src/__tests__/sharing.test.ts +53 -1
  350. package/src/__tests__/snapshots.test.ts +1 -1
  351. package/src/__tests__/standalone-migration.test.ts +199 -0
  352. package/src/__tests__/state-db.test.ts +1 -1
  353. package/src/__tests__/status.test.ts +158 -0
  354. package/src/__tests__/stream-with-tools.test.ts +71 -25
  355. package/src/__tests__/subagents.test.ts +1 -1
  356. package/src/__tests__/system-prompt.test.ts +82 -3
  357. package/src/__tests__/terminal-gap-v2.test.ts +395 -0
  358. package/src/__tests__/terminal-parity.test.ts +393 -0
  359. package/src/__tests__/tf-apply.test.ts +187 -0
  360. package/src/__tests__/tool-converter.test.ts +1 -1
  361. package/src/__tests__/tool-schemas.test.ts +209 -4
  362. package/src/__tests__/tools.test.ts +4 -3
  363. package/src/__tests__/version-json.test.ts +184 -0
  364. package/src/__tests__/version.test.ts +1 -1
  365. package/src/__tests__/watch.test.ts +129 -0
  366. package/src/agent/compaction-agent.ts +40 -1
  367. package/src/agent/context-manager.ts +67 -3
  368. package/src/agent/deploy-preview.ts +62 -1
  369. package/src/agent/expand-files.ts +108 -0
  370. package/src/agent/loop.ts +1312 -31
  371. package/src/agent/permissions.ts +51 -4
  372. package/src/agent/system-prompt.ts +573 -19
  373. package/src/app.ts +58 -0
  374. package/src/audit/security-scanner.ts +45 -0
  375. package/src/auth/keychain.ts +82 -0
  376. package/src/auth/oauth.ts +15 -5
  377. package/src/cli/init.ts +378 -5
  378. package/src/cli/run.ts +407 -16
  379. package/src/cli/serve.ts +78 -1
  380. package/src/cli/web.ts +10 -6
  381. package/src/cli.ts +312 -1
  382. package/src/clients/service-discovery.ts +30 -25
  383. package/src/commands/alias.ts +100 -0
  384. package/src/commands/audit/index.ts +121 -2
  385. package/src/commands/auth-cloud.ts +113 -0
  386. package/src/commands/auth-refresh.ts +187 -0
  387. package/src/commands/aws-discover.ts +144 -251
  388. package/src/commands/aws-terraform.ts +68 -118
  389. package/src/commands/chat.ts +9 -3
  390. package/src/commands/completions.ts +268 -0
  391. package/src/commands/config.ts +26 -0
  392. package/src/commands/cost/index.ts +218 -2
  393. package/src/commands/deploy.ts +260 -0
  394. package/src/commands/doctor.ts +744 -152
  395. package/src/commands/drift/index.ts +371 -23
  396. package/src/commands/export.ts +146 -0
  397. package/src/commands/generate-k8s.ts +9 -61
  398. package/src/commands/generate-terraform.ts +191 -449
  399. package/src/commands/help.ts +212 -36
  400. package/src/commands/history.ts +8 -1
  401. package/src/commands/incident.ts +166 -0
  402. package/src/commands/init.ts +5 -0
  403. package/src/commands/login.ts +86 -1
  404. package/src/commands/logs.ts +167 -0
  405. package/src/commands/onboarding.ts +211 -34
  406. package/src/commands/pipeline.ts +186 -0
  407. package/src/commands/plugin.ts +398 -0
  408. package/src/commands/profile.ts +342 -0
  409. package/src/commands/questionnaire.ts +0 -98
  410. package/src/commands/resume.ts +26 -34
  411. package/src/commands/rollback.ts +315 -0
  412. package/src/commands/rollout.ts +88 -0
  413. package/src/commands/runbook.ts +346 -0
  414. package/src/commands/schedule.ts +236 -0
  415. package/src/commands/status.ts +252 -0
  416. package/src/commands/team-context.ts +220 -0
  417. package/src/commands/template.ts +58 -57
  418. package/src/commands/tf/index.ts +70 -11
  419. package/src/commands/upgrade.ts +57 -0
  420. package/src/commands/version.ts +54 -50
  421. package/src/commands/watch.ts +153 -0
  422. package/src/compat/runtime.ts +1 -1
  423. package/src/compat/sqlite.ts +75 -5
  424. package/src/config/mode-store.ts +62 -0
  425. package/src/config/profiles.ts +84 -0
  426. package/src/config/types.ts +83 -1
  427. package/src/config/workspace-state.ts +53 -0
  428. package/src/engine/cost-estimator.ts +52 -10
  429. package/src/engine/executor.ts +33 -2
  430. package/src/engine/planner.ts +68 -1
  431. package/src/generator/terraform.ts +8 -0
  432. package/src/history/manager.ts +2 -74
  433. package/src/hooks/engine.ts +5 -4
  434. package/src/llm/cost-calculator.ts +2 -2
  435. package/src/llm/providers/anthropic.ts +50 -21
  436. package/src/llm/router.ts +76 -7
  437. package/src/lsp/languages.ts +3 -0
  438. package/src/lsp/manager.ts +21 -5
  439. package/src/nimbus.ts +37 -18
  440. package/src/sessions/manager.ts +108 -1
  441. package/src/sharing/sync.ts +4 -0
  442. package/src/sharing/viewer.ts +66 -0
  443. package/src/tools/file-ops.ts +22 -0
  444. package/src/tools/schemas/devops.ts +3007 -117
  445. package/src/tools/schemas/standard.ts +5 -1
  446. package/src/tools/schemas/types.ts +31 -1
  447. package/src/tools/spawn-exec.ts +148 -0
  448. package/src/ui/App.tsx +1183 -66
  449. package/src/ui/DeployPreview.tsx +62 -57
  450. package/src/ui/FileDiffModal.tsx +162 -0
  451. package/src/ui/Header.tsx +87 -24
  452. package/src/ui/HelpModal.tsx +57 -0
  453. package/src/ui/InputBox.tsx +163 -10
  454. package/src/ui/MessageList.tsx +487 -40
  455. package/src/ui/PermissionPrompt.tsx +17 -5
  456. package/src/ui/StatusBar.tsx +122 -3
  457. package/src/ui/TerminalPane.tsx +84 -0
  458. package/src/ui/ToolCallDisplay.tsx +252 -18
  459. package/src/ui/TreePane.tsx +132 -0
  460. package/src/ui/chat-ui.ts +41 -44
  461. package/src/ui/ink/index.ts +771 -38
  462. package/src/ui/streaming.ts +1 -1
  463. package/src/ui/theme.ts +104 -0
  464. package/src/ui/types.ts +18 -0
  465. package/src/version.ts +1 -1
  466. package/src/watcher/index.ts +66 -15
  467. package/src/wizard/types.ts +1 -0
  468. package/src/wizard/ui.ts +1 -1
  469. package/tsconfig.json +2 -2
@@ -0,0 +1,844 @@
1
+ /**
2
+ * LLM Router
3
+ * Routes requests to the appropriate provider based on model, cost optimization, and fallback logic.
4
+ *
5
+ * Refactored for the embedded Nimbus architecture. Key changes from the microservice version:
6
+ * - Imports providers from local ./providers/ directory
7
+ * - Integrates model alias resolution via resolveModelAlias
8
+ * - Integrates auto-detection via detectProvider
9
+ * - Supports OpenAI-compatible and Bedrock providers via env vars
10
+ * - persistUsage writes to the embedded SQLite usage table (fire-and-forget)
11
+ */
12
+ import { logger } from '../utils';
13
+ import { getTextContent, } from './types';
14
+ import { AnthropicProvider } from './providers/anthropic';
15
+ import { OpenAIProvider } from './providers/openai';
16
+ import { GoogleProvider } from './providers/google';
17
+ import { OllamaProvider } from './providers/ollama';
18
+ import { OpenRouterProvider } from './providers/openrouter';
19
+ import { OpenAICompatibleProvider } from './providers/openai-compatible';
20
+ import { BedrockProvider } from './providers/bedrock';
21
+ import { calculateCost } from './cost-calculator';
22
+ import { resolveModelAlias, stripProviderPrefix } from './model-aliases';
23
+ import { detectProvider } from './provider-registry';
24
+ import { ProviderCircuitBreaker } from './circuit-breaker';
25
+ export class LLMRouter {
26
+ providers;
27
+ config;
28
+ circuitBreaker = new ProviderCircuitBreaker();
29
+ /**
30
+ * Populated during streaming with fallback so callers (e.g. WebSocket)
31
+ * can inspect which provider ended up serving the stream. Reset on
32
+ * every call to routeStream / executeStreamWithFallback.
33
+ */
34
+ lastStreamFallbackMeta = null;
35
+ constructor(config) {
36
+ this.providers = new Map();
37
+ this.config = {
38
+ defaultProvider: config?.defaultProvider || process.env.DEFAULT_PROVIDER || 'anthropic',
39
+ defaultModel: config?.defaultModel || process.env.DEFAULT_MODEL || 'claude-sonnet-4-20250514',
40
+ costOptimization: {
41
+ enabled: config?.costOptimization?.enabled ?? process.env.ENABLE_COST_OPTIMIZATION === 'true',
42
+ cheapModelFor: config?.costOptimization?.cheapModelFor || [
43
+ 'simple_queries',
44
+ 'summarization',
45
+ 'classification',
46
+ 'explanations',
47
+ ],
48
+ expensiveModelFor: config?.costOptimization?.expensiveModelFor || [
49
+ 'code_generation',
50
+ 'complex_reasoning',
51
+ 'planning',
52
+ ],
53
+ cheapModel: config?.costOptimization?.cheapModel ||
54
+ process.env.CHEAP_MODEL ||
55
+ 'claude-haiku-4-20250514',
56
+ expensiveModel: config?.costOptimization?.expensiveModel ||
57
+ process.env.EXPENSIVE_MODEL ||
58
+ 'claude-opus-4-20250514',
59
+ },
60
+ fallback: {
61
+ enabled: config?.fallback?.enabled ?? process.env.DISABLE_FALLBACK !== 'true',
62
+ providers: config?.fallback?.providers ||
63
+ (process.env.FALLBACK_PROVIDERS?.split(',') ?? [
64
+ 'anthropic',
65
+ 'openai',
66
+ 'openrouter',
67
+ 'google',
68
+ ]),
69
+ },
70
+ };
71
+ this.initializeProviders();
72
+ }
73
+ /**
74
+ * Initialize all available providers based on API keys, auth.json, and environment variables.
75
+ *
76
+ * Resolution order per provider:
77
+ * 1. auth.json (~/.nimbus/auth.json) via the auth-bridge
78
+ * 2. Environment variables (ANTHROPIC_API_KEY, etc.)
79
+ */
80
+ initializeProviders() {
81
+ // Lazy-import the auth-bridge to avoid circular deps at module level
82
+ let isConfigured;
83
+ let getApiKey;
84
+ try {
85
+ // eslint-disable-next-line @typescript-eslint/no-var-requires
86
+ const bridge = require('./auth-bridge');
87
+ isConfigured = bridge.isProviderConfigured;
88
+ getApiKey = bridge.getProviderApiKey;
89
+ }
90
+ catch (err) {
91
+ // Auth-bridge unavailable (open-source build) — fall back to env-only
92
+ logger.debug('Auth-bridge unavailable, using environment variables only:', err instanceof Error ? err.message : String(err));
93
+ isConfigured = () => false;
94
+ getApiKey = () => undefined;
95
+ }
96
+ // Anthropic
97
+ if (process.env.ANTHROPIC_API_KEY || isConfigured('anthropic')) {
98
+ this.providers.set('anthropic', new AnthropicProvider());
99
+ logger.info('Initialized Anthropic provider');
100
+ }
101
+ // OpenAI
102
+ if (process.env.OPENAI_API_KEY || isConfigured('openai')) {
103
+ this.providers.set('openai', new OpenAIProvider());
104
+ logger.info('Initialized OpenAI provider');
105
+ }
106
+ // Google
107
+ if (process.env.GOOGLE_API_KEY || isConfigured('google')) {
108
+ this.providers.set('google', new GoogleProvider());
109
+ logger.info('Initialized Google provider');
110
+ }
111
+ // OpenRouter
112
+ if (process.env.OPENROUTER_API_KEY || isConfigured('openrouter')) {
113
+ this.providers.set('openrouter', new OpenRouterProvider());
114
+ logger.info('Initialized OpenRouter provider');
115
+ }
116
+ // Ollama (only if explicitly configured via auth.json or env var)
117
+ if (process.env.OLLAMA_BASE_URL || isConfigured('ollama')) {
118
+ this.providers.set('ollama', new OllamaProvider());
119
+ logger.info('Initialized Ollama provider');
120
+ }
121
+ // AWS Bedrock (uses IAM credentials from environment / instance profile)
122
+ if (process.env.AWS_BEDROCK_ENABLED === 'true' ||
123
+ process.env.AWS_REGION ||
124
+ isConfigured('bedrock') ||
125
+ (process.env.AWS_ACCESS_KEY_ID && process.env.AWS_SECRET_ACCESS_KEY)) {
126
+ this.providers.set('bedrock', new BedrockProvider());
127
+ logger.info('Initialized AWS Bedrock provider');
128
+ }
129
+ // Groq (OpenAI-compatible)
130
+ const groqKey = process.env.GROQ_API_KEY || getApiKey('groq');
131
+ if (groqKey) {
132
+ this.providers.set('groq', new OpenAICompatibleProvider({
133
+ name: 'groq',
134
+ apiKey: groqKey,
135
+ baseURL: 'https://api.groq.com/openai/v1',
136
+ defaultModel: 'llama-3.1-70b-versatile',
137
+ }));
138
+ logger.info('Initialized Groq provider (OpenAI-compatible)');
139
+ }
140
+ // Together AI (OpenAI-compatible)
141
+ const togetherKey = process.env.TOGETHER_API_KEY || getApiKey('together');
142
+ if (togetherKey) {
143
+ this.providers.set('together', new OpenAICompatibleProvider({
144
+ name: 'together',
145
+ apiKey: togetherKey,
146
+ baseURL: 'https://api.together.xyz/v1',
147
+ defaultModel: 'meta-llama/Llama-3.1-70B-Instruct-Turbo',
148
+ }));
149
+ logger.info('Initialized Together AI provider (OpenAI-compatible)');
150
+ }
151
+ // DeepSeek (OpenAI-compatible)
152
+ const deepseekKey = process.env.DEEPSEEK_API_KEY || getApiKey('deepseek');
153
+ if (deepseekKey) {
154
+ this.providers.set('deepseek', new OpenAICompatibleProvider({
155
+ name: 'deepseek',
156
+ apiKey: deepseekKey,
157
+ baseURL: 'https://api.deepseek.com/v1',
158
+ defaultModel: 'deepseek-chat',
159
+ }));
160
+ logger.info('Initialized DeepSeek provider (OpenAI-compatible)');
161
+ }
162
+ // Fireworks AI (OpenAI-compatible)
163
+ const fireworksKey = process.env.FIREWORKS_API_KEY || getApiKey('fireworks');
164
+ if (fireworksKey) {
165
+ this.providers.set('fireworks', new OpenAICompatibleProvider({
166
+ name: 'fireworks',
167
+ apiKey: fireworksKey,
168
+ baseURL: 'https://api.fireworks.ai/inference/v1',
169
+ defaultModel: 'accounts/fireworks/models/llama-v3p1-70b-instruct',
170
+ }));
171
+ logger.info('Initialized Fireworks AI provider (OpenAI-compatible)');
172
+ }
173
+ // Perplexity (OpenAI-compatible)
174
+ const perplexityKey = process.env.PERPLEXITY_API_KEY || getApiKey('perplexity');
175
+ if (perplexityKey) {
176
+ this.providers.set('perplexity', new OpenAICompatibleProvider({
177
+ name: 'perplexity',
178
+ apiKey: perplexityKey,
179
+ baseURL: 'https://api.perplexity.ai',
180
+ defaultModel: 'llama-3.1-sonar-large-128k-online',
181
+ }));
182
+ logger.info('Initialized Perplexity provider (OpenAI-compatible)');
183
+ }
184
+ }
185
+ /**
186
+ * Get the names of all initialized providers.
187
+ */
188
+ getAvailableProviders() {
189
+ return [...this.providers.keys()];
190
+ }
191
+ /**
192
+ * Get the names of providers whose circuit breakers are currently OPEN
193
+ * (i.e. temporarily disabled due to consecutive failures).
194
+ */
195
+ getDisabledProviders() {
196
+ return this.circuitBreaker.getOpenCircuits();
197
+ }
198
+ /**
199
+ * Register a custom provider
200
+ */
201
+ registerProvider(provider) {
202
+ this.providers.set(provider.name, provider);
203
+ logger.info(`Registered custom provider: ${provider.name}`);
204
+ }
205
+ /**
206
+ * Route a completion request to the appropriate provider
207
+ */
208
+ async route(request, taskType) {
209
+ // Resolve model alias before routing
210
+ if (request.model) {
211
+ request.model = resolveModelAlias(request.model);
212
+ }
213
+ const provider = this.selectProvider(request, taskType);
214
+ // Strip provider prefix after routing (APIs expect model ID without prefix)
215
+ if (request.model) {
216
+ request.model = stripProviderPrefix(request.model);
217
+ }
218
+ // Enforce token budget
219
+ this.enforceTokenBudget(request);
220
+ if (!provider) {
221
+ throw new Error('No LLM provider available. Run `nimbus login` to configure a provider, or set an API key via environment variable (e.g. ANTHROPIC_API_KEY).');
222
+ }
223
+ let response;
224
+ if (this.config.fallback.enabled) {
225
+ response = await this.executeWithFallback(provider, request);
226
+ }
227
+ else {
228
+ response = await provider.complete(request);
229
+ }
230
+ // Attach per-request cost calculation
231
+ const cost = this.computeCost(provider.name, response);
232
+ response.cost = cost;
233
+ // Persist usage (fire-and-forget)
234
+ if (response.usage) {
235
+ this.persistUsage(response.usage, response.model, provider.name, cost);
236
+ }
237
+ return response;
238
+ }
239
+ /**
240
+ * Route a streaming completion request.
241
+ * Collects token usage from the final chunk and persists cost data
242
+ * after the stream completes (fire-and-forget, same as route()).
243
+ */
244
+ async *routeStream(request, taskType) {
245
+ // Resolve model alias before routing
246
+ if (request.model) {
247
+ request.model = resolveModelAlias(request.model);
248
+ }
249
+ // Capture `this` and config references before yield points.
250
+ // TypeScript strict mode narrows `this` to `never` after yield in
251
+ // async generators, so all post-yield access goes through locals.
252
+ const self = this;
253
+ const defaultModel = self.config.defaultModel;
254
+ const provider = self.selectProvider(request, taskType);
255
+ // Strip provider prefix after routing (APIs expect model ID without prefix)
256
+ if (request.model) {
257
+ request.model = stripProviderPrefix(request.model);
258
+ }
259
+ // Enforce token budget
260
+ self.enforceTokenBudget(request);
261
+ if (!provider) {
262
+ throw new Error('No LLM provider available. Run `nimbus login` to configure a provider, or set an API key via environment variable (e.g. ANTHROPIC_API_KEY).');
263
+ }
264
+ // Reset fallback metadata
265
+ self.lastStreamFallbackMeta = null;
266
+ const stream = self.config.fallback.enabled
267
+ ? self.executeStreamWithFallback(provider, request)
268
+ : provider.stream(request);
269
+ let totalContent = '';
270
+ let lastUsage;
271
+ for await (const chunk of stream) {
272
+ if (chunk.content) {
273
+ totalContent += chunk.content;
274
+ }
275
+ if (chunk.usage) {
276
+ lastUsage = chunk.usage;
277
+ }
278
+ yield chunk;
279
+ }
280
+ // Determine which provider actually served the stream.
281
+ // Use type assertion because TS control-flow analysis incorrectly
282
+ // narrows lastStreamFallbackMeta to `null` -- it was mutated by
283
+ // executeStreamWithFallback during iteration above.
284
+ const fallbackMeta = self.lastStreamFallbackMeta;
285
+ const activeProviderName = fallbackMeta?.activeProvider ?? provider.name;
286
+ // Track cost after stream completes
287
+ if (lastUsage) {
288
+ const model = request.model || defaultModel;
289
+ const cost = calculateCost(activeProviderName, model, lastUsage.promptTokens, lastUsage.completionTokens);
290
+ self.persistUsage(lastUsage, model, activeProviderName, cost);
291
+ }
292
+ else {
293
+ // Estimate tokens from content length if no usage data
294
+ const estimatedOutputTokens = Math.ceil(totalContent.length / 4);
295
+ const estimatedInputTokens = request.messages.reduce((sum, m) => sum + Math.ceil(getTextContent(m.content).length / 4), 0);
296
+ const model = request.model || defaultModel;
297
+ const cost = calculateCost(activeProviderName, model, estimatedInputTokens, estimatedOutputTokens);
298
+ self.persistUsage({
299
+ promptTokens: estimatedInputTokens,
300
+ completionTokens: estimatedOutputTokens,
301
+ totalTokens: estimatedInputTokens + estimatedOutputTokens,
302
+ }, model, activeProviderName, cost);
303
+ }
304
+ }
305
+ /**
306
+ * Route a streaming tool completion request.
307
+ * Text chunks are yielded incrementally; tool calls arrive on the final
308
+ * chunk. Falls back to non-streaming completeWithTools when the selected
309
+ * provider doesn't support streamWithTools.
310
+ */
311
+ async *routeStreamWithTools(request, taskType) {
312
+ // Resolve model alias before routing
313
+ if (request.model) {
314
+ request.model = resolveModelAlias(request.model);
315
+ }
316
+ const self = this;
317
+ const defaultModel = self.config.defaultModel;
318
+ const provider = self.selectProvider(request, taskType);
319
+ // Strip provider prefix after routing
320
+ if (request.model) {
321
+ request.model = stripProviderPrefix(request.model);
322
+ }
323
+ self.enforceTokenBudget(request);
324
+ if (!provider) {
325
+ throw new Error('No LLM provider available. Run `nimbus login` to configure a provider, or set an API key via environment variable (e.g. ANTHROPIC_API_KEY).');
326
+ }
327
+ // Use native streaming-with-tools if providers support it
328
+ if (provider.streamWithTools && self.config.fallback.enabled) {
329
+ // Try primary provider first, then fallbacks
330
+ const fallbackProviders = self.config.fallback.providers
331
+ .map(name => self.providers.get(name))
332
+ .filter(Boolean);
333
+ const allProviders = [provider, ...fallbackProviders.filter(p => p !== provider)];
334
+ for (const p of allProviders) {
335
+ if (!p.streamWithTools || !self.circuitBreaker.isAvailable(p.name)) {
336
+ continue;
337
+ }
338
+ try {
339
+ let lastUsage;
340
+ // Yield each chunk immediately (no buffering) for real-time streaming UX.
341
+ for await (const chunk of p.streamWithTools(request)) {
342
+ if (chunk.usage) {
343
+ lastUsage = chunk.usage;
344
+ }
345
+ yield chunk;
346
+ }
347
+ // Record success after the `done: true` chunk has been received and yielded.
348
+ self.circuitBreaker.recordSuccess(p.name);
349
+ if (lastUsage) {
350
+ const model = request.model || defaultModel;
351
+ const cost = calculateCost(p.name, model, lastUsage.promptTokens, lastUsage.completionTokens);
352
+ self.persistUsage(lastUsage, model, p.name, cost);
353
+ }
354
+ return;
355
+ }
356
+ catch (error) {
357
+ self.circuitBreaker.recordFailure(p.name);
358
+ logger.warn(`Provider ${p.name} failed for streamWithTools, trying fallback...`, {
359
+ error,
360
+ });
361
+ continue;
362
+ }
363
+ }
364
+ // If all providers with streamWithTools failed, fall through to non-streaming fallback below
365
+ }
366
+ else if (provider.streamWithTools) {
367
+ // Fallback disabled — use provider directly
368
+ let lastUsage;
369
+ for await (const chunk of provider.streamWithTools(request)) {
370
+ if (chunk.usage) {
371
+ lastUsage = chunk.usage;
372
+ }
373
+ yield chunk;
374
+ }
375
+ if (lastUsage) {
376
+ const model = request.model || defaultModel;
377
+ const cost = calculateCost(provider.name, model, lastUsage.promptTokens, lastUsage.completionTokens);
378
+ self.persistUsage(lastUsage, model, provider.name, cost);
379
+ }
380
+ return;
381
+ }
382
+ // Fallback: non-streaming completeWithTools, yield result as a single chunk
383
+ const response = await provider.completeWithTools(request);
384
+ const cost = self.computeCost(provider.name, response);
385
+ response.cost = cost;
386
+ if (response.usage) {
387
+ self.persistUsage(response.usage, response.model, provider.name, cost);
388
+ }
389
+ if (response.content) {
390
+ yield { content: response.content, done: false };
391
+ }
392
+ yield {
393
+ done: true,
394
+ toolCalls: response.toolCalls,
395
+ usage: response.usage,
396
+ };
397
+ }
398
+ /**
399
+ * Route a tool completion request
400
+ */
401
+ async routeWithTools(request, taskType) {
402
+ // Resolve model alias before routing
403
+ if (request.model) {
404
+ request.model = resolveModelAlias(request.model);
405
+ }
406
+ const provider = this.selectProvider(request, taskType);
407
+ // Strip provider prefix after routing (APIs expect model ID without prefix)
408
+ if (request.model) {
409
+ request.model = stripProviderPrefix(request.model);
410
+ }
411
+ // Enforce token budget
412
+ this.enforceTokenBudget(request);
413
+ if (!provider) {
414
+ throw new Error('No LLM provider available. Run `nimbus login` to configure a provider, or set an API key via environment variable (e.g. ANTHROPIC_API_KEY).');
415
+ }
416
+ let response;
417
+ if (this.config.fallback.enabled) {
418
+ response = await this.executeToolsWithFallback(provider, request);
419
+ }
420
+ else {
421
+ response = await provider.completeWithTools(request);
422
+ }
423
+ // Attach per-request cost calculation
424
+ const cost = this.computeCost(provider.name, response);
425
+ response.cost = cost;
426
+ // Persist usage (fire-and-forget)
427
+ if (response.usage) {
428
+ this.persistUsage(response.usage, response.model, provider.name, cost);
429
+ }
430
+ return response;
431
+ }
432
+ /**
433
+ * Get list of available models across all providers
434
+ */
435
+ async getAvailableModels() {
436
+ const models = {};
437
+ const entries = Array.from(this.providers.entries());
438
+ const results = await Promise.allSettled(entries.map(async ([name, provider]) => {
439
+ const providerModels = await provider.listModels();
440
+ return { name, models: providerModels };
441
+ }));
442
+ for (const result of results) {
443
+ if (result.status === 'fulfilled') {
444
+ models[result.value.name] = result.value.models;
445
+ }
446
+ }
447
+ return models;
448
+ }
449
+ /**
450
+ * Get provider information including availability and models.
451
+ * Each registered provider is queried for its model list. If the query
452
+ * succeeds the provider is marked available; otherwise it is marked
453
+ * unavailable with an empty model list.
454
+ */
455
+ async getProviders() {
456
+ const entries = Array.from(this.providers.entries());
457
+ const results = await Promise.allSettled(entries.map(async ([name, provider]) => {
458
+ const models = await provider.listModels();
459
+ return { name, available: true, models };
460
+ }));
461
+ const providers = [];
462
+ for (let i = 0; i < results.length; i++) {
463
+ const result = results[i];
464
+ if (result.status === 'fulfilled') {
465
+ providers.push(result.value);
466
+ }
467
+ else {
468
+ providers.push({ name: entries[i][0], available: false, models: [] });
469
+ }
470
+ }
471
+ return providers;
472
+ }
473
+ /**
474
+ * Select the appropriate provider based on request and task type
475
+ */
476
+ selectProvider(request, taskType) {
477
+ // If model explicitly specified, use its provider
478
+ if (request.model) {
479
+ const providerName = this.getProviderForModel(request.model);
480
+ const provider = this.providers.get(providerName);
481
+ if (provider) {
482
+ logger.info(`Selected ${providerName} provider for model ${request.model}`);
483
+ return provider;
484
+ }
485
+ }
486
+ // Cost optimization
487
+ if (this.config.costOptimization.enabled && taskType) {
488
+ if (this.config.costOptimization.cheapModelFor.includes(taskType)) {
489
+ const cheapModel = this.config.costOptimization.cheapModel;
490
+ const provider = this.getProviderForModel(cheapModel)
491
+ ? this.providers.get(this.getProviderForModel(cheapModel)) || this.getCheapProvider()
492
+ : this.getCheapProvider();
493
+ if (provider) {
494
+ if (!request.model) {
495
+ request.model = cheapModel;
496
+ }
497
+ logger.info(`Selected cheap provider ${provider.name} with model ${request.model} for task type: ${taskType}`);
498
+ return provider;
499
+ }
500
+ }
501
+ if (this.config.costOptimization.expensiveModelFor.includes(taskType)) {
502
+ const expensiveModel = this.config.costOptimization.expensiveModel;
503
+ const provider = this.getProviderForModel(expensiveModel)
504
+ ? this.providers.get(this.getProviderForModel(expensiveModel)) ||
505
+ this.getExpensiveProvider()
506
+ : this.getExpensiveProvider();
507
+ if (provider) {
508
+ if (!request.model) {
509
+ request.model = expensiveModel;
510
+ }
511
+ logger.info(`Selected expensive provider ${provider.name} with model ${request.model} for task type: ${taskType}`);
512
+ return provider;
513
+ }
514
+ }
515
+ }
516
+ // Default provider
517
+ const defaultProvider = this.providers.get(this.config.defaultProvider);
518
+ if (defaultProvider) {
519
+ logger.info(`Using default provider: ${this.config.defaultProvider}`);
520
+ return defaultProvider;
521
+ }
522
+ // Fallback to any available provider
523
+ const firstAvailable = Array.from(this.providers.values())[0];
524
+ if (firstAvailable) {
525
+ logger.warn(`No default provider, using first available: ${firstAvailable.name}`);
526
+ return firstAvailable;
527
+ }
528
+ return null;
529
+ }
530
+ /**
531
+ * Check whether an error is a rate-limit (429) or server error (5xx)
532
+ * that should be retried with backoff before falling through.
533
+ */
534
+ static isRetryableError(error) {
535
+ if (error && typeof error === 'object') {
536
+ const errObj = error;
537
+ const status = (typeof errObj.status === 'number' ? errObj.status : undefined) ??
538
+ (typeof errObj.statusCode === 'number' ? errObj.statusCode : undefined);
539
+ if (status !== undefined && (status === 429 || (status >= 500 && status < 600))) {
540
+ return true;
541
+ }
542
+ const msg = typeof errObj.message === 'string' ? errObj.message : '';
543
+ if (/rate.?limit|429|too many requests|overloaded|503/i.test(msg)) {
544
+ return true;
545
+ }
546
+ }
547
+ return false;
548
+ }
549
+ /**
550
+ * Execute an async function with retry + exponential backoff for rate limits.
551
+ * Retries up to `maxRetries` times with delays of 1s, 2s, 4s, ...
552
+ */
553
+ async withRetry(fn, maxRetries = 3) {
554
+ let lastError;
555
+ for (let attempt = 0; attempt <= maxRetries; attempt++) {
556
+ try {
557
+ return await fn();
558
+ }
559
+ catch (error) {
560
+ lastError = error;
561
+ if (attempt < maxRetries && LLMRouter.isRetryableError(error)) {
562
+ const delay = Math.min(1000 * Math.pow(2, attempt), 8000);
563
+ const jitter = Math.random() * 500;
564
+ logger.info(`Rate limited — retrying in ${Math.round(delay + jitter)}ms (attempt ${attempt + 1}/${maxRetries})`);
565
+ await new Promise(resolve => setTimeout(resolve, delay + jitter));
566
+ continue;
567
+ }
568
+ throw error;
569
+ }
570
+ }
571
+ throw lastError;
572
+ }
573
+ /**
574
+ * Execute request with fallback logic
575
+ */
576
+ async executeWithFallback(primaryProvider, request) {
577
+ const fallbackProviders = this.config.fallback.providers
578
+ .map(name => this.providers.get(name))
579
+ .filter(Boolean);
580
+ const allProviders = [primaryProvider, ...fallbackProviders.filter(p => p !== primaryProvider)];
581
+ for (const provider of allProviders) {
582
+ if (!this.circuitBreaker.isAvailable(provider.name)) {
583
+ logger.info(`Skipping ${provider.name} (circuit open)`);
584
+ continue;
585
+ }
586
+ try {
587
+ logger.info(`Attempting request with ${provider.name}`);
588
+ const result = await this.withRetry(() => provider.complete(request));
589
+ this.circuitBreaker.recordSuccess(provider.name);
590
+ return result;
591
+ }
592
+ catch (error) {
593
+ this.circuitBreaker.recordFailure(provider.name);
594
+ logger.warn(`Provider ${provider.name} failed, trying fallback...`, { error });
595
+ continue;
596
+ }
597
+ }
598
+ throw new Error('All LLM providers failed. Check your API keys and network connection, or try a different provider.');
599
+ }
600
+ /**
601
+ * Execute tool request with fallback logic
602
+ */
603
+ async executeToolsWithFallback(primaryProvider, request) {
604
+ const fallbackProviders = this.config.fallback.providers
605
+ .map(name => this.providers.get(name))
606
+ .filter(Boolean);
607
+ const allProviders = [primaryProvider, ...fallbackProviders.filter(p => p !== primaryProvider)];
608
+ for (const provider of allProviders) {
609
+ if (!this.circuitBreaker.isAvailable(provider.name)) {
610
+ logger.info(`Skipping ${provider.name} for tool request (circuit open)`);
611
+ continue;
612
+ }
613
+ try {
614
+ logger.info(`Attempting tool request with ${provider.name}`);
615
+ const result = await this.withRetry(() => provider.completeWithTools(request));
616
+ this.circuitBreaker.recordSuccess(provider.name);
617
+ return result;
618
+ }
619
+ catch (error) {
620
+ this.circuitBreaker.recordFailure(provider.name);
621
+ logger.warn(`Provider ${provider.name} failed for tool request, trying fallback...`, {
622
+ error,
623
+ });
624
+ continue;
625
+ }
626
+ }
627
+ throw new Error('All LLM providers failed for tool request. Check your API keys and network connection, or try a different provider.');
628
+ }
629
+ /**
630
+ * Execute streaming request with fallback logic.
631
+ *
632
+ * Handles two failure modes:
633
+ * 1. Provider fails before producing any chunks (e.g. auth error, rate limit) --
634
+ * immediately falls through to the next provider.
635
+ * 2. Provider fails mid-stream (partial chunks already buffered) -- discards
636
+ * the partial output and starts fresh with the next provider.
637
+ *
638
+ * Chunks are buffered internally per-provider attempt. Only once a provider
639
+ * completes its full stream successfully are the buffered chunks yielded to
640
+ * the caller. This prevents the caller from receiving a garbled mix of
641
+ * partial responses from multiple providers.
642
+ */
643
+ async *executeStreamWithFallback(primaryProvider, request) {
644
+ // Capture `this` for use across yield points
645
+ const self = this;
646
+ const fallbackProviders = self.config.fallback.providers
647
+ .map(name => self.providers.get(name))
648
+ .filter(Boolean);
649
+ const allProviders = [primaryProvider, ...fallbackProviders.filter(p => p !== primaryProvider)];
650
+ let failedProvider;
651
+ for (const provider of allProviders) {
652
+ if (!self.circuitBreaker.isAvailable(provider.name)) {
653
+ logger.info(`Skipping ${provider.name} for stream (circuit open)`);
654
+ continue;
655
+ }
656
+ const bufferedChunks = [];
657
+ let streamCompleted = false;
658
+ try {
659
+ logger.info(`Attempting stream with ${provider.name}`);
660
+ for await (const chunk of provider.stream(request)) {
661
+ bufferedChunks.push(chunk);
662
+ if (chunk.done) {
663
+ streamCompleted = true;
664
+ }
665
+ }
666
+ // If we got here the stream completed without throwing.
667
+ // Even if there was no explicit done=true chunk we treat
668
+ // exhausting the iterator as success.
669
+ streamCompleted = true;
670
+ self.circuitBreaker.recordSuccess(provider.name);
671
+ }
672
+ catch (error) {
673
+ self.circuitBreaker.recordFailure(provider.name);
674
+ const partialChunkCount = bufferedChunks.length;
675
+ logger.warn(`Provider ${provider.name} failed for stream after ${partialChunkCount} chunk(s), trying fallback...`, { error });
676
+ failedProvider = provider.name;
677
+ // Discard buffered chunks from the failed provider and try next
678
+ continue;
679
+ }
680
+ if (streamCompleted) {
681
+ // Record which provider served the response
682
+ self.lastStreamFallbackMeta = {
683
+ activeProvider: provider.name,
684
+ failedProvider,
685
+ isFallback: !!failedProvider,
686
+ };
687
+ if (failedProvider) {
688
+ logger.info(`Stream fallback: ${failedProvider} -> ${provider.name} (${bufferedChunks.length} chunks)`);
689
+ }
690
+ // Yield all buffered chunks to the caller
691
+ for (const chunk of bufferedChunks) {
692
+ yield chunk;
693
+ }
694
+ return;
695
+ }
696
+ }
697
+ throw new Error('All LLM providers failed for streaming request. Check your API keys and network connection, or try a different provider.');
698
+ }
699
+ /**
700
+ * Compute cost for a response using the cost calculator
701
+ */
702
+ computeCost(providerName, response) {
703
+ return calculateCost(providerName, response.model, response.usage.promptTokens, response.usage.completionTokens);
704
+ }
705
+ /**
706
+ * Get provider name for a specific model.
707
+ * Uses the detectProvider utility for auto-detection.
708
+ */
709
+ getProviderForModel(model) {
710
+ const detected = detectProvider(model);
711
+ // If the detected provider is registered, use it
712
+ if (this.providers.has(detected)) {
713
+ return detected;
714
+ }
715
+ // For models with "/" prefix that could be OpenRouter
716
+ if (model.includes('/') && this.providers.has('openrouter')) {
717
+ return 'openrouter';
718
+ }
719
+ return this.config.defaultProvider;
720
+ }
721
+ /**
722
+ * Get the cheapest available provider
723
+ */
724
+ getCheapProvider() {
725
+ // Prefer Ollama (free) > Haiku > GPT-4o-mini
726
+ return (this.providers.get('ollama') ||
727
+ this.providers.get('anthropic') || // Will use Haiku in practice
728
+ this.providers.get('openai') || // Will use gpt-4o-mini in practice
729
+ null);
730
+ }
731
+ /**
732
+ * Persist token usage to the embedded SQLite state layer (fire-and-forget).
733
+ *
734
+ * Inserts a row into the `usage` table with token counts, cost, and metadata.
735
+ * Failures are logged but never propagated -- persistence is non-critical and
736
+ * must not break the LLM request path.
737
+ */
738
+ persistUsage(usage, model, provider, cost) {
739
+ try {
740
+ // Lazy import to avoid circular dependency between llm/ and state/
741
+ import('../state/db')
742
+ .then(({ getDb }) => {
743
+ try {
744
+ const db = getDb();
745
+ const id = crypto.randomUUID();
746
+ const metadata = JSON.stringify({
747
+ model: model ?? null,
748
+ provider: provider ?? null,
749
+ prompt_tokens: usage.promptTokens,
750
+ completion_tokens: usage.completionTokens,
751
+ });
752
+ db.run(`INSERT INTO usage (id, type, quantity, unit, cost_usd, metadata)
753
+ VALUES (?, ?, ?, ?, ?, ?)`, [id, 'llm_call', usage.totalTokens, 'tokens', cost?.costUSD ?? 0, metadata]);
754
+ }
755
+ catch (err) {
756
+ logger.debug('Failed to persist LLM usage to SQLite', { error: err });
757
+ }
758
+ })
759
+ .catch(err => {
760
+ logger.debug('Failed to import state/db for usage persistence', { error: err });
761
+ });
762
+ }
763
+ catch (err) {
764
+ logger.debug('Unexpected error in persistUsage', { error: err });
765
+ }
766
+ }
767
+ /**
768
+ * Get the most capable (expensive) provider
769
+ */
770
+ getExpensiveProvider() {
771
+ // Prefer Claude Opus/Sonnet > GPT-4o > Gemini Pro
772
+ return (this.providers.get('anthropic') ||
773
+ this.providers.get('openai') ||
774
+ this.providers.get('google') ||
775
+ null);
776
+ }
777
+ /**
778
+ * Enforce token budget on a request
779
+ */
780
+ enforceTokenBudget(request) {
781
+ const maxTokens = this.config.tokenBudget?.maxTokensPerRequest || 32768;
782
+ request.maxTokens = Math.min(request.maxTokens || 4096, maxTokens);
783
+ }
784
+ }
785
+ // ---------------------------------------------------------------------------
786
+ // Gap 6: List authenticated providers for /model command
787
+ // ---------------------------------------------------------------------------
788
+ /**
789
+ * Return the names of providers that have valid credentials configured.
790
+ * Checks both environment variables and the auth store.
791
+ */
792
+ export function listAuthenticatedProviders() {
793
+ const authenticated = [];
794
+ if (process.env.ANTHROPIC_API_KEY)
795
+ authenticated.push('anthropic');
796
+ if (process.env.OPENAI_API_KEY)
797
+ authenticated.push('openai');
798
+ if (process.env.GOOGLE_API_KEY || process.env.GOOGLE_GENERATIVE_AI_API_KEY)
799
+ authenticated.push('google');
800
+ if (process.env.GROQ_API_KEY)
801
+ authenticated.push('groq');
802
+ if (process.env.OPENROUTER_API_KEY)
803
+ authenticated.push('openrouter');
804
+ if (process.env.AWS_ACCESS_KEY_ID || process.env.AWS_PROFILE)
805
+ authenticated.push('bedrock');
806
+ return authenticated;
807
+ }
808
+ /**
809
+ * Classify a user message as simple, moderate, or complex.
810
+ *
811
+ * - **simple**: short status/list/describe queries (<200 chars, no code generation)
812
+ * - **complex**: long messages, code generation, architectural reasoning
813
+ * - **moderate**: everything else
814
+ */
815
+ export function classifyTaskComplexity(message) {
816
+ const lower = message.toLowerCase().trim();
817
+ // Simple: short status/list queries
818
+ if (message.length < 200 &&
819
+ /^(list|show|get|check|status|what is|what are|describe|which|where|who|ping|echo)\b/.test(lower)) {
820
+ return 'simple';
821
+ }
822
+ // Complex: long messages or keywords that imply heavy reasoning
823
+ if (message.length > 500 ||
824
+ /\b(implement|design|architect|refactor|migrate|rewrite|build|create|scaffold|generate|optimize|debug|diagnose|analyze)\b/.test(lower)) {
825
+ return 'complex';
826
+ }
827
+ return 'moderate';
828
+ }
829
+ /**
830
+ * Select the appropriate model string for a given complexity level.
831
+ * If `preferredModel` is provided it always wins (user override).
832
+ */
833
+ export function routeModel(complexity, preferredModel) {
834
+ if (preferredModel)
835
+ return preferredModel;
836
+ switch (complexity) {
837
+ case 'simple':
838
+ return 'anthropic/claude-haiku-4-5-20251001';
839
+ case 'complex':
840
+ return 'anthropic/claude-opus-4-6';
841
+ default:
842
+ return 'anthropic/claude-sonnet-4-20250514';
843
+ }
844
+ }