@build-astron-co/nimbus 0.2.0 → 0.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/nimbus +26 -10
- package/bin/nimbus.cmd +41 -0
- package/bin/nimbus.mjs +70 -0
- package/completions/nimbus.bash +38 -0
- package/completions/nimbus.fish +48 -0
- package/completions/nimbus.zsh +81 -0
- package/dist/src/agent/compaction-agent.js +215 -0
- package/dist/src/agent/context-manager.js +385 -0
- package/dist/src/agent/context.js +322 -0
- package/dist/src/agent/deploy-preview.js +395 -0
- package/dist/src/agent/expand-files.js +95 -0
- package/dist/src/agent/index.js +18 -0
- package/dist/src/agent/loop.js +1535 -0
- package/dist/src/agent/modes.js +347 -0
- package/dist/src/agent/permissions.js +396 -0
- package/dist/src/agent/subagents/base.js +67 -0
- package/dist/src/agent/subagents/cost.js +45 -0
- package/dist/src/agent/subagents/explore.js +36 -0
- package/dist/src/agent/subagents/general.js +41 -0
- package/dist/src/agent/subagents/index.js +88 -0
- package/dist/src/agent/subagents/infra.js +52 -0
- package/dist/src/agent/subagents/security.js +60 -0
- package/dist/src/agent/system-prompt.js +860 -0
- package/dist/src/app.js +152 -0
- package/dist/src/audit/activity-log.js +209 -0
- package/dist/src/audit/compliance-checker.js +419 -0
- package/dist/src/audit/cost-tracker.js +231 -0
- package/dist/src/audit/index.js +10 -0
- package/dist/src/audit/security-scanner.js +490 -0
- package/dist/src/auth/guard.js +64 -0
- package/dist/src/auth/index.js +19 -0
- package/dist/src/auth/keychain.js +79 -0
- package/dist/src/auth/oauth.js +389 -0
- package/dist/src/auth/providers.js +415 -0
- package/dist/src/auth/sso.js +87 -0
- package/dist/src/auth/store.js +424 -0
- package/dist/src/auth/types.js +5 -0
- package/dist/src/cli/index.js +8 -0
- package/dist/src/cli/init.js +1048 -0
- package/dist/src/cli/openapi-spec.js +346 -0
- package/dist/src/cli/run.js +505 -0
- package/dist/src/cli/serve-auth.js +56 -0
- package/dist/src/cli/serve.js +432 -0
- package/dist/src/cli/web.js +50 -0
- package/dist/src/cli.js +1574 -0
- package/dist/src/clients/core-engine-client.js +156 -0
- package/dist/src/clients/enterprise-client.js +246 -0
- package/dist/src/clients/generator-client.js +219 -0
- package/dist/src/clients/git-client.js +367 -0
- package/dist/src/clients/github-client.js +229 -0
- package/dist/src/clients/helm-client.js +299 -0
- package/dist/src/clients/index.js +18 -0
- package/dist/src/clients/k8s-client.js +270 -0
- package/dist/src/clients/llm-client.js +119 -0
- package/dist/src/clients/rest-client.js +104 -0
- package/dist/src/clients/service-discovery.js +35 -0
- package/dist/src/clients/terraform-client.js +302 -0
- package/dist/src/clients/tools-client.js +1227 -0
- package/dist/src/clients/ws-client.js +93 -0
- package/dist/src/commands/alias.js +91 -0
- package/dist/src/commands/analyze/index.js +313 -0
- package/dist/src/commands/apply/helm.js +375 -0
- package/dist/src/commands/apply/index.js +176 -0
- package/dist/src/commands/apply/k8s.js +350 -0
- package/dist/src/commands/apply/terraform.js +465 -0
- package/dist/src/commands/ask.js +137 -0
- package/dist/src/commands/audit/index.js +322 -0
- package/dist/src/commands/auth-cloud.js +345 -0
- package/dist/src/commands/auth-list.js +112 -0
- package/dist/src/commands/auth-profile.js +104 -0
- package/dist/src/commands/auth-refresh.js +161 -0
- package/dist/src/commands/auth-status.js +122 -0
- package/dist/src/commands/aws/ec2.js +402 -0
- package/dist/src/commands/aws/iam.js +304 -0
- package/dist/src/commands/aws/index.js +108 -0
- package/dist/src/commands/aws/lambda.js +317 -0
- package/dist/src/commands/aws/rds.js +345 -0
- package/dist/src/commands/aws/s3.js +346 -0
- package/dist/src/commands/aws/vpc.js +302 -0
- package/dist/src/commands/aws-discover.js +413 -0
- package/dist/src/commands/aws-terraform.js +618 -0
- package/dist/src/commands/azure/aks.js +305 -0
- package/dist/src/commands/azure/functions.js +200 -0
- package/dist/src/commands/azure/index.js +93 -0
- package/dist/src/commands/azure/storage.js +378 -0
- package/dist/src/commands/azure/vm.js +291 -0
- package/dist/src/commands/billing/index.js +224 -0
- package/dist/src/commands/chat.js +259 -0
- package/dist/src/commands/completions.js +255 -0
- package/dist/src/commands/config.js +291 -0
- package/dist/src/commands/cost/cloud-cost-estimator.js +211 -0
- package/dist/src/commands/cost/estimator.js +73 -0
- package/dist/src/commands/cost/index.js +625 -0
- package/dist/src/commands/cost/parsers/terraform.js +234 -0
- package/dist/src/commands/cost/parsers/types.js +4 -0
- package/dist/src/commands/cost/pricing/aws.js +501 -0
- package/dist/src/commands/cost/pricing/azure.js +462 -0
- package/dist/src/commands/cost/pricing/gcp.js +359 -0
- package/dist/src/commands/cost/pricing/index.js +24 -0
- package/dist/src/commands/demo.js +196 -0
- package/dist/src/commands/deploy.js +215 -0
- package/dist/src/commands/doctor.js +1291 -0
- package/dist/src/commands/drift/index.js +674 -0
- package/dist/src/commands/explain.js +235 -0
- package/dist/src/commands/export.js +120 -0
- package/dist/src/commands/feedback.js +319 -0
- package/dist/src/commands/fix.js +263 -0
- package/dist/src/commands/fs/index.js +338 -0
- package/dist/src/commands/gcp/compute.js +266 -0
- package/dist/src/commands/gcp/functions.js +221 -0
- package/dist/src/commands/gcp/gke.js +357 -0
- package/dist/src/commands/gcp/iam.js +295 -0
- package/dist/src/commands/gcp/index.js +105 -0
- package/dist/src/commands/gcp/storage.js +232 -0
- package/dist/src/commands/generate-helm.js +1026 -0
- package/dist/src/commands/generate-k8s.js +1263 -0
- package/dist/src/commands/generate-terraform.js +1058 -0
- package/dist/src/commands/gh/index.js +663 -0
- package/dist/src/commands/git/index.js +1208 -0
- package/dist/src/commands/helm/index.js +985 -0
- package/dist/src/commands/help.js +639 -0
- package/dist/src/commands/history.js +120 -0
- package/dist/src/commands/import.js +782 -0
- package/dist/src/commands/incident.js +144 -0
- package/dist/src/commands/index.js +109 -0
- package/dist/src/commands/init.js +955 -0
- package/dist/src/commands/k8s/index.js +979 -0
- package/dist/src/commands/login.js +588 -0
- package/dist/src/commands/logout.js +61 -0
- package/dist/src/commands/logs.js +160 -0
- package/dist/src/commands/onboarding.js +382 -0
- package/dist/src/commands/pipeline.js +153 -0
- package/dist/src/commands/plan/display.js +216 -0
- package/dist/src/commands/plan/index.js +525 -0
- package/dist/src/commands/plugin.js +325 -0
- package/dist/src/commands/preview.js +356 -0
- package/dist/src/commands/profile.js +297 -0
- package/dist/src/commands/questionnaire.js +1021 -0
- package/dist/src/commands/resume.js +35 -0
- package/dist/src/commands/rollback.js +259 -0
- package/dist/src/commands/rollout.js +74 -0
- package/dist/src/commands/runbook.js +307 -0
- package/dist/src/commands/schedule.js +202 -0
- package/dist/src/commands/status.js +213 -0
- package/dist/src/commands/team/index.js +309 -0
- package/dist/src/commands/team-context.js +200 -0
- package/dist/src/commands/template.js +204 -0
- package/dist/src/commands/tf/index.js +989 -0
- package/dist/src/commands/upgrade.js +515 -0
- package/dist/src/commands/usage/index.js +118 -0
- package/dist/src/commands/version.js +145 -0
- package/dist/src/commands/watch.js +127 -0
- package/dist/src/compat/index.js +2 -0
- package/dist/src/compat/runtime.js +10 -0
- package/dist/src/compat/sqlite.js +144 -0
- package/dist/src/config/index.js +6 -0
- package/dist/src/config/manager.js +469 -0
- package/dist/src/config/mode-store.js +57 -0
- package/dist/src/config/profiles.js +66 -0
- package/dist/src/config/safety-policy.js +251 -0
- package/dist/src/config/schema.js +107 -0
- package/dist/src/config/types.js +311 -0
- package/dist/src/config/workspace-state.js +38 -0
- package/dist/src/context/context-db.js +138 -0
- package/dist/src/demo/index.js +295 -0
- package/dist/src/demo/scenarios/full-journey.js +226 -0
- package/dist/src/demo/scenarios/getting-started.js +124 -0
- package/dist/src/demo/scenarios/helm-release.js +334 -0
- package/dist/src/demo/scenarios/k8s-deployment.js +190 -0
- package/dist/src/demo/scenarios/terraform-vpc.js +167 -0
- package/dist/src/demo/types.js +6 -0
- package/dist/src/engine/cost-estimator.js +334 -0
- package/dist/src/engine/diagram-generator.js +192 -0
- package/dist/src/engine/drift-detector.js +688 -0
- package/dist/src/engine/executor.js +832 -0
- package/dist/src/engine/index.js +39 -0
- package/dist/src/engine/orchestrator.js +436 -0
- package/dist/src/engine/planner.js +616 -0
- package/dist/src/engine/safety.js +609 -0
- package/dist/src/engine/verifier.js +664 -0
- package/dist/src/enterprise/audit.js +241 -0
- package/dist/src/enterprise/auth.js +189 -0
- package/dist/src/enterprise/billing.js +512 -0
- package/dist/src/enterprise/index.js +16 -0
- package/dist/src/enterprise/teams.js +315 -0
- package/dist/src/generator/best-practices.js +1375 -0
- package/dist/src/generator/helm.js +495 -0
- package/dist/src/generator/index.js +11 -0
- package/dist/src/generator/intent-parser.js +420 -0
- package/dist/src/generator/kubernetes.js +773 -0
- package/dist/src/generator/terraform.js +1472 -0
- package/dist/src/history/index.js +6 -0
- package/dist/src/history/manager.js +199 -0
- package/dist/src/history/types.js +6 -0
- package/dist/src/hooks/config.js +318 -0
- package/dist/src/hooks/engine.js +317 -0
- package/dist/src/hooks/index.js +2 -0
- package/dist/src/llm/auth-bridge.js +157 -0
- package/dist/src/llm/circuit-breaker.js +116 -0
- package/dist/src/llm/config-loader.js +172 -0
- package/dist/src/llm/cost-calculator.js +137 -0
- package/dist/src/llm/index.js +7 -0
- package/dist/src/llm/model-aliases.js +99 -0
- package/dist/src/llm/provider-registry.js +57 -0
- package/dist/src/llm/providers/anthropic.js +430 -0
- package/dist/src/llm/providers/bedrock.js +409 -0
- package/dist/src/llm/providers/google.js +344 -0
- package/dist/src/llm/providers/ollama.js +661 -0
- package/dist/src/llm/providers/openai-compatible.js +289 -0
- package/dist/src/llm/providers/openai.js +284 -0
- package/dist/src/llm/providers/openrouter.js +293 -0
- package/dist/src/llm/router.js +844 -0
- package/dist/src/llm/types.js +69 -0
- package/dist/src/lsp/client.js +239 -0
- package/dist/src/lsp/languages.js +95 -0
- package/dist/src/lsp/manager.js +243 -0
- package/dist/src/mcp/client.js +289 -0
- package/dist/src/mcp/index.js +5 -0
- package/dist/src/mcp/manager.js +113 -0
- package/dist/src/nimbus.js +212 -0
- package/dist/src/plugins/index.js +13 -0
- package/dist/src/plugins/loader.js +280 -0
- package/dist/src/plugins/manager.js +282 -0
- package/dist/src/plugins/types.js +23 -0
- package/dist/src/scanners/cicd-scanner.js +230 -0
- package/dist/src/scanners/cloud-scanner.js +415 -0
- package/dist/src/scanners/framework-scanner.js +430 -0
- package/dist/src/scanners/iac-scanner.js +350 -0
- package/dist/src/scanners/index.js +454 -0
- package/dist/src/scanners/language-scanner.js +258 -0
- package/dist/src/scanners/package-manager-scanner.js +252 -0
- package/dist/src/scanners/types.js +6 -0
- package/dist/src/sessions/manager.js +395 -0
- package/dist/src/sessions/types.js +4 -0
- package/dist/src/sharing/sync.js +238 -0
- package/dist/src/sharing/viewer.js +131 -0
- package/dist/src/snapshots/index.js +1 -0
- package/dist/src/snapshots/manager.js +432 -0
- package/dist/src/state/artifacts.js +94 -0
- package/dist/src/state/audit.js +73 -0
- package/dist/src/state/billing.js +126 -0
- package/dist/src/state/checkpoints.js +81 -0
- package/dist/src/state/config.js +58 -0
- package/dist/src/state/conversations.js +7 -0
- package/dist/src/state/credentials.js +96 -0
- package/dist/src/state/db.js +53 -0
- package/dist/src/state/index.js +23 -0
- package/dist/src/state/messages.js +76 -0
- package/dist/src/state/projects.js +92 -0
- package/dist/src/state/schema.js +233 -0
- package/dist/src/state/sessions.js +79 -0
- package/dist/src/state/teams.js +131 -0
- package/dist/src/telemetry.js +91 -0
- package/dist/src/tools/aws-ops.js +747 -0
- package/dist/src/tools/azure-ops.js +491 -0
- package/dist/src/tools/file-ops.js +451 -0
- package/dist/src/tools/gcp-ops.js +559 -0
- package/dist/src/tools/git-ops.js +557 -0
- package/dist/src/tools/github-ops.js +460 -0
- package/dist/src/tools/helm-ops.js +634 -0
- package/dist/src/tools/index.js +16 -0
- package/dist/src/tools/k8s-ops.js +579 -0
- package/dist/src/tools/schemas/converter.js +129 -0
- package/dist/src/tools/schemas/devops.js +3319 -0
- package/dist/src/tools/schemas/index.js +19 -0
- package/dist/src/tools/schemas/standard.js +966 -0
- package/dist/src/tools/schemas/types.js +409 -0
- package/dist/src/tools/spawn-exec.js +109 -0
- package/dist/src/tools/terraform-ops.js +627 -0
- package/dist/src/types/config.js +1 -0
- package/dist/src/types/drift.js +4 -0
- package/dist/src/types/enterprise.js +5 -0
- package/dist/src/types/index.js +14 -0
- package/dist/src/types/plan.js +1 -0
- package/dist/src/types/request.js +1 -0
- package/dist/src/types/response.js +1 -0
- package/dist/src/types/service.js +1 -0
- package/dist/src/ui/App.js +1672 -0
- package/dist/src/ui/DeployPreview.js +60 -0
- package/dist/src/ui/FileDiffModal.js +108 -0
- package/dist/src/ui/Header.js +46 -0
- package/dist/src/ui/HelpModal.js +9 -0
- package/dist/src/ui/InputBox.js +408 -0
- package/dist/src/ui/MessageList.js +795 -0
- package/dist/src/ui/PermissionPrompt.js +72 -0
- package/dist/src/ui/StatusBar.js +109 -0
- package/dist/src/ui/TerminalPane.js +31 -0
- package/dist/src/ui/ToolCallDisplay.js +303 -0
- package/dist/src/ui/TreePane.js +83 -0
- package/dist/src/ui/chat-ui.js +721 -0
- package/dist/src/ui/index.js +11 -0
- package/dist/src/ui/ink/index.js +1325 -0
- package/dist/src/ui/streaming.js +137 -0
- package/dist/src/ui/theme.js +78 -0
- package/dist/src/ui/types.js +7 -0
- package/dist/src/utils/analytics.js +61 -0
- package/dist/src/utils/cost-warning.js +25 -0
- package/dist/src/utils/env.js +42 -0
- package/dist/src/utils/errors.js +54 -0
- package/dist/src/utils/event-bus.js +22 -0
- package/dist/src/utils/index.js +16 -0
- package/dist/src/utils/logger.js +150 -0
- package/dist/src/utils/rate-limiter.js +90 -0
- package/dist/src/utils/service-auth.js +36 -0
- package/dist/src/utils/validation.js +39 -0
- package/dist/src/version.js +3 -0
- package/dist/src/watcher/index.js +192 -0
- package/dist/src/wizard/approval.js +275 -0
- package/dist/src/wizard/index.js +13 -0
- package/dist/src/wizard/prompts.js +273 -0
- package/dist/src/wizard/types.js +4 -0
- package/dist/src/wizard/ui.js +453 -0
- package/dist/src/wizard/wizard.js +227 -0
- package/package.json +31 -23
- package/src/__tests__/alias.test.ts +133 -0
- package/src/__tests__/app.test.ts +1 -1
- package/src/__tests__/audit.test.ts +1 -1
- package/src/__tests__/circuit-breaker.test.ts +1 -1
- package/src/__tests__/cli-run.test.ts +237 -1
- package/src/__tests__/compat-sqlite.test.ts +68 -0
- package/src/__tests__/context-manager.test.ts +131 -1
- package/src/__tests__/context.test.ts +1 -1
- package/src/__tests__/devops-terminal-gaps.test.ts +718 -0
- package/src/__tests__/doctor.test.ts +48 -0
- package/src/__tests__/enterprise.test.ts +1 -1
- package/src/__tests__/export.test.ts +236 -0
- package/src/__tests__/gap-11-18-20.test.ts +958 -0
- package/src/__tests__/generator.test.ts +1 -1
- package/src/__tests__/helm-streaming.test.ts +127 -0
- package/src/__tests__/hooks.test.ts +1 -1
- package/src/__tests__/incident.test.ts +179 -0
- package/src/__tests__/init.test.ts +55 -4
- package/src/__tests__/intent-parser.test.ts +1 -1
- package/src/__tests__/llm-router.test.ts +1 -1
- package/src/__tests__/logs.test.ts +107 -0
- package/src/__tests__/loop-errors.test.ts +244 -0
- package/src/__tests__/lsp.test.ts +1 -1
- package/src/__tests__/modes.test.ts +1 -1
- package/src/__tests__/perf-optimizations.test.ts +847 -0
- package/src/__tests__/permissions.test.ts +1 -1
- package/src/__tests__/pipeline.test.ts +50 -0
- package/src/__tests__/polish-phase3.test.ts +340 -0
- package/src/__tests__/profile.test.ts +237 -0
- package/src/__tests__/rollback.test.ts +83 -0
- package/src/__tests__/runbook.test.ts +219 -0
- package/src/__tests__/schedule.test.ts +206 -0
- package/src/__tests__/serve.test.ts +1 -1
- package/src/__tests__/sessions.test.ts +96 -1
- package/src/__tests__/sharing.test.ts +53 -1
- package/src/__tests__/snapshots.test.ts +1 -1
- package/src/__tests__/standalone-migration.test.ts +199 -0
- package/src/__tests__/state-db.test.ts +1 -1
- package/src/__tests__/status.test.ts +158 -0
- package/src/__tests__/stream-with-tools.test.ts +71 -25
- package/src/__tests__/subagents.test.ts +1 -1
- package/src/__tests__/system-prompt.test.ts +82 -3
- package/src/__tests__/terminal-gap-v2.test.ts +395 -0
- package/src/__tests__/terminal-parity.test.ts +393 -0
- package/src/__tests__/tf-apply.test.ts +187 -0
- package/src/__tests__/tool-converter.test.ts +1 -1
- package/src/__tests__/tool-schemas.test.ts +209 -4
- package/src/__tests__/tools.test.ts +4 -3
- package/src/__tests__/version-json.test.ts +184 -0
- package/src/__tests__/version.test.ts +1 -1
- package/src/__tests__/watch.test.ts +129 -0
- package/src/agent/compaction-agent.ts +40 -1
- package/src/agent/context-manager.ts +67 -3
- package/src/agent/deploy-preview.ts +62 -1
- package/src/agent/expand-files.ts +108 -0
- package/src/agent/loop.ts +1312 -31
- package/src/agent/permissions.ts +51 -4
- package/src/agent/system-prompt.ts +573 -19
- package/src/app.ts +58 -0
- package/src/audit/security-scanner.ts +45 -0
- package/src/auth/keychain.ts +82 -0
- package/src/auth/oauth.ts +15 -5
- package/src/cli/init.ts +378 -5
- package/src/cli/run.ts +407 -16
- package/src/cli/serve.ts +78 -1
- package/src/cli/web.ts +10 -6
- package/src/cli.ts +312 -1
- package/src/clients/service-discovery.ts +30 -25
- package/src/commands/alias.ts +100 -0
- package/src/commands/audit/index.ts +121 -2
- package/src/commands/auth-cloud.ts +113 -0
- package/src/commands/auth-refresh.ts +187 -0
- package/src/commands/aws-discover.ts +144 -251
- package/src/commands/aws-terraform.ts +68 -118
- package/src/commands/chat.ts +9 -3
- package/src/commands/completions.ts +268 -0
- package/src/commands/config.ts +26 -0
- package/src/commands/cost/index.ts +218 -2
- package/src/commands/deploy.ts +260 -0
- package/src/commands/doctor.ts +744 -152
- package/src/commands/drift/index.ts +371 -23
- package/src/commands/export.ts +146 -0
- package/src/commands/generate-k8s.ts +9 -61
- package/src/commands/generate-terraform.ts +191 -449
- package/src/commands/help.ts +212 -36
- package/src/commands/history.ts +8 -1
- package/src/commands/incident.ts +166 -0
- package/src/commands/init.ts +5 -0
- package/src/commands/login.ts +86 -1
- package/src/commands/logs.ts +167 -0
- package/src/commands/onboarding.ts +211 -34
- package/src/commands/pipeline.ts +186 -0
- package/src/commands/plugin.ts +398 -0
- package/src/commands/profile.ts +342 -0
- package/src/commands/questionnaire.ts +0 -98
- package/src/commands/resume.ts +26 -34
- package/src/commands/rollback.ts +315 -0
- package/src/commands/rollout.ts +88 -0
- package/src/commands/runbook.ts +346 -0
- package/src/commands/schedule.ts +236 -0
- package/src/commands/status.ts +252 -0
- package/src/commands/team-context.ts +220 -0
- package/src/commands/template.ts +58 -57
- package/src/commands/tf/index.ts +70 -11
- package/src/commands/upgrade.ts +57 -0
- package/src/commands/version.ts +54 -50
- package/src/commands/watch.ts +153 -0
- package/src/compat/runtime.ts +1 -1
- package/src/compat/sqlite.ts +75 -5
- package/src/config/mode-store.ts +62 -0
- package/src/config/profiles.ts +84 -0
- package/src/config/types.ts +83 -1
- package/src/config/workspace-state.ts +53 -0
- package/src/engine/cost-estimator.ts +52 -10
- package/src/engine/executor.ts +33 -2
- package/src/engine/planner.ts +68 -1
- package/src/generator/terraform.ts +8 -0
- package/src/history/manager.ts +2 -74
- package/src/hooks/engine.ts +5 -4
- package/src/llm/cost-calculator.ts +2 -2
- package/src/llm/providers/anthropic.ts +50 -21
- package/src/llm/router.ts +76 -7
- package/src/lsp/languages.ts +3 -0
- package/src/lsp/manager.ts +21 -5
- package/src/nimbus.ts +37 -18
- package/src/sessions/manager.ts +108 -1
- package/src/sharing/sync.ts +4 -0
- package/src/sharing/viewer.ts +66 -0
- package/src/tools/file-ops.ts +22 -0
- package/src/tools/schemas/devops.ts +3007 -117
- package/src/tools/schemas/standard.ts +5 -1
- package/src/tools/schemas/types.ts +31 -1
- package/src/tools/spawn-exec.ts +148 -0
- package/src/ui/App.tsx +1183 -66
- package/src/ui/DeployPreview.tsx +62 -57
- package/src/ui/FileDiffModal.tsx +162 -0
- package/src/ui/Header.tsx +87 -24
- package/src/ui/HelpModal.tsx +57 -0
- package/src/ui/InputBox.tsx +163 -10
- package/src/ui/MessageList.tsx +487 -40
- package/src/ui/PermissionPrompt.tsx +17 -5
- package/src/ui/StatusBar.tsx +122 -3
- package/src/ui/TerminalPane.tsx +84 -0
- package/src/ui/ToolCallDisplay.tsx +252 -18
- package/src/ui/TreePane.tsx +132 -0
- package/src/ui/chat-ui.ts +41 -44
- package/src/ui/ink/index.ts +771 -38
- package/src/ui/streaming.ts +1 -1
- package/src/ui/theme.ts +104 -0
- package/src/ui/types.ts +18 -0
- package/src/version.ts +1 -1
- package/src/watcher/index.ts +66 -15
- package/src/wizard/types.ts +1 -0
- package/src/wizard/ui.ts +1 -1
- package/tsconfig.json +2 -2
|
@@ -0,0 +1,661 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Ollama Provider
|
|
3
|
+
* Supports local Ollama models: Llama 3.2, CodeLlama, Mistral, etc.
|
|
4
|
+
*/
|
|
5
|
+
import { BaseProvider, getTextContent, } from '../types';
|
|
6
|
+
import { getProviderBaseUrl } from '../auth-bridge';
|
|
7
|
+
export class OllamaProvider extends BaseProvider {
|
|
8
|
+
name = 'ollama';
|
|
9
|
+
baseUrl;
|
|
10
|
+
defaultModel = 'llama3.2';
|
|
11
|
+
constructor(baseUrl) {
|
|
12
|
+
super();
|
|
13
|
+
this.baseUrl =
|
|
14
|
+
baseUrl ||
|
|
15
|
+
getProviderBaseUrl('ollama') ||
|
|
16
|
+
process.env.OLLAMA_BASE_URL ||
|
|
17
|
+
'http://localhost:11434';
|
|
18
|
+
}
|
|
19
|
+
async complete(request) {
|
|
20
|
+
const messages = this.convertMessages(request.messages);
|
|
21
|
+
const controller = new AbortController();
|
|
22
|
+
const timeoutId = setTimeout(() => controller.abort(), 120000); // 2 minute timeout
|
|
23
|
+
try {
|
|
24
|
+
const response = await fetch(`${this.baseUrl}/api/chat`, {
|
|
25
|
+
method: 'POST',
|
|
26
|
+
headers: { 'Content-Type': 'application/json' },
|
|
27
|
+
body: JSON.stringify({
|
|
28
|
+
model: request.model || this.defaultModel,
|
|
29
|
+
messages,
|
|
30
|
+
options: {
|
|
31
|
+
temperature: request.temperature,
|
|
32
|
+
num_predict: request.maxTokens,
|
|
33
|
+
stop: request.stopSequences,
|
|
34
|
+
},
|
|
35
|
+
stream: false,
|
|
36
|
+
}),
|
|
37
|
+
signal: controller.signal,
|
|
38
|
+
});
|
|
39
|
+
clearTimeout(timeoutId);
|
|
40
|
+
if (!response.ok) {
|
|
41
|
+
throw new Error(`Ollama API error: ${response.status} ${await response.text()}`);
|
|
42
|
+
}
|
|
43
|
+
const data = (await response.json());
|
|
44
|
+
return {
|
|
45
|
+
content: data.message.content,
|
|
46
|
+
usage: {
|
|
47
|
+
promptTokens: data.prompt_eval_count || 0,
|
|
48
|
+
completionTokens: data.eval_count || 0,
|
|
49
|
+
totalTokens: (data.prompt_eval_count || 0) + (data.eval_count || 0),
|
|
50
|
+
},
|
|
51
|
+
model: data.model,
|
|
52
|
+
finishReason: 'stop',
|
|
53
|
+
};
|
|
54
|
+
}
|
|
55
|
+
catch (error) {
|
|
56
|
+
clearTimeout(timeoutId);
|
|
57
|
+
if (error.name === 'AbortError') {
|
|
58
|
+
throw new Error('Ollama request timed out after 120 seconds');
|
|
59
|
+
}
|
|
60
|
+
throw error;
|
|
61
|
+
}
|
|
62
|
+
}
|
|
63
|
+
async *stream(request) {
|
|
64
|
+
const messages = this.convertMessages(request.messages);
|
|
65
|
+
const response = await fetch(`${this.baseUrl}/api/chat`, {
|
|
66
|
+
method: 'POST',
|
|
67
|
+
headers: { 'Content-Type': 'application/json' },
|
|
68
|
+
body: JSON.stringify({
|
|
69
|
+
model: request.model || this.defaultModel,
|
|
70
|
+
messages,
|
|
71
|
+
options: {
|
|
72
|
+
temperature: request.temperature,
|
|
73
|
+
num_predict: request.maxTokens,
|
|
74
|
+
},
|
|
75
|
+
stream: true,
|
|
76
|
+
}),
|
|
77
|
+
});
|
|
78
|
+
if (!response.ok) {
|
|
79
|
+
throw new Error(`Ollama API error: ${response.status} ${await response.text()}`);
|
|
80
|
+
}
|
|
81
|
+
const reader = response.body?.getReader();
|
|
82
|
+
if (!reader) {
|
|
83
|
+
throw new Error('No response body');
|
|
84
|
+
}
|
|
85
|
+
const decoder = new TextDecoder();
|
|
86
|
+
let buffer = '';
|
|
87
|
+
while (true) {
|
|
88
|
+
const { done, value } = await reader.read();
|
|
89
|
+
if (done) {
|
|
90
|
+
break;
|
|
91
|
+
}
|
|
92
|
+
buffer += decoder.decode(value, { stream: true });
|
|
93
|
+
const lines = buffer.split('\n');
|
|
94
|
+
// Keep the last incomplete line in the buffer
|
|
95
|
+
buffer = lines.pop() || '';
|
|
96
|
+
for (const line of lines) {
|
|
97
|
+
if (!line.trim()) {
|
|
98
|
+
continue;
|
|
99
|
+
}
|
|
100
|
+
try {
|
|
101
|
+
const data = JSON.parse(line);
|
|
102
|
+
if (data.message?.content) {
|
|
103
|
+
yield {
|
|
104
|
+
content: data.message.content,
|
|
105
|
+
done: false,
|
|
106
|
+
};
|
|
107
|
+
}
|
|
108
|
+
if (data.done) {
|
|
109
|
+
yield { done: true };
|
|
110
|
+
}
|
|
111
|
+
}
|
|
112
|
+
catch (e) {
|
|
113
|
+
// Ignore malformed JSON lines
|
|
114
|
+
continue;
|
|
115
|
+
}
|
|
116
|
+
}
|
|
117
|
+
}
|
|
118
|
+
}
|
|
119
|
+
async completeWithTools(request) {
|
|
120
|
+
// Try native Ollama tool calling first (supported by llama3.x, mistral, etc.)
|
|
121
|
+
try {
|
|
122
|
+
const nativeResult = await this.completeWithNativeTools(request);
|
|
123
|
+
if (nativeResult) {
|
|
124
|
+
return nativeResult;
|
|
125
|
+
}
|
|
126
|
+
}
|
|
127
|
+
catch {
|
|
128
|
+
// Native tool calling not supported by this model — fall through
|
|
129
|
+
}
|
|
130
|
+
// Fallback: prompt engineering approach for models without native tool support
|
|
131
|
+
const toolPrompt = this.buildToolPrompt(request.tools);
|
|
132
|
+
const modifiedRequest = {
|
|
133
|
+
...request,
|
|
134
|
+
messages: [{ role: 'system', content: toolPrompt }, ...request.messages],
|
|
135
|
+
};
|
|
136
|
+
const response = await this.complete(modifiedRequest);
|
|
137
|
+
// Attempt to extract tool calls from the text response. If extraction
|
|
138
|
+
// fails for any reason (malformed JSON, unexpected structure, etc.),
|
|
139
|
+
// return the raw text so the agent loop can still display it.
|
|
140
|
+
let toolCalls = [];
|
|
141
|
+
try {
|
|
142
|
+
toolCalls = this.extractToolCalls(response.content);
|
|
143
|
+
}
|
|
144
|
+
catch {
|
|
145
|
+
// Extraction failed -- return the original text as a plain response
|
|
146
|
+
return response;
|
|
147
|
+
}
|
|
148
|
+
return {
|
|
149
|
+
...response,
|
|
150
|
+
content: toolCalls.length > 0 ? '' : response.content,
|
|
151
|
+
toolCalls: toolCalls.length > 0 ? toolCalls : undefined,
|
|
152
|
+
};
|
|
153
|
+
}
|
|
154
|
+
/**
|
|
155
|
+
* Attempt native Ollama tool calling via the /api/chat tools parameter.
|
|
156
|
+
* Returns null if the model doesn't support tools (response has no tool_calls).
|
|
157
|
+
*/
|
|
158
|
+
async completeWithNativeTools(request) {
|
|
159
|
+
const messages = this.convertMessages(request.messages);
|
|
160
|
+
const tools = request.tools.map(t => ({
|
|
161
|
+
type: 'function',
|
|
162
|
+
function: {
|
|
163
|
+
name: t.function.name,
|
|
164
|
+
description: t.function.description,
|
|
165
|
+
parameters: t.function.parameters,
|
|
166
|
+
},
|
|
167
|
+
}));
|
|
168
|
+
const controller = new AbortController();
|
|
169
|
+
const timeoutId = setTimeout(() => controller.abort(), 120000);
|
|
170
|
+
try {
|
|
171
|
+
const response = await fetch(`${this.baseUrl}/api/chat`, {
|
|
172
|
+
method: 'POST',
|
|
173
|
+
headers: { 'Content-Type': 'application/json' },
|
|
174
|
+
body: JSON.stringify({
|
|
175
|
+
model: request.model || this.defaultModel,
|
|
176
|
+
messages,
|
|
177
|
+
tools,
|
|
178
|
+
options: {
|
|
179
|
+
temperature: request.temperature,
|
|
180
|
+
num_predict: request.maxTokens,
|
|
181
|
+
},
|
|
182
|
+
stream: false,
|
|
183
|
+
}),
|
|
184
|
+
signal: controller.signal,
|
|
185
|
+
});
|
|
186
|
+
clearTimeout(timeoutId);
|
|
187
|
+
if (!response.ok) {
|
|
188
|
+
return null;
|
|
189
|
+
}
|
|
190
|
+
const data = (await response.json());
|
|
191
|
+
const msg = data.message;
|
|
192
|
+
// If no tool_calls in response, native tools aren't working
|
|
193
|
+
if (!msg?.tool_calls || msg.tool_calls.length === 0) {
|
|
194
|
+
return null;
|
|
195
|
+
}
|
|
196
|
+
const toolCalls = msg.tool_calls.map(tc => ({
|
|
197
|
+
id: crypto.randomUUID(),
|
|
198
|
+
type: 'function',
|
|
199
|
+
function: {
|
|
200
|
+
name: tc.function.name,
|
|
201
|
+
arguments: JSON.stringify(tc.function.arguments),
|
|
202
|
+
},
|
|
203
|
+
}));
|
|
204
|
+
return {
|
|
205
|
+
content: msg.content || '',
|
|
206
|
+
toolCalls,
|
|
207
|
+
usage: {
|
|
208
|
+
promptTokens: data.prompt_eval_count || 0,
|
|
209
|
+
completionTokens: data.eval_count || 0,
|
|
210
|
+
totalTokens: (data.prompt_eval_count || 0) + (data.eval_count || 0),
|
|
211
|
+
},
|
|
212
|
+
model: data.model,
|
|
213
|
+
finishReason: 'tool_calls',
|
|
214
|
+
};
|
|
215
|
+
}
|
|
216
|
+
catch {
|
|
217
|
+
clearTimeout(timeoutId);
|
|
218
|
+
return null;
|
|
219
|
+
}
|
|
220
|
+
}
|
|
221
|
+
/**
|
|
222
|
+
* Stream a chat completion with tool calling support.
|
|
223
|
+
* Attempts native Ollama tool streaming via the OpenAI-compatible endpoint first.
|
|
224
|
+
* Falls back to the non-streaming completeWithTools for models without native
|
|
225
|
+
* tool support, yielding the result as a single chunk.
|
|
226
|
+
*/
|
|
227
|
+
async *streamWithTools(request) {
|
|
228
|
+
// Try native streaming with tools via the OpenAI-compatible endpoint
|
|
229
|
+
try {
|
|
230
|
+
const nativeStream = this.streamWithNativeTools(request);
|
|
231
|
+
let gotToolCalls = false;
|
|
232
|
+
for await (const chunk of nativeStream) {
|
|
233
|
+
if (chunk.toolCalls && chunk.toolCalls.length > 0) {
|
|
234
|
+
gotToolCalls = true;
|
|
235
|
+
}
|
|
236
|
+
yield chunk;
|
|
237
|
+
}
|
|
238
|
+
// If we successfully streamed (even without tool calls), we're done
|
|
239
|
+
if (gotToolCalls) {
|
|
240
|
+
return;
|
|
241
|
+
}
|
|
242
|
+
// If the native stream completed without any tool calls, it may mean
|
|
243
|
+
// the model answered with text only, which is a valid response — return.
|
|
244
|
+
return;
|
|
245
|
+
}
|
|
246
|
+
catch {
|
|
247
|
+
// Native streaming not supported — fall through to fallback
|
|
248
|
+
}
|
|
249
|
+
// Fallback: use non-streaming completeWithTools and yield as a single chunk
|
|
250
|
+
const response = await this.completeWithTools(request);
|
|
251
|
+
if (response.content) {
|
|
252
|
+
yield { content: response.content, done: false };
|
|
253
|
+
}
|
|
254
|
+
yield {
|
|
255
|
+
done: true,
|
|
256
|
+
toolCalls: response.toolCalls,
|
|
257
|
+
usage: response.usage,
|
|
258
|
+
};
|
|
259
|
+
}
|
|
260
|
+
/**
|
|
261
|
+
* Stream with native tool calling via the Ollama OpenAI-compatible endpoint.
|
|
262
|
+
* Uses fetch + SSE parsing against /v1/chat/completions with stream: true.
|
|
263
|
+
*/
|
|
264
|
+
async *streamWithNativeTools(request) {
|
|
265
|
+
const messages = this.convertMessages(request.messages);
|
|
266
|
+
const tools = request.tools.map(t => ({
|
|
267
|
+
type: 'function',
|
|
268
|
+
function: {
|
|
269
|
+
name: t.function.name,
|
|
270
|
+
description: t.function.description,
|
|
271
|
+
parameters: t.function.parameters,
|
|
272
|
+
},
|
|
273
|
+
}));
|
|
274
|
+
const response = await fetch(`${this.baseUrl}/v1/chat/completions`, {
|
|
275
|
+
method: 'POST',
|
|
276
|
+
headers: { 'Content-Type': 'application/json' },
|
|
277
|
+
body: JSON.stringify({
|
|
278
|
+
model: request.model || this.defaultModel,
|
|
279
|
+
messages,
|
|
280
|
+
tools,
|
|
281
|
+
tool_choice: request.toolChoice || 'auto',
|
|
282
|
+
max_tokens: request.maxTokens,
|
|
283
|
+
temperature: request.temperature,
|
|
284
|
+
stream: true,
|
|
285
|
+
}),
|
|
286
|
+
});
|
|
287
|
+
if (!response.ok) {
|
|
288
|
+
throw new Error(`Ollama OpenAI-compatible API error: ${response.status} ${await response.text()}`);
|
|
289
|
+
}
|
|
290
|
+
const reader = response.body?.getReader();
|
|
291
|
+
if (!reader) {
|
|
292
|
+
throw new Error('No response body');
|
|
293
|
+
}
|
|
294
|
+
const decoder = new TextDecoder();
|
|
295
|
+
let buffer = '';
|
|
296
|
+
const toolCallAccumulator = new Map();
|
|
297
|
+
let usage;
|
|
298
|
+
while (true) {
|
|
299
|
+
const { done, value } = await reader.read();
|
|
300
|
+
if (done) {
|
|
301
|
+
break;
|
|
302
|
+
}
|
|
303
|
+
buffer += decoder.decode(value, { stream: true });
|
|
304
|
+
const lines = buffer.split('\n');
|
|
305
|
+
// Keep the last incomplete line in the buffer
|
|
306
|
+
buffer = lines.pop() || '';
|
|
307
|
+
for (const line of lines) {
|
|
308
|
+
const trimmed = line.trim();
|
|
309
|
+
if (!trimmed || trimmed === 'data: [DONE]') {
|
|
310
|
+
continue;
|
|
311
|
+
}
|
|
312
|
+
if (!trimmed.startsWith('data: ')) {
|
|
313
|
+
continue;
|
|
314
|
+
}
|
|
315
|
+
try {
|
|
316
|
+
const data = JSON.parse(trimmed.slice(6));
|
|
317
|
+
const delta = data.choices?.[0]?.delta;
|
|
318
|
+
const finishReason = data.choices?.[0]?.finish_reason;
|
|
319
|
+
if (delta?.content) {
|
|
320
|
+
yield { content: delta.content, done: false };
|
|
321
|
+
}
|
|
322
|
+
if (delta?.tool_calls) {
|
|
323
|
+
for (const tc of delta.tool_calls) {
|
|
324
|
+
const index = tc.index ?? 0;
|
|
325
|
+
const existing = toolCallAccumulator.get(index);
|
|
326
|
+
if (existing) {
|
|
327
|
+
if (tc.function?.arguments) {
|
|
328
|
+
existing.arguments += tc.function.arguments;
|
|
329
|
+
}
|
|
330
|
+
}
|
|
331
|
+
else {
|
|
332
|
+
toolCallAccumulator.set(index, {
|
|
333
|
+
id: tc.id || crypto.randomUUID(),
|
|
334
|
+
name: tc.function?.name || '',
|
|
335
|
+
arguments: tc.function?.arguments || '',
|
|
336
|
+
});
|
|
337
|
+
}
|
|
338
|
+
}
|
|
339
|
+
}
|
|
340
|
+
if (data.usage) {
|
|
341
|
+
usage = {
|
|
342
|
+
promptTokens: data.usage.prompt_tokens || 0,
|
|
343
|
+
completionTokens: data.usage.completion_tokens || 0,
|
|
344
|
+
totalTokens: data.usage.total_tokens || 0,
|
|
345
|
+
};
|
|
346
|
+
}
|
|
347
|
+
if (finishReason) {
|
|
348
|
+
const toolCalls = toolCallAccumulator.size > 0
|
|
349
|
+
? Array.from(toolCallAccumulator.values()).map(tc => ({
|
|
350
|
+
id: tc.id,
|
|
351
|
+
type: 'function',
|
|
352
|
+
function: { name: tc.name, arguments: tc.arguments },
|
|
353
|
+
}))
|
|
354
|
+
: undefined;
|
|
355
|
+
yield { done: true, toolCalls, usage };
|
|
356
|
+
return;
|
|
357
|
+
}
|
|
358
|
+
}
|
|
359
|
+
catch {
|
|
360
|
+
// Ignore malformed SSE lines
|
|
361
|
+
continue;
|
|
362
|
+
}
|
|
363
|
+
}
|
|
364
|
+
}
|
|
365
|
+
// If we reach here without a finishReason, emit a final done chunk
|
|
366
|
+
const toolCalls = toolCallAccumulator.size > 0
|
|
367
|
+
? Array.from(toolCallAccumulator.values()).map(tc => ({
|
|
368
|
+
id: tc.id,
|
|
369
|
+
type: 'function',
|
|
370
|
+
function: { name: tc.name, arguments: tc.arguments },
|
|
371
|
+
}))
|
|
372
|
+
: undefined;
|
|
373
|
+
yield { done: true, toolCalls, usage };
|
|
374
|
+
}
|
|
375
|
+
async countTokens(text) {
|
|
376
|
+
try {
|
|
377
|
+
// Use gpt-tokenizer (already a dependency) for better approximation
|
|
378
|
+
const { encode } = await import('gpt-tokenizer');
|
|
379
|
+
return encode(text).length;
|
|
380
|
+
}
|
|
381
|
+
catch {
|
|
382
|
+
// Fallback to approximation if tokenizer fails
|
|
383
|
+
return Math.ceil(text.length / 4);
|
|
384
|
+
}
|
|
385
|
+
}
|
|
386
|
+
getMaxTokens(model) {
|
|
387
|
+
// Check the runtime cache first (populated by getModelInfo)
|
|
388
|
+
const cached = this.modelContextCache.get(model);
|
|
389
|
+
if (cached !== undefined) {
|
|
390
|
+
return cached;
|
|
391
|
+
}
|
|
392
|
+
const limits = {
|
|
393
|
+
// Llama 3.x family
|
|
394
|
+
llama3: 8192,
|
|
395
|
+
'llama3.1': 131072,
|
|
396
|
+
'llama3.1:8b': 131072,
|
|
397
|
+
'llama3.1:70b': 131072,
|
|
398
|
+
'llama3.1:405b': 131072,
|
|
399
|
+
'llama3.2': 131072,
|
|
400
|
+
'llama3.2:1b': 131072,
|
|
401
|
+
'llama3.2:3b': 131072,
|
|
402
|
+
'llama3.2:70b': 131072,
|
|
403
|
+
'llama3.3': 131072,
|
|
404
|
+
'llama3.3:70b': 131072,
|
|
405
|
+
// Llama 2 family
|
|
406
|
+
llama2: 4096,
|
|
407
|
+
'llama2:13b': 4096,
|
|
408
|
+
'llama2:70b': 4096,
|
|
409
|
+
// CodeLlama
|
|
410
|
+
codellama: 16384,
|
|
411
|
+
'codellama:7b': 16384,
|
|
412
|
+
'codellama:13b': 16384,
|
|
413
|
+
'codellama:34b': 16384,
|
|
414
|
+
'codellama:70b': 16384,
|
|
415
|
+
// Mistral / Mixtral
|
|
416
|
+
mistral: 32768,
|
|
417
|
+
'mistral:7b': 32768,
|
|
418
|
+
'mistral-nemo': 128000,
|
|
419
|
+
'mistral-large': 128000,
|
|
420
|
+
'mistral-small': 32768,
|
|
421
|
+
mixtral: 32768,
|
|
422
|
+
'mixtral:8x7b': 32768,
|
|
423
|
+
'mixtral:8x22b': 65536,
|
|
424
|
+
// Phi family
|
|
425
|
+
phi: 2048,
|
|
426
|
+
phi3: 131072,
|
|
427
|
+
'phi3:mini': 131072,
|
|
428
|
+
'phi3:medium': 131072,
|
|
429
|
+
'phi3.5': 131072,
|
|
430
|
+
phi4: 16384,
|
|
431
|
+
// Gemma family
|
|
432
|
+
gemma: 8192,
|
|
433
|
+
'gemma:2b': 8192,
|
|
434
|
+
'gemma:7b': 8192,
|
|
435
|
+
gemma2: 8192,
|
|
436
|
+
'gemma2:2b': 8192,
|
|
437
|
+
'gemma2:9b': 8192,
|
|
438
|
+
'gemma2:27b': 8192,
|
|
439
|
+
// Qwen family
|
|
440
|
+
qwen: 32768,
|
|
441
|
+
qwen2: 131072,
|
|
442
|
+
'qwen2:7b': 131072,
|
|
443
|
+
'qwen2:72b': 131072,
|
|
444
|
+
'qwen2.5': 131072,
|
|
445
|
+
'qwen2.5:7b': 131072,
|
|
446
|
+
'qwen2.5:14b': 131072,
|
|
447
|
+
'qwen2.5:32b': 131072,
|
|
448
|
+
'qwen2.5:72b': 131072,
|
|
449
|
+
'qwen2.5-coder': 131072,
|
|
450
|
+
// DeepSeek family
|
|
451
|
+
'deepseek-coder': 16384,
|
|
452
|
+
'deepseek-coder-v2': 131072,
|
|
453
|
+
'deepseek-r1': 131072,
|
|
454
|
+
// StarCoder
|
|
455
|
+
starcoder: 8192,
|
|
456
|
+
starcoder2: 16384,
|
|
457
|
+
// Command R
|
|
458
|
+
'command-r': 131072,
|
|
459
|
+
'command-r-plus': 131072,
|
|
460
|
+
// Others
|
|
461
|
+
'nomic-embed-text': 8192,
|
|
462
|
+
'mxbai-embed-large': 512,
|
|
463
|
+
yi: 200000,
|
|
464
|
+
solar: 4096,
|
|
465
|
+
'neural-chat': 4096,
|
|
466
|
+
'wizard-vicuna': 4096,
|
|
467
|
+
};
|
|
468
|
+
// Handle model variants (e.g., "llama3.2:7b-instruct" -> "llama3.2:7b" -> "llama3.2")
|
|
469
|
+
if (limits[model]) {
|
|
470
|
+
return limits[model];
|
|
471
|
+
}
|
|
472
|
+
const baseModel = model.split(':')[0];
|
|
473
|
+
return limits[baseModel] || 8192;
|
|
474
|
+
}
|
|
475
|
+
/**
|
|
476
|
+
* Query the Ollama `/api/show` endpoint to retrieve the actual model
|
|
477
|
+
* context length from the running server. Results are cached in memory
|
|
478
|
+
* so repeated calls for the same model are free.
|
|
479
|
+
*
|
|
480
|
+
* If the call fails (Ollama not running, model not pulled, etc.) the
|
|
481
|
+
* method returns `null` and the caller should fall back to the
|
|
482
|
+
* hardcoded map in {@link getMaxTokens}.
|
|
483
|
+
*/
|
|
484
|
+
async getModelInfo(model) {
|
|
485
|
+
const cached = this.modelContextCache.get(model);
|
|
486
|
+
if (cached !== undefined) {
|
|
487
|
+
return cached;
|
|
488
|
+
}
|
|
489
|
+
try {
|
|
490
|
+
const response = await fetch(`${this.baseUrl}/api/show`, {
|
|
491
|
+
method: 'POST',
|
|
492
|
+
headers: { 'Content-Type': 'application/json' },
|
|
493
|
+
body: JSON.stringify({ name: model }),
|
|
494
|
+
signal: AbortSignal.timeout(5000),
|
|
495
|
+
});
|
|
496
|
+
if (!response.ok) {
|
|
497
|
+
return null;
|
|
498
|
+
}
|
|
499
|
+
const data = (await response.json());
|
|
500
|
+
// Strategy 1: Check model_info for context_length or num_ctx keys
|
|
501
|
+
if (data.model_info) {
|
|
502
|
+
for (const [key, value] of Object.entries(data.model_info)) {
|
|
503
|
+
if ((key.includes('context_length') || key.includes('num_ctx')) &&
|
|
504
|
+
typeof value === 'number' &&
|
|
505
|
+
value > 0) {
|
|
506
|
+
this.modelContextCache.set(model, value);
|
|
507
|
+
return value;
|
|
508
|
+
}
|
|
509
|
+
}
|
|
510
|
+
}
|
|
511
|
+
// Strategy 2: Parse the parameters string for num_ctx
|
|
512
|
+
if (data.parameters) {
|
|
513
|
+
const match = data.parameters.match(/num_ctx\s+(\d+)/);
|
|
514
|
+
if (match) {
|
|
515
|
+
const numCtx = parseInt(match[1], 10);
|
|
516
|
+
if (numCtx > 0) {
|
|
517
|
+
this.modelContextCache.set(model, numCtx);
|
|
518
|
+
return numCtx;
|
|
519
|
+
}
|
|
520
|
+
}
|
|
521
|
+
}
|
|
522
|
+
return null;
|
|
523
|
+
}
|
|
524
|
+
catch {
|
|
525
|
+
return null;
|
|
526
|
+
}
|
|
527
|
+
}
|
|
528
|
+
/** In-memory cache for model context lengths retrieved via /api/show. */
|
|
529
|
+
modelContextCache = new Map();
|
|
530
|
+
async listModels() {
|
|
531
|
+
try {
|
|
532
|
+
const response = await fetch(`${this.baseUrl}/api/tags`, {
|
|
533
|
+
signal: AbortSignal.timeout(3000),
|
|
534
|
+
});
|
|
535
|
+
if (response.ok) {
|
|
536
|
+
const data = (await response.json());
|
|
537
|
+
if (data.models && Array.isArray(data.models)) {
|
|
538
|
+
return data.models.map(m => m.name || m.model || '').filter(Boolean);
|
|
539
|
+
}
|
|
540
|
+
}
|
|
541
|
+
}
|
|
542
|
+
catch {
|
|
543
|
+
// Ollama not available, return static fallback
|
|
544
|
+
}
|
|
545
|
+
return ['llama3.2', 'llama3.2:70b', 'codellama', 'mistral', 'mixtral', 'phi'];
|
|
546
|
+
}
|
|
547
|
+
/**
|
|
548
|
+
* Convert messages to Ollama format
|
|
549
|
+
*/
|
|
550
|
+
convertMessages(messages) {
|
|
551
|
+
return messages.map(m => ({
|
|
552
|
+
role: m.role === 'assistant' ? 'assistant' : m.role === 'system' ? 'system' : 'user',
|
|
553
|
+
content: getTextContent(m.content),
|
|
554
|
+
}));
|
|
555
|
+
}
|
|
556
|
+
/**
|
|
557
|
+
* Build tool prompt for prompt engineering approach
|
|
558
|
+
*/
|
|
559
|
+
buildToolPrompt(tools) {
|
|
560
|
+
const toolDescriptions = tools
|
|
561
|
+
.map(t => {
|
|
562
|
+
const params = t.function.parameters;
|
|
563
|
+
const required = params.required || [];
|
|
564
|
+
const props = params.properties || {};
|
|
565
|
+
const paramList = Object.entries(props)
|
|
566
|
+
.map(([k, v]) => {
|
|
567
|
+
const req = required.includes(k) ? ' (required)' : ' (optional)';
|
|
568
|
+
return ` "${k}": ${v.type || 'string'}${req} — ${v.description || ''}`;
|
|
569
|
+
})
|
|
570
|
+
.join('\n');
|
|
571
|
+
return `- ${t.function.name}: ${t.function.description}\n Parameters:\n${paramList}`;
|
|
572
|
+
})
|
|
573
|
+
.join('\n\n');
|
|
574
|
+
return `You are a helpful AI assistant with access to tools. When you need to use a tool, respond with ONLY a JSON object in this exact format (no other text before or after):
|
|
575
|
+
|
|
576
|
+
\`\`\`json
|
|
577
|
+
{"tool": "tool_name", "arguments": {"param1": "value1"}}
|
|
578
|
+
\`\`\`
|
|
579
|
+
|
|
580
|
+
Available tools:
|
|
581
|
+
|
|
582
|
+
${toolDescriptions}
|
|
583
|
+
|
|
584
|
+
IMPORTANT: When using a tool, output ONLY the JSON object. Do not include any explanation text before or after it. If you want to respond without using a tool, respond normally with plain text (no JSON).`;
|
|
585
|
+
}
|
|
586
|
+
/**
|
|
587
|
+
* Extract tool calls from response content using robust pattern matching.
|
|
588
|
+
* Handles JSON in code blocks, bare JSON, and multiple tool calls.
|
|
589
|
+
*/
|
|
590
|
+
extractToolCalls(content) {
|
|
591
|
+
const toolCalls = [];
|
|
592
|
+
// Strategy 1: Look for JSON in code blocks
|
|
593
|
+
const codeBlockRegex = /```(?:json)?\s*\n?([\s\S]*?)\n?```/g;
|
|
594
|
+
let match;
|
|
595
|
+
while ((match = codeBlockRegex.exec(content)) !== null) {
|
|
596
|
+
const parsed = this.tryParseToolCall(match[1].trim());
|
|
597
|
+
if (parsed) {
|
|
598
|
+
toolCalls.push(parsed);
|
|
599
|
+
}
|
|
600
|
+
}
|
|
601
|
+
if (toolCalls.length > 0) {
|
|
602
|
+
return toolCalls;
|
|
603
|
+
}
|
|
604
|
+
// Strategy 2: Try to parse the entire content as JSON
|
|
605
|
+
const wholeContent = content.trim();
|
|
606
|
+
if (wholeContent.startsWith('{')) {
|
|
607
|
+
const parsed = this.tryParseToolCall(wholeContent);
|
|
608
|
+
if (parsed) {
|
|
609
|
+
return [parsed];
|
|
610
|
+
}
|
|
611
|
+
}
|
|
612
|
+
// Strategy 3: Find JSON objects using balanced brace matching
|
|
613
|
+
let depth = 0;
|
|
614
|
+
let start = -1;
|
|
615
|
+
for (let i = 0; i < content.length; i++) {
|
|
616
|
+
if (content[i] === '{') {
|
|
617
|
+
if (depth === 0) {
|
|
618
|
+
start = i;
|
|
619
|
+
}
|
|
620
|
+
depth++;
|
|
621
|
+
}
|
|
622
|
+
else if (content[i] === '}') {
|
|
623
|
+
depth--;
|
|
624
|
+
if (depth === 0 && start !== -1) {
|
|
625
|
+
const candidate = content.slice(start, i + 1);
|
|
626
|
+
const parsed = this.tryParseToolCall(candidate);
|
|
627
|
+
if (parsed) {
|
|
628
|
+
toolCalls.push(parsed);
|
|
629
|
+
}
|
|
630
|
+
start = -1;
|
|
631
|
+
}
|
|
632
|
+
}
|
|
633
|
+
}
|
|
634
|
+
return toolCalls;
|
|
635
|
+
}
|
|
636
|
+
/**
|
|
637
|
+
* Try to parse a string as a tool call JSON object.
|
|
638
|
+
*/
|
|
639
|
+
tryParseToolCall(text) {
|
|
640
|
+
try {
|
|
641
|
+
const parsed = JSON.parse(text);
|
|
642
|
+
if (parsed.tool &&
|
|
643
|
+
typeof parsed.tool === 'string' &&
|
|
644
|
+
parsed.arguments &&
|
|
645
|
+
typeof parsed.arguments === 'object') {
|
|
646
|
+
return {
|
|
647
|
+
id: crypto.randomUUID(),
|
|
648
|
+
type: 'function',
|
|
649
|
+
function: {
|
|
650
|
+
name: parsed.tool,
|
|
651
|
+
arguments: JSON.stringify(parsed.arguments),
|
|
652
|
+
},
|
|
653
|
+
};
|
|
654
|
+
}
|
|
655
|
+
}
|
|
656
|
+
catch {
|
|
657
|
+
// Not valid JSON
|
|
658
|
+
}
|
|
659
|
+
return null;
|
|
660
|
+
}
|
|
661
|
+
}
|