@gguf/coder 0.3.1 → 0.3.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/package.json +5 -2
- package/.editorconfig +0 -16
- package/.env.example +0 -63
- package/.gitattributes +0 -1
- package/.semgrepignore +0 -19
- package/coder-dummy-file.ts +0 -52
- package/coder.config.example.json +0 -59
- package/coder.config.json +0 -13
- package/color_picker.html +0 -36
- package/scripts/extract-changelog.js +0 -73
- package/scripts/fetch-models.js +0 -143
- package/scripts/test.sh +0 -40
- package/scripts/update-homebrew-formula.sh +0 -125
- package/scripts/update-nix-version.sh +0 -157
- package/source/ai-sdk-client/AISDKClient.spec.ts +0 -117
- package/source/ai-sdk-client/AISDKClient.ts +0 -155
- package/source/ai-sdk-client/chat/chat-handler.spec.ts +0 -121
- package/source/ai-sdk-client/chat/chat-handler.ts +0 -276
- package/source/ai-sdk-client/chat/streaming-handler.spec.ts +0 -173
- package/source/ai-sdk-client/chat/streaming-handler.ts +0 -110
- package/source/ai-sdk-client/chat/tool-processor.spec.ts +0 -92
- package/source/ai-sdk-client/chat/tool-processor.ts +0 -70
- package/source/ai-sdk-client/converters/message-converter.spec.ts +0 -220
- package/source/ai-sdk-client/converters/message-converter.ts +0 -113
- package/source/ai-sdk-client/converters/tool-converter.spec.ts +0 -90
- package/source/ai-sdk-client/converters/tool-converter.ts +0 -46
- package/source/ai-sdk-client/error-handling/error-extractor.spec.ts +0 -55
- package/source/ai-sdk-client/error-handling/error-extractor.ts +0 -15
- package/source/ai-sdk-client/error-handling/error-parser.spec.ts +0 -169
- package/source/ai-sdk-client/error-handling/error-parser.ts +0 -161
- package/source/ai-sdk-client/index.ts +0 -7
- package/source/ai-sdk-client/providers/provider-factory.spec.ts +0 -71
- package/source/ai-sdk-client/providers/provider-factory.ts +0 -41
- package/source/ai-sdk-client/types.ts +0 -9
- package/source/ai-sdk-client-empty-message.spec.ts +0 -141
- package/source/ai-sdk-client-error-handling.spec.ts +0 -186
- package/source/ai-sdk-client-maxretries.spec.ts +0 -114
- package/source/ai-sdk-client-preparestep.spec.ts +0 -279
- package/source/app/App.spec.tsx +0 -32
- package/source/app/App.tsx +0 -480
- package/source/app/components/AppContainer.spec.tsx +0 -96
- package/source/app/components/AppContainer.tsx +0 -56
- package/source/app/components/ChatInterface.spec.tsx +0 -163
- package/source/app/components/ChatInterface.tsx +0 -144
- package/source/app/components/ModalSelectors.spec.tsx +0 -141
- package/source/app/components/ModalSelectors.tsx +0 -135
- package/source/app/helpers.spec.ts +0 -97
- package/source/app/helpers.ts +0 -63
- package/source/app/index.ts +0 -4
- package/source/app/types.ts +0 -39
- package/source/app/utils/appUtils.ts +0 -294
- package/source/app/utils/conversationState.ts +0 -310
- package/source/app.spec.tsx +0 -244
- package/source/cli.spec.ts +0 -73
- package/source/cli.tsx +0 -51
- package/source/client-factory.spec.ts +0 -48
- package/source/client-factory.ts +0 -178
- package/source/command-parser.spec.ts +0 -127
- package/source/command-parser.ts +0 -36
- package/source/commands/checkpoint.spec.tsx +0 -277
- package/source/commands/checkpoint.tsx +0 -366
- package/source/commands/clear.tsx +0 -22
- package/source/commands/custom-commands.tsx +0 -121
- package/source/commands/exit.ts +0 -21
- package/source/commands/export.spec.tsx +0 -131
- package/source/commands/export.tsx +0 -79
- package/source/commands/help.tsx +0 -120
- package/source/commands/index.ts +0 -17
- package/source/commands/init.tsx +0 -339
- package/source/commands/lsp-command.spec.tsx +0 -281
- package/source/commands/lsp.tsx +0 -120
- package/source/commands/mcp-command.spec.tsx +0 -313
- package/source/commands/mcp.tsx +0 -162
- package/source/commands/model-database.spec.tsx +0 -758
- package/source/commands/model-database.tsx +0 -418
- package/source/commands/model.ts +0 -12
- package/source/commands/provider.ts +0 -12
- package/source/commands/setup-config.tsx +0 -16
- package/source/commands/simple-commands.spec.tsx +0 -175
- package/source/commands/status.ts +0 -12
- package/source/commands/theme.ts +0 -12
- package/source/commands/update.spec.tsx +0 -261
- package/source/commands/update.tsx +0 -201
- package/source/commands/usage.spec.tsx +0 -495
- package/source/commands/usage.tsx +0 -100
- package/source/commands.spec.ts +0 -436
- package/source/commands.ts +0 -83
- package/source/components/assistant-message.spec.tsx +0 -796
- package/source/components/assistant-message.tsx +0 -34
- package/source/components/bash-execution-indicator.tsx +0 -21
- package/source/components/cancelling-indicator.tsx +0 -16
- package/source/components/chat-queue.spec.tsx +0 -83
- package/source/components/chat-queue.tsx +0 -36
- package/source/components/checkpoint-display.spec.tsx +0 -219
- package/source/components/checkpoint-display.tsx +0 -126
- package/source/components/checkpoint-selector.spec.tsx +0 -173
- package/source/components/checkpoint-selector.tsx +0 -173
- package/source/components/development-mode-indicator.spec.tsx +0 -268
- package/source/components/development-mode-indicator.tsx +0 -38
- package/source/components/message-box.spec.tsx +0 -427
- package/source/components/message-box.tsx +0 -87
- package/source/components/model-selector.tsx +0 -132
- package/source/components/provider-selector.tsx +0 -75
- package/source/components/random-spinner.tsx +0 -19
- package/source/components/security-disclaimer.tsx +0 -73
- package/source/components/status-connection-display.spec.tsx +0 -133
- package/source/components/status.tsx +0 -267
- package/source/components/theme-selector.tsx +0 -126
- package/source/components/tool-confirmation.tsx +0 -190
- package/source/components/tool-execution-indicator.tsx +0 -33
- package/source/components/tool-message.tsx +0 -85
- package/source/components/ui/titled-box.spec.tsx +0 -207
- package/source/components/ui/titled-box.tsx +0 -57
- package/source/components/usage/progress-bar.spec.tsx +0 -398
- package/source/components/usage/progress-bar.tsx +0 -30
- package/source/components/usage/usage-display.spec.tsx +0 -780
- package/source/components/usage/usage-display.tsx +0 -291
- package/source/components/user-input.spec.tsx +0 -327
- package/source/components/user-input.tsx +0 -533
- package/source/components/user-message.spec.tsx +0 -230
- package/source/components/user-message.tsx +0 -84
- package/source/components/welcome-message.tsx +0 -76
- package/source/config/env-substitution.ts +0 -65
- package/source/config/index.spec.ts +0 -171
- package/source/config/index.ts +0 -154
- package/source/config/paths.spec.ts +0 -241
- package/source/config/paths.ts +0 -55
- package/source/config/preferences.ts +0 -51
- package/source/config/themes.ts +0 -315
- package/source/constants.ts +0 -130
- package/source/context/mode-context.spec.ts +0 -79
- package/source/context/mode-context.ts +0 -24
- package/source/custom-commands/executor.spec.ts +0 -142
- package/source/custom-commands/executor.ts +0 -64
- package/source/custom-commands/loader.spec.ts +0 -314
- package/source/custom-commands/loader.ts +0 -153
- package/source/custom-commands/parser.ts +0 -196
- package/source/hooks/chat-handler/conversation/conversation-loop.spec.ts +0 -39
- package/source/hooks/chat-handler/conversation/conversation-loop.tsx +0 -511
- package/source/hooks/chat-handler/conversation/tool-executor.spec.ts +0 -50
- package/source/hooks/chat-handler/conversation/tool-executor.tsx +0 -109
- package/source/hooks/chat-handler/index.ts +0 -12
- package/source/hooks/chat-handler/state/streaming-state.spec.ts +0 -26
- package/source/hooks/chat-handler/state/streaming-state.ts +0 -19
- package/source/hooks/chat-handler/types.ts +0 -38
- package/source/hooks/chat-handler/useChatHandler.spec.tsx +0 -321
- package/source/hooks/chat-handler/useChatHandler.tsx +0 -194
- package/source/hooks/chat-handler/utils/context-checker.spec.ts +0 -60
- package/source/hooks/chat-handler/utils/context-checker.tsx +0 -73
- package/source/hooks/chat-handler/utils/message-helpers.spec.ts +0 -42
- package/source/hooks/chat-handler/utils/message-helpers.tsx +0 -36
- package/source/hooks/chat-handler/utils/tool-filters.spec.ts +0 -109
- package/source/hooks/chat-handler/utils/tool-filters.ts +0 -64
- package/source/hooks/useAppHandlers.tsx +0 -291
- package/source/hooks/useAppInitialization.tsx +0 -422
- package/source/hooks/useAppState.tsx +0 -311
- package/source/hooks/useDirectoryTrust.tsx +0 -98
- package/source/hooks/useInputState.ts +0 -414
- package/source/hooks/useModeHandlers.tsx +0 -302
- package/source/hooks/useNonInteractiveMode.ts +0 -140
- package/source/hooks/useTerminalWidth.tsx +0 -81
- package/source/hooks/useTheme.ts +0 -18
- package/source/hooks/useToolHandler.tsx +0 -349
- package/source/hooks/useUIState.ts +0 -61
- package/source/init/agents-template-generator.ts +0 -421
- package/source/init/existing-rules-extractor.ts +0 -319
- package/source/init/file-scanner.spec.ts +0 -227
- package/source/init/file-scanner.ts +0 -238
- package/source/init/framework-detector.ts +0 -382
- package/source/init/language-detector.ts +0 -269
- package/source/init/project-analyzer.spec.ts +0 -231
- package/source/init/project-analyzer.ts +0 -458
- package/source/lsp/index.ts +0 -31
- package/source/lsp/lsp-client.spec.ts +0 -508
- package/source/lsp/lsp-client.ts +0 -487
- package/source/lsp/lsp-manager.spec.ts +0 -477
- package/source/lsp/lsp-manager.ts +0 -419
- package/source/lsp/protocol.spec.ts +0 -502
- package/source/lsp/protocol.ts +0 -360
- package/source/lsp/server-discovery.spec.ts +0 -654
- package/source/lsp/server-discovery.ts +0 -515
- package/source/markdown-parser/html-entities.spec.ts +0 -88
- package/source/markdown-parser/html-entities.ts +0 -45
- package/source/markdown-parser/index.spec.ts +0 -281
- package/source/markdown-parser/index.ts +0 -126
- package/source/markdown-parser/table-parser.spec.ts +0 -133
- package/source/markdown-parser/table-parser.ts +0 -114
- package/source/markdown-parser/utils.spec.ts +0 -70
- package/source/markdown-parser/utils.ts +0 -13
- package/source/mcp/mcp-client.spec.ts +0 -81
- package/source/mcp/mcp-client.ts +0 -625
- package/source/mcp/transport-factory.spec.ts +0 -406
- package/source/mcp/transport-factory.ts +0 -312
- package/source/message-handler.ts +0 -67
- package/source/model-database/database-engine.spec.ts +0 -494
- package/source/model-database/database-engine.ts +0 -50
- package/source/model-database/model-database.spec.ts +0 -363
- package/source/model-database/model-database.ts +0 -91
- package/source/model-database/model-engine.spec.ts +0 -447
- package/source/model-database/model-engine.ts +0 -65
- package/source/model-database/model-fetcher.spec.ts +0 -583
- package/source/model-database/model-fetcher.ts +0 -330
- package/source/models/index.ts +0 -1
- package/source/models/models-cache.spec.ts +0 -214
- package/source/models/models-cache.ts +0 -78
- package/source/models/models-dev-client.spec.ts +0 -379
- package/source/models/models-dev-client.ts +0 -329
- package/source/models/models-types.ts +0 -68
- package/source/prompt-history.ts +0 -155
- package/source/security/command-injection.spec.ts +0 -240
- package/source/services/checkpoint-manager.spec.ts +0 -523
- package/source/services/checkpoint-manager.ts +0 -466
- package/source/services/file-snapshot.spec.ts +0 -569
- package/source/services/file-snapshot.ts +0 -220
- package/source/test-utils/render-with-theme.tsx +0 -48
- package/source/tokenization/index.ts +0 -1
- package/source/tokenization/tokenizer-factory.spec.ts +0 -170
- package/source/tokenization/tokenizer-factory.ts +0 -125
- package/source/tokenization/tokenizers/anthropic-tokenizer.spec.ts +0 -200
- package/source/tokenization/tokenizers/anthropic-tokenizer.ts +0 -43
- package/source/tokenization/tokenizers/fallback-tokenizer.spec.ts +0 -236
- package/source/tokenization/tokenizers/fallback-tokenizer.ts +0 -26
- package/source/tokenization/tokenizers/llama-tokenizer.spec.ts +0 -224
- package/source/tokenization/tokenizers/llama-tokenizer.ts +0 -41
- package/source/tokenization/tokenizers/openai-tokenizer.spec.ts +0 -184
- package/source/tokenization/tokenizers/openai-tokenizer.ts +0 -57
- package/source/tool-calling/index.ts +0 -5
- package/source/tool-calling/json-parser.spec.ts +0 -639
- package/source/tool-calling/json-parser.ts +0 -247
- package/source/tool-calling/tool-parser.spec.ts +0 -395
- package/source/tool-calling/tool-parser.ts +0 -120
- package/source/tool-calling/xml-parser.spec.ts +0 -662
- package/source/tool-calling/xml-parser.ts +0 -289
- package/source/tools/execute-bash.spec.tsx +0 -353
- package/source/tools/execute-bash.tsx +0 -219
- package/source/tools/execute-function.spec.ts +0 -130
- package/source/tools/fetch-url.spec.tsx +0 -342
- package/source/tools/fetch-url.tsx +0 -172
- package/source/tools/find-files.spec.tsx +0 -924
- package/source/tools/find-files.tsx +0 -293
- package/source/tools/index.ts +0 -102
- package/source/tools/lsp-get-diagnostics.tsx +0 -192
- package/source/tools/needs-approval.spec.ts +0 -282
- package/source/tools/read-file.spec.tsx +0 -801
- package/source/tools/read-file.tsx +0 -387
- package/source/tools/search-file-contents.spec.tsx +0 -1273
- package/source/tools/search-file-contents.tsx +0 -293
- package/source/tools/string-replace.spec.tsx +0 -730
- package/source/tools/string-replace.tsx +0 -548
- package/source/tools/tool-manager.ts +0 -210
- package/source/tools/tool-registry.spec.ts +0 -415
- package/source/tools/tool-registry.ts +0 -228
- package/source/tools/web-search.tsx +0 -223
- package/source/tools/write-file.spec.tsx +0 -559
- package/source/tools/write-file.tsx +0 -228
- package/source/types/app.ts +0 -37
- package/source/types/checkpoint.ts +0 -48
- package/source/types/commands.ts +0 -46
- package/source/types/components.ts +0 -27
- package/source/types/config.ts +0 -103
- package/source/types/core-connection-status.spec.ts +0 -67
- package/source/types/core.ts +0 -181
- package/source/types/hooks.ts +0 -50
- package/source/types/index.ts +0 -12
- package/source/types/markdown-parser.ts +0 -11
- package/source/types/mcp.ts +0 -52
- package/source/types/system.ts +0 -16
- package/source/types/tokenization.ts +0 -41
- package/source/types/ui.ts +0 -40
- package/source/types/usage.ts +0 -58
- package/source/types/utils.ts +0 -16
- package/source/usage/calculator.spec.ts +0 -385
- package/source/usage/calculator.ts +0 -104
- package/source/usage/storage.spec.ts +0 -703
- package/source/usage/storage.ts +0 -238
- package/source/usage/tracker.spec.ts +0 -456
- package/source/usage/tracker.ts +0 -102
- package/source/utils/atomic-deletion.spec.ts +0 -194
- package/source/utils/atomic-deletion.ts +0 -127
- package/source/utils/bounded-map.spec.ts +0 -300
- package/source/utils/bounded-map.ts +0 -193
- package/source/utils/checkpoint-utils.spec.ts +0 -222
- package/source/utils/checkpoint-utils.ts +0 -92
- package/source/utils/error-formatter.spec.ts +0 -169
- package/source/utils/error-formatter.ts +0 -194
- package/source/utils/file-autocomplete.spec.ts +0 -173
- package/source/utils/file-autocomplete.ts +0 -196
- package/source/utils/file-cache.spec.ts +0 -309
- package/source/utils/file-cache.ts +0 -195
- package/source/utils/file-content-loader.spec.ts +0 -180
- package/source/utils/file-content-loader.ts +0 -179
- package/source/utils/file-mention-handler.spec.ts +0 -261
- package/source/utils/file-mention-handler.ts +0 -84
- package/source/utils/file-mention-parser.spec.ts +0 -182
- package/source/utils/file-mention-parser.ts +0 -170
- package/source/utils/fuzzy-matching.spec.ts +0 -149
- package/source/utils/fuzzy-matching.ts +0 -146
- package/source/utils/indentation-normalizer.spec.ts +0 -216
- package/source/utils/indentation-normalizer.ts +0 -76
- package/source/utils/installation-detector.spec.ts +0 -178
- package/source/utils/installation-detector.ts +0 -153
- package/source/utils/logging/config.spec.ts +0 -311
- package/source/utils/logging/config.ts +0 -210
- package/source/utils/logging/console-facade.spec.ts +0 -184
- package/source/utils/logging/console-facade.ts +0 -384
- package/source/utils/logging/correlation.spec.ts +0 -679
- package/source/utils/logging/correlation.ts +0 -474
- package/source/utils/logging/formatters.spec.ts +0 -464
- package/source/utils/logging/formatters.ts +0 -207
- package/source/utils/logging/health-monitor/alerts/alert-manager.spec.ts +0 -93
- package/source/utils/logging/health-monitor/alerts/alert-manager.ts +0 -79
- package/source/utils/logging/health-monitor/checks/configuration-check.spec.ts +0 -56
- package/source/utils/logging/health-monitor/checks/configuration-check.ts +0 -43
- package/source/utils/logging/health-monitor/checks/logging-check.spec.ts +0 -56
- package/source/utils/logging/health-monitor/checks/logging-check.ts +0 -58
- package/source/utils/logging/health-monitor/checks/memory-check.spec.ts +0 -100
- package/source/utils/logging/health-monitor/checks/memory-check.ts +0 -78
- package/source/utils/logging/health-monitor/checks/performance-check.spec.ts +0 -56
- package/source/utils/logging/health-monitor/checks/performance-check.ts +0 -56
- package/source/utils/logging/health-monitor/checks/request-check.spec.ts +0 -56
- package/source/utils/logging/health-monitor/checks/request-check.ts +0 -76
- package/source/utils/logging/health-monitor/core/health-check-runner.spec.ts +0 -70
- package/source/utils/logging/health-monitor/core/health-check-runner.ts +0 -138
- package/source/utils/logging/health-monitor/core/health-monitor.spec.ts +0 -58
- package/source/utils/logging/health-monitor/core/health-monitor.ts +0 -344
- package/source/utils/logging/health-monitor/core/scoring.spec.ts +0 -65
- package/source/utils/logging/health-monitor/core/scoring.ts +0 -91
- package/source/utils/logging/health-monitor/index.ts +0 -15
- package/source/utils/logging/health-monitor/instances.ts +0 -48
- package/source/utils/logging/health-monitor/middleware/http-middleware.spec.ts +0 -141
- package/source/utils/logging/health-monitor/middleware/http-middleware.ts +0 -75
- package/source/utils/logging/health-monitor/types.ts +0 -126
- package/source/utils/logging/index.spec.ts +0 -284
- package/source/utils/logging/index.ts +0 -236
- package/source/utils/logging/integration.spec.ts +0 -441
- package/source/utils/logging/log-method-factory.spec.ts +0 -573
- package/source/utils/logging/log-method-factory.ts +0 -233
- package/source/utils/logging/log-query/aggregation/aggregator.spec.ts +0 -277
- package/source/utils/logging/log-query/aggregation/aggregator.ts +0 -159
- package/source/utils/logging/log-query/aggregation/facet-generator.spec.ts +0 -159
- package/source/utils/logging/log-query/aggregation/facet-generator.ts +0 -47
- package/source/utils/logging/log-query/index.ts +0 -23
- package/source/utils/logging/log-query/query/filter-predicates.spec.ts +0 -247
- package/source/utils/logging/log-query/query/filter-predicates.ts +0 -154
- package/source/utils/logging/log-query/query/query-builder.spec.ts +0 -182
- package/source/utils/logging/log-query/query/query-builder.ts +0 -151
- package/source/utils/logging/log-query/query/query-engine.spec.ts +0 -214
- package/source/utils/logging/log-query/query/query-engine.ts +0 -45
- package/source/utils/logging/log-query/storage/circular-buffer.spec.ts +0 -143
- package/source/utils/logging/log-query/storage/circular-buffer.ts +0 -75
- package/source/utils/logging/log-query/storage/index-manager.spec.ts +0 -150
- package/source/utils/logging/log-query/storage/index-manager.ts +0 -71
- package/source/utils/logging/log-query/storage/log-storage.spec.ts +0 -257
- package/source/utils/logging/log-query/storage/log-storage.ts +0 -80
- package/source/utils/logging/log-query/types.ts +0 -163
- package/source/utils/logging/log-query/utils/helpers.spec.ts +0 -263
- package/source/utils/logging/log-query/utils/helpers.ts +0 -72
- package/source/utils/logging/log-query/utils/sorting.spec.ts +0 -182
- package/source/utils/logging/log-query/utils/sorting.ts +0 -61
- package/source/utils/logging/logger-provider.spec.ts +0 -262
- package/source/utils/logging/logger-provider.ts +0 -362
- package/source/utils/logging/performance.spec.ts +0 -209
- package/source/utils/logging/performance.ts +0 -757
- package/source/utils/logging/pino-logger.spec.ts +0 -425
- package/source/utils/logging/pino-logger.ts +0 -514
- package/source/utils/logging/redaction.spec.ts +0 -490
- package/source/utils/logging/redaction.ts +0 -267
- package/source/utils/logging/request-tracker.spec.ts +0 -1198
- package/source/utils/logging/request-tracker.ts +0 -803
- package/source/utils/logging/transports.spec.ts +0 -505
- package/source/utils/logging/transports.ts +0 -305
- package/source/utils/logging/types.ts +0 -216
- package/source/utils/message-builder.spec.ts +0 -179
- package/source/utils/message-builder.ts +0 -101
- package/source/utils/message-queue.tsx +0 -486
- package/source/utils/paste-detection.spec.ts +0 -69
- package/source/utils/paste-detection.ts +0 -124
- package/source/utils/paste-roundtrip.spec.ts +0 -442
- package/source/utils/paste-utils.spec.ts +0 -128
- package/source/utils/paste-utils.ts +0 -52
- package/source/utils/programming-language-helper.spec.ts +0 -74
- package/source/utils/programming-language-helper.ts +0 -32
- package/source/utils/prompt-assembly.spec.ts +0 -221
- package/source/utils/prompt-processor.ts +0 -173
- package/source/utils/tool-args-parser.spec.ts +0 -136
- package/source/utils/tool-args-parser.ts +0 -54
- package/source/utils/tool-cancellation.spec.ts +0 -230
- package/source/utils/tool-cancellation.ts +0 -28
- package/source/utils/tool-result-display.spec.tsx +0 -469
- package/source/utils/tool-result-display.tsx +0 -90
- package/source/utils/update-checker.spec.ts +0 -383
- package/source/utils/update-checker.ts +0 -183
- package/source/wizard/config-wizard.spec.tsx +0 -103
- package/source/wizard/config-wizard.tsx +0 -382
- package/source/wizard/steps/location-step.spec.tsx +0 -186
- package/source/wizard/steps/location-step.tsx +0 -147
- package/source/wizard/steps/mcp-step.spec.tsx +0 -607
- package/source/wizard/steps/mcp-step.tsx +0 -632
- package/source/wizard/steps/provider-step.spec.tsx +0 -342
- package/source/wizard/steps/provider-step.tsx +0 -957
- package/source/wizard/steps/summary-step.spec.tsx +0 -749
- package/source/wizard/steps/summary-step.tsx +0 -228
- package/source/wizard/templates/mcp-templates.spec.ts +0 -613
- package/source/wizard/templates/mcp-templates.ts +0 -570
- package/source/wizard/templates/provider-templates.spec.ts +0 -152
- package/source/wizard/templates/provider-templates.ts +0 -485
- package/source/wizard/utils/fetch-cloud-models.spec.ts +0 -428
- package/source/wizard/utils/fetch-cloud-models.ts +0 -223
- package/source/wizard/utils/fetch-local-models.spec.ts +0 -297
- package/source/wizard/utils/fetch-local-models.ts +0 -192
- package/source/wizard/validation-array.spec.ts +0 -264
- package/source/wizard/validation.spec.ts +0 -373
- package/source/wizard/validation.ts +0 -232
|
@@ -1,379 +0,0 @@
|
|
|
1
|
-
import test from 'ava';
|
|
2
|
-
import {getModelContextLimit} from './models-dev-client.js';
|
|
3
|
-
|
|
4
|
-
console.log(`\nmodels-dev-client.spec.ts`);
|
|
5
|
-
|
|
6
|
-
/**
|
|
7
|
-
* Tests for models-dev-client.ts
|
|
8
|
-
*
|
|
9
|
-
* Note: These tests make real API calls to models.dev.
|
|
10
|
-
* The API has caching and fallback mechanisms built in.
|
|
11
|
-
* Tests are organized by:
|
|
12
|
-
* 1. Ollama cloud model fallbacks (no network required)
|
|
13
|
-
* 2. Ollama local model fallbacks (no network required)
|
|
14
|
-
* 3. models.dev API lookups (network required, cached)
|
|
15
|
-
*/
|
|
16
|
-
|
|
17
|
-
// ============================================================================
|
|
18
|
-
// Ollama Cloud Model Fallbacks
|
|
19
|
-
// ============================================================================
|
|
20
|
-
|
|
21
|
-
test('getModelContextLimit - returns 128000 for gpt-oss:20b-cloud', async t => {
|
|
22
|
-
const limit = await getModelContextLimit('gpt-oss:20b-cloud');
|
|
23
|
-
t.is(limit, 128000);
|
|
24
|
-
});
|
|
25
|
-
|
|
26
|
-
test('getModelContextLimit - returns 128000 for gpt-oss:120b-cloud', async t => {
|
|
27
|
-
const limit = await getModelContextLimit('gpt-oss:120b-cloud');
|
|
28
|
-
t.is(limit, 128000);
|
|
29
|
-
});
|
|
30
|
-
|
|
31
|
-
test('getModelContextLimit - returns 128000 for qwen3-coder:480b-cloud', async t => {
|
|
32
|
-
const limit = await getModelContextLimit('qwen3-coder:480b-cloud');
|
|
33
|
-
t.is(limit, 128000);
|
|
34
|
-
});
|
|
35
|
-
|
|
36
|
-
test('getModelContextLimit - returns 128000 for deepseek-v3.1:671b-cloud', async t => {
|
|
37
|
-
const limit = await getModelContextLimit('deepseek-v3.1:671b-cloud');
|
|
38
|
-
t.is(limit, 128000);
|
|
39
|
-
});
|
|
40
|
-
|
|
41
|
-
test('getModelContextLimit - returns 196608 for minimax-m2:cloud', async t => {
|
|
42
|
-
const limit = await getModelContextLimit('minimax-m2:cloud');
|
|
43
|
-
t.is(limit, 196608);
|
|
44
|
-
});
|
|
45
|
-
|
|
46
|
-
test('getModelContextLimit - returns 200000 for glm-4.7:cloud', async t => {
|
|
47
|
-
const limit = await getModelContextLimit('glm-4.7:cloud');
|
|
48
|
-
t.is(limit, 200000);
|
|
49
|
-
});
|
|
50
|
-
|
|
51
|
-
test('getModelContextLimit - returns 256000 for kimi-k2:1t-cloud', async t => {
|
|
52
|
-
const limit = await getModelContextLimit('kimi-k2:1t-cloud');
|
|
53
|
-
t.is(limit, 256000);
|
|
54
|
-
});
|
|
55
|
-
|
|
56
|
-
test('getModelContextLimit - returns 256000 for kimi-k2-thinking:cloud', async t => {
|
|
57
|
-
const limit = await getModelContextLimit('kimi-k2-thinking:cloud');
|
|
58
|
-
t.is(limit, 256000);
|
|
59
|
-
});
|
|
60
|
-
|
|
61
|
-
// ============================================================================
|
|
62
|
-
// Ollama Local Model Fallbacks - Llama Family
|
|
63
|
-
// ============================================================================
|
|
64
|
-
|
|
65
|
-
test('getModelContextLimit - returns 128000 for llama3.2', async t => {
|
|
66
|
-
const limit = await getModelContextLimit('llama3.2');
|
|
67
|
-
t.is(limit, 128000);
|
|
68
|
-
});
|
|
69
|
-
|
|
70
|
-
test('getModelContextLimit - returns 128000 for llama3.2:1b', async t => {
|
|
71
|
-
const limit = await getModelContextLimit('llama3.2:1b');
|
|
72
|
-
t.is(limit, 128000);
|
|
73
|
-
});
|
|
74
|
-
|
|
75
|
-
test('getModelContextLimit - returns 128000 for llama3.2:3b', async t => {
|
|
76
|
-
const limit = await getModelContextLimit('llama3.2:3b');
|
|
77
|
-
t.is(limit, 128000);
|
|
78
|
-
});
|
|
79
|
-
|
|
80
|
-
test('getModelContextLimit - returns 128000 for llama3.1', async t => {
|
|
81
|
-
const limit = await getModelContextLimit('llama3.1');
|
|
82
|
-
t.is(limit, 128000);
|
|
83
|
-
});
|
|
84
|
-
|
|
85
|
-
test('getModelContextLimit - returns 128000 for llama3.1:8b', async t => {
|
|
86
|
-
const limit = await getModelContextLimit('llama3.1:8b');
|
|
87
|
-
t.is(limit, 128000);
|
|
88
|
-
});
|
|
89
|
-
|
|
90
|
-
test('getModelContextLimit - returns 128000 for llama3.1:70b', async t => {
|
|
91
|
-
const limit = await getModelContextLimit('llama3.1:70b');
|
|
92
|
-
t.is(limit, 128000);
|
|
93
|
-
});
|
|
94
|
-
|
|
95
|
-
test('getModelContextLimit - returns 128000 for llama3.1:405b', async t => {
|
|
96
|
-
const limit = await getModelContextLimit('llama3.1:405b');
|
|
97
|
-
t.is(limit, 128000);
|
|
98
|
-
});
|
|
99
|
-
|
|
100
|
-
test('getModelContextLimit - returns 8192 for llama3', async t => {
|
|
101
|
-
const limit = await getModelContextLimit('llama3');
|
|
102
|
-
t.is(limit, 8192);
|
|
103
|
-
});
|
|
104
|
-
|
|
105
|
-
test('getModelContextLimit - returns 8192 for llama3:8b', async t => {
|
|
106
|
-
const limit = await getModelContextLimit('llama3:8b');
|
|
107
|
-
t.is(limit, 8192);
|
|
108
|
-
});
|
|
109
|
-
|
|
110
|
-
test('getModelContextLimit - returns 8192 for llama3:70b', async t => {
|
|
111
|
-
const limit = await getModelContextLimit('llama3:70b');
|
|
112
|
-
t.is(limit, 8192);
|
|
113
|
-
});
|
|
114
|
-
|
|
115
|
-
test('getModelContextLimit - returns 4096 for llama2', async t => {
|
|
116
|
-
const limit = await getModelContextLimit('llama2');
|
|
117
|
-
t.is(limit, 4096);
|
|
118
|
-
});
|
|
119
|
-
|
|
120
|
-
test('getModelContextLimit - returns 4096 for llama2:7b', async t => {
|
|
121
|
-
const limit = await getModelContextLimit('llama2:7b');
|
|
122
|
-
t.is(limit, 4096);
|
|
123
|
-
});
|
|
124
|
-
|
|
125
|
-
test('getModelContextLimit - returns 4096 for llama2:13b', async t => {
|
|
126
|
-
const limit = await getModelContextLimit('llama2:13b');
|
|
127
|
-
t.is(limit, 4096);
|
|
128
|
-
});
|
|
129
|
-
|
|
130
|
-
test('getModelContextLimit - returns 4096 for llama2:70b', async t => {
|
|
131
|
-
const limit = await getModelContextLimit('llama2:70b');
|
|
132
|
-
t.is(limit, 4096);
|
|
133
|
-
});
|
|
134
|
-
|
|
135
|
-
// ============================================================================
|
|
136
|
-
// Ollama Local Model Fallbacks - Mistral Family
|
|
137
|
-
// ============================================================================
|
|
138
|
-
|
|
139
|
-
test('getModelContextLimit - returns 32000 for mistral', async t => {
|
|
140
|
-
const limit = await getModelContextLimit('mistral');
|
|
141
|
-
t.is(limit, 32000);
|
|
142
|
-
});
|
|
143
|
-
|
|
144
|
-
test('getModelContextLimit - returns 32000 for mistral:7b', async t => {
|
|
145
|
-
const limit = await getModelContextLimit('mistral:7b');
|
|
146
|
-
t.is(limit, 32000);
|
|
147
|
-
});
|
|
148
|
-
|
|
149
|
-
test('getModelContextLimit - returns 32000 for mixtral', async t => {
|
|
150
|
-
const limit = await getModelContextLimit('mixtral');
|
|
151
|
-
t.is(limit, 32000);
|
|
152
|
-
});
|
|
153
|
-
|
|
154
|
-
test('getModelContextLimit - returns 32000 for mixtral:8x7b', async t => {
|
|
155
|
-
const limit = await getModelContextLimit('mixtral:8x7b');
|
|
156
|
-
t.is(limit, 32000);
|
|
157
|
-
});
|
|
158
|
-
|
|
159
|
-
test('getModelContextLimit - returns 32000 for mixtral:8x22b', async t => {
|
|
160
|
-
const limit = await getModelContextLimit('mixtral:8x22b');
|
|
161
|
-
t.is(limit, 32000);
|
|
162
|
-
});
|
|
163
|
-
|
|
164
|
-
// ============================================================================
|
|
165
|
-
// Ollama Local Model Fallbacks - Qwen Family
|
|
166
|
-
// ============================================================================
|
|
167
|
-
|
|
168
|
-
test('getModelContextLimit - returns 32000 for qwen', async t => {
|
|
169
|
-
const limit = await getModelContextLimit('qwen');
|
|
170
|
-
t.is(limit, 32000);
|
|
171
|
-
});
|
|
172
|
-
|
|
173
|
-
test('getModelContextLimit - returns 32000 for qwen:7b', async t => {
|
|
174
|
-
const limit = await getModelContextLimit('qwen:7b');
|
|
175
|
-
t.is(limit, 32000);
|
|
176
|
-
});
|
|
177
|
-
|
|
178
|
-
test('getModelContextLimit - returns 32000 for qwen:14b', async t => {
|
|
179
|
-
const limit = await getModelContextLimit('qwen:14b');
|
|
180
|
-
t.is(limit, 32000);
|
|
181
|
-
});
|
|
182
|
-
|
|
183
|
-
test('getModelContextLimit - returns 32000 for qwen2', async t => {
|
|
184
|
-
const limit = await getModelContextLimit('qwen2');
|
|
185
|
-
t.is(limit, 32000);
|
|
186
|
-
});
|
|
187
|
-
|
|
188
|
-
test('getModelContextLimit - returns 32000 for qwen2:7b', async t => {
|
|
189
|
-
const limit = await getModelContextLimit('qwen2:7b');
|
|
190
|
-
t.is(limit, 32000);
|
|
191
|
-
});
|
|
192
|
-
|
|
193
|
-
test('getModelContextLimit - returns 128000 for qwen2.5', async t => {
|
|
194
|
-
const limit = await getModelContextLimit('qwen2.5');
|
|
195
|
-
t.is(limit, 128000);
|
|
196
|
-
});
|
|
197
|
-
|
|
198
|
-
test('getModelContextLimit - returns 128000 for qwen2.5:7b', async t => {
|
|
199
|
-
const limit = await getModelContextLimit('qwen2.5:7b');
|
|
200
|
-
t.is(limit, 128000);
|
|
201
|
-
});
|
|
202
|
-
|
|
203
|
-
test('getModelContextLimit - returns 128000 for qwen3', async t => {
|
|
204
|
-
const limit = await getModelContextLimit('qwen3');
|
|
205
|
-
t.is(limit, 128000);
|
|
206
|
-
});
|
|
207
|
-
|
|
208
|
-
test('getModelContextLimit - returns 128000 for qwen3:7b', async t => {
|
|
209
|
-
const limit = await getModelContextLimit('qwen3:7b');
|
|
210
|
-
t.is(limit, 128000);
|
|
211
|
-
});
|
|
212
|
-
|
|
213
|
-
test('getModelContextLimit - returns 128000 for qwen3:14b', async t => {
|
|
214
|
-
const limit = await getModelContextLimit('qwen3:14b');
|
|
215
|
-
t.is(limit, 128000);
|
|
216
|
-
});
|
|
217
|
-
|
|
218
|
-
test('getModelContextLimit - returns 128000 for qwen3:32b', async t => {
|
|
219
|
-
const limit = await getModelContextLimit('qwen3:32b');
|
|
220
|
-
t.is(limit, 128000);
|
|
221
|
-
});
|
|
222
|
-
|
|
223
|
-
// ============================================================================
|
|
224
|
-
// Ollama Local Model Fallbacks - Gemma Family
|
|
225
|
-
// ============================================================================
|
|
226
|
-
|
|
227
|
-
test('getModelContextLimit - returns 8192 for gemma', async t => {
|
|
228
|
-
const limit = await getModelContextLimit('gemma');
|
|
229
|
-
t.is(limit, 8192);
|
|
230
|
-
});
|
|
231
|
-
|
|
232
|
-
test('getModelContextLimit - returns 8192 for gemma:2b', async t => {
|
|
233
|
-
const limit = await getModelContextLimit('gemma:2b');
|
|
234
|
-
t.is(limit, 8192);
|
|
235
|
-
});
|
|
236
|
-
|
|
237
|
-
test('getModelContextLimit - returns 8192 for gemma:7b', async t => {
|
|
238
|
-
const limit = await getModelContextLimit('gemma:7b');
|
|
239
|
-
t.is(limit, 8192);
|
|
240
|
-
});
|
|
241
|
-
|
|
242
|
-
test('getModelContextLimit - returns 8192 for gemma2', async t => {
|
|
243
|
-
const limit = await getModelContextLimit('gemma2');
|
|
244
|
-
t.is(limit, 8192);
|
|
245
|
-
});
|
|
246
|
-
|
|
247
|
-
test('getModelContextLimit - returns 8192 for gemma2:9b', async t => {
|
|
248
|
-
const limit = await getModelContextLimit('gemma2:9b');
|
|
249
|
-
t.is(limit, 8192);
|
|
250
|
-
});
|
|
251
|
-
|
|
252
|
-
test('getModelContextLimit - returns 8192 for gemma2:27b', async t => {
|
|
253
|
-
const limit = await getModelContextLimit('gemma2:27b');
|
|
254
|
-
t.is(limit, 8192);
|
|
255
|
-
});
|
|
256
|
-
|
|
257
|
-
// ============================================================================
|
|
258
|
-
// Ollama Local Model Fallbacks - Other Models
|
|
259
|
-
// ============================================================================
|
|
260
|
-
|
|
261
|
-
test('getModelContextLimit - returns 128000 for command-r', async t => {
|
|
262
|
-
const limit = await getModelContextLimit('command-r');
|
|
263
|
-
t.is(limit, 128000);
|
|
264
|
-
});
|
|
265
|
-
|
|
266
|
-
test('getModelContextLimit - returns 128000 for command-r-plus', async t => {
|
|
267
|
-
const limit = await getModelContextLimit('command-r-plus');
|
|
268
|
-
t.is(limit, 128000);
|
|
269
|
-
});
|
|
270
|
-
|
|
271
|
-
test('getModelContextLimit - returns 16000 for deepseek-coder', async t => {
|
|
272
|
-
const limit = await getModelContextLimit('deepseek-coder');
|
|
273
|
-
t.is(limit, 16000);
|
|
274
|
-
});
|
|
275
|
-
|
|
276
|
-
test('getModelContextLimit - returns 16000 for deepseek-coder-v2', async t => {
|
|
277
|
-
const limit = await getModelContextLimit('deepseek-coder-v2');
|
|
278
|
-
t.is(limit, 16000);
|
|
279
|
-
});
|
|
280
|
-
|
|
281
|
-
test('getModelContextLimit - returns 128000 for phi3', async t => {
|
|
282
|
-
const limit = await getModelContextLimit('phi3');
|
|
283
|
-
t.is(limit, 128000);
|
|
284
|
-
});
|
|
285
|
-
|
|
286
|
-
test('getModelContextLimit - returns 128000 for phi3:mini', async t => {
|
|
287
|
-
const limit = await getModelContextLimit('phi3:mini');
|
|
288
|
-
t.is(limit, 128000);
|
|
289
|
-
});
|
|
290
|
-
|
|
291
|
-
test('getModelContextLimit - returns 128000 for phi3:medium', async t => {
|
|
292
|
-
const limit = await getModelContextLimit('phi3:medium');
|
|
293
|
-
t.is(limit, 128000);
|
|
294
|
-
});
|
|
295
|
-
|
|
296
|
-
// ============================================================================
|
|
297
|
-
// Ollama Model Variants (with quantization/tags)
|
|
298
|
-
// ============================================================================
|
|
299
|
-
|
|
300
|
-
test('getModelContextLimit - handles llama3.1:8b-instruct-q4_0 variant', async t => {
|
|
301
|
-
const limit = await getModelContextLimit('llama3.1:8b-instruct-q4_0');
|
|
302
|
-
t.is(limit, 128000);
|
|
303
|
-
});
|
|
304
|
-
|
|
305
|
-
test('getModelContextLimit - handles mistral:7b-instruct variant', async t => {
|
|
306
|
-
const limit = await getModelContextLimit('mistral:7b-instruct');
|
|
307
|
-
t.is(limit, 32000);
|
|
308
|
-
});
|
|
309
|
-
|
|
310
|
-
test('getModelContextLimit - handles qwen2.5:7b-instruct-fp16 variant', async t => {
|
|
311
|
-
const limit = await getModelContextLimit('qwen2.5:7b-instruct-fp16');
|
|
312
|
-
t.is(limit, 128000);
|
|
313
|
-
});
|
|
314
|
-
|
|
315
|
-
// ============================================================================
|
|
316
|
-
// Edge Cases
|
|
317
|
-
// ============================================================================
|
|
318
|
-
|
|
319
|
-
test('getModelContextLimit - returns null for completely unknown model', async t => {
|
|
320
|
-
const limit = await getModelContextLimit('unknown-model-12345');
|
|
321
|
-
t.is(limit, null);
|
|
322
|
-
});
|
|
323
|
-
|
|
324
|
-
test('getModelContextLimit - handles empty string', async t => {
|
|
325
|
-
const limit = await getModelContextLimit('');
|
|
326
|
-
t.is(limit, 262144);
|
|
327
|
-
});
|
|
328
|
-
|
|
329
|
-
test('getModelContextLimit - handles model names with uppercase', async t => {
|
|
330
|
-
const limit = await getModelContextLimit('LLAMA3.1:8B');
|
|
331
|
-
t.is(limit, 128000);
|
|
332
|
-
});
|
|
333
|
-
|
|
334
|
-
test('getModelContextLimit - handles model names with mixed case', async t => {
|
|
335
|
-
const limit = await getModelContextLimit('Llama3.1:8B');
|
|
336
|
-
t.is(limit, 128000);
|
|
337
|
-
});
|
|
338
|
-
|
|
339
|
-
// ============================================================================
|
|
340
|
-
// models.dev API Lookups (Network Required)
|
|
341
|
-
// ============================================================================
|
|
342
|
-
|
|
343
|
-
test('getModelContextLimit - fetches from models.dev for popular API models', async t => {
|
|
344
|
-
// This test requires network access and will use cached data if available
|
|
345
|
-
// Testing with a common model that should be in models.dev
|
|
346
|
-
const limit = await getModelContextLimit('gpt-4');
|
|
347
|
-
|
|
348
|
-
// We just verify it returns a number or null (API might change)
|
|
349
|
-
t.true(limit === null || typeof limit === 'number');
|
|
350
|
-
});
|
|
351
|
-
|
|
352
|
-
test('getModelContextLimit - handles models.dev API failure gracefully', async t => {
|
|
353
|
-
// Test that the function doesn't throw even if models.dev is unavailable
|
|
354
|
-
// Using a model that's not in fallbacks to trigger API lookup
|
|
355
|
-
const limit = await getModelContextLimit('some-api-only-model-xyz');
|
|
356
|
-
|
|
357
|
-
// Should return null gracefully, not throw
|
|
358
|
-
t.is(limit, null);
|
|
359
|
-
});
|
|
360
|
-
|
|
361
|
-
// ============================================================================
|
|
362
|
-
// Cloud Model Normalization
|
|
363
|
-
// ============================================================================
|
|
364
|
-
|
|
365
|
-
test('getModelContextLimit - cloud suffix is tried first before normalization', async t => {
|
|
366
|
-
// This ensures the fix for cloud models works
|
|
367
|
-
// gpt-oss:20b-cloud should match the fallback BEFORE stripping :cloud
|
|
368
|
-
const limit = await getModelContextLimit('gpt-oss:20b-cloud');
|
|
369
|
-
t.is(limit, 128000);
|
|
370
|
-
});
|
|
371
|
-
|
|
372
|
-
test('getModelContextLimit - handles -cloud suffix (hyphen variant)', async t => {
|
|
373
|
-
// Some models might use -cloud instead of :cloud
|
|
374
|
-
// Note: Currently no models in fallback use this, but the code supports it
|
|
375
|
-
const limit = await getModelContextLimit('unknown-model-cloud');
|
|
376
|
-
|
|
377
|
-
// Should still process without error
|
|
378
|
-
t.true(limit === null || typeof limit === 'number');
|
|
379
|
-
});
|
|
@@ -1,329 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* API client for models.dev
|
|
3
|
-
* Fetches and caches model metadata
|
|
4
|
-
*/
|
|
5
|
-
|
|
6
|
-
import {TIMEOUT_HTTP_BODY_MS, TIMEOUT_HTTP_HEADERS_MS} from '@/constants';
|
|
7
|
-
import {formatError} from '@/utils/error-formatter';
|
|
8
|
-
import {getLogger} from '@/utils/logging';
|
|
9
|
-
import {request} from 'undici';
|
|
10
|
-
import {readCache, writeCache} from './models-cache.js';
|
|
11
|
-
import type {ModelInfo, ModelsDevDatabase} from './models-types.js';
|
|
12
|
-
|
|
13
|
-
const MODELS_DEV_API_URL = 'https://models.dev/api.json';
|
|
14
|
-
|
|
15
|
-
/**
|
|
16
|
-
* Fallback context limits for common Ollama model architectures
|
|
17
|
-
* Used when models.dev doesn't have the model data
|
|
18
|
-
*/
|
|
19
|
-
const OLLAMA_MODEL_CONTEXT_LIMITS: Record<string, number> = {
|
|
20
|
-
// Llama 3.2 models
|
|
21
|
-
'llama3.2': 128000,
|
|
22
|
-
'llama3.2:1b': 128000,
|
|
23
|
-
'llama3.2:3b': 128000,
|
|
24
|
-
|
|
25
|
-
// Llama 3.1 models
|
|
26
|
-
'llama3.1': 128000,
|
|
27
|
-
'llama3.1:8b': 128000,
|
|
28
|
-
'llama3.1:70b': 128000,
|
|
29
|
-
'llama3.1:405b': 128000,
|
|
30
|
-
|
|
31
|
-
// Llama 3 models
|
|
32
|
-
llama3: 8192,
|
|
33
|
-
'llama3:8b': 8192,
|
|
34
|
-
'llama3:70b': 8192,
|
|
35
|
-
|
|
36
|
-
// Llama 2 models
|
|
37
|
-
llama2: 4096,
|
|
38
|
-
'llama2:7b': 4096,
|
|
39
|
-
'llama2:13b': 4096,
|
|
40
|
-
'llama2:70b': 4096,
|
|
41
|
-
|
|
42
|
-
// Mistral models
|
|
43
|
-
mistral: 32000,
|
|
44
|
-
'mistral:7b': 32000,
|
|
45
|
-
'mistral-large': 256000,
|
|
46
|
-
mixtral: 32000,
|
|
47
|
-
'mixtral:8x7b': 32000,
|
|
48
|
-
'mixtral:8x22b': 64000,
|
|
49
|
-
ministral: 256000,
|
|
50
|
-
'ministral:3b': 256000,
|
|
51
|
-
'ministral:8b': 256000,
|
|
52
|
-
'devstral-small-2:24b': 256000,
|
|
53
|
-
'devstral-2': 256000,
|
|
54
|
-
|
|
55
|
-
// Essentials AI models
|
|
56
|
-
'rnj-1:8b': 32000,
|
|
57
|
-
|
|
58
|
-
// Qwen models
|
|
59
|
-
qwen: 32000,
|
|
60
|
-
'qwen:7b': 32000,
|
|
61
|
-
'qwen:14b': 32000,
|
|
62
|
-
qwen2: 32000,
|
|
63
|
-
'qwen2:7b': 32000,
|
|
64
|
-
'qwen2.5': 128000,
|
|
65
|
-
'qwen2.5:7b': 128000,
|
|
66
|
-
qwen3: 128000,
|
|
67
|
-
'qwen3:7b': 128000,
|
|
68
|
-
'qwen3:14b': 128000,
|
|
69
|
-
'qwen3:32b': 128000,
|
|
70
|
-
'qwen3-coder:480b': 256000,
|
|
71
|
-
|
|
72
|
-
// Gemma models
|
|
73
|
-
gemma: 8192,
|
|
74
|
-
'gemma:2b': 8192,
|
|
75
|
-
'gemma:7b': 8192,
|
|
76
|
-
gemma2: 8192,
|
|
77
|
-
'gemma2:9b': 8192,
|
|
78
|
-
'gemma2:27b': 8192,
|
|
79
|
-
|
|
80
|
-
// Command-R models
|
|
81
|
-
'command-r': 128000,
|
|
82
|
-
'command-r-plus': 128000,
|
|
83
|
-
|
|
84
|
-
// DeepSeek models
|
|
85
|
-
'deepseek-coder': 16000,
|
|
86
|
-
'deepseek-coder-v2': 128000,
|
|
87
|
-
'deepseek-v3.1': 128000,
|
|
88
|
-
'deepseek-v3.2': 128000,
|
|
89
|
-
|
|
90
|
-
// Phi models
|
|
91
|
-
phi3: 128000,
|
|
92
|
-
'phi3:mini': 128000,
|
|
93
|
-
'phi3:medium': 128000,
|
|
94
|
-
|
|
95
|
-
// OpenAI models
|
|
96
|
-
'gpt-oss:120b': 128000,
|
|
97
|
-
'gpt-oss:20b': 128000,
|
|
98
|
-
|
|
99
|
-
// Z.ai models
|
|
100
|
-
'glm-4.7': 200000,
|
|
101
|
-
|
|
102
|
-
// Moonshot AI models
|
|
103
|
-
'kimi-k2:1t-cloud': 256000,
|
|
104
|
-
'kimi-k2-thinking:cloud': 256000,
|
|
105
|
-
|
|
106
|
-
// Cloud models
|
|
107
|
-
'minimax-m2:cloud': 196608,
|
|
108
|
-
};
|
|
109
|
-
|
|
110
|
-
/**
|
|
111
|
-
* Extract base model architecture from Ollama model name
|
|
112
|
-
* e.g., "llama3.1:8b-instruct-q4_0" -> "llama3.1:8b"
|
|
113
|
-
*/
|
|
114
|
-
function extractOllamaModelBase(modelName: string): string | null {
|
|
115
|
-
const lower = modelName.toLowerCase();
|
|
116
|
-
|
|
117
|
-
// Try exact matches first
|
|
118
|
-
for (const key of Object.keys(OLLAMA_MODEL_CONTEXT_LIMITS)) {
|
|
119
|
-
if (
|
|
120
|
-
lower === key ||
|
|
121
|
-
lower.startsWith(`${key}-`) ||
|
|
122
|
-
lower.startsWith(`${key}:`)
|
|
123
|
-
) {
|
|
124
|
-
return key;
|
|
125
|
-
}
|
|
126
|
-
}
|
|
127
|
-
|
|
128
|
-
// Try to match base architecture
|
|
129
|
-
if (lower.includes('llama3.2')) return 'llama3.2';
|
|
130
|
-
if (lower.includes('llama3.1')) return 'llama3.1';
|
|
131
|
-
if (lower.includes('llama3')) return 'llama3';
|
|
132
|
-
if (lower.includes('llama2')) return 'llama2';
|
|
133
|
-
if (lower.includes('mixtral:8x22b')) return 'mixtral:8x22b';
|
|
134
|
-
if (lower.includes('mixtral')) return 'mixtral';
|
|
135
|
-
if (lower.includes('ministral')) return 'ministral';
|
|
136
|
-
if (lower.includes('mistral-large')) return 'mistral-large';
|
|
137
|
-
if (lower.includes('mistral')) return 'mistral';
|
|
138
|
-
if (lower.includes('qwen2.5')) return 'qwen2.5';
|
|
139
|
-
if (lower.includes('qwen2')) return 'qwen2';
|
|
140
|
-
if (lower.includes('qwen')) return 'qwen';
|
|
141
|
-
if (lower.includes('gemma2')) return 'gemma2';
|
|
142
|
-
if (lower.includes('gemma')) return 'gemma';
|
|
143
|
-
if (lower.includes('command-r-plus')) return 'command-r-plus';
|
|
144
|
-
if (lower.includes('command-r')) return 'command-r';
|
|
145
|
-
if (lower.includes('deepseek-coder-v2')) return 'deepseek-coder-v2';
|
|
146
|
-
if (lower.includes('deepseek')) return 'deepseek-coder';
|
|
147
|
-
if (lower.includes('phi3')) return 'phi3';
|
|
148
|
-
|
|
149
|
-
return null;
|
|
150
|
-
}
|
|
151
|
-
|
|
152
|
-
/**
|
|
153
|
-
* Get fallback context limit for Ollama models
|
|
154
|
-
*/
|
|
155
|
-
function getOllamaFallbackContextLimit(modelName: string): number | null {
|
|
156
|
-
const baseModel = extractOllamaModelBase(modelName);
|
|
157
|
-
if (!baseModel) {
|
|
158
|
-
return null;
|
|
159
|
-
}
|
|
160
|
-
|
|
161
|
-
return OLLAMA_MODEL_CONTEXT_LIMITS[baseModel] || null;
|
|
162
|
-
}
|
|
163
|
-
|
|
164
|
-
/**
|
|
165
|
-
* Fetch models data from models.dev API
|
|
166
|
-
* Falls back to cache if API is unavailable
|
|
167
|
-
*/
|
|
168
|
-
async function fetchModelsData(): Promise<ModelsDevDatabase | null> {
|
|
169
|
-
try {
|
|
170
|
-
const response = await request(MODELS_DEV_API_URL, {
|
|
171
|
-
method: 'GET',
|
|
172
|
-
headersTimeout: TIMEOUT_HTTP_HEADERS_MS,
|
|
173
|
-
bodyTimeout: TIMEOUT_HTTP_BODY_MS,
|
|
174
|
-
});
|
|
175
|
-
|
|
176
|
-
if (response.statusCode !== 200) {
|
|
177
|
-
throw new Error(
|
|
178
|
-
`Failed to fetch models data: HTTP ${response.statusCode}`,
|
|
179
|
-
);
|
|
180
|
-
}
|
|
181
|
-
|
|
182
|
-
const body = await response.body.json();
|
|
183
|
-
const data = body as ModelsDevDatabase;
|
|
184
|
-
|
|
185
|
-
// Cache the successful response
|
|
186
|
-
await writeCache(data);
|
|
187
|
-
|
|
188
|
-
return data;
|
|
189
|
-
} catch (error) {
|
|
190
|
-
const logger = getLogger();
|
|
191
|
-
logger.warn({error: formatError(error)}, 'Failed to fetch from models.dev');
|
|
192
|
-
|
|
193
|
-
// Try to use cached data as fallback
|
|
194
|
-
const cached = await readCache();
|
|
195
|
-
if (cached) {
|
|
196
|
-
logger.info('Using cached models data');
|
|
197
|
-
return cached.data;
|
|
198
|
-
}
|
|
199
|
-
|
|
200
|
-
return null;
|
|
201
|
-
}
|
|
202
|
-
}
|
|
203
|
-
|
|
204
|
-
/**
|
|
205
|
-
* Get models data, preferring cache if valid
|
|
206
|
-
*/
|
|
207
|
-
async function getModelsData(): Promise<ModelsDevDatabase | null> {
|
|
208
|
-
// Try cache first
|
|
209
|
-
const cached = await readCache();
|
|
210
|
-
if (cached) {
|
|
211
|
-
return cached.data;
|
|
212
|
-
}
|
|
213
|
-
|
|
214
|
-
// Fetch fresh data if cache is invalid
|
|
215
|
-
return fetchModelsData();
|
|
216
|
-
}
|
|
217
|
-
|
|
218
|
-
/**
|
|
219
|
-
* Find a model by ID across all providers
|
|
220
|
-
* Returns the model info and provider name
|
|
221
|
-
*/
|
|
222
|
-
async function findModelById(modelId: string): Promise<ModelInfo | null> {
|
|
223
|
-
const data = await getModelsData();
|
|
224
|
-
if (!data) {
|
|
225
|
-
return null;
|
|
226
|
-
}
|
|
227
|
-
|
|
228
|
-
// Search through all providers
|
|
229
|
-
for (const [_providerId, provider] of Object.entries(data)) {
|
|
230
|
-
const model = provider.models[modelId];
|
|
231
|
-
if (model) {
|
|
232
|
-
return {
|
|
233
|
-
id: model.id,
|
|
234
|
-
name: model.name,
|
|
235
|
-
provider: provider.name,
|
|
236
|
-
contextLimit: model.limit.context,
|
|
237
|
-
outputLimit: model.limit.output,
|
|
238
|
-
supportsToolCalls: model.tool_call,
|
|
239
|
-
cost: {
|
|
240
|
-
input: model.cost.input,
|
|
241
|
-
output: model.cost.output,
|
|
242
|
-
},
|
|
243
|
-
};
|
|
244
|
-
}
|
|
245
|
-
}
|
|
246
|
-
|
|
247
|
-
return null;
|
|
248
|
-
}
|
|
249
|
-
|
|
250
|
-
/**
|
|
251
|
-
* Find a model by partial name match
|
|
252
|
-
* Useful for local models where exact ID might not match
|
|
253
|
-
*/
|
|
254
|
-
async function findModelByName(modelName: string): Promise<ModelInfo | null> {
|
|
255
|
-
const data = await getModelsData();
|
|
256
|
-
if (!data) {
|
|
257
|
-
return null;
|
|
258
|
-
}
|
|
259
|
-
|
|
260
|
-
const lowerName = modelName.toLowerCase();
|
|
261
|
-
|
|
262
|
-
// Search through all providers
|
|
263
|
-
for (const [_providerId, provider] of Object.entries(data)) {
|
|
264
|
-
for (const [_modelId, model] of Object.entries(provider.models)) {
|
|
265
|
-
if (
|
|
266
|
-
model.id.toLowerCase().includes(lowerName) ||
|
|
267
|
-
model.name.toLowerCase().includes(lowerName)
|
|
268
|
-
) {
|
|
269
|
-
return {
|
|
270
|
-
id: model.id,
|
|
271
|
-
name: model.name,
|
|
272
|
-
provider: provider.name,
|
|
273
|
-
contextLimit: model.limit.context,
|
|
274
|
-
outputLimit: model.limit.output,
|
|
275
|
-
supportsToolCalls: model.tool_call,
|
|
276
|
-
cost: {
|
|
277
|
-
input: model.cost.input,
|
|
278
|
-
output: model.cost.output,
|
|
279
|
-
},
|
|
280
|
-
};
|
|
281
|
-
}
|
|
282
|
-
}
|
|
283
|
-
}
|
|
284
|
-
|
|
285
|
-
return null;
|
|
286
|
-
}
|
|
287
|
-
|
|
288
|
-
/**
|
|
289
|
-
* Get context limit for a model
|
|
290
|
-
* Returns null if model not found and no fallback available
|
|
291
|
-
*/
|
|
292
|
-
export async function getModelContextLimit(
|
|
293
|
-
modelId: string,
|
|
294
|
-
): Promise<number | null> {
|
|
295
|
-
// Try Ollama fallback first with original model ID (before normalization)
|
|
296
|
-
// This handles cloud models like gpt-oss:20b-cloud
|
|
297
|
-
const ollamaLimitOriginal = getOllamaFallbackContextLimit(modelId);
|
|
298
|
-
if (ollamaLimitOriginal) {
|
|
299
|
-
return ollamaLimitOriginal;
|
|
300
|
-
}
|
|
301
|
-
|
|
302
|
-
// Strip :cloud or -cloud suffix if present (Ollama cloud models)
|
|
303
|
-
const normalizedModelId =
|
|
304
|
-
modelId.endsWith(':cloud') || modelId.endsWith('-cloud')
|
|
305
|
-
? modelId.slice(0, -6) // Remove ":cloud" or "-cloud"
|
|
306
|
-
: modelId;
|
|
307
|
-
|
|
308
|
-
// Try exact ID match first
|
|
309
|
-
let modelInfo = await findModelById(normalizedModelId);
|
|
310
|
-
|
|
311
|
-
// Try partial name match if exact match fails
|
|
312
|
-
if (!modelInfo) {
|
|
313
|
-
modelInfo = await findModelByName(normalizedModelId);
|
|
314
|
-
}
|
|
315
|
-
|
|
316
|
-
// If found in models.dev, return that
|
|
317
|
-
if (modelInfo) {
|
|
318
|
-
return modelInfo.contextLimit;
|
|
319
|
-
}
|
|
320
|
-
|
|
321
|
-
// Fall back to Ollama model defaults with normalized ID
|
|
322
|
-
const ollamaLimit = getOllamaFallbackContextLimit(normalizedModelId);
|
|
323
|
-
if (ollamaLimit) {
|
|
324
|
-
return ollamaLimit;
|
|
325
|
-
}
|
|
326
|
-
|
|
327
|
-
// No context limit found
|
|
328
|
-
return null;
|
|
329
|
-
}
|