@juspay/neurolink 9.15.0 → 9.17.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +12 -0
- package/README.md +22 -20
- package/dist/adapters/video/videoAnalyzer.d.ts +1 -1
- package/dist/adapters/video/videoAnalyzer.js +10 -8
- package/dist/cli/commands/setup-anthropic.js +1 -14
- package/dist/cli/commands/setup-azure.js +1 -12
- package/dist/cli/commands/setup-bedrock.js +1 -9
- package/dist/cli/commands/setup-google-ai.js +1 -12
- package/dist/cli/commands/setup-openai.js +1 -14
- package/dist/cli/commands/workflow.d.ts +27 -0
- package/dist/cli/commands/workflow.js +216 -0
- package/dist/cli/factories/commandFactory.js +79 -20
- package/dist/cli/index.js +0 -1
- package/dist/cli/parser.js +4 -1
- package/dist/cli/utils/maskCredential.d.ts +11 -0
- package/dist/cli/utils/maskCredential.js +23 -0
- package/dist/constants/contextWindows.js +107 -16
- package/dist/constants/enums.d.ts +99 -15
- package/dist/constants/enums.js +152 -22
- package/dist/context/budgetChecker.js +1 -1
- package/dist/context/contextCompactor.js +31 -4
- package/dist/context/emergencyTruncation.d.ts +21 -0
- package/dist/context/emergencyTruncation.js +88 -0
- package/dist/context/errorDetection.d.ts +16 -0
- package/dist/context/errorDetection.js +48 -1
- package/dist/context/errors.d.ts +19 -0
- package/dist/context/errors.js +21 -0
- package/dist/context/stages/slidingWindowTruncator.d.ts +6 -0
- package/dist/context/stages/slidingWindowTruncator.js +159 -24
- package/dist/context/stages/structuredSummarizer.js +2 -2
- package/dist/core/baseProvider.js +306 -200
- package/dist/core/conversationMemoryManager.js +104 -61
- package/dist/core/evaluationProviders.js +16 -33
- package/dist/core/factory.js +237 -164
- package/dist/core/modules/GenerationHandler.js +175 -116
- package/dist/core/modules/MessageBuilder.js +222 -170
- package/dist/core/modules/StreamHandler.d.ts +1 -0
- package/dist/core/modules/StreamHandler.js +95 -27
- package/dist/core/modules/TelemetryHandler.d.ts +10 -1
- package/dist/core/modules/TelemetryHandler.js +25 -7
- package/dist/core/modules/ToolsManager.js +115 -191
- package/dist/core/redisConversationMemoryManager.js +418 -282
- package/dist/factories/providerRegistry.d.ts +5 -0
- package/dist/factories/providerRegistry.js +20 -2
- package/dist/index.d.ts +2 -2
- package/dist/index.js +4 -2
- package/dist/lib/adapters/video/videoAnalyzer.d.ts +1 -1
- package/dist/lib/adapters/video/videoAnalyzer.js +10 -8
- package/dist/lib/constants/contextWindows.js +107 -16
- package/dist/lib/constants/enums.d.ts +99 -15
- package/dist/lib/constants/enums.js +152 -22
- package/dist/lib/context/budgetChecker.js +1 -1
- package/dist/lib/context/contextCompactor.js +31 -4
- package/dist/lib/context/emergencyTruncation.d.ts +21 -0
- package/dist/lib/context/emergencyTruncation.js +89 -0
- package/dist/lib/context/errorDetection.d.ts +16 -0
- package/dist/lib/context/errorDetection.js +48 -1
- package/dist/lib/context/errors.d.ts +19 -0
- package/dist/lib/context/errors.js +22 -0
- package/dist/lib/context/stages/slidingWindowTruncator.d.ts +6 -0
- package/dist/lib/context/stages/slidingWindowTruncator.js +159 -24
- package/dist/lib/context/stages/structuredSummarizer.js +2 -2
- package/dist/lib/core/baseProvider.js +306 -200
- package/dist/lib/core/conversationMemoryManager.js +104 -61
- package/dist/lib/core/evaluationProviders.js +16 -33
- package/dist/lib/core/factory.js +237 -164
- package/dist/lib/core/modules/GenerationHandler.js +175 -116
- package/dist/lib/core/modules/MessageBuilder.js +222 -170
- package/dist/lib/core/modules/StreamHandler.d.ts +1 -0
- package/dist/lib/core/modules/StreamHandler.js +95 -27
- package/dist/lib/core/modules/TelemetryHandler.d.ts +10 -1
- package/dist/lib/core/modules/TelemetryHandler.js +25 -7
- package/dist/lib/core/modules/ToolsManager.js +115 -191
- package/dist/lib/core/redisConversationMemoryManager.js +418 -282
- package/dist/lib/factories/providerRegistry.d.ts +5 -0
- package/dist/lib/factories/providerRegistry.js +20 -2
- package/dist/lib/index.d.ts +2 -2
- package/dist/lib/index.js +4 -2
- package/dist/lib/mcp/externalServerManager.js +66 -0
- package/dist/lib/mcp/mcpCircuitBreaker.js +24 -0
- package/dist/lib/mcp/mcpClientFactory.js +16 -0
- package/dist/lib/mcp/toolDiscoveryService.js +32 -6
- package/dist/lib/mcp/toolRegistry.js +193 -123
- package/dist/lib/neurolink.d.ts +6 -0
- package/dist/lib/neurolink.js +1162 -646
- package/dist/lib/providers/amazonBedrock.d.ts +1 -1
- package/dist/lib/providers/amazonBedrock.js +521 -319
- package/dist/lib/providers/anthropic.js +73 -17
- package/dist/lib/providers/anthropicBaseProvider.js +77 -17
- package/dist/lib/providers/googleAiStudio.d.ts +1 -1
- package/dist/lib/providers/googleAiStudio.js +292 -227
- package/dist/lib/providers/googleVertex.d.ts +36 -1
- package/dist/lib/providers/googleVertex.js +553 -260
- package/dist/lib/providers/ollama.js +329 -278
- package/dist/lib/providers/openAI.js +77 -19
- package/dist/lib/providers/sagemaker/parsers.js +3 -3
- package/dist/lib/providers/sagemaker/streaming.js +3 -3
- package/dist/lib/proxy/proxyFetch.js +81 -48
- package/dist/lib/rag/ChunkerFactory.js +1 -1
- package/dist/lib/rag/chunkers/MarkdownChunker.d.ts +22 -0
- package/dist/lib/rag/chunkers/MarkdownChunker.js +213 -9
- package/dist/lib/rag/chunking/markdownChunker.d.ts +16 -0
- package/dist/lib/rag/chunking/markdownChunker.js +174 -2
- package/dist/lib/rag/pipeline/contextAssembly.js +2 -1
- package/dist/lib/rag/ragIntegration.d.ts +18 -1
- package/dist/lib/rag/ragIntegration.js +94 -14
- package/dist/lib/rag/retrieval/vectorQueryTool.js +21 -4
- package/dist/lib/server/abstract/baseServerAdapter.js +4 -1
- package/dist/lib/server/adapters/fastifyAdapter.js +35 -30
- package/dist/lib/services/server/ai/observability/instrumentation.d.ts +32 -0
- package/dist/lib/services/server/ai/observability/instrumentation.js +39 -0
- package/dist/lib/telemetry/attributes.d.ts +52 -0
- package/dist/lib/telemetry/attributes.js +61 -0
- package/dist/lib/telemetry/index.d.ts +3 -0
- package/dist/lib/telemetry/index.js +3 -0
- package/dist/lib/telemetry/telemetryService.d.ts +6 -0
- package/dist/lib/telemetry/telemetryService.js +6 -0
- package/dist/lib/telemetry/tracers.d.ts +15 -0
- package/dist/lib/telemetry/tracers.js +17 -0
- package/dist/lib/telemetry/withSpan.d.ts +9 -0
- package/dist/lib/telemetry/withSpan.js +35 -0
- package/dist/lib/types/contextTypes.d.ts +10 -0
- package/dist/lib/types/streamTypes.d.ts +14 -0
- package/dist/lib/utils/conversationMemory.js +123 -84
- package/dist/lib/utils/logger.d.ts +5 -0
- package/dist/lib/utils/logger.js +50 -2
- package/dist/lib/utils/messageBuilder.js +22 -42
- package/dist/lib/utils/modelDetection.js +3 -3
- package/dist/lib/utils/providerRetry.d.ts +41 -0
- package/dist/lib/utils/providerRetry.js +114 -0
- package/dist/lib/utils/retryability.d.ts +14 -0
- package/dist/lib/utils/retryability.js +23 -0
- package/dist/lib/utils/sanitizers/svg.js +4 -5
- package/dist/lib/utils/tokenEstimation.d.ts +11 -1
- package/dist/lib/utils/tokenEstimation.js +19 -4
- package/dist/lib/utils/videoAnalysisProcessor.js +7 -3
- package/dist/mcp/externalServerManager.js +66 -0
- package/dist/mcp/mcpCircuitBreaker.js +24 -0
- package/dist/mcp/mcpClientFactory.js +16 -0
- package/dist/mcp/toolDiscoveryService.js +32 -6
- package/dist/mcp/toolRegistry.js +193 -123
- package/dist/neurolink.d.ts +6 -0
- package/dist/neurolink.js +1162 -646
- package/dist/providers/amazonBedrock.d.ts +1 -1
- package/dist/providers/amazonBedrock.js +521 -319
- package/dist/providers/anthropic.js +73 -17
- package/dist/providers/anthropicBaseProvider.js +77 -17
- package/dist/providers/googleAiStudio.d.ts +1 -1
- package/dist/providers/googleAiStudio.js +292 -227
- package/dist/providers/googleVertex.d.ts +36 -1
- package/dist/providers/googleVertex.js +553 -260
- package/dist/providers/ollama.js +329 -278
- package/dist/providers/openAI.js +77 -19
- package/dist/providers/sagemaker/parsers.js +3 -3
- package/dist/providers/sagemaker/streaming.js +3 -3
- package/dist/proxy/proxyFetch.js +81 -48
- package/dist/rag/ChunkerFactory.js +1 -1
- package/dist/rag/chunkers/MarkdownChunker.d.ts +22 -0
- package/dist/rag/chunkers/MarkdownChunker.js +213 -9
- package/dist/rag/chunking/markdownChunker.d.ts +16 -0
- package/dist/rag/chunking/markdownChunker.js +174 -2
- package/dist/rag/pipeline/contextAssembly.js +2 -1
- package/dist/rag/ragIntegration.d.ts +18 -1
- package/dist/rag/ragIntegration.js +94 -14
- package/dist/rag/retrieval/vectorQueryTool.js +21 -4
- package/dist/server/abstract/baseServerAdapter.js +4 -1
- package/dist/server/adapters/fastifyAdapter.js +35 -30
- package/dist/services/server/ai/observability/instrumentation.d.ts +32 -0
- package/dist/services/server/ai/observability/instrumentation.js +39 -0
- package/dist/telemetry/attributes.d.ts +52 -0
- package/dist/telemetry/attributes.js +60 -0
- package/dist/telemetry/index.d.ts +3 -0
- package/dist/telemetry/index.js +3 -0
- package/dist/telemetry/telemetryService.d.ts +6 -0
- package/dist/telemetry/telemetryService.js +6 -0
- package/dist/telemetry/tracers.d.ts +15 -0
- package/dist/telemetry/tracers.js +16 -0
- package/dist/telemetry/withSpan.d.ts +9 -0
- package/dist/telemetry/withSpan.js +34 -0
- package/dist/types/contextTypes.d.ts +10 -0
- package/dist/types/streamTypes.d.ts +14 -0
- package/dist/utils/conversationMemory.js +123 -84
- package/dist/utils/logger.d.ts +5 -0
- package/dist/utils/logger.js +50 -2
- package/dist/utils/messageBuilder.js +22 -42
- package/dist/utils/modelDetection.js +3 -3
- package/dist/utils/providerRetry.d.ts +41 -0
- package/dist/utils/providerRetry.js +113 -0
- package/dist/utils/retryability.d.ts +14 -0
- package/dist/utils/retryability.js +22 -0
- package/dist/utils/sanitizers/svg.js +4 -5
- package/dist/utils/tokenEstimation.d.ts +11 -1
- package/dist/utils/tokenEstimation.js +19 -4
- package/dist/utils/videoAnalysisProcessor.js +7 -3
- package/dist/workflow/config.d.ts +26 -26
- package/package.json +1 -1
package/dist/cli/parser.js
CHANGED
|
@@ -12,6 +12,7 @@ import { ServeCommandFactory } from "./commands/serve.js";
|
|
|
12
12
|
import { ragCommand } from "./commands/rag.js";
|
|
13
13
|
import { DocsCommandFactory } from "./commands/docs.js";
|
|
14
14
|
import { AuthCommandFactory } from "./factories/authCommandFactory.js";
|
|
15
|
+
import { WorkflowCommandFactory } from "./commands/workflow.js";
|
|
15
16
|
// Enhanced CLI with Professional UX
|
|
16
17
|
export function initializeCliParser() {
|
|
17
18
|
return (yargs(hideBin(process.argv))
|
|
@@ -178,6 +179,8 @@ export function initializeCliParser() {
|
|
|
178
179
|
// Docs MCP Server Command
|
|
179
180
|
.command(DocsCommandFactory.createDocsCommand())
|
|
180
181
|
// Auth Commands - Using AuthCommandFactory
|
|
181
|
-
.command(AuthCommandFactory.createAuthCommands())
|
|
182
|
+
.command(AuthCommandFactory.createAuthCommands())
|
|
183
|
+
// Workflow Commands
|
|
184
|
+
.command(WorkflowCommandFactory.createWorkflowCommands())); // Close the main return statement
|
|
182
185
|
}
|
|
183
186
|
//# sourceMappingURL=parser.js.map
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Unified credential masking utility for CLI setup commands.
|
|
3
|
+
*
|
|
4
|
+
* Preserves known provider prefixes (sk-, sk-ant-, AIza, AKIA) so
|
|
5
|
+
* users can identify which key is configured, while hiding the secret
|
|
6
|
+
* portion with asterisks.
|
|
7
|
+
*
|
|
8
|
+
* @param credential - Raw API key or secret
|
|
9
|
+
* @returns Masked string, e.g. "sk-****abcd"
|
|
10
|
+
*/
|
|
11
|
+
export declare function maskCredential(credential: string): string;
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Unified credential masking utility for CLI setup commands.
|
|
3
|
+
*
|
|
4
|
+
* Preserves known provider prefixes (sk-, sk-ant-, AIza, AKIA) so
|
|
5
|
+
* users can identify which key is configured, while hiding the secret
|
|
6
|
+
* portion with asterisks.
|
|
7
|
+
*
|
|
8
|
+
* @param credential - Raw API key or secret
|
|
9
|
+
* @returns Masked string, e.g. "sk-****abcd"
|
|
10
|
+
*/
|
|
11
|
+
export function maskCredential(credential) {
|
|
12
|
+
if (!credential || credential.length <= 8) {
|
|
13
|
+
return "****";
|
|
14
|
+
}
|
|
15
|
+
// Provider-specific prefixes ordered longest-first so "sk-ant-" wins over "sk-"
|
|
16
|
+
const knownPrefixes = ["sk-ant-", "sk-", "AIza", "AKIA"];
|
|
17
|
+
const prefix = knownPrefixes.find((p) => credential.startsWith(p)) ??
|
|
18
|
+
credential.slice(0, 4);
|
|
19
|
+
const end = credential.slice(-4);
|
|
20
|
+
const stars = "*".repeat(Math.max(4, credential.length - prefix.length - 4));
|
|
21
|
+
return `${prefix}${stars}${end}`;
|
|
22
|
+
}
|
|
23
|
+
//# sourceMappingURL=maskCredential.js.map
|
|
@@ -25,8 +25,18 @@ export const DEFAULT_OUTPUT_RESERVE_RATIO = 0.35;
|
|
|
25
25
|
export const MODEL_CONTEXT_WINDOWS = {
|
|
26
26
|
anthropic: {
|
|
27
27
|
_default: 200_000,
|
|
28
|
+
// Claude 4.6 (Feb 2026) — 200K standard, 1M with beta header
|
|
29
|
+
"claude-opus-4-6": 200_000,
|
|
30
|
+
"claude-sonnet-4-6": 200_000,
|
|
31
|
+
// Claude 4.5
|
|
32
|
+
"claude-opus-4-5-20251101": 200_000,
|
|
33
|
+
"claude-sonnet-4-5-20250929": 200_000,
|
|
34
|
+
"claude-haiku-4-5-20251001": 200_000,
|
|
35
|
+
// Claude 4.x
|
|
36
|
+
"claude-opus-4-1-20250805": 200_000,
|
|
28
37
|
"claude-opus-4-20250514": 200_000,
|
|
29
38
|
"claude-sonnet-4-20250514": 200_000,
|
|
39
|
+
// Claude 3.x
|
|
30
40
|
"claude-3-7-sonnet-20250219": 200_000,
|
|
31
41
|
"claude-3-5-sonnet-20241022": 200_000,
|
|
32
42
|
"claude-3-5-haiku-20241022": 200_000,
|
|
@@ -36,67 +46,144 @@ export const MODEL_CONTEXT_WINDOWS = {
|
|
|
36
46
|
},
|
|
37
47
|
openai: {
|
|
38
48
|
_default: 128_000,
|
|
49
|
+
// GPT-5.x family — 400K context
|
|
50
|
+
"gpt-5.3-codex": 400_000,
|
|
51
|
+
"gpt-5.2": 400_000,
|
|
52
|
+
"gpt-5.2-pro": 400_000,
|
|
53
|
+
"gpt-5.2-codex": 400_000,
|
|
54
|
+
"gpt-5.2-chat-latest": 128_000,
|
|
55
|
+
"gpt-5.1": 400_000,
|
|
56
|
+
"gpt-5.1-codex": 400_000,
|
|
57
|
+
"gpt-5.1-codex-max": 400_000,
|
|
58
|
+
"gpt-5.1-codex-mini": 400_000,
|
|
59
|
+
"gpt-5.1-chat-latest": 128_000,
|
|
60
|
+
"gpt-5": 400_000,
|
|
61
|
+
"gpt-5-mini": 400_000,
|
|
62
|
+
"gpt-5-nano": 400_000,
|
|
63
|
+
"gpt-5-pro": 400_000,
|
|
64
|
+
"gpt-5-codex": 400_000,
|
|
65
|
+
"gpt-5-chat-latest": 128_000,
|
|
66
|
+
// GPT Open Source
|
|
67
|
+
"gpt-oss-120b": 128_000,
|
|
68
|
+
"gpt-oss-20b": 128_000,
|
|
69
|
+
// GPT-4.1 family — 1M context
|
|
70
|
+
"gpt-4.1": 1_047_576,
|
|
71
|
+
"gpt-4.1-mini": 1_047_576,
|
|
72
|
+
"gpt-4.1-nano": 1_047_576,
|
|
73
|
+
// GPT-4o
|
|
39
74
|
"gpt-4o": 128_000,
|
|
40
75
|
"gpt-4o-mini": 128_000,
|
|
41
|
-
|
|
42
|
-
"gpt-4": 8_192,
|
|
43
|
-
"gpt-3.5-turbo": 16_385,
|
|
76
|
+
// O-series reasoning — 200K context
|
|
44
77
|
o1: 200_000,
|
|
45
78
|
"o1-mini": 128_000,
|
|
46
79
|
"o1-pro": 200_000,
|
|
47
80
|
o3: 200_000,
|
|
48
81
|
"o3-mini": 200_000,
|
|
82
|
+
"o3-pro": 200_000,
|
|
49
83
|
"o4-mini": 200_000,
|
|
50
|
-
|
|
51
|
-
"gpt-4
|
|
52
|
-
"gpt-4
|
|
53
|
-
"gpt-5":
|
|
84
|
+
// Legacy
|
|
85
|
+
"gpt-4-turbo": 128_000,
|
|
86
|
+
"gpt-4": 8_192,
|
|
87
|
+
"gpt-3.5-turbo": 16_385,
|
|
54
88
|
},
|
|
55
89
|
"google-ai": {
|
|
56
90
|
_default: 1_048_576,
|
|
91
|
+
"gemini-3.1-pro-preview": 1_048_576,
|
|
92
|
+
"gemini-3-pro-preview": 1_048_576,
|
|
93
|
+
"gemini-3-pro-image-preview": 65_536,
|
|
94
|
+
"gemini-3-flash-preview": 1_048_576,
|
|
95
|
+
"gemini-3-flash": 1_048_576,
|
|
57
96
|
"gemini-2.5-pro": 1_048_576,
|
|
58
97
|
"gemini-2.5-flash": 1_048_576,
|
|
98
|
+
"gemini-2.5-flash-lite": 1_048_576,
|
|
99
|
+
"gemini-2.5-flash-image": 32_768,
|
|
59
100
|
"gemini-2.0-flash": 1_048_576,
|
|
60
101
|
"gemini-1.5-pro": 2_097_152,
|
|
61
102
|
"gemini-1.5-flash": 1_048_576,
|
|
62
|
-
"gemini-3-flash-preview": 1_048_576,
|
|
63
|
-
"gemini-3-pro-preview": 1_048_576,
|
|
64
103
|
},
|
|
65
104
|
vertex: {
|
|
66
105
|
_default: 1_048_576,
|
|
106
|
+
// Claude on Vertex
|
|
107
|
+
"claude-opus-4-6": 200_000,
|
|
108
|
+
"claude-sonnet-4-6": 200_000,
|
|
109
|
+
"claude-sonnet-4-5": 200_000,
|
|
110
|
+
"claude-opus-4-5": 200_000,
|
|
111
|
+
"claude-haiku-4-5": 200_000,
|
|
112
|
+
"claude-sonnet-4": 200_000,
|
|
113
|
+
"claude-sonnet-4-20250514": 200_000,
|
|
114
|
+
"claude-opus-4-20250514": 200_000,
|
|
115
|
+
"claude-opus-4": 200_000,
|
|
116
|
+
// Gemini on Vertex
|
|
117
|
+
"gemini-3.1-pro-preview": 1_048_576,
|
|
118
|
+
"gemini-3-pro-preview": 1_048_576,
|
|
119
|
+
"gemini-3-pro-latest": 1_048_576,
|
|
120
|
+
"gemini-3-flash-preview": 1_048_576,
|
|
121
|
+
"gemini-3-flash-latest": 1_048_576,
|
|
67
122
|
"gemini-2.5-pro": 1_048_576,
|
|
68
123
|
"gemini-2.5-flash": 1_048_576,
|
|
69
124
|
"gemini-2.0-flash": 1_048_576,
|
|
70
125
|
"gemini-1.5-pro": 2_097_152,
|
|
71
126
|
"gemini-1.5-flash": 1_048_576,
|
|
72
|
-
"claude-sonnet-4-5": 200_000,
|
|
73
|
-
"claude-sonnet-4-20250514": 200_000,
|
|
74
|
-
"claude-opus-4": 200_000,
|
|
75
|
-
"claude-opus-4-20250514": 200_000,
|
|
76
127
|
},
|
|
77
128
|
bedrock: {
|
|
78
129
|
_default: 200_000,
|
|
79
|
-
|
|
130
|
+
// Claude 4.6
|
|
131
|
+
"anthropic.claude-opus-4-6-v1:0": 200_000,
|
|
132
|
+
"anthropic.claude-sonnet-4-6": 200_000,
|
|
133
|
+
// Claude 4.5
|
|
134
|
+
"anthropic.claude-opus-4-5-20251124-v1:0": 200_000,
|
|
135
|
+
"anthropic.claude-sonnet-4-5-20250929-v1:0": 200_000,
|
|
136
|
+
"anthropic.claude-haiku-4-5-20251001-v1:0": 200_000,
|
|
137
|
+
// Claude legacy
|
|
138
|
+
"anthropic.claude-3-5-sonnet-20241022-v1:0": 200_000,
|
|
80
139
|
"anthropic.claude-3-5-haiku-20241022-v1:0": 200_000,
|
|
81
140
|
"anthropic.claude-3-opus-20240229-v1:0": 200_000,
|
|
82
141
|
"anthropic.claude-3-sonnet-20240229-v1:0": 200_000,
|
|
83
142
|
"anthropic.claude-3-haiku-20240307-v1:0": 200_000,
|
|
143
|
+
// Amazon Nova
|
|
84
144
|
"amazon.nova-pro-v1:0": 300_000,
|
|
85
145
|
"amazon.nova-lite-v1:0": 300_000,
|
|
146
|
+
"amazon.nova-2-lite-v1:0": 1_000_000,
|
|
147
|
+
// Writer
|
|
148
|
+
"writer.palmyra-x5-v1:0": 1_000_000,
|
|
149
|
+
"writer.palmyra-x4-v1:0": 128_000,
|
|
150
|
+
// NVIDIA
|
|
151
|
+
"nvidia.nemotron-nano-3-30b": 256_000,
|
|
86
152
|
},
|
|
87
153
|
azure: {
|
|
88
154
|
_default: 128_000,
|
|
155
|
+
// GPT-5.x
|
|
156
|
+
"gpt-5.2": 400_000,
|
|
157
|
+
"gpt-5.2-pro": 400_000,
|
|
158
|
+
"gpt-5.2-codex": 400_000,
|
|
159
|
+
"gpt-5.1": 400_000,
|
|
160
|
+
"gpt-5": 400_000,
|
|
161
|
+
"gpt-5-mini": 400_000,
|
|
162
|
+
// GPT-4.1
|
|
163
|
+
"gpt-4.1": 1_047_576,
|
|
164
|
+
"gpt-4.1-mini": 1_047_576,
|
|
165
|
+
// GPT-4o
|
|
89
166
|
"gpt-4o": 128_000,
|
|
90
167
|
"gpt-4o-mini": 128_000,
|
|
168
|
+
// O-series
|
|
169
|
+
o3: 200_000,
|
|
170
|
+
"o3-mini": 200_000,
|
|
171
|
+
"o4-mini": 200_000,
|
|
172
|
+
// Legacy
|
|
91
173
|
"gpt-4-turbo": 128_000,
|
|
92
174
|
"gpt-4": 8_192,
|
|
93
175
|
},
|
|
94
176
|
mistral: {
|
|
95
177
|
_default: 128_000,
|
|
96
|
-
"mistral-large-latest":
|
|
97
|
-
"mistral-
|
|
178
|
+
"mistral-large-latest": 256_000,
|
|
179
|
+
"mistral-large-2512": 256_000,
|
|
180
|
+
"mistral-medium-latest": 128_000,
|
|
98
181
|
"mistral-small-latest": 128_000,
|
|
99
182
|
"codestral-latest": 256_000,
|
|
183
|
+
"codestral-2508": 256_000,
|
|
184
|
+
"devstral-2512": 256_000,
|
|
185
|
+
"devstral-small-2512": 256_000,
|
|
186
|
+
"magistral-medium-latest": 128_000,
|
|
100
187
|
},
|
|
101
188
|
ollama: {
|
|
102
189
|
_default: 128_000,
|
|
@@ -109,6 +196,10 @@ export const MODEL_CONTEXT_WINDOWS = {
|
|
|
109
196
|
},
|
|
110
197
|
sagemaker: {
|
|
111
198
|
_default: 128_000,
|
|
199
|
+
// NVIDIA Nemotron 3 Nano (February 2026) — 1M context
|
|
200
|
+
"nvidia-nemotron-3-nano-30b": 1_000_000,
|
|
201
|
+
// Qwen3 VL — 32K context
|
|
202
|
+
"qwen3-vl-8b-instruct": 32_768,
|
|
112
203
|
},
|
|
113
204
|
};
|
|
114
205
|
/**
|
|
@@ -22,23 +22,37 @@ export declare enum AIProviderName {
|
|
|
22
22
|
* OpenRouter uses 'provider/model' format
|
|
23
23
|
*/
|
|
24
24
|
export declare enum OpenRouterModels {
|
|
25
|
+
CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4.6",
|
|
26
|
+
CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4.6",
|
|
27
|
+
CLAUDE_SONNET_4_5 = "anthropic/claude-sonnet-4.5",
|
|
28
|
+
CLAUDE_HAIKU_4_5 = "anthropic/claude-haiku-4.5",
|
|
25
29
|
CLAUDE_3_5_SONNET = "anthropic/claude-3-5-sonnet",
|
|
26
30
|
CLAUDE_3_5_HAIKU = "anthropic/claude-3-5-haiku",
|
|
27
31
|
CLAUDE_3_OPUS = "anthropic/claude-3-opus",
|
|
32
|
+
GPT_5_2 = "openai/gpt-5.2",
|
|
33
|
+
GPT_5 = "openai/gpt-5",
|
|
28
34
|
GPT_4O = "openai/gpt-4o",
|
|
29
35
|
GPT_4O_MINI = "openai/gpt-4o-mini",
|
|
30
36
|
GPT_4_TURBO = "openai/gpt-4-turbo",
|
|
37
|
+
GEMINI_3_1_PRO_PREVIEW = "google/gemini-3.1-pro-preview",
|
|
38
|
+
GEMINI_3_PRO_PREVIEW = "google/gemini-3-pro-preview",
|
|
39
|
+
GEMINI_3_FLASH_PREVIEW = "google/gemini-3-flash-preview",
|
|
40
|
+
GEMINI_2_5_FLASH = "google/gemini-2.5-flash",
|
|
41
|
+
GEMINI_2_5_FLASH_LITE = "google/gemini-2.5-flash-lite",
|
|
31
42
|
GEMINI_2_0_FLASH = "google/gemini-2.0-flash",
|
|
32
|
-
GEMINI_1_5_PRO = "google/gemini-1.5-pro",
|
|
33
43
|
LLAMA_3_1_70B = "meta-llama/llama-3.1-70b-instruct",
|
|
34
44
|
LLAMA_3_1_8B = "meta-llama/llama-3.1-8b-instruct",
|
|
35
45
|
MISTRAL_LARGE = "mistralai/mistral-large",
|
|
36
|
-
MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct"
|
|
46
|
+
MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct",
|
|
47
|
+
DEEPSEEK_R1 = "deepseek/deepseek-r1",
|
|
48
|
+
GROK_4_1_FAST = "xai/grok-4.1-fast"
|
|
37
49
|
}
|
|
38
50
|
/**
|
|
39
51
|
* Supported Models for Amazon Bedrock
|
|
40
52
|
*/
|
|
41
53
|
export declare enum BedrockModels {
|
|
54
|
+
CLAUDE_4_6_OPUS = "anthropic.claude-opus-4-6-v1:0",
|
|
55
|
+
CLAUDE_4_6_SONNET = "anthropic.claude-sonnet-4-6",
|
|
42
56
|
CLAUDE_4_5_OPUS = "anthropic.claude-opus-4-5-20251124-v1:0",
|
|
43
57
|
CLAUDE_4_5_SONNET = "anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
44
58
|
CLAUDE_4_5_HAIKU = "anthropic.claude-haiku-4-5-20251001-v1:0",
|
|
@@ -104,18 +118,49 @@ export declare enum BedrockModels {
|
|
|
104
118
|
GEMMA_3_12B_IT = "google.gemma-3-12b-it",
|
|
105
119
|
GEMMA_3_4B_IT = "google.gemma-3-4b-it",
|
|
106
120
|
JAMBA_1_5_LARGE = "ai21.jamba-1-5-large-v1:0",
|
|
107
|
-
JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0"
|
|
121
|
+
JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0",
|
|
122
|
+
WRITER_PALMYRA_X5 = "writer.palmyra-x5-v1:0",
|
|
123
|
+
WRITER_PALMYRA_X4 = "writer.palmyra-x4-v1:0",
|
|
124
|
+
MINIMAX_M2_1 = "minimax.minimax-m2.1",
|
|
125
|
+
MINIMAX_M2 = "minimax.minimax-m2",
|
|
126
|
+
KIMI_K2_THINKING = "moonshot.kimi-k2-thinking",
|
|
127
|
+
KIMI_K2_5 = "moonshotai.kimi-k2.5",
|
|
128
|
+
NVIDIA_NEMOTRON_NANO_3_30B = "nvidia.nemotron-nano-3-30b",
|
|
129
|
+
NVIDIA_NEMOTRON_NANO_12B_V2 = "nvidia.nemotron-nano-12b-v2",
|
|
130
|
+
NVIDIA_NEMOTRON_NANO_9B_V2 = "nvidia.nemotron-nano-9b-v2",
|
|
131
|
+
OPENAI_GPT_OSS_120B = "openai.gpt-oss-120b-1:0",
|
|
132
|
+
OPENAI_GPT_OSS_20B = "openai.gpt-oss-20b-1:0",
|
|
133
|
+
GLM_4_7 = "zai.glm-4.7",
|
|
134
|
+
GLM_4_7_FLASH = "zai.glm-4.7-flash",
|
|
135
|
+
COHERE_EMBED_ENGLISH_V3 = "cohere.embed-english-v3",
|
|
136
|
+
COHERE_EMBED_MULTILINGUAL_V3 = "cohere.embed-multilingual-v3",
|
|
137
|
+
COHERE_EMBED_V4 = "cohere.embed-v4:0",
|
|
138
|
+
COHERE_RERANK_V3_5 = "cohere.rerank-v3-5:0",
|
|
139
|
+
AMAZON_RERANK_V1 = "amazon.rerank-v1:0",
|
|
140
|
+
DEVSTRAL_2_123B = "mistral.devstral-2-123b"
|
|
108
141
|
}
|
|
109
142
|
/**
|
|
110
143
|
* Supported Models for OpenAI
|
|
111
144
|
*/
|
|
112
145
|
export declare enum OpenAIModels {
|
|
146
|
+
GPT_5_3_CODEX = "gpt-5.3-codex",
|
|
113
147
|
GPT_5_2 = "gpt-5.2",
|
|
114
148
|
GPT_5_2_CHAT_LATEST = "gpt-5.2-chat-latest",
|
|
115
149
|
GPT_5_2_PRO = "gpt-5.2-pro",
|
|
150
|
+
GPT_5_2_CODEX = "gpt-5.2-codex",
|
|
151
|
+
GPT_5_1 = "gpt-5.1",
|
|
152
|
+
GPT_5_1_CHAT_LATEST = "gpt-5.1-chat-latest",
|
|
153
|
+
GPT_5_1_CODEX = "gpt-5.1-codex",
|
|
154
|
+
GPT_5_1_CODEX_MAX = "gpt-5.1-codex-max",
|
|
155
|
+
GPT_5_1_CODEX_MINI = "gpt-5.1-codex-mini",
|
|
116
156
|
GPT_5 = "gpt-5",
|
|
117
157
|
GPT_5_MINI = "gpt-5-mini",
|
|
118
158
|
GPT_5_NANO = "gpt-5-nano",
|
|
159
|
+
GPT_5_PRO = "gpt-5-pro",
|
|
160
|
+
GPT_5_CHAT_LATEST = "gpt-5-chat-latest",
|
|
161
|
+
GPT_5_CODEX = "gpt-5-codex",
|
|
162
|
+
GPT_OSS_120B = "gpt-oss-120b",
|
|
163
|
+
GPT_OSS_20B = "gpt-oss-20b",
|
|
119
164
|
GPT_4_1 = "gpt-4.1",
|
|
120
165
|
GPT_4_1_MINI = "gpt-4.1-mini",
|
|
121
166
|
GPT_4_1_NANO = "gpt-4.1-nano",
|
|
@@ -137,6 +182,10 @@ export declare enum OpenAIModels {
|
|
|
137
182
|
* Note: Azure uses deployment names, these are model identifiers
|
|
138
183
|
*/
|
|
139
184
|
export declare enum AzureOpenAIModels {
|
|
185
|
+
GPT_5_2 = "gpt-5.2",
|
|
186
|
+
GPT_5_2_CHAT = "gpt-5.2-chat",
|
|
187
|
+
GPT_5_2_PRO = "gpt-5.2-pro",
|
|
188
|
+
GPT_5_2_CODEX = "gpt-5.2-codex",
|
|
140
189
|
GPT_5_1 = "gpt-5.1",
|
|
141
190
|
GPT_5_1_CHAT = "gpt-5.1-chat",
|
|
142
191
|
GPT_5_1_CODEX = "gpt-5.1-codex",
|
|
@@ -172,6 +221,8 @@ export declare enum AzureOpenAIModels {
|
|
|
172
221
|
* Supported Models for Google Vertex AI
|
|
173
222
|
*/
|
|
174
223
|
export declare enum VertexModels {
|
|
224
|
+
CLAUDE_4_6_OPUS = "claude-opus-4-6",
|
|
225
|
+
CLAUDE_4_6_SONNET = "claude-sonnet-4-6",
|
|
175
226
|
CLAUDE_4_5_OPUS = "claude-opus-4-5@20251124",
|
|
176
227
|
CLAUDE_4_5_SONNET = "claude-sonnet-4-5@20250929",
|
|
177
228
|
CLAUDE_4_5_HAIKU = "claude-haiku-4-5@20251001",
|
|
@@ -183,19 +234,13 @@ export declare enum VertexModels {
|
|
|
183
234
|
CLAUDE_3_SONNET = "claude-3-sonnet-20240229",
|
|
184
235
|
CLAUDE_3_OPUS = "claude-3-opus-20240229",
|
|
185
236
|
CLAUDE_3_HAIKU = "claude-3-haiku-20240307",
|
|
186
|
-
|
|
237
|
+
GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
|
|
187
238
|
GEMINI_3_PRO = "gemini-3-pro",
|
|
188
|
-
/** Gemini 3 Pro Preview - Versioned preview (November 2025) */
|
|
189
239
|
GEMINI_3_PRO_PREVIEW_11_2025 = "gemini-3-pro-preview-11-2025",
|
|
190
|
-
/** Gemini 3 Pro Latest - Auto-updated alias (always points to latest preview) */
|
|
191
240
|
GEMINI_3_PRO_LATEST = "gemini-3-pro-latest",
|
|
192
|
-
/** Gemini 3 Pro Preview - Generic preview (legacy) */
|
|
193
241
|
GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
|
|
194
|
-
/** Gemini 3 Flash - Base model with adaptive thinking */
|
|
195
242
|
GEMINI_3_FLASH = "gemini-3-flash",
|
|
196
|
-
/** Gemini 3 Flash Preview - Versioned preview */
|
|
197
243
|
GEMINI_3_FLASH_PREVIEW = "gemini-3-flash-preview",
|
|
198
|
-
/** Gemini 3 Flash Latest - Auto-updated alias (always points to latest preview) */
|
|
199
244
|
GEMINI_3_FLASH_LATEST = "gemini-3-flash-latest",
|
|
200
245
|
GEMINI_2_5_PRO = "gemini-2.5-pro",
|
|
201
246
|
GEMINI_2_5_FLASH = "gemini-2.5-flash",
|
|
@@ -203,15 +248,17 @@ export declare enum VertexModels {
|
|
|
203
248
|
GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
|
|
204
249
|
GEMINI_2_0_FLASH = "gemini-2.0-flash",
|
|
205
250
|
GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
|
|
206
|
-
/** Gemini 2.0 Flash Lite - GA, production-ready, cost-optimized */
|
|
207
251
|
GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
|
|
252
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
208
253
|
GEMINI_1_5_PRO = "gemini-1.5-pro-002",
|
|
254
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
209
255
|
GEMINI_1_5_FLASH = "gemini-1.5-flash-002"
|
|
210
256
|
}
|
|
211
257
|
/**
|
|
212
258
|
* Supported Models for Google AI Studio
|
|
213
259
|
*/
|
|
214
260
|
export declare enum GoogleAIModels {
|
|
261
|
+
GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
|
|
215
262
|
GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
|
|
216
263
|
GEMINI_3_PRO_IMAGE_PREVIEW = "gemini-3-pro-image-preview",
|
|
217
264
|
GEMINI_3_FLASH = "gemini-3-flash",
|
|
@@ -220,20 +267,26 @@ export declare enum GoogleAIModels {
|
|
|
220
267
|
GEMINI_2_5_FLASH = "gemini-2.5-flash",
|
|
221
268
|
GEMINI_2_5_FLASH_LITE = "gemini-2.5-flash-lite",
|
|
222
269
|
GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
|
|
223
|
-
|
|
270
|
+
GEMINI_2_5_FLASH_PREVIEW_TTS = "gemini-2.5-flash-preview-tts",
|
|
271
|
+
GEMINI_2_5_PRO_PREVIEW_TTS = "gemini-2.5-pro-preview-tts",
|
|
224
272
|
GEMINI_2_0_FLASH = "gemini-2.0-flash",
|
|
225
273
|
GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
|
|
226
274
|
GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
|
|
227
275
|
GEMINI_2_0_FLASH_IMAGE = "gemini-2.0-flash-preview-image-generation",
|
|
276
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
228
277
|
GEMINI_1_5_PRO = "gemini-1.5-pro",
|
|
278
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
229
279
|
GEMINI_1_5_FLASH = "gemini-1.5-flash",
|
|
230
280
|
GEMINI_EMBEDDING = "gemini-embedding-001",
|
|
281
|
+
/** @deprecated Shutdown Jan 2026. Use gemini-embedding-001 */
|
|
231
282
|
TEXT_EMBEDDING_004 = "text-embedding-004"
|
|
232
283
|
}
|
|
233
284
|
/**
|
|
234
285
|
* Supported Models for Anthropic (Direct API)
|
|
235
286
|
*/
|
|
236
287
|
export declare enum AnthropicModels {
|
|
288
|
+
CLAUDE_OPUS_4_6 = "claude-opus-4-6",
|
|
289
|
+
CLAUDE_SONNET_4_6 = "claude-sonnet-4-6",
|
|
237
290
|
CLAUDE_OPUS_4_5 = "claude-opus-4-5-20251101",
|
|
238
291
|
CLAUDE_SONNET_4_5 = "claude-sonnet-4-5-20250929",
|
|
239
292
|
CLAUDE_4_5_HAIKU = "claude-haiku-4-5-20251001",
|
|
@@ -271,6 +324,13 @@ export declare enum MistralModels {
|
|
|
271
324
|
PIXTRAL_12B = "pixtral-12b",
|
|
272
325
|
VOXTRAL_SMALL_LATEST = "voxtral-small-latest",
|
|
273
326
|
VOXTRAL_MINI_LATEST = "voxtral-mini-latest",
|
|
327
|
+
DEVSTRAL_2 = "devstral-2512",
|
|
328
|
+
DEVSTRAL_SMALL_2 = "devstral-small-2512",
|
|
329
|
+
MAGISTRAL_MEDIUM_2509 = "magistral-medium-2509",
|
|
330
|
+
MAGISTRAL_SMALL_2509 = "magistral-small-2509",
|
|
331
|
+
VOXTRAL_MINI_TRANSCRIBE_2 = "voxtral-mini-2602",
|
|
332
|
+
MISTRAL_OCR_3 = "mistral-ocr-2512",
|
|
333
|
+
MISTRAL_OCR_LATEST = "mistral-ocr-latest",
|
|
274
334
|
MISTRAL_NEMO = "mistral-nemo",
|
|
275
335
|
MISTRAL_EMBED = "mistral-embed",
|
|
276
336
|
MISTRAL_MODERATION_LATEST = "mistral-moderation-latest"
|
|
@@ -341,7 +401,17 @@ export declare enum OllamaModels {
|
|
|
341
401
|
STARCODER2_15B = "starcoder2:15b",
|
|
342
402
|
MIXTRAL_8X7B = "mixtral:8x7b",
|
|
343
403
|
MIXTRAL_8X22B = "mixtral:8x22b",
|
|
344
|
-
COMMAND_R_PLUS = "command-r-plus:104b"
|
|
404
|
+
COMMAND_R_PLUS = "command-r-plus:104b",
|
|
405
|
+
GLM_5_LATEST = "glm-5:latest",
|
|
406
|
+
KIMI_K2_5_LATEST = "kimi-k2.5:latest",
|
|
407
|
+
QWEN3_5_LATEST = "qwen3.5:latest",
|
|
408
|
+
QWEN3_CODER_LATEST = "qwen3-coder:latest",
|
|
409
|
+
QWEN3_CODER_30B = "qwen3-coder:30b",
|
|
410
|
+
DEEPSEEK_V3_2_LATEST = "deepseek-v3.2:latest",
|
|
411
|
+
NEMOTRON_3_NANO_LATEST = "nemotron-3-nano:latest",
|
|
412
|
+
NEMOTRON_3_NANO_30B = "nemotron-3-nano:30b",
|
|
413
|
+
SMOLLM3_3B = "smollm3:3b",
|
|
414
|
+
GPT_OSS_LATEST = "gpt-oss:latest"
|
|
345
415
|
}
|
|
346
416
|
/**
|
|
347
417
|
* Common Models for LiteLLM Proxy
|
|
@@ -381,6 +451,12 @@ export declare enum LiteLLMModels {
|
|
|
381
451
|
MISTRAL_MAGISTRAL_MEDIUM = "mistral/magistral-medium-2506",
|
|
382
452
|
BEDROCK_CLAUDE_3_5_SONNET = "bedrock/anthropic.claude-3-5-sonnet-20240620-v1:0",
|
|
383
453
|
BEDROCK_CLAUDE_3_HAIKU = "bedrock/anthropic.claude-3-haiku-20240307-v1:0",
|
|
454
|
+
OPENAI_GPT_5_2 = "openai/gpt-5.2",
|
|
455
|
+
OPENAI_GPT_5_2_CODEX = "openai/gpt-5.2-codex",
|
|
456
|
+
ANTHROPIC_CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4-6",
|
|
457
|
+
ANTHROPIC_CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4-6",
|
|
458
|
+
GEMINI_3_1_PRO = "gemini/gemini-3.1-pro-preview",
|
|
459
|
+
XAI_GROK_4_1_FAST = "xai/grok-4.1-fast",
|
|
384
460
|
PERPLEXITY_SONAR_PRO = "perplexity/sonar-pro",
|
|
385
461
|
PERPLEXITY_SONAR_REASONING_PRO = "perplexity/sonar-reasoning-pro"
|
|
386
462
|
}
|
|
@@ -433,7 +509,13 @@ export declare enum HuggingFaceModels {
|
|
|
433
509
|
STARCODER2_15B = "bigcode/starcoder2-15b",
|
|
434
510
|
CODELLAMA_34B_INSTRUCT = "codellama/CodeLlama-34b-Instruct-hf",
|
|
435
511
|
BLOOM_7B1 = "bigscience/bloom-7b1",
|
|
436
|
-
BLOOM_1B3 = "bigscience/bloom-1b3"
|
|
512
|
+
BLOOM_1B3 = "bigscience/bloom-1b3",
|
|
513
|
+
GLM_5 = "zai-org/GLM-5",
|
|
514
|
+
QWEN_3_5_397B_A17B = "Qwen/Qwen3.5-397B-A17B",
|
|
515
|
+
NEMOTRON_3_NANO_30B = "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16",
|
|
516
|
+
SMOLLM3_3B = "HuggingFaceTB/SmolLM3-3B",
|
|
517
|
+
FALCON_3_7B_INSTRUCT = "tiiuae/Falcon3-7B-Instruct",
|
|
518
|
+
FALCON_3_10B_INSTRUCT = "tiiuae/Falcon3-10B-Instruct"
|
|
437
519
|
}
|
|
438
520
|
/**
|
|
439
521
|
* Supported Models for AWS SageMaker JumpStart
|
|
@@ -455,7 +537,9 @@ export declare enum SageMakerModels {
|
|
|
455
537
|
FALCON_3_7B = "tii-falcon-3-7b-instruct",
|
|
456
538
|
FALCON_3_10B = "tii-falcon-3-10b-instruct",
|
|
457
539
|
FALCON_40B = "tii-falcon-40b-instruct",
|
|
458
|
-
FALCON_180B = "tii-falcon-180b"
|
|
540
|
+
FALCON_180B = "tii-falcon-180b",
|
|
541
|
+
NEMOTRON_3_NANO_30B = "nvidia-nemotron-3-nano-30b",
|
|
542
|
+
QWEN3_VL_8B = "qwen3-vl-8b-instruct"
|
|
459
543
|
}
|
|
460
544
|
/**
|
|
461
545
|
* API Versions for various providers
|