@juspay/neurolink 9.15.0 → 9.16.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +6 -0
- package/dist/adapters/video/videoAnalyzer.d.ts +1 -1
- package/dist/adapters/video/videoAnalyzer.js +10 -8
- package/dist/cli/commands/setup-anthropic.js +1 -14
- package/dist/cli/commands/setup-azure.js +1 -12
- package/dist/cli/commands/setup-bedrock.js +1 -9
- package/dist/cli/commands/setup-google-ai.js +1 -12
- package/dist/cli/commands/setup-openai.js +1 -14
- package/dist/cli/commands/workflow.d.ts +27 -0
- package/dist/cli/commands/workflow.js +216 -0
- package/dist/cli/factories/commandFactory.js +79 -20
- package/dist/cli/index.js +0 -1
- package/dist/cli/parser.js +4 -1
- package/dist/cli/utils/maskCredential.d.ts +11 -0
- package/dist/cli/utils/maskCredential.js +23 -0
- package/dist/constants/contextWindows.js +107 -16
- package/dist/constants/enums.d.ts +99 -15
- package/dist/constants/enums.js +152 -22
- package/dist/context/budgetChecker.js +1 -1
- package/dist/context/contextCompactor.js +31 -4
- package/dist/context/emergencyTruncation.d.ts +21 -0
- package/dist/context/emergencyTruncation.js +88 -0
- package/dist/context/errorDetection.d.ts +16 -0
- package/dist/context/errorDetection.js +48 -1
- package/dist/context/errors.d.ts +19 -0
- package/dist/context/errors.js +21 -0
- package/dist/context/stages/slidingWindowTruncator.d.ts +6 -0
- package/dist/context/stages/slidingWindowTruncator.js +159 -24
- package/dist/core/baseProvider.js +306 -200
- package/dist/core/conversationMemoryManager.js +104 -61
- package/dist/core/evaluationProviders.js +16 -33
- package/dist/core/factory.js +237 -164
- package/dist/core/modules/GenerationHandler.js +175 -116
- package/dist/core/modules/MessageBuilder.js +222 -170
- package/dist/core/modules/StreamHandler.d.ts +1 -0
- package/dist/core/modules/StreamHandler.js +95 -27
- package/dist/core/modules/TelemetryHandler.d.ts +10 -1
- package/dist/core/modules/TelemetryHandler.js +25 -7
- package/dist/core/modules/ToolsManager.js +115 -191
- package/dist/core/redisConversationMemoryManager.js +418 -282
- package/dist/factories/providerRegistry.d.ts +5 -0
- package/dist/factories/providerRegistry.js +20 -2
- package/dist/index.d.ts +2 -2
- package/dist/index.js +4 -2
- package/dist/lib/adapters/video/videoAnalyzer.d.ts +1 -1
- package/dist/lib/adapters/video/videoAnalyzer.js +10 -8
- package/dist/lib/constants/contextWindows.js +107 -16
- package/dist/lib/constants/enums.d.ts +99 -15
- package/dist/lib/constants/enums.js +152 -22
- package/dist/lib/context/budgetChecker.js +1 -1
- package/dist/lib/context/contextCompactor.js +31 -4
- package/dist/lib/context/emergencyTruncation.d.ts +21 -0
- package/dist/lib/context/emergencyTruncation.js +89 -0
- package/dist/lib/context/errorDetection.d.ts +16 -0
- package/dist/lib/context/errorDetection.js +48 -1
- package/dist/lib/context/errors.d.ts +19 -0
- package/dist/lib/context/errors.js +22 -0
- package/dist/lib/context/stages/slidingWindowTruncator.d.ts +6 -0
- package/dist/lib/context/stages/slidingWindowTruncator.js +159 -24
- package/dist/lib/core/baseProvider.js +306 -200
- package/dist/lib/core/conversationMemoryManager.js +104 -61
- package/dist/lib/core/evaluationProviders.js +16 -33
- package/dist/lib/core/factory.js +237 -164
- package/dist/lib/core/modules/GenerationHandler.js +175 -116
- package/dist/lib/core/modules/MessageBuilder.js +222 -170
- package/dist/lib/core/modules/StreamHandler.d.ts +1 -0
- package/dist/lib/core/modules/StreamHandler.js +95 -27
- package/dist/lib/core/modules/TelemetryHandler.d.ts +10 -1
- package/dist/lib/core/modules/TelemetryHandler.js +25 -7
- package/dist/lib/core/modules/ToolsManager.js +115 -191
- package/dist/lib/core/redisConversationMemoryManager.js +418 -282
- package/dist/lib/factories/providerRegistry.d.ts +5 -0
- package/dist/lib/factories/providerRegistry.js +20 -2
- package/dist/lib/index.d.ts +2 -2
- package/dist/lib/index.js +4 -2
- package/dist/lib/mcp/externalServerManager.js +66 -0
- package/dist/lib/mcp/mcpCircuitBreaker.js +24 -0
- package/dist/lib/mcp/mcpClientFactory.js +16 -0
- package/dist/lib/mcp/toolDiscoveryService.js +32 -6
- package/dist/lib/mcp/toolRegistry.js +193 -123
- package/dist/lib/neurolink.d.ts +6 -0
- package/dist/lib/neurolink.js +1162 -646
- package/dist/lib/providers/amazonBedrock.d.ts +1 -1
- package/dist/lib/providers/amazonBedrock.js +521 -319
- package/dist/lib/providers/anthropic.js +73 -17
- package/dist/lib/providers/anthropicBaseProvider.js +77 -17
- package/dist/lib/providers/googleAiStudio.d.ts +1 -1
- package/dist/lib/providers/googleAiStudio.js +292 -227
- package/dist/lib/providers/googleVertex.d.ts +36 -1
- package/dist/lib/providers/googleVertex.js +553 -260
- package/dist/lib/providers/ollama.js +329 -278
- package/dist/lib/providers/openAI.js +77 -19
- package/dist/lib/providers/sagemaker/parsers.js +3 -3
- package/dist/lib/providers/sagemaker/streaming.js +3 -3
- package/dist/lib/proxy/proxyFetch.js +81 -48
- package/dist/lib/rag/ChunkerFactory.js +1 -1
- package/dist/lib/rag/chunkers/MarkdownChunker.d.ts +22 -0
- package/dist/lib/rag/chunkers/MarkdownChunker.js +213 -9
- package/dist/lib/rag/chunking/markdownChunker.d.ts +16 -0
- package/dist/lib/rag/chunking/markdownChunker.js +174 -2
- package/dist/lib/rag/pipeline/contextAssembly.js +2 -1
- package/dist/lib/rag/ragIntegration.d.ts +18 -1
- package/dist/lib/rag/ragIntegration.js +94 -14
- package/dist/lib/rag/retrieval/vectorQueryTool.js +21 -4
- package/dist/lib/server/abstract/baseServerAdapter.js +4 -1
- package/dist/lib/server/adapters/fastifyAdapter.js +35 -30
- package/dist/lib/services/server/ai/observability/instrumentation.d.ts +32 -0
- package/dist/lib/services/server/ai/observability/instrumentation.js +39 -0
- package/dist/lib/telemetry/attributes.d.ts +52 -0
- package/dist/lib/telemetry/attributes.js +61 -0
- package/dist/lib/telemetry/index.d.ts +3 -0
- package/dist/lib/telemetry/index.js +3 -0
- package/dist/lib/telemetry/telemetryService.d.ts +6 -0
- package/dist/lib/telemetry/telemetryService.js +6 -0
- package/dist/lib/telemetry/tracers.d.ts +15 -0
- package/dist/lib/telemetry/tracers.js +17 -0
- package/dist/lib/telemetry/withSpan.d.ts +9 -0
- package/dist/lib/telemetry/withSpan.js +35 -0
- package/dist/lib/types/contextTypes.d.ts +10 -0
- package/dist/lib/types/streamTypes.d.ts +14 -0
- package/dist/lib/utils/conversationMemory.js +121 -82
- package/dist/lib/utils/logger.d.ts +5 -0
- package/dist/lib/utils/logger.js +50 -2
- package/dist/lib/utils/messageBuilder.js +22 -42
- package/dist/lib/utils/modelDetection.js +3 -3
- package/dist/lib/utils/providerRetry.d.ts +41 -0
- package/dist/lib/utils/providerRetry.js +114 -0
- package/dist/lib/utils/retryability.d.ts +14 -0
- package/dist/lib/utils/retryability.js +23 -0
- package/dist/lib/utils/sanitizers/svg.js +4 -5
- package/dist/lib/utils/tokenEstimation.d.ts +11 -1
- package/dist/lib/utils/tokenEstimation.js +19 -4
- package/dist/lib/utils/videoAnalysisProcessor.js +7 -3
- package/dist/mcp/externalServerManager.js +66 -0
- package/dist/mcp/mcpCircuitBreaker.js +24 -0
- package/dist/mcp/mcpClientFactory.js +16 -0
- package/dist/mcp/toolDiscoveryService.js +32 -6
- package/dist/mcp/toolRegistry.js +193 -123
- package/dist/neurolink.d.ts +6 -0
- package/dist/neurolink.js +1162 -646
- package/dist/providers/amazonBedrock.d.ts +1 -1
- package/dist/providers/amazonBedrock.js +521 -319
- package/dist/providers/anthropic.js +73 -17
- package/dist/providers/anthropicBaseProvider.js +77 -17
- package/dist/providers/googleAiStudio.d.ts +1 -1
- package/dist/providers/googleAiStudio.js +292 -227
- package/dist/providers/googleVertex.d.ts +36 -1
- package/dist/providers/googleVertex.js +553 -260
- package/dist/providers/ollama.js +329 -278
- package/dist/providers/openAI.js +77 -19
- package/dist/providers/sagemaker/parsers.js +3 -3
- package/dist/providers/sagemaker/streaming.js +3 -3
- package/dist/proxy/proxyFetch.js +81 -48
- package/dist/rag/ChunkerFactory.js +1 -1
- package/dist/rag/chunkers/MarkdownChunker.d.ts +22 -0
- package/dist/rag/chunkers/MarkdownChunker.js +213 -9
- package/dist/rag/chunking/markdownChunker.d.ts +16 -0
- package/dist/rag/chunking/markdownChunker.js +174 -2
- package/dist/rag/pipeline/contextAssembly.js +2 -1
- package/dist/rag/ragIntegration.d.ts +18 -1
- package/dist/rag/ragIntegration.js +94 -14
- package/dist/rag/retrieval/vectorQueryTool.js +21 -4
- package/dist/server/abstract/baseServerAdapter.js +4 -1
- package/dist/server/adapters/fastifyAdapter.js +35 -30
- package/dist/services/server/ai/observability/instrumentation.d.ts +32 -0
- package/dist/services/server/ai/observability/instrumentation.js +39 -0
- package/dist/telemetry/attributes.d.ts +52 -0
- package/dist/telemetry/attributes.js +60 -0
- package/dist/telemetry/index.d.ts +3 -0
- package/dist/telemetry/index.js +3 -0
- package/dist/telemetry/telemetryService.d.ts +6 -0
- package/dist/telemetry/telemetryService.js +6 -0
- package/dist/telemetry/tracers.d.ts +15 -0
- package/dist/telemetry/tracers.js +16 -0
- package/dist/telemetry/withSpan.d.ts +9 -0
- package/dist/telemetry/withSpan.js +34 -0
- package/dist/types/contextTypes.d.ts +10 -0
- package/dist/types/streamTypes.d.ts +14 -0
- package/dist/utils/conversationMemory.js +121 -82
- package/dist/utils/logger.d.ts +5 -0
- package/dist/utils/logger.js +50 -2
- package/dist/utils/messageBuilder.js +22 -42
- package/dist/utils/modelDetection.js +3 -3
- package/dist/utils/providerRetry.d.ts +41 -0
- package/dist/utils/providerRetry.js +113 -0
- package/dist/utils/retryability.d.ts +14 -0
- package/dist/utils/retryability.js +22 -0
- package/dist/utils/sanitizers/svg.js +4 -5
- package/dist/utils/tokenEstimation.d.ts +11 -1
- package/dist/utils/tokenEstimation.js +19 -4
- package/dist/utils/videoAnalysisProcessor.js +7 -3
- package/dist/workflow/config.d.ts +26 -26
- package/package.json +1 -1
|
@@ -25,8 +25,18 @@ export const DEFAULT_OUTPUT_RESERVE_RATIO = 0.35;
|
|
|
25
25
|
export const MODEL_CONTEXT_WINDOWS = {
|
|
26
26
|
anthropic: {
|
|
27
27
|
_default: 200_000,
|
|
28
|
+
// Claude 4.6 (Feb 2026) — 200K standard, 1M with beta header
|
|
29
|
+
"claude-opus-4-6": 200_000,
|
|
30
|
+
"claude-sonnet-4-6": 200_000,
|
|
31
|
+
// Claude 4.5
|
|
32
|
+
"claude-opus-4-5-20251101": 200_000,
|
|
33
|
+
"claude-sonnet-4-5-20250929": 200_000,
|
|
34
|
+
"claude-haiku-4-5-20251001": 200_000,
|
|
35
|
+
// Claude 4.x
|
|
36
|
+
"claude-opus-4-1-20250805": 200_000,
|
|
28
37
|
"claude-opus-4-20250514": 200_000,
|
|
29
38
|
"claude-sonnet-4-20250514": 200_000,
|
|
39
|
+
// Claude 3.x
|
|
30
40
|
"claude-3-7-sonnet-20250219": 200_000,
|
|
31
41
|
"claude-3-5-sonnet-20241022": 200_000,
|
|
32
42
|
"claude-3-5-haiku-20241022": 200_000,
|
|
@@ -36,67 +46,144 @@ export const MODEL_CONTEXT_WINDOWS = {
|
|
|
36
46
|
},
|
|
37
47
|
openai: {
|
|
38
48
|
_default: 128_000,
|
|
49
|
+
// GPT-5.x family — 400K context
|
|
50
|
+
"gpt-5.3-codex": 400_000,
|
|
51
|
+
"gpt-5.2": 400_000,
|
|
52
|
+
"gpt-5.2-pro": 400_000,
|
|
53
|
+
"gpt-5.2-codex": 400_000,
|
|
54
|
+
"gpt-5.2-chat-latest": 128_000,
|
|
55
|
+
"gpt-5.1": 400_000,
|
|
56
|
+
"gpt-5.1-codex": 400_000,
|
|
57
|
+
"gpt-5.1-codex-max": 400_000,
|
|
58
|
+
"gpt-5.1-codex-mini": 400_000,
|
|
59
|
+
"gpt-5.1-chat-latest": 128_000,
|
|
60
|
+
"gpt-5": 400_000,
|
|
61
|
+
"gpt-5-mini": 400_000,
|
|
62
|
+
"gpt-5-nano": 400_000,
|
|
63
|
+
"gpt-5-pro": 400_000,
|
|
64
|
+
"gpt-5-codex": 400_000,
|
|
65
|
+
"gpt-5-chat-latest": 128_000,
|
|
66
|
+
// GPT Open Source
|
|
67
|
+
"gpt-oss-120b": 128_000,
|
|
68
|
+
"gpt-oss-20b": 128_000,
|
|
69
|
+
// GPT-4.1 family — 1M context
|
|
70
|
+
"gpt-4.1": 1_047_576,
|
|
71
|
+
"gpt-4.1-mini": 1_047_576,
|
|
72
|
+
"gpt-4.1-nano": 1_047_576,
|
|
73
|
+
// GPT-4o
|
|
39
74
|
"gpt-4o": 128_000,
|
|
40
75
|
"gpt-4o-mini": 128_000,
|
|
41
|
-
|
|
42
|
-
"gpt-4": 8_192,
|
|
43
|
-
"gpt-3.5-turbo": 16_385,
|
|
76
|
+
// O-series reasoning — 200K context
|
|
44
77
|
o1: 200_000,
|
|
45
78
|
"o1-mini": 128_000,
|
|
46
79
|
"o1-pro": 200_000,
|
|
47
80
|
o3: 200_000,
|
|
48
81
|
"o3-mini": 200_000,
|
|
82
|
+
"o3-pro": 200_000,
|
|
49
83
|
"o4-mini": 200_000,
|
|
50
|
-
|
|
51
|
-
"gpt-4
|
|
52
|
-
"gpt-4
|
|
53
|
-
"gpt-5":
|
|
84
|
+
// Legacy
|
|
85
|
+
"gpt-4-turbo": 128_000,
|
|
86
|
+
"gpt-4": 8_192,
|
|
87
|
+
"gpt-3.5-turbo": 16_385,
|
|
54
88
|
},
|
|
55
89
|
"google-ai": {
|
|
56
90
|
_default: 1_048_576,
|
|
91
|
+
"gemini-3.1-pro-preview": 1_048_576,
|
|
92
|
+
"gemini-3-pro-preview": 1_048_576,
|
|
93
|
+
"gemini-3-pro-image-preview": 65_536,
|
|
94
|
+
"gemini-3-flash-preview": 1_048_576,
|
|
95
|
+
"gemini-3-flash": 1_048_576,
|
|
57
96
|
"gemini-2.5-pro": 1_048_576,
|
|
58
97
|
"gemini-2.5-flash": 1_048_576,
|
|
98
|
+
"gemini-2.5-flash-lite": 1_048_576,
|
|
99
|
+
"gemini-2.5-flash-image": 32_768,
|
|
59
100
|
"gemini-2.0-flash": 1_048_576,
|
|
60
101
|
"gemini-1.5-pro": 2_097_152,
|
|
61
102
|
"gemini-1.5-flash": 1_048_576,
|
|
62
|
-
"gemini-3-flash-preview": 1_048_576,
|
|
63
|
-
"gemini-3-pro-preview": 1_048_576,
|
|
64
103
|
},
|
|
65
104
|
vertex: {
|
|
66
105
|
_default: 1_048_576,
|
|
106
|
+
// Claude on Vertex
|
|
107
|
+
"claude-opus-4-6": 200_000,
|
|
108
|
+
"claude-sonnet-4-6": 200_000,
|
|
109
|
+
"claude-sonnet-4-5": 200_000,
|
|
110
|
+
"claude-opus-4-5": 200_000,
|
|
111
|
+
"claude-haiku-4-5": 200_000,
|
|
112
|
+
"claude-sonnet-4": 200_000,
|
|
113
|
+
"claude-sonnet-4-20250514": 200_000,
|
|
114
|
+
"claude-opus-4-20250514": 200_000,
|
|
115
|
+
"claude-opus-4": 200_000,
|
|
116
|
+
// Gemini on Vertex
|
|
117
|
+
"gemini-3.1-pro-preview": 1_048_576,
|
|
118
|
+
"gemini-3-pro-preview": 1_048_576,
|
|
119
|
+
"gemini-3-pro-latest": 1_048_576,
|
|
120
|
+
"gemini-3-flash-preview": 1_048_576,
|
|
121
|
+
"gemini-3-flash-latest": 1_048_576,
|
|
67
122
|
"gemini-2.5-pro": 1_048_576,
|
|
68
123
|
"gemini-2.5-flash": 1_048_576,
|
|
69
124
|
"gemini-2.0-flash": 1_048_576,
|
|
70
125
|
"gemini-1.5-pro": 2_097_152,
|
|
71
126
|
"gemini-1.5-flash": 1_048_576,
|
|
72
|
-
"claude-sonnet-4-5": 200_000,
|
|
73
|
-
"claude-sonnet-4-20250514": 200_000,
|
|
74
|
-
"claude-opus-4": 200_000,
|
|
75
|
-
"claude-opus-4-20250514": 200_000,
|
|
76
127
|
},
|
|
77
128
|
bedrock: {
|
|
78
129
|
_default: 200_000,
|
|
79
|
-
|
|
130
|
+
// Claude 4.6
|
|
131
|
+
"anthropic.claude-opus-4-6-v1:0": 200_000,
|
|
132
|
+
"anthropic.claude-sonnet-4-6": 200_000,
|
|
133
|
+
// Claude 4.5
|
|
134
|
+
"anthropic.claude-opus-4-5-20251124-v1:0": 200_000,
|
|
135
|
+
"anthropic.claude-sonnet-4-5-20250929-v1:0": 200_000,
|
|
136
|
+
"anthropic.claude-haiku-4-5-20251001-v1:0": 200_000,
|
|
137
|
+
// Claude legacy
|
|
138
|
+
"anthropic.claude-3-5-sonnet-20241022-v1:0": 200_000,
|
|
80
139
|
"anthropic.claude-3-5-haiku-20241022-v1:0": 200_000,
|
|
81
140
|
"anthropic.claude-3-opus-20240229-v1:0": 200_000,
|
|
82
141
|
"anthropic.claude-3-sonnet-20240229-v1:0": 200_000,
|
|
83
142
|
"anthropic.claude-3-haiku-20240307-v1:0": 200_000,
|
|
143
|
+
// Amazon Nova
|
|
84
144
|
"amazon.nova-pro-v1:0": 300_000,
|
|
85
145
|
"amazon.nova-lite-v1:0": 300_000,
|
|
146
|
+
"amazon.nova-2-lite-v1:0": 1_000_000,
|
|
147
|
+
// Writer
|
|
148
|
+
"writer.palmyra-x5-v1:0": 1_000_000,
|
|
149
|
+
"writer.palmyra-x4-v1:0": 128_000,
|
|
150
|
+
// NVIDIA
|
|
151
|
+
"nvidia.nemotron-nano-3-30b": 256_000,
|
|
86
152
|
},
|
|
87
153
|
azure: {
|
|
88
154
|
_default: 128_000,
|
|
155
|
+
// GPT-5.x
|
|
156
|
+
"gpt-5.2": 400_000,
|
|
157
|
+
"gpt-5.2-pro": 400_000,
|
|
158
|
+
"gpt-5.2-codex": 400_000,
|
|
159
|
+
"gpt-5.1": 400_000,
|
|
160
|
+
"gpt-5": 400_000,
|
|
161
|
+
"gpt-5-mini": 400_000,
|
|
162
|
+
// GPT-4.1
|
|
163
|
+
"gpt-4.1": 1_047_576,
|
|
164
|
+
"gpt-4.1-mini": 1_047_576,
|
|
165
|
+
// GPT-4o
|
|
89
166
|
"gpt-4o": 128_000,
|
|
90
167
|
"gpt-4o-mini": 128_000,
|
|
168
|
+
// O-series
|
|
169
|
+
o3: 200_000,
|
|
170
|
+
"o3-mini": 200_000,
|
|
171
|
+
"o4-mini": 200_000,
|
|
172
|
+
// Legacy
|
|
91
173
|
"gpt-4-turbo": 128_000,
|
|
92
174
|
"gpt-4": 8_192,
|
|
93
175
|
},
|
|
94
176
|
mistral: {
|
|
95
177
|
_default: 128_000,
|
|
96
|
-
"mistral-large-latest":
|
|
97
|
-
"mistral-
|
|
178
|
+
"mistral-large-latest": 256_000,
|
|
179
|
+
"mistral-large-2512": 256_000,
|
|
180
|
+
"mistral-medium-latest": 128_000,
|
|
98
181
|
"mistral-small-latest": 128_000,
|
|
99
182
|
"codestral-latest": 256_000,
|
|
183
|
+
"codestral-2508": 256_000,
|
|
184
|
+
"devstral-2512": 256_000,
|
|
185
|
+
"devstral-small-2512": 256_000,
|
|
186
|
+
"magistral-medium-latest": 128_000,
|
|
100
187
|
},
|
|
101
188
|
ollama: {
|
|
102
189
|
_default: 128_000,
|
|
@@ -109,6 +196,10 @@ export const MODEL_CONTEXT_WINDOWS = {
|
|
|
109
196
|
},
|
|
110
197
|
sagemaker: {
|
|
111
198
|
_default: 128_000,
|
|
199
|
+
// NVIDIA Nemotron 3 Nano (February 2026) — 1M context
|
|
200
|
+
"nvidia-nemotron-3-nano-30b": 1_000_000,
|
|
201
|
+
// Qwen3 VL — 32K context
|
|
202
|
+
"qwen3-vl-8b-instruct": 32_768,
|
|
112
203
|
},
|
|
113
204
|
};
|
|
114
205
|
/**
|
|
@@ -22,23 +22,37 @@ export declare enum AIProviderName {
|
|
|
22
22
|
* OpenRouter uses 'provider/model' format
|
|
23
23
|
*/
|
|
24
24
|
export declare enum OpenRouterModels {
|
|
25
|
+
CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4.6",
|
|
26
|
+
CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4.6",
|
|
27
|
+
CLAUDE_SONNET_4_5 = "anthropic/claude-sonnet-4.5",
|
|
28
|
+
CLAUDE_HAIKU_4_5 = "anthropic/claude-haiku-4.5",
|
|
25
29
|
CLAUDE_3_5_SONNET = "anthropic/claude-3-5-sonnet",
|
|
26
30
|
CLAUDE_3_5_HAIKU = "anthropic/claude-3-5-haiku",
|
|
27
31
|
CLAUDE_3_OPUS = "anthropic/claude-3-opus",
|
|
32
|
+
GPT_5_2 = "openai/gpt-5.2",
|
|
33
|
+
GPT_5 = "openai/gpt-5",
|
|
28
34
|
GPT_4O = "openai/gpt-4o",
|
|
29
35
|
GPT_4O_MINI = "openai/gpt-4o-mini",
|
|
30
36
|
GPT_4_TURBO = "openai/gpt-4-turbo",
|
|
37
|
+
GEMINI_3_1_PRO_PREVIEW = "google/gemini-3.1-pro-preview",
|
|
38
|
+
GEMINI_3_PRO_PREVIEW = "google/gemini-3-pro-preview",
|
|
39
|
+
GEMINI_3_FLASH_PREVIEW = "google/gemini-3-flash-preview",
|
|
40
|
+
GEMINI_2_5_FLASH = "google/gemini-2.5-flash",
|
|
41
|
+
GEMINI_2_5_FLASH_LITE = "google/gemini-2.5-flash-lite",
|
|
31
42
|
GEMINI_2_0_FLASH = "google/gemini-2.0-flash",
|
|
32
|
-
GEMINI_1_5_PRO = "google/gemini-1.5-pro",
|
|
33
43
|
LLAMA_3_1_70B = "meta-llama/llama-3.1-70b-instruct",
|
|
34
44
|
LLAMA_3_1_8B = "meta-llama/llama-3.1-8b-instruct",
|
|
35
45
|
MISTRAL_LARGE = "mistralai/mistral-large",
|
|
36
|
-
MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct"
|
|
46
|
+
MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct",
|
|
47
|
+
DEEPSEEK_R1 = "deepseek/deepseek-r1",
|
|
48
|
+
GROK_4_1_FAST = "xai/grok-4.1-fast"
|
|
37
49
|
}
|
|
38
50
|
/**
|
|
39
51
|
* Supported Models for Amazon Bedrock
|
|
40
52
|
*/
|
|
41
53
|
export declare enum BedrockModels {
|
|
54
|
+
CLAUDE_4_6_OPUS = "anthropic.claude-opus-4-6-v1:0",
|
|
55
|
+
CLAUDE_4_6_SONNET = "anthropic.claude-sonnet-4-6",
|
|
42
56
|
CLAUDE_4_5_OPUS = "anthropic.claude-opus-4-5-20251124-v1:0",
|
|
43
57
|
CLAUDE_4_5_SONNET = "anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
44
58
|
CLAUDE_4_5_HAIKU = "anthropic.claude-haiku-4-5-20251001-v1:0",
|
|
@@ -104,18 +118,49 @@ export declare enum BedrockModels {
|
|
|
104
118
|
GEMMA_3_12B_IT = "google.gemma-3-12b-it",
|
|
105
119
|
GEMMA_3_4B_IT = "google.gemma-3-4b-it",
|
|
106
120
|
JAMBA_1_5_LARGE = "ai21.jamba-1-5-large-v1:0",
|
|
107
|
-
JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0"
|
|
121
|
+
JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0",
|
|
122
|
+
WRITER_PALMYRA_X5 = "writer.palmyra-x5-v1:0",
|
|
123
|
+
WRITER_PALMYRA_X4 = "writer.palmyra-x4-v1:0",
|
|
124
|
+
MINIMAX_M2_1 = "minimax.minimax-m2.1",
|
|
125
|
+
MINIMAX_M2 = "minimax.minimax-m2",
|
|
126
|
+
KIMI_K2_THINKING = "moonshot.kimi-k2-thinking",
|
|
127
|
+
KIMI_K2_5 = "moonshotai.kimi-k2.5",
|
|
128
|
+
NVIDIA_NEMOTRON_NANO_3_30B = "nvidia.nemotron-nano-3-30b",
|
|
129
|
+
NVIDIA_NEMOTRON_NANO_12B_V2 = "nvidia.nemotron-nano-12b-v2",
|
|
130
|
+
NVIDIA_NEMOTRON_NANO_9B_V2 = "nvidia.nemotron-nano-9b-v2",
|
|
131
|
+
OPENAI_GPT_OSS_120B = "openai.gpt-oss-120b-1:0",
|
|
132
|
+
OPENAI_GPT_OSS_20B = "openai.gpt-oss-20b-1:0",
|
|
133
|
+
GLM_4_7 = "zai.glm-4.7",
|
|
134
|
+
GLM_4_7_FLASH = "zai.glm-4.7-flash",
|
|
135
|
+
COHERE_EMBED_ENGLISH_V3 = "cohere.embed-english-v3",
|
|
136
|
+
COHERE_EMBED_MULTILINGUAL_V3 = "cohere.embed-multilingual-v3",
|
|
137
|
+
COHERE_EMBED_V4 = "cohere.embed-v4:0",
|
|
138
|
+
COHERE_RERANK_V3_5 = "cohere.rerank-v3-5:0",
|
|
139
|
+
AMAZON_RERANK_V1 = "amazon.rerank-v1:0",
|
|
140
|
+
DEVSTRAL_2_123B = "mistral.devstral-2-123b"
|
|
108
141
|
}
|
|
109
142
|
/**
|
|
110
143
|
* Supported Models for OpenAI
|
|
111
144
|
*/
|
|
112
145
|
export declare enum OpenAIModels {
|
|
146
|
+
GPT_5_3_CODEX = "gpt-5.3-codex",
|
|
113
147
|
GPT_5_2 = "gpt-5.2",
|
|
114
148
|
GPT_5_2_CHAT_LATEST = "gpt-5.2-chat-latest",
|
|
115
149
|
GPT_5_2_PRO = "gpt-5.2-pro",
|
|
150
|
+
GPT_5_2_CODEX = "gpt-5.2-codex",
|
|
151
|
+
GPT_5_1 = "gpt-5.1",
|
|
152
|
+
GPT_5_1_CHAT_LATEST = "gpt-5.1-chat-latest",
|
|
153
|
+
GPT_5_1_CODEX = "gpt-5.1-codex",
|
|
154
|
+
GPT_5_1_CODEX_MAX = "gpt-5.1-codex-max",
|
|
155
|
+
GPT_5_1_CODEX_MINI = "gpt-5.1-codex-mini",
|
|
116
156
|
GPT_5 = "gpt-5",
|
|
117
157
|
GPT_5_MINI = "gpt-5-mini",
|
|
118
158
|
GPT_5_NANO = "gpt-5-nano",
|
|
159
|
+
GPT_5_PRO = "gpt-5-pro",
|
|
160
|
+
GPT_5_CHAT_LATEST = "gpt-5-chat-latest",
|
|
161
|
+
GPT_5_CODEX = "gpt-5-codex",
|
|
162
|
+
GPT_OSS_120B = "gpt-oss-120b",
|
|
163
|
+
GPT_OSS_20B = "gpt-oss-20b",
|
|
119
164
|
GPT_4_1 = "gpt-4.1",
|
|
120
165
|
GPT_4_1_MINI = "gpt-4.1-mini",
|
|
121
166
|
GPT_4_1_NANO = "gpt-4.1-nano",
|
|
@@ -137,6 +182,10 @@ export declare enum OpenAIModels {
|
|
|
137
182
|
* Note: Azure uses deployment names, these are model identifiers
|
|
138
183
|
*/
|
|
139
184
|
export declare enum AzureOpenAIModels {
|
|
185
|
+
GPT_5_2 = "gpt-5.2",
|
|
186
|
+
GPT_5_2_CHAT = "gpt-5.2-chat",
|
|
187
|
+
GPT_5_2_PRO = "gpt-5.2-pro",
|
|
188
|
+
GPT_5_2_CODEX = "gpt-5.2-codex",
|
|
140
189
|
GPT_5_1 = "gpt-5.1",
|
|
141
190
|
GPT_5_1_CHAT = "gpt-5.1-chat",
|
|
142
191
|
GPT_5_1_CODEX = "gpt-5.1-codex",
|
|
@@ -172,6 +221,8 @@ export declare enum AzureOpenAIModels {
|
|
|
172
221
|
* Supported Models for Google Vertex AI
|
|
173
222
|
*/
|
|
174
223
|
export declare enum VertexModels {
|
|
224
|
+
CLAUDE_4_6_OPUS = "claude-opus-4-6",
|
|
225
|
+
CLAUDE_4_6_SONNET = "claude-sonnet-4-6",
|
|
175
226
|
CLAUDE_4_5_OPUS = "claude-opus-4-5@20251124",
|
|
176
227
|
CLAUDE_4_5_SONNET = "claude-sonnet-4-5@20250929",
|
|
177
228
|
CLAUDE_4_5_HAIKU = "claude-haiku-4-5@20251001",
|
|
@@ -183,19 +234,13 @@ export declare enum VertexModels {
|
|
|
183
234
|
CLAUDE_3_SONNET = "claude-3-sonnet-20240229",
|
|
184
235
|
CLAUDE_3_OPUS = "claude-3-opus-20240229",
|
|
185
236
|
CLAUDE_3_HAIKU = "claude-3-haiku-20240307",
|
|
186
|
-
|
|
237
|
+
GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
|
|
187
238
|
GEMINI_3_PRO = "gemini-3-pro",
|
|
188
|
-
/** Gemini 3 Pro Preview - Versioned preview (November 2025) */
|
|
189
239
|
GEMINI_3_PRO_PREVIEW_11_2025 = "gemini-3-pro-preview-11-2025",
|
|
190
|
-
/** Gemini 3 Pro Latest - Auto-updated alias (always points to latest preview) */
|
|
191
240
|
GEMINI_3_PRO_LATEST = "gemini-3-pro-latest",
|
|
192
|
-
/** Gemini 3 Pro Preview - Generic preview (legacy) */
|
|
193
241
|
GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
|
|
194
|
-
/** Gemini 3 Flash - Base model with adaptive thinking */
|
|
195
242
|
GEMINI_3_FLASH = "gemini-3-flash",
|
|
196
|
-
/** Gemini 3 Flash Preview - Versioned preview */
|
|
197
243
|
GEMINI_3_FLASH_PREVIEW = "gemini-3-flash-preview",
|
|
198
|
-
/** Gemini 3 Flash Latest - Auto-updated alias (always points to latest preview) */
|
|
199
244
|
GEMINI_3_FLASH_LATEST = "gemini-3-flash-latest",
|
|
200
245
|
GEMINI_2_5_PRO = "gemini-2.5-pro",
|
|
201
246
|
GEMINI_2_5_FLASH = "gemini-2.5-flash",
|
|
@@ -203,15 +248,17 @@ export declare enum VertexModels {
|
|
|
203
248
|
GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
|
|
204
249
|
GEMINI_2_0_FLASH = "gemini-2.0-flash",
|
|
205
250
|
GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
|
|
206
|
-
/** Gemini 2.0 Flash Lite - GA, production-ready, cost-optimized */
|
|
207
251
|
GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
|
|
252
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
208
253
|
GEMINI_1_5_PRO = "gemini-1.5-pro-002",
|
|
254
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
209
255
|
GEMINI_1_5_FLASH = "gemini-1.5-flash-002"
|
|
210
256
|
}
|
|
211
257
|
/**
|
|
212
258
|
* Supported Models for Google AI Studio
|
|
213
259
|
*/
|
|
214
260
|
export declare enum GoogleAIModels {
|
|
261
|
+
GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
|
|
215
262
|
GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
|
|
216
263
|
GEMINI_3_PRO_IMAGE_PREVIEW = "gemini-3-pro-image-preview",
|
|
217
264
|
GEMINI_3_FLASH = "gemini-3-flash",
|
|
@@ -220,20 +267,26 @@ export declare enum GoogleAIModels {
|
|
|
220
267
|
GEMINI_2_5_FLASH = "gemini-2.5-flash",
|
|
221
268
|
GEMINI_2_5_FLASH_LITE = "gemini-2.5-flash-lite",
|
|
222
269
|
GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
|
|
223
|
-
|
|
270
|
+
GEMINI_2_5_FLASH_PREVIEW_TTS = "gemini-2.5-flash-preview-tts",
|
|
271
|
+
GEMINI_2_5_PRO_PREVIEW_TTS = "gemini-2.5-pro-preview-tts",
|
|
224
272
|
GEMINI_2_0_FLASH = "gemini-2.0-flash",
|
|
225
273
|
GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
|
|
226
274
|
GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
|
|
227
275
|
GEMINI_2_0_FLASH_IMAGE = "gemini-2.0-flash-preview-image-generation",
|
|
276
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
228
277
|
GEMINI_1_5_PRO = "gemini-1.5-pro",
|
|
278
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
229
279
|
GEMINI_1_5_FLASH = "gemini-1.5-flash",
|
|
230
280
|
GEMINI_EMBEDDING = "gemini-embedding-001",
|
|
281
|
+
/** @deprecated Shutdown Jan 2026. Use gemini-embedding-001 */
|
|
231
282
|
TEXT_EMBEDDING_004 = "text-embedding-004"
|
|
232
283
|
}
|
|
233
284
|
/**
|
|
234
285
|
* Supported Models for Anthropic (Direct API)
|
|
235
286
|
*/
|
|
236
287
|
export declare enum AnthropicModels {
|
|
288
|
+
CLAUDE_OPUS_4_6 = "claude-opus-4-6",
|
|
289
|
+
CLAUDE_SONNET_4_6 = "claude-sonnet-4-6",
|
|
237
290
|
CLAUDE_OPUS_4_5 = "claude-opus-4-5-20251101",
|
|
238
291
|
CLAUDE_SONNET_4_5 = "claude-sonnet-4-5-20250929",
|
|
239
292
|
CLAUDE_4_5_HAIKU = "claude-haiku-4-5-20251001",
|
|
@@ -271,6 +324,13 @@ export declare enum MistralModels {
|
|
|
271
324
|
PIXTRAL_12B = "pixtral-12b",
|
|
272
325
|
VOXTRAL_SMALL_LATEST = "voxtral-small-latest",
|
|
273
326
|
VOXTRAL_MINI_LATEST = "voxtral-mini-latest",
|
|
327
|
+
DEVSTRAL_2 = "devstral-2512",
|
|
328
|
+
DEVSTRAL_SMALL_2 = "devstral-small-2512",
|
|
329
|
+
MAGISTRAL_MEDIUM_2509 = "magistral-medium-2509",
|
|
330
|
+
MAGISTRAL_SMALL_2509 = "magistral-small-2509",
|
|
331
|
+
VOXTRAL_MINI_TRANSCRIBE_2 = "voxtral-mini-2602",
|
|
332
|
+
MISTRAL_OCR_3 = "mistral-ocr-2512",
|
|
333
|
+
MISTRAL_OCR_LATEST = "mistral-ocr-latest",
|
|
274
334
|
MISTRAL_NEMO = "mistral-nemo",
|
|
275
335
|
MISTRAL_EMBED = "mistral-embed",
|
|
276
336
|
MISTRAL_MODERATION_LATEST = "mistral-moderation-latest"
|
|
@@ -341,7 +401,17 @@ export declare enum OllamaModels {
|
|
|
341
401
|
STARCODER2_15B = "starcoder2:15b",
|
|
342
402
|
MIXTRAL_8X7B = "mixtral:8x7b",
|
|
343
403
|
MIXTRAL_8X22B = "mixtral:8x22b",
|
|
344
|
-
COMMAND_R_PLUS = "command-r-plus:104b"
|
|
404
|
+
COMMAND_R_PLUS = "command-r-plus:104b",
|
|
405
|
+
GLM_5_LATEST = "glm-5:latest",
|
|
406
|
+
KIMI_K2_5_LATEST = "kimi-k2.5:latest",
|
|
407
|
+
QWEN3_5_LATEST = "qwen3.5:latest",
|
|
408
|
+
QWEN3_CODER_LATEST = "qwen3-coder:latest",
|
|
409
|
+
QWEN3_CODER_30B = "qwen3-coder:30b",
|
|
410
|
+
DEEPSEEK_V3_2_LATEST = "deepseek-v3.2:latest",
|
|
411
|
+
NEMOTRON_3_NANO_LATEST = "nemotron-3-nano:latest",
|
|
412
|
+
NEMOTRON_3_NANO_30B = "nemotron-3-nano:30b",
|
|
413
|
+
SMOLLM3_3B = "smollm3:3b",
|
|
414
|
+
GPT_OSS_LATEST = "gpt-oss:latest"
|
|
345
415
|
}
|
|
346
416
|
/**
|
|
347
417
|
* Common Models for LiteLLM Proxy
|
|
@@ -381,6 +451,12 @@ export declare enum LiteLLMModels {
|
|
|
381
451
|
MISTRAL_MAGISTRAL_MEDIUM = "mistral/magistral-medium-2506",
|
|
382
452
|
BEDROCK_CLAUDE_3_5_SONNET = "bedrock/anthropic.claude-3-5-sonnet-20240620-v1:0",
|
|
383
453
|
BEDROCK_CLAUDE_3_HAIKU = "bedrock/anthropic.claude-3-haiku-20240307-v1:0",
|
|
454
|
+
OPENAI_GPT_5_2 = "openai/gpt-5.2",
|
|
455
|
+
OPENAI_GPT_5_2_CODEX = "openai/gpt-5.2-codex",
|
|
456
|
+
ANTHROPIC_CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4-6",
|
|
457
|
+
ANTHROPIC_CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4-6",
|
|
458
|
+
GEMINI_3_1_PRO = "gemini/gemini-3.1-pro-preview",
|
|
459
|
+
XAI_GROK_4_1_FAST = "xai/grok-4.1-fast",
|
|
384
460
|
PERPLEXITY_SONAR_PRO = "perplexity/sonar-pro",
|
|
385
461
|
PERPLEXITY_SONAR_REASONING_PRO = "perplexity/sonar-reasoning-pro"
|
|
386
462
|
}
|
|
@@ -433,7 +509,13 @@ export declare enum HuggingFaceModels {
|
|
|
433
509
|
STARCODER2_15B = "bigcode/starcoder2-15b",
|
|
434
510
|
CODELLAMA_34B_INSTRUCT = "codellama/CodeLlama-34b-Instruct-hf",
|
|
435
511
|
BLOOM_7B1 = "bigscience/bloom-7b1",
|
|
436
|
-
BLOOM_1B3 = "bigscience/bloom-1b3"
|
|
512
|
+
BLOOM_1B3 = "bigscience/bloom-1b3",
|
|
513
|
+
GLM_5 = "zai-org/GLM-5",
|
|
514
|
+
QWEN_3_5_397B_A17B = "Qwen/Qwen3.5-397B-A17B",
|
|
515
|
+
NEMOTRON_3_NANO_30B = "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16",
|
|
516
|
+
SMOLLM3_3B = "HuggingFaceTB/SmolLM3-3B",
|
|
517
|
+
FALCON_3_7B_INSTRUCT = "tiiuae/Falcon3-7B-Instruct",
|
|
518
|
+
FALCON_3_10B_INSTRUCT = "tiiuae/Falcon3-10B-Instruct"
|
|
437
519
|
}
|
|
438
520
|
/**
|
|
439
521
|
* Supported Models for AWS SageMaker JumpStart
|
|
@@ -455,7 +537,9 @@ export declare enum SageMakerModels {
|
|
|
455
537
|
FALCON_3_7B = "tii-falcon-3-7b-instruct",
|
|
456
538
|
FALCON_3_10B = "tii-falcon-3-10b-instruct",
|
|
457
539
|
FALCON_40B = "tii-falcon-40b-instruct",
|
|
458
|
-
FALCON_180B = "tii-falcon-180b"
|
|
540
|
+
FALCON_180B = "tii-falcon-180b",
|
|
541
|
+
NEMOTRON_3_NANO_30B = "nvidia-nemotron-3-nano-30b",
|
|
542
|
+
QWEN3_VL_8B = "qwen3-vl-8b-instruct"
|
|
459
543
|
}
|
|
460
544
|
/**
|
|
461
545
|
* API Versions for various providers
|