@juspay/neurolink 9.15.0 → 9.17.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (196) hide show
  1. package/CHANGELOG.md +12 -0
  2. package/README.md +22 -20
  3. package/dist/adapters/video/videoAnalyzer.d.ts +1 -1
  4. package/dist/adapters/video/videoAnalyzer.js +10 -8
  5. package/dist/cli/commands/setup-anthropic.js +1 -14
  6. package/dist/cli/commands/setup-azure.js +1 -12
  7. package/dist/cli/commands/setup-bedrock.js +1 -9
  8. package/dist/cli/commands/setup-google-ai.js +1 -12
  9. package/dist/cli/commands/setup-openai.js +1 -14
  10. package/dist/cli/commands/workflow.d.ts +27 -0
  11. package/dist/cli/commands/workflow.js +216 -0
  12. package/dist/cli/factories/commandFactory.js +79 -20
  13. package/dist/cli/index.js +0 -1
  14. package/dist/cli/parser.js +4 -1
  15. package/dist/cli/utils/maskCredential.d.ts +11 -0
  16. package/dist/cli/utils/maskCredential.js +23 -0
  17. package/dist/constants/contextWindows.js +107 -16
  18. package/dist/constants/enums.d.ts +99 -15
  19. package/dist/constants/enums.js +152 -22
  20. package/dist/context/budgetChecker.js +1 -1
  21. package/dist/context/contextCompactor.js +31 -4
  22. package/dist/context/emergencyTruncation.d.ts +21 -0
  23. package/dist/context/emergencyTruncation.js +88 -0
  24. package/dist/context/errorDetection.d.ts +16 -0
  25. package/dist/context/errorDetection.js +48 -1
  26. package/dist/context/errors.d.ts +19 -0
  27. package/dist/context/errors.js +21 -0
  28. package/dist/context/stages/slidingWindowTruncator.d.ts +6 -0
  29. package/dist/context/stages/slidingWindowTruncator.js +159 -24
  30. package/dist/context/stages/structuredSummarizer.js +2 -2
  31. package/dist/core/baseProvider.js +306 -200
  32. package/dist/core/conversationMemoryManager.js +104 -61
  33. package/dist/core/evaluationProviders.js +16 -33
  34. package/dist/core/factory.js +237 -164
  35. package/dist/core/modules/GenerationHandler.js +175 -116
  36. package/dist/core/modules/MessageBuilder.js +222 -170
  37. package/dist/core/modules/StreamHandler.d.ts +1 -0
  38. package/dist/core/modules/StreamHandler.js +95 -27
  39. package/dist/core/modules/TelemetryHandler.d.ts +10 -1
  40. package/dist/core/modules/TelemetryHandler.js +25 -7
  41. package/dist/core/modules/ToolsManager.js +115 -191
  42. package/dist/core/redisConversationMemoryManager.js +418 -282
  43. package/dist/factories/providerRegistry.d.ts +5 -0
  44. package/dist/factories/providerRegistry.js +20 -2
  45. package/dist/index.d.ts +2 -2
  46. package/dist/index.js +4 -2
  47. package/dist/lib/adapters/video/videoAnalyzer.d.ts +1 -1
  48. package/dist/lib/adapters/video/videoAnalyzer.js +10 -8
  49. package/dist/lib/constants/contextWindows.js +107 -16
  50. package/dist/lib/constants/enums.d.ts +99 -15
  51. package/dist/lib/constants/enums.js +152 -22
  52. package/dist/lib/context/budgetChecker.js +1 -1
  53. package/dist/lib/context/contextCompactor.js +31 -4
  54. package/dist/lib/context/emergencyTruncation.d.ts +21 -0
  55. package/dist/lib/context/emergencyTruncation.js +89 -0
  56. package/dist/lib/context/errorDetection.d.ts +16 -0
  57. package/dist/lib/context/errorDetection.js +48 -1
  58. package/dist/lib/context/errors.d.ts +19 -0
  59. package/dist/lib/context/errors.js +22 -0
  60. package/dist/lib/context/stages/slidingWindowTruncator.d.ts +6 -0
  61. package/dist/lib/context/stages/slidingWindowTruncator.js +159 -24
  62. package/dist/lib/context/stages/structuredSummarizer.js +2 -2
  63. package/dist/lib/core/baseProvider.js +306 -200
  64. package/dist/lib/core/conversationMemoryManager.js +104 -61
  65. package/dist/lib/core/evaluationProviders.js +16 -33
  66. package/dist/lib/core/factory.js +237 -164
  67. package/dist/lib/core/modules/GenerationHandler.js +175 -116
  68. package/dist/lib/core/modules/MessageBuilder.js +222 -170
  69. package/dist/lib/core/modules/StreamHandler.d.ts +1 -0
  70. package/dist/lib/core/modules/StreamHandler.js +95 -27
  71. package/dist/lib/core/modules/TelemetryHandler.d.ts +10 -1
  72. package/dist/lib/core/modules/TelemetryHandler.js +25 -7
  73. package/dist/lib/core/modules/ToolsManager.js +115 -191
  74. package/dist/lib/core/redisConversationMemoryManager.js +418 -282
  75. package/dist/lib/factories/providerRegistry.d.ts +5 -0
  76. package/dist/lib/factories/providerRegistry.js +20 -2
  77. package/dist/lib/index.d.ts +2 -2
  78. package/dist/lib/index.js +4 -2
  79. package/dist/lib/mcp/externalServerManager.js +66 -0
  80. package/dist/lib/mcp/mcpCircuitBreaker.js +24 -0
  81. package/dist/lib/mcp/mcpClientFactory.js +16 -0
  82. package/dist/lib/mcp/toolDiscoveryService.js +32 -6
  83. package/dist/lib/mcp/toolRegistry.js +193 -123
  84. package/dist/lib/neurolink.d.ts +6 -0
  85. package/dist/lib/neurolink.js +1162 -646
  86. package/dist/lib/providers/amazonBedrock.d.ts +1 -1
  87. package/dist/lib/providers/amazonBedrock.js +521 -319
  88. package/dist/lib/providers/anthropic.js +73 -17
  89. package/dist/lib/providers/anthropicBaseProvider.js +77 -17
  90. package/dist/lib/providers/googleAiStudio.d.ts +1 -1
  91. package/dist/lib/providers/googleAiStudio.js +292 -227
  92. package/dist/lib/providers/googleVertex.d.ts +36 -1
  93. package/dist/lib/providers/googleVertex.js +553 -260
  94. package/dist/lib/providers/ollama.js +329 -278
  95. package/dist/lib/providers/openAI.js +77 -19
  96. package/dist/lib/providers/sagemaker/parsers.js +3 -3
  97. package/dist/lib/providers/sagemaker/streaming.js +3 -3
  98. package/dist/lib/proxy/proxyFetch.js +81 -48
  99. package/dist/lib/rag/ChunkerFactory.js +1 -1
  100. package/dist/lib/rag/chunkers/MarkdownChunker.d.ts +22 -0
  101. package/dist/lib/rag/chunkers/MarkdownChunker.js +213 -9
  102. package/dist/lib/rag/chunking/markdownChunker.d.ts +16 -0
  103. package/dist/lib/rag/chunking/markdownChunker.js +174 -2
  104. package/dist/lib/rag/pipeline/contextAssembly.js +2 -1
  105. package/dist/lib/rag/ragIntegration.d.ts +18 -1
  106. package/dist/lib/rag/ragIntegration.js +94 -14
  107. package/dist/lib/rag/retrieval/vectorQueryTool.js +21 -4
  108. package/dist/lib/server/abstract/baseServerAdapter.js +4 -1
  109. package/dist/lib/server/adapters/fastifyAdapter.js +35 -30
  110. package/dist/lib/services/server/ai/observability/instrumentation.d.ts +32 -0
  111. package/dist/lib/services/server/ai/observability/instrumentation.js +39 -0
  112. package/dist/lib/telemetry/attributes.d.ts +52 -0
  113. package/dist/lib/telemetry/attributes.js +61 -0
  114. package/dist/lib/telemetry/index.d.ts +3 -0
  115. package/dist/lib/telemetry/index.js +3 -0
  116. package/dist/lib/telemetry/telemetryService.d.ts +6 -0
  117. package/dist/lib/telemetry/telemetryService.js +6 -0
  118. package/dist/lib/telemetry/tracers.d.ts +15 -0
  119. package/dist/lib/telemetry/tracers.js +17 -0
  120. package/dist/lib/telemetry/withSpan.d.ts +9 -0
  121. package/dist/lib/telemetry/withSpan.js +35 -0
  122. package/dist/lib/types/contextTypes.d.ts +10 -0
  123. package/dist/lib/types/streamTypes.d.ts +14 -0
  124. package/dist/lib/utils/conversationMemory.js +123 -84
  125. package/dist/lib/utils/logger.d.ts +5 -0
  126. package/dist/lib/utils/logger.js +50 -2
  127. package/dist/lib/utils/messageBuilder.js +22 -42
  128. package/dist/lib/utils/modelDetection.js +3 -3
  129. package/dist/lib/utils/providerRetry.d.ts +41 -0
  130. package/dist/lib/utils/providerRetry.js +114 -0
  131. package/dist/lib/utils/retryability.d.ts +14 -0
  132. package/dist/lib/utils/retryability.js +23 -0
  133. package/dist/lib/utils/sanitizers/svg.js +4 -5
  134. package/dist/lib/utils/tokenEstimation.d.ts +11 -1
  135. package/dist/lib/utils/tokenEstimation.js +19 -4
  136. package/dist/lib/utils/videoAnalysisProcessor.js +7 -3
  137. package/dist/mcp/externalServerManager.js +66 -0
  138. package/dist/mcp/mcpCircuitBreaker.js +24 -0
  139. package/dist/mcp/mcpClientFactory.js +16 -0
  140. package/dist/mcp/toolDiscoveryService.js +32 -6
  141. package/dist/mcp/toolRegistry.js +193 -123
  142. package/dist/neurolink.d.ts +6 -0
  143. package/dist/neurolink.js +1162 -646
  144. package/dist/providers/amazonBedrock.d.ts +1 -1
  145. package/dist/providers/amazonBedrock.js +521 -319
  146. package/dist/providers/anthropic.js +73 -17
  147. package/dist/providers/anthropicBaseProvider.js +77 -17
  148. package/dist/providers/googleAiStudio.d.ts +1 -1
  149. package/dist/providers/googleAiStudio.js +292 -227
  150. package/dist/providers/googleVertex.d.ts +36 -1
  151. package/dist/providers/googleVertex.js +553 -260
  152. package/dist/providers/ollama.js +329 -278
  153. package/dist/providers/openAI.js +77 -19
  154. package/dist/providers/sagemaker/parsers.js +3 -3
  155. package/dist/providers/sagemaker/streaming.js +3 -3
  156. package/dist/proxy/proxyFetch.js +81 -48
  157. package/dist/rag/ChunkerFactory.js +1 -1
  158. package/dist/rag/chunkers/MarkdownChunker.d.ts +22 -0
  159. package/dist/rag/chunkers/MarkdownChunker.js +213 -9
  160. package/dist/rag/chunking/markdownChunker.d.ts +16 -0
  161. package/dist/rag/chunking/markdownChunker.js +174 -2
  162. package/dist/rag/pipeline/contextAssembly.js +2 -1
  163. package/dist/rag/ragIntegration.d.ts +18 -1
  164. package/dist/rag/ragIntegration.js +94 -14
  165. package/dist/rag/retrieval/vectorQueryTool.js +21 -4
  166. package/dist/server/abstract/baseServerAdapter.js +4 -1
  167. package/dist/server/adapters/fastifyAdapter.js +35 -30
  168. package/dist/services/server/ai/observability/instrumentation.d.ts +32 -0
  169. package/dist/services/server/ai/observability/instrumentation.js +39 -0
  170. package/dist/telemetry/attributes.d.ts +52 -0
  171. package/dist/telemetry/attributes.js +60 -0
  172. package/dist/telemetry/index.d.ts +3 -0
  173. package/dist/telemetry/index.js +3 -0
  174. package/dist/telemetry/telemetryService.d.ts +6 -0
  175. package/dist/telemetry/telemetryService.js +6 -0
  176. package/dist/telemetry/tracers.d.ts +15 -0
  177. package/dist/telemetry/tracers.js +16 -0
  178. package/dist/telemetry/withSpan.d.ts +9 -0
  179. package/dist/telemetry/withSpan.js +34 -0
  180. package/dist/types/contextTypes.d.ts +10 -0
  181. package/dist/types/streamTypes.d.ts +14 -0
  182. package/dist/utils/conversationMemory.js +123 -84
  183. package/dist/utils/logger.d.ts +5 -0
  184. package/dist/utils/logger.js +50 -2
  185. package/dist/utils/messageBuilder.js +22 -42
  186. package/dist/utils/modelDetection.js +3 -3
  187. package/dist/utils/providerRetry.d.ts +41 -0
  188. package/dist/utils/providerRetry.js +113 -0
  189. package/dist/utils/retryability.d.ts +14 -0
  190. package/dist/utils/retryability.js +22 -0
  191. package/dist/utils/sanitizers/svg.js +4 -5
  192. package/dist/utils/tokenEstimation.d.ts +11 -1
  193. package/dist/utils/tokenEstimation.js +19 -4
  194. package/dist/utils/videoAnalysisProcessor.js +7 -3
  195. package/dist/workflow/config.d.ts +26 -26
  196. package/package.json +1 -1
@@ -12,6 +12,7 @@ import { ServeCommandFactory } from "./commands/serve.js";
12
12
  import { ragCommand } from "./commands/rag.js";
13
13
  import { DocsCommandFactory } from "./commands/docs.js";
14
14
  import { AuthCommandFactory } from "./factories/authCommandFactory.js";
15
+ import { WorkflowCommandFactory } from "./commands/workflow.js";
15
16
  // Enhanced CLI with Professional UX
16
17
  export function initializeCliParser() {
17
18
  return (yargs(hideBin(process.argv))
@@ -178,6 +179,8 @@ export function initializeCliParser() {
178
179
  // Docs MCP Server Command
179
180
  .command(DocsCommandFactory.createDocsCommand())
180
181
  // Auth Commands - Using AuthCommandFactory
181
- .command(AuthCommandFactory.createAuthCommands())); // Close the main return statement
182
+ .command(AuthCommandFactory.createAuthCommands())
183
+ // Workflow Commands
184
+ .command(WorkflowCommandFactory.createWorkflowCommands())); // Close the main return statement
182
185
  }
183
186
  //# sourceMappingURL=parser.js.map
@@ -0,0 +1,11 @@
1
+ /**
2
+ * Unified credential masking utility for CLI setup commands.
3
+ *
4
+ * Preserves known provider prefixes (sk-, sk-ant-, AIza, AKIA) so
5
+ * users can identify which key is configured, while hiding the secret
6
+ * portion with asterisks.
7
+ *
8
+ * @param credential - Raw API key or secret
9
+ * @returns Masked string, e.g. "sk-****abcd"
10
+ */
11
+ export declare function maskCredential(credential: string): string;
@@ -0,0 +1,23 @@
1
+ /**
2
+ * Unified credential masking utility for CLI setup commands.
3
+ *
4
+ * Preserves known provider prefixes (sk-, sk-ant-, AIza, AKIA) so
5
+ * users can identify which key is configured, while hiding the secret
6
+ * portion with asterisks.
7
+ *
8
+ * @param credential - Raw API key or secret
9
+ * @returns Masked string, e.g. "sk-****abcd"
10
+ */
11
+ export function maskCredential(credential) {
12
+ if (!credential || credential.length <= 8) {
13
+ return "****";
14
+ }
15
+ // Provider-specific prefixes ordered longest-first so "sk-ant-" wins over "sk-"
16
+ const knownPrefixes = ["sk-ant-", "sk-", "AIza", "AKIA"];
17
+ const prefix = knownPrefixes.find((p) => credential.startsWith(p)) ??
18
+ credential.slice(0, 4);
19
+ const end = credential.slice(-4);
20
+ const stars = "*".repeat(Math.max(4, credential.length - prefix.length - 4));
21
+ return `${prefix}${stars}${end}`;
22
+ }
23
+ //# sourceMappingURL=maskCredential.js.map
@@ -25,8 +25,18 @@ export const DEFAULT_OUTPUT_RESERVE_RATIO = 0.35;
25
25
  export const MODEL_CONTEXT_WINDOWS = {
26
26
  anthropic: {
27
27
  _default: 200_000,
28
+ // Claude 4.6 (Feb 2026) — 200K standard, 1M with beta header
29
+ "claude-opus-4-6": 200_000,
30
+ "claude-sonnet-4-6": 200_000,
31
+ // Claude 4.5
32
+ "claude-opus-4-5-20251101": 200_000,
33
+ "claude-sonnet-4-5-20250929": 200_000,
34
+ "claude-haiku-4-5-20251001": 200_000,
35
+ // Claude 4.x
36
+ "claude-opus-4-1-20250805": 200_000,
28
37
  "claude-opus-4-20250514": 200_000,
29
38
  "claude-sonnet-4-20250514": 200_000,
39
+ // Claude 3.x
30
40
  "claude-3-7-sonnet-20250219": 200_000,
31
41
  "claude-3-5-sonnet-20241022": 200_000,
32
42
  "claude-3-5-haiku-20241022": 200_000,
@@ -36,67 +46,144 @@ export const MODEL_CONTEXT_WINDOWS = {
36
46
  },
37
47
  openai: {
38
48
  _default: 128_000,
49
+ // GPT-5.x family — 400K context
50
+ "gpt-5.3-codex": 400_000,
51
+ "gpt-5.2": 400_000,
52
+ "gpt-5.2-pro": 400_000,
53
+ "gpt-5.2-codex": 400_000,
54
+ "gpt-5.2-chat-latest": 128_000,
55
+ "gpt-5.1": 400_000,
56
+ "gpt-5.1-codex": 400_000,
57
+ "gpt-5.1-codex-max": 400_000,
58
+ "gpt-5.1-codex-mini": 400_000,
59
+ "gpt-5.1-chat-latest": 128_000,
60
+ "gpt-5": 400_000,
61
+ "gpt-5-mini": 400_000,
62
+ "gpt-5-nano": 400_000,
63
+ "gpt-5-pro": 400_000,
64
+ "gpt-5-codex": 400_000,
65
+ "gpt-5-chat-latest": 128_000,
66
+ // GPT Open Source
67
+ "gpt-oss-120b": 128_000,
68
+ "gpt-oss-20b": 128_000,
69
+ // GPT-4.1 family — 1M context
70
+ "gpt-4.1": 1_047_576,
71
+ "gpt-4.1-mini": 1_047_576,
72
+ "gpt-4.1-nano": 1_047_576,
73
+ // GPT-4o
39
74
  "gpt-4o": 128_000,
40
75
  "gpt-4o-mini": 128_000,
41
- "gpt-4-turbo": 128_000,
42
- "gpt-4": 8_192,
43
- "gpt-3.5-turbo": 16_385,
76
+ // O-series reasoning — 200K context
44
77
  o1: 200_000,
45
78
  "o1-mini": 128_000,
46
79
  "o1-pro": 200_000,
47
80
  o3: 200_000,
48
81
  "o3-mini": 200_000,
82
+ "o3-pro": 200_000,
49
83
  "o4-mini": 200_000,
50
- "gpt-4.1": 1_047_576,
51
- "gpt-4.1-mini": 1_047_576,
52
- "gpt-4.1-nano": 1_047_576,
53
- "gpt-5": 1_047_576,
84
+ // Legacy
85
+ "gpt-4-turbo": 128_000,
86
+ "gpt-4": 8_192,
87
+ "gpt-3.5-turbo": 16_385,
54
88
  },
55
89
  "google-ai": {
56
90
  _default: 1_048_576,
91
+ "gemini-3.1-pro-preview": 1_048_576,
92
+ "gemini-3-pro-preview": 1_048_576,
93
+ "gemini-3-pro-image-preview": 65_536,
94
+ "gemini-3-flash-preview": 1_048_576,
95
+ "gemini-3-flash": 1_048_576,
57
96
  "gemini-2.5-pro": 1_048_576,
58
97
  "gemini-2.5-flash": 1_048_576,
98
+ "gemini-2.5-flash-lite": 1_048_576,
99
+ "gemini-2.5-flash-image": 32_768,
59
100
  "gemini-2.0-flash": 1_048_576,
60
101
  "gemini-1.5-pro": 2_097_152,
61
102
  "gemini-1.5-flash": 1_048_576,
62
- "gemini-3-flash-preview": 1_048_576,
63
- "gemini-3-pro-preview": 1_048_576,
64
103
  },
65
104
  vertex: {
66
105
  _default: 1_048_576,
106
+ // Claude on Vertex
107
+ "claude-opus-4-6": 200_000,
108
+ "claude-sonnet-4-6": 200_000,
109
+ "claude-sonnet-4-5": 200_000,
110
+ "claude-opus-4-5": 200_000,
111
+ "claude-haiku-4-5": 200_000,
112
+ "claude-sonnet-4": 200_000,
113
+ "claude-sonnet-4-20250514": 200_000,
114
+ "claude-opus-4-20250514": 200_000,
115
+ "claude-opus-4": 200_000,
116
+ // Gemini on Vertex
117
+ "gemini-3.1-pro-preview": 1_048_576,
118
+ "gemini-3-pro-preview": 1_048_576,
119
+ "gemini-3-pro-latest": 1_048_576,
120
+ "gemini-3-flash-preview": 1_048_576,
121
+ "gemini-3-flash-latest": 1_048_576,
67
122
  "gemini-2.5-pro": 1_048_576,
68
123
  "gemini-2.5-flash": 1_048_576,
69
124
  "gemini-2.0-flash": 1_048_576,
70
125
  "gemini-1.5-pro": 2_097_152,
71
126
  "gemini-1.5-flash": 1_048_576,
72
- "claude-sonnet-4-5": 200_000,
73
- "claude-sonnet-4-20250514": 200_000,
74
- "claude-opus-4": 200_000,
75
- "claude-opus-4-20250514": 200_000,
76
127
  },
77
128
  bedrock: {
78
129
  _default: 200_000,
79
- "anthropic.claude-3-5-sonnet-20241022-v2:0": 200_000,
130
+ // Claude 4.6
131
+ "anthropic.claude-opus-4-6-v1:0": 200_000,
132
+ "anthropic.claude-sonnet-4-6": 200_000,
133
+ // Claude 4.5
134
+ "anthropic.claude-opus-4-5-20251124-v1:0": 200_000,
135
+ "anthropic.claude-sonnet-4-5-20250929-v1:0": 200_000,
136
+ "anthropic.claude-haiku-4-5-20251001-v1:0": 200_000,
137
+ // Claude legacy
138
+ "anthropic.claude-3-5-sonnet-20241022-v1:0": 200_000,
80
139
  "anthropic.claude-3-5-haiku-20241022-v1:0": 200_000,
81
140
  "anthropic.claude-3-opus-20240229-v1:0": 200_000,
82
141
  "anthropic.claude-3-sonnet-20240229-v1:0": 200_000,
83
142
  "anthropic.claude-3-haiku-20240307-v1:0": 200_000,
143
+ // Amazon Nova
84
144
  "amazon.nova-pro-v1:0": 300_000,
85
145
  "amazon.nova-lite-v1:0": 300_000,
146
+ "amazon.nova-2-lite-v1:0": 1_000_000,
147
+ // Writer
148
+ "writer.palmyra-x5-v1:0": 1_000_000,
149
+ "writer.palmyra-x4-v1:0": 128_000,
150
+ // NVIDIA
151
+ "nvidia.nemotron-nano-3-30b": 256_000,
86
152
  },
87
153
  azure: {
88
154
  _default: 128_000,
155
+ // GPT-5.x
156
+ "gpt-5.2": 400_000,
157
+ "gpt-5.2-pro": 400_000,
158
+ "gpt-5.2-codex": 400_000,
159
+ "gpt-5.1": 400_000,
160
+ "gpt-5": 400_000,
161
+ "gpt-5-mini": 400_000,
162
+ // GPT-4.1
163
+ "gpt-4.1": 1_047_576,
164
+ "gpt-4.1-mini": 1_047_576,
165
+ // GPT-4o
89
166
  "gpt-4o": 128_000,
90
167
  "gpt-4o-mini": 128_000,
168
+ // O-series
169
+ o3: 200_000,
170
+ "o3-mini": 200_000,
171
+ "o4-mini": 200_000,
172
+ // Legacy
91
173
  "gpt-4-turbo": 128_000,
92
174
  "gpt-4": 8_192,
93
175
  },
94
176
  mistral: {
95
177
  _default: 128_000,
96
- "mistral-large-latest": 128_000,
97
- "mistral-medium-latest": 32_000,
178
+ "mistral-large-latest": 256_000,
179
+ "mistral-large-2512": 256_000,
180
+ "mistral-medium-latest": 128_000,
98
181
  "mistral-small-latest": 128_000,
99
182
  "codestral-latest": 256_000,
183
+ "codestral-2508": 256_000,
184
+ "devstral-2512": 256_000,
185
+ "devstral-small-2512": 256_000,
186
+ "magistral-medium-latest": 128_000,
100
187
  },
101
188
  ollama: {
102
189
  _default: 128_000,
@@ -109,6 +196,10 @@ export const MODEL_CONTEXT_WINDOWS = {
109
196
  },
110
197
  sagemaker: {
111
198
  _default: 128_000,
199
+ // NVIDIA Nemotron 3 Nano (February 2026) — 1M context
200
+ "nvidia-nemotron-3-nano-30b": 1_000_000,
201
+ // Qwen3 VL — 32K context
202
+ "qwen3-vl-8b-instruct": 32_768,
112
203
  },
113
204
  };
114
205
  /**
@@ -22,23 +22,37 @@ export declare enum AIProviderName {
22
22
  * OpenRouter uses 'provider/model' format
23
23
  */
24
24
  export declare enum OpenRouterModels {
25
+ CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4.6",
26
+ CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4.6",
27
+ CLAUDE_SONNET_4_5 = "anthropic/claude-sonnet-4.5",
28
+ CLAUDE_HAIKU_4_5 = "anthropic/claude-haiku-4.5",
25
29
  CLAUDE_3_5_SONNET = "anthropic/claude-3-5-sonnet",
26
30
  CLAUDE_3_5_HAIKU = "anthropic/claude-3-5-haiku",
27
31
  CLAUDE_3_OPUS = "anthropic/claude-3-opus",
32
+ GPT_5_2 = "openai/gpt-5.2",
33
+ GPT_5 = "openai/gpt-5",
28
34
  GPT_4O = "openai/gpt-4o",
29
35
  GPT_4O_MINI = "openai/gpt-4o-mini",
30
36
  GPT_4_TURBO = "openai/gpt-4-turbo",
37
+ GEMINI_3_1_PRO_PREVIEW = "google/gemini-3.1-pro-preview",
38
+ GEMINI_3_PRO_PREVIEW = "google/gemini-3-pro-preview",
39
+ GEMINI_3_FLASH_PREVIEW = "google/gemini-3-flash-preview",
40
+ GEMINI_2_5_FLASH = "google/gemini-2.5-flash",
41
+ GEMINI_2_5_FLASH_LITE = "google/gemini-2.5-flash-lite",
31
42
  GEMINI_2_0_FLASH = "google/gemini-2.0-flash",
32
- GEMINI_1_5_PRO = "google/gemini-1.5-pro",
33
43
  LLAMA_3_1_70B = "meta-llama/llama-3.1-70b-instruct",
34
44
  LLAMA_3_1_8B = "meta-llama/llama-3.1-8b-instruct",
35
45
  MISTRAL_LARGE = "mistralai/mistral-large",
36
- MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct"
46
+ MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct",
47
+ DEEPSEEK_R1 = "deepseek/deepseek-r1",
48
+ GROK_4_1_FAST = "xai/grok-4.1-fast"
37
49
  }
38
50
  /**
39
51
  * Supported Models for Amazon Bedrock
40
52
  */
41
53
  export declare enum BedrockModels {
54
+ CLAUDE_4_6_OPUS = "anthropic.claude-opus-4-6-v1:0",
55
+ CLAUDE_4_6_SONNET = "anthropic.claude-sonnet-4-6",
42
56
  CLAUDE_4_5_OPUS = "anthropic.claude-opus-4-5-20251124-v1:0",
43
57
  CLAUDE_4_5_SONNET = "anthropic.claude-sonnet-4-5-20250929-v1:0",
44
58
  CLAUDE_4_5_HAIKU = "anthropic.claude-haiku-4-5-20251001-v1:0",
@@ -104,18 +118,49 @@ export declare enum BedrockModels {
104
118
  GEMMA_3_12B_IT = "google.gemma-3-12b-it",
105
119
  GEMMA_3_4B_IT = "google.gemma-3-4b-it",
106
120
  JAMBA_1_5_LARGE = "ai21.jamba-1-5-large-v1:0",
107
- JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0"
121
+ JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0",
122
+ WRITER_PALMYRA_X5 = "writer.palmyra-x5-v1:0",
123
+ WRITER_PALMYRA_X4 = "writer.palmyra-x4-v1:0",
124
+ MINIMAX_M2_1 = "minimax.minimax-m2.1",
125
+ MINIMAX_M2 = "minimax.minimax-m2",
126
+ KIMI_K2_THINKING = "moonshot.kimi-k2-thinking",
127
+ KIMI_K2_5 = "moonshotai.kimi-k2.5",
128
+ NVIDIA_NEMOTRON_NANO_3_30B = "nvidia.nemotron-nano-3-30b",
129
+ NVIDIA_NEMOTRON_NANO_12B_V2 = "nvidia.nemotron-nano-12b-v2",
130
+ NVIDIA_NEMOTRON_NANO_9B_V2 = "nvidia.nemotron-nano-9b-v2",
131
+ OPENAI_GPT_OSS_120B = "openai.gpt-oss-120b-1:0",
132
+ OPENAI_GPT_OSS_20B = "openai.gpt-oss-20b-1:0",
133
+ GLM_4_7 = "zai.glm-4.7",
134
+ GLM_4_7_FLASH = "zai.glm-4.7-flash",
135
+ COHERE_EMBED_ENGLISH_V3 = "cohere.embed-english-v3",
136
+ COHERE_EMBED_MULTILINGUAL_V3 = "cohere.embed-multilingual-v3",
137
+ COHERE_EMBED_V4 = "cohere.embed-v4:0",
138
+ COHERE_RERANK_V3_5 = "cohere.rerank-v3-5:0",
139
+ AMAZON_RERANK_V1 = "amazon.rerank-v1:0",
140
+ DEVSTRAL_2_123B = "mistral.devstral-2-123b"
108
141
  }
109
142
  /**
110
143
  * Supported Models for OpenAI
111
144
  */
112
145
  export declare enum OpenAIModels {
146
+ GPT_5_3_CODEX = "gpt-5.3-codex",
113
147
  GPT_5_2 = "gpt-5.2",
114
148
  GPT_5_2_CHAT_LATEST = "gpt-5.2-chat-latest",
115
149
  GPT_5_2_PRO = "gpt-5.2-pro",
150
+ GPT_5_2_CODEX = "gpt-5.2-codex",
151
+ GPT_5_1 = "gpt-5.1",
152
+ GPT_5_1_CHAT_LATEST = "gpt-5.1-chat-latest",
153
+ GPT_5_1_CODEX = "gpt-5.1-codex",
154
+ GPT_5_1_CODEX_MAX = "gpt-5.1-codex-max",
155
+ GPT_5_1_CODEX_MINI = "gpt-5.1-codex-mini",
116
156
  GPT_5 = "gpt-5",
117
157
  GPT_5_MINI = "gpt-5-mini",
118
158
  GPT_5_NANO = "gpt-5-nano",
159
+ GPT_5_PRO = "gpt-5-pro",
160
+ GPT_5_CHAT_LATEST = "gpt-5-chat-latest",
161
+ GPT_5_CODEX = "gpt-5-codex",
162
+ GPT_OSS_120B = "gpt-oss-120b",
163
+ GPT_OSS_20B = "gpt-oss-20b",
119
164
  GPT_4_1 = "gpt-4.1",
120
165
  GPT_4_1_MINI = "gpt-4.1-mini",
121
166
  GPT_4_1_NANO = "gpt-4.1-nano",
@@ -137,6 +182,10 @@ export declare enum OpenAIModels {
137
182
  * Note: Azure uses deployment names, these are model identifiers
138
183
  */
139
184
  export declare enum AzureOpenAIModels {
185
+ GPT_5_2 = "gpt-5.2",
186
+ GPT_5_2_CHAT = "gpt-5.2-chat",
187
+ GPT_5_2_PRO = "gpt-5.2-pro",
188
+ GPT_5_2_CODEX = "gpt-5.2-codex",
140
189
  GPT_5_1 = "gpt-5.1",
141
190
  GPT_5_1_CHAT = "gpt-5.1-chat",
142
191
  GPT_5_1_CODEX = "gpt-5.1-codex",
@@ -172,6 +221,8 @@ export declare enum AzureOpenAIModels {
172
221
  * Supported Models for Google Vertex AI
173
222
  */
174
223
  export declare enum VertexModels {
224
+ CLAUDE_4_6_OPUS = "claude-opus-4-6",
225
+ CLAUDE_4_6_SONNET = "claude-sonnet-4-6",
175
226
  CLAUDE_4_5_OPUS = "claude-opus-4-5@20251124",
176
227
  CLAUDE_4_5_SONNET = "claude-sonnet-4-5@20250929",
177
228
  CLAUDE_4_5_HAIKU = "claude-haiku-4-5@20251001",
@@ -183,19 +234,13 @@ export declare enum VertexModels {
183
234
  CLAUDE_3_SONNET = "claude-3-sonnet-20240229",
184
235
  CLAUDE_3_OPUS = "claude-3-opus-20240229",
185
236
  CLAUDE_3_HAIKU = "claude-3-haiku-20240307",
186
- /** Gemini 3 Pro - Base model with adaptive thinking */
237
+ GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
187
238
  GEMINI_3_PRO = "gemini-3-pro",
188
- /** Gemini 3 Pro Preview - Versioned preview (November 2025) */
189
239
  GEMINI_3_PRO_PREVIEW_11_2025 = "gemini-3-pro-preview-11-2025",
190
- /** Gemini 3 Pro Latest - Auto-updated alias (always points to latest preview) */
191
240
  GEMINI_3_PRO_LATEST = "gemini-3-pro-latest",
192
- /** Gemini 3 Pro Preview - Generic preview (legacy) */
193
241
  GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
194
- /** Gemini 3 Flash - Base model with adaptive thinking */
195
242
  GEMINI_3_FLASH = "gemini-3-flash",
196
- /** Gemini 3 Flash Preview - Versioned preview */
197
243
  GEMINI_3_FLASH_PREVIEW = "gemini-3-flash-preview",
198
- /** Gemini 3 Flash Latest - Auto-updated alias (always points to latest preview) */
199
244
  GEMINI_3_FLASH_LATEST = "gemini-3-flash-latest",
200
245
  GEMINI_2_5_PRO = "gemini-2.5-pro",
201
246
  GEMINI_2_5_FLASH = "gemini-2.5-flash",
@@ -203,15 +248,17 @@ export declare enum VertexModels {
203
248
  GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
204
249
  GEMINI_2_0_FLASH = "gemini-2.0-flash",
205
250
  GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
206
- /** Gemini 2.0 Flash Lite - GA, production-ready, cost-optimized */
207
251
  GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
252
+ /** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
208
253
  GEMINI_1_5_PRO = "gemini-1.5-pro-002",
254
+ /** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
209
255
  GEMINI_1_5_FLASH = "gemini-1.5-flash-002"
210
256
  }
211
257
  /**
212
258
  * Supported Models for Google AI Studio
213
259
  */
214
260
  export declare enum GoogleAIModels {
261
+ GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
215
262
  GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
216
263
  GEMINI_3_PRO_IMAGE_PREVIEW = "gemini-3-pro-image-preview",
217
264
  GEMINI_3_FLASH = "gemini-3-flash",
@@ -220,20 +267,26 @@ export declare enum GoogleAIModels {
220
267
  GEMINI_2_5_FLASH = "gemini-2.5-flash",
221
268
  GEMINI_2_5_FLASH_LITE = "gemini-2.5-flash-lite",
222
269
  GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
223
- GEMINI_2_5_FLASH_LIVE = "gemini-2.5-flash-native-audio-preview-09-2025",
270
+ GEMINI_2_5_FLASH_PREVIEW_TTS = "gemini-2.5-flash-preview-tts",
271
+ GEMINI_2_5_PRO_PREVIEW_TTS = "gemini-2.5-pro-preview-tts",
224
272
  GEMINI_2_0_FLASH = "gemini-2.0-flash",
225
273
  GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
226
274
  GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
227
275
  GEMINI_2_0_FLASH_IMAGE = "gemini-2.0-flash-preview-image-generation",
276
+ /** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
228
277
  GEMINI_1_5_PRO = "gemini-1.5-pro",
278
+ /** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
229
279
  GEMINI_1_5_FLASH = "gemini-1.5-flash",
230
280
  GEMINI_EMBEDDING = "gemini-embedding-001",
281
+ /** @deprecated Shutdown Jan 2026. Use gemini-embedding-001 */
231
282
  TEXT_EMBEDDING_004 = "text-embedding-004"
232
283
  }
233
284
  /**
234
285
  * Supported Models for Anthropic (Direct API)
235
286
  */
236
287
  export declare enum AnthropicModels {
288
+ CLAUDE_OPUS_4_6 = "claude-opus-4-6",
289
+ CLAUDE_SONNET_4_6 = "claude-sonnet-4-6",
237
290
  CLAUDE_OPUS_4_5 = "claude-opus-4-5-20251101",
238
291
  CLAUDE_SONNET_4_5 = "claude-sonnet-4-5-20250929",
239
292
  CLAUDE_4_5_HAIKU = "claude-haiku-4-5-20251001",
@@ -271,6 +324,13 @@ export declare enum MistralModels {
271
324
  PIXTRAL_12B = "pixtral-12b",
272
325
  VOXTRAL_SMALL_LATEST = "voxtral-small-latest",
273
326
  VOXTRAL_MINI_LATEST = "voxtral-mini-latest",
327
+ DEVSTRAL_2 = "devstral-2512",
328
+ DEVSTRAL_SMALL_2 = "devstral-small-2512",
329
+ MAGISTRAL_MEDIUM_2509 = "magistral-medium-2509",
330
+ MAGISTRAL_SMALL_2509 = "magistral-small-2509",
331
+ VOXTRAL_MINI_TRANSCRIBE_2 = "voxtral-mini-2602",
332
+ MISTRAL_OCR_3 = "mistral-ocr-2512",
333
+ MISTRAL_OCR_LATEST = "mistral-ocr-latest",
274
334
  MISTRAL_NEMO = "mistral-nemo",
275
335
  MISTRAL_EMBED = "mistral-embed",
276
336
  MISTRAL_MODERATION_LATEST = "mistral-moderation-latest"
@@ -341,7 +401,17 @@ export declare enum OllamaModels {
341
401
  STARCODER2_15B = "starcoder2:15b",
342
402
  MIXTRAL_8X7B = "mixtral:8x7b",
343
403
  MIXTRAL_8X22B = "mixtral:8x22b",
344
- COMMAND_R_PLUS = "command-r-plus:104b"
404
+ COMMAND_R_PLUS = "command-r-plus:104b",
405
+ GLM_5_LATEST = "glm-5:latest",
406
+ KIMI_K2_5_LATEST = "kimi-k2.5:latest",
407
+ QWEN3_5_LATEST = "qwen3.5:latest",
408
+ QWEN3_CODER_LATEST = "qwen3-coder:latest",
409
+ QWEN3_CODER_30B = "qwen3-coder:30b",
410
+ DEEPSEEK_V3_2_LATEST = "deepseek-v3.2:latest",
411
+ NEMOTRON_3_NANO_LATEST = "nemotron-3-nano:latest",
412
+ NEMOTRON_3_NANO_30B = "nemotron-3-nano:30b",
413
+ SMOLLM3_3B = "smollm3:3b",
414
+ GPT_OSS_LATEST = "gpt-oss:latest"
345
415
  }
346
416
  /**
347
417
  * Common Models for LiteLLM Proxy
@@ -381,6 +451,12 @@ export declare enum LiteLLMModels {
381
451
  MISTRAL_MAGISTRAL_MEDIUM = "mistral/magistral-medium-2506",
382
452
  BEDROCK_CLAUDE_3_5_SONNET = "bedrock/anthropic.claude-3-5-sonnet-20240620-v1:0",
383
453
  BEDROCK_CLAUDE_3_HAIKU = "bedrock/anthropic.claude-3-haiku-20240307-v1:0",
454
+ OPENAI_GPT_5_2 = "openai/gpt-5.2",
455
+ OPENAI_GPT_5_2_CODEX = "openai/gpt-5.2-codex",
456
+ ANTHROPIC_CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4-6",
457
+ ANTHROPIC_CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4-6",
458
+ GEMINI_3_1_PRO = "gemini/gemini-3.1-pro-preview",
459
+ XAI_GROK_4_1_FAST = "xai/grok-4.1-fast",
384
460
  PERPLEXITY_SONAR_PRO = "perplexity/sonar-pro",
385
461
  PERPLEXITY_SONAR_REASONING_PRO = "perplexity/sonar-reasoning-pro"
386
462
  }
@@ -433,7 +509,13 @@ export declare enum HuggingFaceModels {
433
509
  STARCODER2_15B = "bigcode/starcoder2-15b",
434
510
  CODELLAMA_34B_INSTRUCT = "codellama/CodeLlama-34b-Instruct-hf",
435
511
  BLOOM_7B1 = "bigscience/bloom-7b1",
436
- BLOOM_1B3 = "bigscience/bloom-1b3"
512
+ BLOOM_1B3 = "bigscience/bloom-1b3",
513
+ GLM_5 = "zai-org/GLM-5",
514
+ QWEN_3_5_397B_A17B = "Qwen/Qwen3.5-397B-A17B",
515
+ NEMOTRON_3_NANO_30B = "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16",
516
+ SMOLLM3_3B = "HuggingFaceTB/SmolLM3-3B",
517
+ FALCON_3_7B_INSTRUCT = "tiiuae/Falcon3-7B-Instruct",
518
+ FALCON_3_10B_INSTRUCT = "tiiuae/Falcon3-10B-Instruct"
437
519
  }
438
520
  /**
439
521
  * Supported Models for AWS SageMaker JumpStart
@@ -455,7 +537,9 @@ export declare enum SageMakerModels {
455
537
  FALCON_3_7B = "tii-falcon-3-7b-instruct",
456
538
  FALCON_3_10B = "tii-falcon-3-10b-instruct",
457
539
  FALCON_40B = "tii-falcon-40b-instruct",
458
- FALCON_180B = "tii-falcon-180b"
540
+ FALCON_180B = "tii-falcon-180b",
541
+ NEMOTRON_3_NANO_30B = "nvidia-nemotron-3-nano-30b",
542
+ QWEN3_VL_8B = "qwen3-vl-8b-instruct"
459
543
  }
460
544
  /**
461
545
  * API Versions for various providers