@juspay/neurolink 9.15.0 → 9.17.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +12 -0
- package/README.md +22 -20
- package/dist/adapters/video/videoAnalyzer.d.ts +1 -1
- package/dist/adapters/video/videoAnalyzer.js +10 -8
- package/dist/cli/commands/setup-anthropic.js +1 -14
- package/dist/cli/commands/setup-azure.js +1 -12
- package/dist/cli/commands/setup-bedrock.js +1 -9
- package/dist/cli/commands/setup-google-ai.js +1 -12
- package/dist/cli/commands/setup-openai.js +1 -14
- package/dist/cli/commands/workflow.d.ts +27 -0
- package/dist/cli/commands/workflow.js +216 -0
- package/dist/cli/factories/commandFactory.js +79 -20
- package/dist/cli/index.js +0 -1
- package/dist/cli/parser.js +4 -1
- package/dist/cli/utils/maskCredential.d.ts +11 -0
- package/dist/cli/utils/maskCredential.js +23 -0
- package/dist/constants/contextWindows.js +107 -16
- package/dist/constants/enums.d.ts +99 -15
- package/dist/constants/enums.js +152 -22
- package/dist/context/budgetChecker.js +1 -1
- package/dist/context/contextCompactor.js +31 -4
- package/dist/context/emergencyTruncation.d.ts +21 -0
- package/dist/context/emergencyTruncation.js +88 -0
- package/dist/context/errorDetection.d.ts +16 -0
- package/dist/context/errorDetection.js +48 -1
- package/dist/context/errors.d.ts +19 -0
- package/dist/context/errors.js +21 -0
- package/dist/context/stages/slidingWindowTruncator.d.ts +6 -0
- package/dist/context/stages/slidingWindowTruncator.js +159 -24
- package/dist/context/stages/structuredSummarizer.js +2 -2
- package/dist/core/baseProvider.js +306 -200
- package/dist/core/conversationMemoryManager.js +104 -61
- package/dist/core/evaluationProviders.js +16 -33
- package/dist/core/factory.js +237 -164
- package/dist/core/modules/GenerationHandler.js +175 -116
- package/dist/core/modules/MessageBuilder.js +222 -170
- package/dist/core/modules/StreamHandler.d.ts +1 -0
- package/dist/core/modules/StreamHandler.js +95 -27
- package/dist/core/modules/TelemetryHandler.d.ts +10 -1
- package/dist/core/modules/TelemetryHandler.js +25 -7
- package/dist/core/modules/ToolsManager.js +115 -191
- package/dist/core/redisConversationMemoryManager.js +418 -282
- package/dist/factories/providerRegistry.d.ts +5 -0
- package/dist/factories/providerRegistry.js +20 -2
- package/dist/index.d.ts +2 -2
- package/dist/index.js +4 -2
- package/dist/lib/adapters/video/videoAnalyzer.d.ts +1 -1
- package/dist/lib/adapters/video/videoAnalyzer.js +10 -8
- package/dist/lib/constants/contextWindows.js +107 -16
- package/dist/lib/constants/enums.d.ts +99 -15
- package/dist/lib/constants/enums.js +152 -22
- package/dist/lib/context/budgetChecker.js +1 -1
- package/dist/lib/context/contextCompactor.js +31 -4
- package/dist/lib/context/emergencyTruncation.d.ts +21 -0
- package/dist/lib/context/emergencyTruncation.js +89 -0
- package/dist/lib/context/errorDetection.d.ts +16 -0
- package/dist/lib/context/errorDetection.js +48 -1
- package/dist/lib/context/errors.d.ts +19 -0
- package/dist/lib/context/errors.js +22 -0
- package/dist/lib/context/stages/slidingWindowTruncator.d.ts +6 -0
- package/dist/lib/context/stages/slidingWindowTruncator.js +159 -24
- package/dist/lib/context/stages/structuredSummarizer.js +2 -2
- package/dist/lib/core/baseProvider.js +306 -200
- package/dist/lib/core/conversationMemoryManager.js +104 -61
- package/dist/lib/core/evaluationProviders.js +16 -33
- package/dist/lib/core/factory.js +237 -164
- package/dist/lib/core/modules/GenerationHandler.js +175 -116
- package/dist/lib/core/modules/MessageBuilder.js +222 -170
- package/dist/lib/core/modules/StreamHandler.d.ts +1 -0
- package/dist/lib/core/modules/StreamHandler.js +95 -27
- package/dist/lib/core/modules/TelemetryHandler.d.ts +10 -1
- package/dist/lib/core/modules/TelemetryHandler.js +25 -7
- package/dist/lib/core/modules/ToolsManager.js +115 -191
- package/dist/lib/core/redisConversationMemoryManager.js +418 -282
- package/dist/lib/factories/providerRegistry.d.ts +5 -0
- package/dist/lib/factories/providerRegistry.js +20 -2
- package/dist/lib/index.d.ts +2 -2
- package/dist/lib/index.js +4 -2
- package/dist/lib/mcp/externalServerManager.js +66 -0
- package/dist/lib/mcp/mcpCircuitBreaker.js +24 -0
- package/dist/lib/mcp/mcpClientFactory.js +16 -0
- package/dist/lib/mcp/toolDiscoveryService.js +32 -6
- package/dist/lib/mcp/toolRegistry.js +193 -123
- package/dist/lib/neurolink.d.ts +6 -0
- package/dist/lib/neurolink.js +1162 -646
- package/dist/lib/providers/amazonBedrock.d.ts +1 -1
- package/dist/lib/providers/amazonBedrock.js +521 -319
- package/dist/lib/providers/anthropic.js +73 -17
- package/dist/lib/providers/anthropicBaseProvider.js +77 -17
- package/dist/lib/providers/googleAiStudio.d.ts +1 -1
- package/dist/lib/providers/googleAiStudio.js +292 -227
- package/dist/lib/providers/googleVertex.d.ts +36 -1
- package/dist/lib/providers/googleVertex.js +553 -260
- package/dist/lib/providers/ollama.js +329 -278
- package/dist/lib/providers/openAI.js +77 -19
- package/dist/lib/providers/sagemaker/parsers.js +3 -3
- package/dist/lib/providers/sagemaker/streaming.js +3 -3
- package/dist/lib/proxy/proxyFetch.js +81 -48
- package/dist/lib/rag/ChunkerFactory.js +1 -1
- package/dist/lib/rag/chunkers/MarkdownChunker.d.ts +22 -0
- package/dist/lib/rag/chunkers/MarkdownChunker.js +213 -9
- package/dist/lib/rag/chunking/markdownChunker.d.ts +16 -0
- package/dist/lib/rag/chunking/markdownChunker.js +174 -2
- package/dist/lib/rag/pipeline/contextAssembly.js +2 -1
- package/dist/lib/rag/ragIntegration.d.ts +18 -1
- package/dist/lib/rag/ragIntegration.js +94 -14
- package/dist/lib/rag/retrieval/vectorQueryTool.js +21 -4
- package/dist/lib/server/abstract/baseServerAdapter.js +4 -1
- package/dist/lib/server/adapters/fastifyAdapter.js +35 -30
- package/dist/lib/services/server/ai/observability/instrumentation.d.ts +32 -0
- package/dist/lib/services/server/ai/observability/instrumentation.js +39 -0
- package/dist/lib/telemetry/attributes.d.ts +52 -0
- package/dist/lib/telemetry/attributes.js +61 -0
- package/dist/lib/telemetry/index.d.ts +3 -0
- package/dist/lib/telemetry/index.js +3 -0
- package/dist/lib/telemetry/telemetryService.d.ts +6 -0
- package/dist/lib/telemetry/telemetryService.js +6 -0
- package/dist/lib/telemetry/tracers.d.ts +15 -0
- package/dist/lib/telemetry/tracers.js +17 -0
- package/dist/lib/telemetry/withSpan.d.ts +9 -0
- package/dist/lib/telemetry/withSpan.js +35 -0
- package/dist/lib/types/contextTypes.d.ts +10 -0
- package/dist/lib/types/streamTypes.d.ts +14 -0
- package/dist/lib/utils/conversationMemory.js +123 -84
- package/dist/lib/utils/logger.d.ts +5 -0
- package/dist/lib/utils/logger.js +50 -2
- package/dist/lib/utils/messageBuilder.js +22 -42
- package/dist/lib/utils/modelDetection.js +3 -3
- package/dist/lib/utils/providerRetry.d.ts +41 -0
- package/dist/lib/utils/providerRetry.js +114 -0
- package/dist/lib/utils/retryability.d.ts +14 -0
- package/dist/lib/utils/retryability.js +23 -0
- package/dist/lib/utils/sanitizers/svg.js +4 -5
- package/dist/lib/utils/tokenEstimation.d.ts +11 -1
- package/dist/lib/utils/tokenEstimation.js +19 -4
- package/dist/lib/utils/videoAnalysisProcessor.js +7 -3
- package/dist/mcp/externalServerManager.js +66 -0
- package/dist/mcp/mcpCircuitBreaker.js +24 -0
- package/dist/mcp/mcpClientFactory.js +16 -0
- package/dist/mcp/toolDiscoveryService.js +32 -6
- package/dist/mcp/toolRegistry.js +193 -123
- package/dist/neurolink.d.ts +6 -0
- package/dist/neurolink.js +1162 -646
- package/dist/providers/amazonBedrock.d.ts +1 -1
- package/dist/providers/amazonBedrock.js +521 -319
- package/dist/providers/anthropic.js +73 -17
- package/dist/providers/anthropicBaseProvider.js +77 -17
- package/dist/providers/googleAiStudio.d.ts +1 -1
- package/dist/providers/googleAiStudio.js +292 -227
- package/dist/providers/googleVertex.d.ts +36 -1
- package/dist/providers/googleVertex.js +553 -260
- package/dist/providers/ollama.js +329 -278
- package/dist/providers/openAI.js +77 -19
- package/dist/providers/sagemaker/parsers.js +3 -3
- package/dist/providers/sagemaker/streaming.js +3 -3
- package/dist/proxy/proxyFetch.js +81 -48
- package/dist/rag/ChunkerFactory.js +1 -1
- package/dist/rag/chunkers/MarkdownChunker.d.ts +22 -0
- package/dist/rag/chunkers/MarkdownChunker.js +213 -9
- package/dist/rag/chunking/markdownChunker.d.ts +16 -0
- package/dist/rag/chunking/markdownChunker.js +174 -2
- package/dist/rag/pipeline/contextAssembly.js +2 -1
- package/dist/rag/ragIntegration.d.ts +18 -1
- package/dist/rag/ragIntegration.js +94 -14
- package/dist/rag/retrieval/vectorQueryTool.js +21 -4
- package/dist/server/abstract/baseServerAdapter.js +4 -1
- package/dist/server/adapters/fastifyAdapter.js +35 -30
- package/dist/services/server/ai/observability/instrumentation.d.ts +32 -0
- package/dist/services/server/ai/observability/instrumentation.js +39 -0
- package/dist/telemetry/attributes.d.ts +52 -0
- package/dist/telemetry/attributes.js +60 -0
- package/dist/telemetry/index.d.ts +3 -0
- package/dist/telemetry/index.js +3 -0
- package/dist/telemetry/telemetryService.d.ts +6 -0
- package/dist/telemetry/telemetryService.js +6 -0
- package/dist/telemetry/tracers.d.ts +15 -0
- package/dist/telemetry/tracers.js +16 -0
- package/dist/telemetry/withSpan.d.ts +9 -0
- package/dist/telemetry/withSpan.js +34 -0
- package/dist/types/contextTypes.d.ts +10 -0
- package/dist/types/streamTypes.d.ts +14 -0
- package/dist/utils/conversationMemory.js +123 -84
- package/dist/utils/logger.d.ts +5 -0
- package/dist/utils/logger.js +50 -2
- package/dist/utils/messageBuilder.js +22 -42
- package/dist/utils/modelDetection.js +3 -3
- package/dist/utils/providerRetry.d.ts +41 -0
- package/dist/utils/providerRetry.js +113 -0
- package/dist/utils/retryability.d.ts +14 -0
- package/dist/utils/retryability.js +22 -0
- package/dist/utils/sanitizers/svg.js +4 -5
- package/dist/utils/tokenEstimation.d.ts +11 -1
- package/dist/utils/tokenEstimation.js +19 -4
- package/dist/utils/videoAnalysisProcessor.js +7 -3
- package/dist/workflow/config.d.ts +26 -26
- package/package.json +1 -1
|
@@ -5,11 +5,16 @@ import type { ProviderRegistryOptions } from "../types/index.js";
|
|
|
5
5
|
*/
|
|
6
6
|
export declare class ProviderRegistry {
|
|
7
7
|
private static registered;
|
|
8
|
+
private static registrationPromise;
|
|
8
9
|
private static options;
|
|
9
10
|
/**
|
|
10
11
|
* Register all providers with the factory
|
|
11
12
|
*/
|
|
12
13
|
static registerAllProviders(): Promise<void>;
|
|
14
|
+
/**
|
|
15
|
+
* Internal registration implementation
|
|
16
|
+
*/
|
|
17
|
+
private static _doRegister;
|
|
13
18
|
/**
|
|
14
19
|
* Check if providers are registered
|
|
15
20
|
*/
|
|
@@ -7,6 +7,7 @@ import { AIProviderName, GoogleAIModels, OpenAIModels, AnthropicModels, VertexMo
|
|
|
7
7
|
*/
|
|
8
8
|
export class ProviderRegistry {
|
|
9
9
|
static registered = false;
|
|
10
|
+
static registrationPromise = null;
|
|
10
11
|
static options = {
|
|
11
12
|
enableManualMCP: false, // Default to disabled for safety
|
|
12
13
|
};
|
|
@@ -17,6 +18,22 @@ export class ProviderRegistry {
|
|
|
17
18
|
if (this.registered) {
|
|
18
19
|
return;
|
|
19
20
|
}
|
|
21
|
+
if (this.registrationPromise) {
|
|
22
|
+
return this.registrationPromise;
|
|
23
|
+
}
|
|
24
|
+
this.registrationPromise = this._doRegister();
|
|
25
|
+
try {
|
|
26
|
+
await this.registrationPromise;
|
|
27
|
+
}
|
|
28
|
+
catch (error) {
|
|
29
|
+
this.registrationPromise = null; // Allow retry on failure
|
|
30
|
+
throw error;
|
|
31
|
+
}
|
|
32
|
+
}
|
|
33
|
+
/**
|
|
34
|
+
* Internal registration implementation
|
|
35
|
+
*/
|
|
36
|
+
static async _doRegister() {
|
|
20
37
|
try {
|
|
21
38
|
// Register providers with dynamic import factory functions
|
|
22
39
|
const { ProviderFactory } = await import("./providerFactory.js");
|
|
@@ -34,7 +51,7 @@ export class ProviderRegistry {
|
|
|
34
51
|
ProviderFactory.registerProvider(AIProviderName.ANTHROPIC, async (modelName, _providerName, sdk) => {
|
|
35
52
|
const { AnthropicProvider } = await import("../providers/anthropic.js");
|
|
36
53
|
return new AnthropicProvider(modelName, sdk);
|
|
37
|
-
}, AnthropicModels.
|
|
54
|
+
}, AnthropicModels.CLAUDE_SONNET_4_6, ["claude", "anthropic"]);
|
|
38
55
|
// Register Amazon Bedrock provider
|
|
39
56
|
ProviderFactory.registerProvider(AIProviderName.BEDROCK, async (modelName, _providerName, sdk, region) => {
|
|
40
57
|
const { AmazonBedrockProvider } = await import("../providers/amazonBedrock.js");
|
|
@@ -54,7 +71,7 @@ export class ProviderRegistry {
|
|
|
54
71
|
ProviderFactory.registerProvider(AIProviderName.VERTEX, async (modelName, providerName, sdk, region) => {
|
|
55
72
|
const { GoogleVertexProvider } = await import("../providers/googleVertex.js");
|
|
56
73
|
return new GoogleVertexProvider(modelName, providerName, sdk, region);
|
|
57
|
-
}, VertexModels.
|
|
74
|
+
}, VertexModels.CLAUDE_4_6_SONNET, ["vertex", "googleVertex"]);
|
|
58
75
|
// Register Hugging Face provider (Unified Router implementation)
|
|
59
76
|
ProviderFactory.registerProvider(AIProviderName.HUGGINGFACE, async (modelName) => {
|
|
60
77
|
const { HuggingFaceProvider } = await import("../providers/huggingFace.js");
|
|
@@ -130,6 +147,7 @@ export class ProviderRegistry {
|
|
|
130
147
|
static clearRegistrations() {
|
|
131
148
|
ProviderFactory.clearRegistrations();
|
|
132
149
|
this.registered = false;
|
|
150
|
+
this.registrationPromise = null;
|
|
133
151
|
}
|
|
134
152
|
/**
|
|
135
153
|
* Set registry options (should be called before initialization)
|
package/dist/index.d.ts
CHANGED
|
@@ -49,9 +49,9 @@ export { NeuroLink };
|
|
|
49
49
|
export type { MCPServerInfo } from "./types/mcpTypes.js";
|
|
50
50
|
export type { LangfuseConfig, LangfuseSpanAttributes, ObservabilityConfig, OpenTelemetryConfig, TraceNameFormat, } from "./types/observability.js";
|
|
51
51
|
export { buildObservabilityConfigFromEnv } from "./utils/observabilityHelpers.js";
|
|
52
|
-
import { createContextEnricher, flushOpenTelemetry, getLangfuseContext, getLangfuseHealthStatus, getLangfuseSpanProcessor, getSpanProcessors, getTracer, getTracerProvider, initializeOpenTelemetry, isOpenTelemetryInitialized, isUsingExternalTracerProvider, setLangfuseContext, shutdownOpenTelemetry } from "./services/server/ai/observability/instrumentation.js";
|
|
52
|
+
import { createContextEnricher, flushOpenTelemetry, getLangfuseContext, getLangfuseHealthStatus, getLangfuseSpanProcessor, getSpanProcessors, getTracer, getTracerProvider, initializeOpenTelemetry, isOpenTelemetryInitialized, isUsingExternalTracerProvider, runWithCurrentLangfuseContext, setLangfuseContext, shutdownOpenTelemetry } from "./services/server/ai/observability/instrumentation.js";
|
|
53
53
|
export type { LangfuseContext } from "./services/server/ai/observability/instrumentation.js";
|
|
54
|
-
export { initializeOpenTelemetry, shutdownOpenTelemetry, flushOpenTelemetry, getLangfuseHealthStatus, setLangfuseContext, getLangfuseSpanProcessor, getTracerProvider, isOpenTelemetryInitialized, getSpanProcessors, createContextEnricher, isUsingExternalTracerProvider, getLangfuseContext, getTracer, };
|
|
54
|
+
export { initializeOpenTelemetry, shutdownOpenTelemetry, flushOpenTelemetry, getLangfuseHealthStatus, setLangfuseContext, getLangfuseSpanProcessor, getTracerProvider, isOpenTelemetryInitialized, getSpanProcessors, createContextEnricher, isUsingExternalTracerProvider, getLangfuseContext, getTracer, runWithCurrentLangfuseContext, };
|
|
55
55
|
export { clearAnalyticsMetrics, createAnalyticsMiddleware, getAnalyticsMetrics, } from "./middleware/builtin/analytics.js";
|
|
56
56
|
export { MiddlewareFactory } from "./middleware/factory.js";
|
|
57
57
|
export type { MiddlewareConfig, MiddlewareContext, MiddlewareFactoryOptions, MiddlewarePreset, NeuroLinkMiddleware, } from "./types/middlewareTypes.js";
|
package/dist/index.js
CHANGED
|
@@ -60,13 +60,15 @@ import { createContextEnricher, flushOpenTelemetry,
|
|
|
60
60
|
// Enhanced context and tracing
|
|
61
61
|
getLangfuseContext, getLangfuseHealthStatus, getLangfuseSpanProcessor,
|
|
62
62
|
// NEW EXPORTS - External TracerProvider Support
|
|
63
|
-
getSpanProcessors, getTracer, getTracerProvider, initializeOpenTelemetry, isOpenTelemetryInitialized, isUsingExternalTracerProvider, setLangfuseContext, shutdownOpenTelemetry, } from "./services/server/ai/observability/instrumentation.js";
|
|
63
|
+
getSpanProcessors, getTracer, getTracerProvider, initializeOpenTelemetry, isOpenTelemetryInitialized, isUsingExternalTracerProvider, runWithCurrentLangfuseContext, setLangfuseContext, shutdownOpenTelemetry, } from "./services/server/ai/observability/instrumentation.js";
|
|
64
64
|
import { getTelemetryStatus as getStatus, initializeTelemetry as init, } from "./telemetry/index.js";
|
|
65
65
|
export { initializeOpenTelemetry, shutdownOpenTelemetry, flushOpenTelemetry, getLangfuseHealthStatus, setLangfuseContext, getLangfuseSpanProcessor, getTracerProvider, isOpenTelemetryInitialized,
|
|
66
66
|
// NEW EXPORTS - External TracerProvider Support
|
|
67
67
|
getSpanProcessors, createContextEnricher, isUsingExternalTracerProvider,
|
|
68
68
|
// Enhanced context and tracing
|
|
69
|
-
getLangfuseContext, getTracer,
|
|
69
|
+
getLangfuseContext, getTracer,
|
|
70
|
+
// ALS context propagation helper
|
|
71
|
+
runWithCurrentLangfuseContext, };
|
|
70
72
|
// Analytics Middleware exports
|
|
71
73
|
export { clearAnalyticsMetrics, createAnalyticsMiddleware, getAnalyticsMetrics, } from "./middleware/builtin/analytics.js";
|
|
72
74
|
export { MiddlewareFactory } from "./middleware/factory.js";
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
/**
|
|
2
2
|
* Video Analysis Handler
|
|
3
3
|
*
|
|
4
|
-
* Provides video analysis using Google's Gemini 2.
|
|
4
|
+
* Provides video analysis using Google's Gemini 2.5 Flash model.
|
|
5
5
|
* Supports both Vertex AI and Gemini API providers.
|
|
6
6
|
*
|
|
7
7
|
* @module adapters/video/geminiVideoAnalyzer
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
/**
|
|
2
2
|
* Video Analysis Handler
|
|
3
3
|
*
|
|
4
|
-
* Provides video analysis using Google's Gemini 2.
|
|
4
|
+
* Provides video analysis using Google's Gemini 2.5 Flash model.
|
|
5
5
|
* Supports both Vertex AI and Gemini API providers.
|
|
6
6
|
*
|
|
7
7
|
* @module adapters/video/geminiVideoAnalyzer
|
|
@@ -13,7 +13,7 @@ import { NeuroLinkError, ErrorFactory } from "../../utils/errorHandling.js";
|
|
|
13
13
|
// ---------------------------------------------------------------------------
|
|
14
14
|
// Shared config
|
|
15
15
|
// ---------------------------------------------------------------------------
|
|
16
|
-
const DEFAULT_MODEL = "gemini-2.
|
|
16
|
+
const DEFAULT_MODEL = "gemini-2.5-flash";
|
|
17
17
|
const DEFAULT_LOCATION = "us-central1";
|
|
18
18
|
/**
|
|
19
19
|
* Extract content items from user messages
|
|
@@ -223,15 +223,17 @@ async function getVertexConfig() {
|
|
|
223
223
|
}
|
|
224
224
|
export async function analyzeVideo(messages, options = {}) {
|
|
225
225
|
const provider = options.provider || AIProviderName.AUTO;
|
|
226
|
-
// Vertex — only when
|
|
227
|
-
if (provider === AIProviderName.VERTEX ||
|
|
226
|
+
// Vertex — only when Vertex credentials are configured
|
|
227
|
+
if (provider === AIProviderName.VERTEX ||
|
|
228
|
+
(provider === AIProviderName.AUTO &&
|
|
229
|
+
(process.env.GOOGLE_VERTEX_PROJECT || process.env.GOOGLE_CLOUD_PROJECT))) {
|
|
228
230
|
return analyzeVideoWithVertexAI(messages, options);
|
|
229
231
|
}
|
|
230
|
-
// Gemini API — when
|
|
231
|
-
if (provider === AIProviderName.GOOGLE_AI
|
|
232
|
+
// Gemini API — when Google AI API key is available
|
|
233
|
+
if (provider === AIProviderName.GOOGLE_AI ||
|
|
234
|
+
(provider === AIProviderName.AUTO && process.env.GOOGLE_AI_API_KEY)) {
|
|
232
235
|
return analyzeVideoWithGeminiAPI(messages, options);
|
|
233
236
|
}
|
|
234
|
-
throw
|
|
235
|
-
"Set GOOGLE_VERTEX_PROJECT for Vertex AI or GOOGLE_AI_API_KEY for Gemini API.");
|
|
237
|
+
throw ErrorFactory.invalidConfiguration("video analysis provider", "No valid provider configuration found. Set GOOGLE_VERTEX_PROJECT for Vertex AI or GOOGLE_AI_API_KEY for Gemini API.");
|
|
236
238
|
}
|
|
237
239
|
//# sourceMappingURL=videoAnalyzer.js.map
|
|
@@ -25,8 +25,18 @@ export const DEFAULT_OUTPUT_RESERVE_RATIO = 0.35;
|
|
|
25
25
|
export const MODEL_CONTEXT_WINDOWS = {
|
|
26
26
|
anthropic: {
|
|
27
27
|
_default: 200_000,
|
|
28
|
+
// Claude 4.6 (Feb 2026) — 200K standard, 1M with beta header
|
|
29
|
+
"claude-opus-4-6": 200_000,
|
|
30
|
+
"claude-sonnet-4-6": 200_000,
|
|
31
|
+
// Claude 4.5
|
|
32
|
+
"claude-opus-4-5-20251101": 200_000,
|
|
33
|
+
"claude-sonnet-4-5-20250929": 200_000,
|
|
34
|
+
"claude-haiku-4-5-20251001": 200_000,
|
|
35
|
+
// Claude 4.x
|
|
36
|
+
"claude-opus-4-1-20250805": 200_000,
|
|
28
37
|
"claude-opus-4-20250514": 200_000,
|
|
29
38
|
"claude-sonnet-4-20250514": 200_000,
|
|
39
|
+
// Claude 3.x
|
|
30
40
|
"claude-3-7-sonnet-20250219": 200_000,
|
|
31
41
|
"claude-3-5-sonnet-20241022": 200_000,
|
|
32
42
|
"claude-3-5-haiku-20241022": 200_000,
|
|
@@ -36,67 +46,144 @@ export const MODEL_CONTEXT_WINDOWS = {
|
|
|
36
46
|
},
|
|
37
47
|
openai: {
|
|
38
48
|
_default: 128_000,
|
|
49
|
+
// GPT-5.x family — 400K context
|
|
50
|
+
"gpt-5.3-codex": 400_000,
|
|
51
|
+
"gpt-5.2": 400_000,
|
|
52
|
+
"gpt-5.2-pro": 400_000,
|
|
53
|
+
"gpt-5.2-codex": 400_000,
|
|
54
|
+
"gpt-5.2-chat-latest": 128_000,
|
|
55
|
+
"gpt-5.1": 400_000,
|
|
56
|
+
"gpt-5.1-codex": 400_000,
|
|
57
|
+
"gpt-5.1-codex-max": 400_000,
|
|
58
|
+
"gpt-5.1-codex-mini": 400_000,
|
|
59
|
+
"gpt-5.1-chat-latest": 128_000,
|
|
60
|
+
"gpt-5": 400_000,
|
|
61
|
+
"gpt-5-mini": 400_000,
|
|
62
|
+
"gpt-5-nano": 400_000,
|
|
63
|
+
"gpt-5-pro": 400_000,
|
|
64
|
+
"gpt-5-codex": 400_000,
|
|
65
|
+
"gpt-5-chat-latest": 128_000,
|
|
66
|
+
// GPT Open Source
|
|
67
|
+
"gpt-oss-120b": 128_000,
|
|
68
|
+
"gpt-oss-20b": 128_000,
|
|
69
|
+
// GPT-4.1 family — 1M context
|
|
70
|
+
"gpt-4.1": 1_047_576,
|
|
71
|
+
"gpt-4.1-mini": 1_047_576,
|
|
72
|
+
"gpt-4.1-nano": 1_047_576,
|
|
73
|
+
// GPT-4o
|
|
39
74
|
"gpt-4o": 128_000,
|
|
40
75
|
"gpt-4o-mini": 128_000,
|
|
41
|
-
|
|
42
|
-
"gpt-4": 8_192,
|
|
43
|
-
"gpt-3.5-turbo": 16_385,
|
|
76
|
+
// O-series reasoning — 200K context
|
|
44
77
|
o1: 200_000,
|
|
45
78
|
"o1-mini": 128_000,
|
|
46
79
|
"o1-pro": 200_000,
|
|
47
80
|
o3: 200_000,
|
|
48
81
|
"o3-mini": 200_000,
|
|
82
|
+
"o3-pro": 200_000,
|
|
49
83
|
"o4-mini": 200_000,
|
|
50
|
-
|
|
51
|
-
"gpt-4
|
|
52
|
-
"gpt-4
|
|
53
|
-
"gpt-5":
|
|
84
|
+
// Legacy
|
|
85
|
+
"gpt-4-turbo": 128_000,
|
|
86
|
+
"gpt-4": 8_192,
|
|
87
|
+
"gpt-3.5-turbo": 16_385,
|
|
54
88
|
},
|
|
55
89
|
"google-ai": {
|
|
56
90
|
_default: 1_048_576,
|
|
91
|
+
"gemini-3.1-pro-preview": 1_048_576,
|
|
92
|
+
"gemini-3-pro-preview": 1_048_576,
|
|
93
|
+
"gemini-3-pro-image-preview": 65_536,
|
|
94
|
+
"gemini-3-flash-preview": 1_048_576,
|
|
95
|
+
"gemini-3-flash": 1_048_576,
|
|
57
96
|
"gemini-2.5-pro": 1_048_576,
|
|
58
97
|
"gemini-2.5-flash": 1_048_576,
|
|
98
|
+
"gemini-2.5-flash-lite": 1_048_576,
|
|
99
|
+
"gemini-2.5-flash-image": 32_768,
|
|
59
100
|
"gemini-2.0-flash": 1_048_576,
|
|
60
101
|
"gemini-1.5-pro": 2_097_152,
|
|
61
102
|
"gemini-1.5-flash": 1_048_576,
|
|
62
|
-
"gemini-3-flash-preview": 1_048_576,
|
|
63
|
-
"gemini-3-pro-preview": 1_048_576,
|
|
64
103
|
},
|
|
65
104
|
vertex: {
|
|
66
105
|
_default: 1_048_576,
|
|
106
|
+
// Claude on Vertex
|
|
107
|
+
"claude-opus-4-6": 200_000,
|
|
108
|
+
"claude-sonnet-4-6": 200_000,
|
|
109
|
+
"claude-sonnet-4-5": 200_000,
|
|
110
|
+
"claude-opus-4-5": 200_000,
|
|
111
|
+
"claude-haiku-4-5": 200_000,
|
|
112
|
+
"claude-sonnet-4": 200_000,
|
|
113
|
+
"claude-sonnet-4-20250514": 200_000,
|
|
114
|
+
"claude-opus-4-20250514": 200_000,
|
|
115
|
+
"claude-opus-4": 200_000,
|
|
116
|
+
// Gemini on Vertex
|
|
117
|
+
"gemini-3.1-pro-preview": 1_048_576,
|
|
118
|
+
"gemini-3-pro-preview": 1_048_576,
|
|
119
|
+
"gemini-3-pro-latest": 1_048_576,
|
|
120
|
+
"gemini-3-flash-preview": 1_048_576,
|
|
121
|
+
"gemini-3-flash-latest": 1_048_576,
|
|
67
122
|
"gemini-2.5-pro": 1_048_576,
|
|
68
123
|
"gemini-2.5-flash": 1_048_576,
|
|
69
124
|
"gemini-2.0-flash": 1_048_576,
|
|
70
125
|
"gemini-1.5-pro": 2_097_152,
|
|
71
126
|
"gemini-1.5-flash": 1_048_576,
|
|
72
|
-
"claude-sonnet-4-5": 200_000,
|
|
73
|
-
"claude-sonnet-4-20250514": 200_000,
|
|
74
|
-
"claude-opus-4": 200_000,
|
|
75
|
-
"claude-opus-4-20250514": 200_000,
|
|
76
127
|
},
|
|
77
128
|
bedrock: {
|
|
78
129
|
_default: 200_000,
|
|
79
|
-
|
|
130
|
+
// Claude 4.6
|
|
131
|
+
"anthropic.claude-opus-4-6-v1:0": 200_000,
|
|
132
|
+
"anthropic.claude-sonnet-4-6": 200_000,
|
|
133
|
+
// Claude 4.5
|
|
134
|
+
"anthropic.claude-opus-4-5-20251124-v1:0": 200_000,
|
|
135
|
+
"anthropic.claude-sonnet-4-5-20250929-v1:0": 200_000,
|
|
136
|
+
"anthropic.claude-haiku-4-5-20251001-v1:0": 200_000,
|
|
137
|
+
// Claude legacy
|
|
138
|
+
"anthropic.claude-3-5-sonnet-20241022-v1:0": 200_000,
|
|
80
139
|
"anthropic.claude-3-5-haiku-20241022-v1:0": 200_000,
|
|
81
140
|
"anthropic.claude-3-opus-20240229-v1:0": 200_000,
|
|
82
141
|
"anthropic.claude-3-sonnet-20240229-v1:0": 200_000,
|
|
83
142
|
"anthropic.claude-3-haiku-20240307-v1:0": 200_000,
|
|
143
|
+
// Amazon Nova
|
|
84
144
|
"amazon.nova-pro-v1:0": 300_000,
|
|
85
145
|
"amazon.nova-lite-v1:0": 300_000,
|
|
146
|
+
"amazon.nova-2-lite-v1:0": 1_000_000,
|
|
147
|
+
// Writer
|
|
148
|
+
"writer.palmyra-x5-v1:0": 1_000_000,
|
|
149
|
+
"writer.palmyra-x4-v1:0": 128_000,
|
|
150
|
+
// NVIDIA
|
|
151
|
+
"nvidia.nemotron-nano-3-30b": 256_000,
|
|
86
152
|
},
|
|
87
153
|
azure: {
|
|
88
154
|
_default: 128_000,
|
|
155
|
+
// GPT-5.x
|
|
156
|
+
"gpt-5.2": 400_000,
|
|
157
|
+
"gpt-5.2-pro": 400_000,
|
|
158
|
+
"gpt-5.2-codex": 400_000,
|
|
159
|
+
"gpt-5.1": 400_000,
|
|
160
|
+
"gpt-5": 400_000,
|
|
161
|
+
"gpt-5-mini": 400_000,
|
|
162
|
+
// GPT-4.1
|
|
163
|
+
"gpt-4.1": 1_047_576,
|
|
164
|
+
"gpt-4.1-mini": 1_047_576,
|
|
165
|
+
// GPT-4o
|
|
89
166
|
"gpt-4o": 128_000,
|
|
90
167
|
"gpt-4o-mini": 128_000,
|
|
168
|
+
// O-series
|
|
169
|
+
o3: 200_000,
|
|
170
|
+
"o3-mini": 200_000,
|
|
171
|
+
"o4-mini": 200_000,
|
|
172
|
+
// Legacy
|
|
91
173
|
"gpt-4-turbo": 128_000,
|
|
92
174
|
"gpt-4": 8_192,
|
|
93
175
|
},
|
|
94
176
|
mistral: {
|
|
95
177
|
_default: 128_000,
|
|
96
|
-
"mistral-large-latest":
|
|
97
|
-
"mistral-
|
|
178
|
+
"mistral-large-latest": 256_000,
|
|
179
|
+
"mistral-large-2512": 256_000,
|
|
180
|
+
"mistral-medium-latest": 128_000,
|
|
98
181
|
"mistral-small-latest": 128_000,
|
|
99
182
|
"codestral-latest": 256_000,
|
|
183
|
+
"codestral-2508": 256_000,
|
|
184
|
+
"devstral-2512": 256_000,
|
|
185
|
+
"devstral-small-2512": 256_000,
|
|
186
|
+
"magistral-medium-latest": 128_000,
|
|
100
187
|
},
|
|
101
188
|
ollama: {
|
|
102
189
|
_default: 128_000,
|
|
@@ -109,6 +196,10 @@ export const MODEL_CONTEXT_WINDOWS = {
|
|
|
109
196
|
},
|
|
110
197
|
sagemaker: {
|
|
111
198
|
_default: 128_000,
|
|
199
|
+
// NVIDIA Nemotron 3 Nano (February 2026) — 1M context
|
|
200
|
+
"nvidia-nemotron-3-nano-30b": 1_000_000,
|
|
201
|
+
// Qwen3 VL — 32K context
|
|
202
|
+
"qwen3-vl-8b-instruct": 32_768,
|
|
112
203
|
},
|
|
113
204
|
};
|
|
114
205
|
/**
|
|
@@ -22,23 +22,37 @@ export declare enum AIProviderName {
|
|
|
22
22
|
* OpenRouter uses 'provider/model' format
|
|
23
23
|
*/
|
|
24
24
|
export declare enum OpenRouterModels {
|
|
25
|
+
CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4.6",
|
|
26
|
+
CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4.6",
|
|
27
|
+
CLAUDE_SONNET_4_5 = "anthropic/claude-sonnet-4.5",
|
|
28
|
+
CLAUDE_HAIKU_4_5 = "anthropic/claude-haiku-4.5",
|
|
25
29
|
CLAUDE_3_5_SONNET = "anthropic/claude-3-5-sonnet",
|
|
26
30
|
CLAUDE_3_5_HAIKU = "anthropic/claude-3-5-haiku",
|
|
27
31
|
CLAUDE_3_OPUS = "anthropic/claude-3-opus",
|
|
32
|
+
GPT_5_2 = "openai/gpt-5.2",
|
|
33
|
+
GPT_5 = "openai/gpt-5",
|
|
28
34
|
GPT_4O = "openai/gpt-4o",
|
|
29
35
|
GPT_4O_MINI = "openai/gpt-4o-mini",
|
|
30
36
|
GPT_4_TURBO = "openai/gpt-4-turbo",
|
|
37
|
+
GEMINI_3_1_PRO_PREVIEW = "google/gemini-3.1-pro-preview",
|
|
38
|
+
GEMINI_3_PRO_PREVIEW = "google/gemini-3-pro-preview",
|
|
39
|
+
GEMINI_3_FLASH_PREVIEW = "google/gemini-3-flash-preview",
|
|
40
|
+
GEMINI_2_5_FLASH = "google/gemini-2.5-flash",
|
|
41
|
+
GEMINI_2_5_FLASH_LITE = "google/gemini-2.5-flash-lite",
|
|
31
42
|
GEMINI_2_0_FLASH = "google/gemini-2.0-flash",
|
|
32
|
-
GEMINI_1_5_PRO = "google/gemini-1.5-pro",
|
|
33
43
|
LLAMA_3_1_70B = "meta-llama/llama-3.1-70b-instruct",
|
|
34
44
|
LLAMA_3_1_8B = "meta-llama/llama-3.1-8b-instruct",
|
|
35
45
|
MISTRAL_LARGE = "mistralai/mistral-large",
|
|
36
|
-
MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct"
|
|
46
|
+
MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct",
|
|
47
|
+
DEEPSEEK_R1 = "deepseek/deepseek-r1",
|
|
48
|
+
GROK_4_1_FAST = "xai/grok-4.1-fast"
|
|
37
49
|
}
|
|
38
50
|
/**
|
|
39
51
|
* Supported Models for Amazon Bedrock
|
|
40
52
|
*/
|
|
41
53
|
export declare enum BedrockModels {
|
|
54
|
+
CLAUDE_4_6_OPUS = "anthropic.claude-opus-4-6-v1:0",
|
|
55
|
+
CLAUDE_4_6_SONNET = "anthropic.claude-sonnet-4-6",
|
|
42
56
|
CLAUDE_4_5_OPUS = "anthropic.claude-opus-4-5-20251124-v1:0",
|
|
43
57
|
CLAUDE_4_5_SONNET = "anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
44
58
|
CLAUDE_4_5_HAIKU = "anthropic.claude-haiku-4-5-20251001-v1:0",
|
|
@@ -104,18 +118,49 @@ export declare enum BedrockModels {
|
|
|
104
118
|
GEMMA_3_12B_IT = "google.gemma-3-12b-it",
|
|
105
119
|
GEMMA_3_4B_IT = "google.gemma-3-4b-it",
|
|
106
120
|
JAMBA_1_5_LARGE = "ai21.jamba-1-5-large-v1:0",
|
|
107
|
-
JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0"
|
|
121
|
+
JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0",
|
|
122
|
+
WRITER_PALMYRA_X5 = "writer.palmyra-x5-v1:0",
|
|
123
|
+
WRITER_PALMYRA_X4 = "writer.palmyra-x4-v1:0",
|
|
124
|
+
MINIMAX_M2_1 = "minimax.minimax-m2.1",
|
|
125
|
+
MINIMAX_M2 = "minimax.minimax-m2",
|
|
126
|
+
KIMI_K2_THINKING = "moonshot.kimi-k2-thinking",
|
|
127
|
+
KIMI_K2_5 = "moonshotai.kimi-k2.5",
|
|
128
|
+
NVIDIA_NEMOTRON_NANO_3_30B = "nvidia.nemotron-nano-3-30b",
|
|
129
|
+
NVIDIA_NEMOTRON_NANO_12B_V2 = "nvidia.nemotron-nano-12b-v2",
|
|
130
|
+
NVIDIA_NEMOTRON_NANO_9B_V2 = "nvidia.nemotron-nano-9b-v2",
|
|
131
|
+
OPENAI_GPT_OSS_120B = "openai.gpt-oss-120b-1:0",
|
|
132
|
+
OPENAI_GPT_OSS_20B = "openai.gpt-oss-20b-1:0",
|
|
133
|
+
GLM_4_7 = "zai.glm-4.7",
|
|
134
|
+
GLM_4_7_FLASH = "zai.glm-4.7-flash",
|
|
135
|
+
COHERE_EMBED_ENGLISH_V3 = "cohere.embed-english-v3",
|
|
136
|
+
COHERE_EMBED_MULTILINGUAL_V3 = "cohere.embed-multilingual-v3",
|
|
137
|
+
COHERE_EMBED_V4 = "cohere.embed-v4:0",
|
|
138
|
+
COHERE_RERANK_V3_5 = "cohere.rerank-v3-5:0",
|
|
139
|
+
AMAZON_RERANK_V1 = "amazon.rerank-v1:0",
|
|
140
|
+
DEVSTRAL_2_123B = "mistral.devstral-2-123b"
|
|
108
141
|
}
|
|
109
142
|
/**
|
|
110
143
|
* Supported Models for OpenAI
|
|
111
144
|
*/
|
|
112
145
|
export declare enum OpenAIModels {
|
|
146
|
+
GPT_5_3_CODEX = "gpt-5.3-codex",
|
|
113
147
|
GPT_5_2 = "gpt-5.2",
|
|
114
148
|
GPT_5_2_CHAT_LATEST = "gpt-5.2-chat-latest",
|
|
115
149
|
GPT_5_2_PRO = "gpt-5.2-pro",
|
|
150
|
+
GPT_5_2_CODEX = "gpt-5.2-codex",
|
|
151
|
+
GPT_5_1 = "gpt-5.1",
|
|
152
|
+
GPT_5_1_CHAT_LATEST = "gpt-5.1-chat-latest",
|
|
153
|
+
GPT_5_1_CODEX = "gpt-5.1-codex",
|
|
154
|
+
GPT_5_1_CODEX_MAX = "gpt-5.1-codex-max",
|
|
155
|
+
GPT_5_1_CODEX_MINI = "gpt-5.1-codex-mini",
|
|
116
156
|
GPT_5 = "gpt-5",
|
|
117
157
|
GPT_5_MINI = "gpt-5-mini",
|
|
118
158
|
GPT_5_NANO = "gpt-5-nano",
|
|
159
|
+
GPT_5_PRO = "gpt-5-pro",
|
|
160
|
+
GPT_5_CHAT_LATEST = "gpt-5-chat-latest",
|
|
161
|
+
GPT_5_CODEX = "gpt-5-codex",
|
|
162
|
+
GPT_OSS_120B = "gpt-oss-120b",
|
|
163
|
+
GPT_OSS_20B = "gpt-oss-20b",
|
|
119
164
|
GPT_4_1 = "gpt-4.1",
|
|
120
165
|
GPT_4_1_MINI = "gpt-4.1-mini",
|
|
121
166
|
GPT_4_1_NANO = "gpt-4.1-nano",
|
|
@@ -137,6 +182,10 @@ export declare enum OpenAIModels {
|
|
|
137
182
|
* Note: Azure uses deployment names, these are model identifiers
|
|
138
183
|
*/
|
|
139
184
|
export declare enum AzureOpenAIModels {
|
|
185
|
+
GPT_5_2 = "gpt-5.2",
|
|
186
|
+
GPT_5_2_CHAT = "gpt-5.2-chat",
|
|
187
|
+
GPT_5_2_PRO = "gpt-5.2-pro",
|
|
188
|
+
GPT_5_2_CODEX = "gpt-5.2-codex",
|
|
140
189
|
GPT_5_1 = "gpt-5.1",
|
|
141
190
|
GPT_5_1_CHAT = "gpt-5.1-chat",
|
|
142
191
|
GPT_5_1_CODEX = "gpt-5.1-codex",
|
|
@@ -172,6 +221,8 @@ export declare enum AzureOpenAIModels {
|
|
|
172
221
|
* Supported Models for Google Vertex AI
|
|
173
222
|
*/
|
|
174
223
|
export declare enum VertexModels {
|
|
224
|
+
CLAUDE_4_6_OPUS = "claude-opus-4-6",
|
|
225
|
+
CLAUDE_4_6_SONNET = "claude-sonnet-4-6",
|
|
175
226
|
CLAUDE_4_5_OPUS = "claude-opus-4-5@20251124",
|
|
176
227
|
CLAUDE_4_5_SONNET = "claude-sonnet-4-5@20250929",
|
|
177
228
|
CLAUDE_4_5_HAIKU = "claude-haiku-4-5@20251001",
|
|
@@ -183,19 +234,13 @@ export declare enum VertexModels {
|
|
|
183
234
|
CLAUDE_3_SONNET = "claude-3-sonnet-20240229",
|
|
184
235
|
CLAUDE_3_OPUS = "claude-3-opus-20240229",
|
|
185
236
|
CLAUDE_3_HAIKU = "claude-3-haiku-20240307",
|
|
186
|
-
|
|
237
|
+
GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
|
|
187
238
|
GEMINI_3_PRO = "gemini-3-pro",
|
|
188
|
-
/** Gemini 3 Pro Preview - Versioned preview (November 2025) */
|
|
189
239
|
GEMINI_3_PRO_PREVIEW_11_2025 = "gemini-3-pro-preview-11-2025",
|
|
190
|
-
/** Gemini 3 Pro Latest - Auto-updated alias (always points to latest preview) */
|
|
191
240
|
GEMINI_3_PRO_LATEST = "gemini-3-pro-latest",
|
|
192
|
-
/** Gemini 3 Pro Preview - Generic preview (legacy) */
|
|
193
241
|
GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
|
|
194
|
-
/** Gemini 3 Flash - Base model with adaptive thinking */
|
|
195
242
|
GEMINI_3_FLASH = "gemini-3-flash",
|
|
196
|
-
/** Gemini 3 Flash Preview - Versioned preview */
|
|
197
243
|
GEMINI_3_FLASH_PREVIEW = "gemini-3-flash-preview",
|
|
198
|
-
/** Gemini 3 Flash Latest - Auto-updated alias (always points to latest preview) */
|
|
199
244
|
GEMINI_3_FLASH_LATEST = "gemini-3-flash-latest",
|
|
200
245
|
GEMINI_2_5_PRO = "gemini-2.5-pro",
|
|
201
246
|
GEMINI_2_5_FLASH = "gemini-2.5-flash",
|
|
@@ -203,15 +248,17 @@ export declare enum VertexModels {
|
|
|
203
248
|
GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
|
|
204
249
|
GEMINI_2_0_FLASH = "gemini-2.0-flash",
|
|
205
250
|
GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
|
|
206
|
-
/** Gemini 2.0 Flash Lite - GA, production-ready, cost-optimized */
|
|
207
251
|
GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
|
|
252
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
208
253
|
GEMINI_1_5_PRO = "gemini-1.5-pro-002",
|
|
254
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
209
255
|
GEMINI_1_5_FLASH = "gemini-1.5-flash-002"
|
|
210
256
|
}
|
|
211
257
|
/**
|
|
212
258
|
* Supported Models for Google AI Studio
|
|
213
259
|
*/
|
|
214
260
|
export declare enum GoogleAIModels {
|
|
261
|
+
GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
|
|
215
262
|
GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
|
|
216
263
|
GEMINI_3_PRO_IMAGE_PREVIEW = "gemini-3-pro-image-preview",
|
|
217
264
|
GEMINI_3_FLASH = "gemini-3-flash",
|
|
@@ -220,20 +267,26 @@ export declare enum GoogleAIModels {
|
|
|
220
267
|
GEMINI_2_5_FLASH = "gemini-2.5-flash",
|
|
221
268
|
GEMINI_2_5_FLASH_LITE = "gemini-2.5-flash-lite",
|
|
222
269
|
GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
|
|
223
|
-
|
|
270
|
+
GEMINI_2_5_FLASH_PREVIEW_TTS = "gemini-2.5-flash-preview-tts",
|
|
271
|
+
GEMINI_2_5_PRO_PREVIEW_TTS = "gemini-2.5-pro-preview-tts",
|
|
224
272
|
GEMINI_2_0_FLASH = "gemini-2.0-flash",
|
|
225
273
|
GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
|
|
226
274
|
GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
|
|
227
275
|
GEMINI_2_0_FLASH_IMAGE = "gemini-2.0-flash-preview-image-generation",
|
|
276
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
228
277
|
GEMINI_1_5_PRO = "gemini-1.5-pro",
|
|
278
|
+
/** @deprecated Retired Sep 2025. Use Gemini 2.5+ */
|
|
229
279
|
GEMINI_1_5_FLASH = "gemini-1.5-flash",
|
|
230
280
|
GEMINI_EMBEDDING = "gemini-embedding-001",
|
|
281
|
+
/** @deprecated Shutdown Jan 2026. Use gemini-embedding-001 */
|
|
231
282
|
TEXT_EMBEDDING_004 = "text-embedding-004"
|
|
232
283
|
}
|
|
233
284
|
/**
|
|
234
285
|
* Supported Models for Anthropic (Direct API)
|
|
235
286
|
*/
|
|
236
287
|
export declare enum AnthropicModels {
|
|
288
|
+
CLAUDE_OPUS_4_6 = "claude-opus-4-6",
|
|
289
|
+
CLAUDE_SONNET_4_6 = "claude-sonnet-4-6",
|
|
237
290
|
CLAUDE_OPUS_4_5 = "claude-opus-4-5-20251101",
|
|
238
291
|
CLAUDE_SONNET_4_5 = "claude-sonnet-4-5-20250929",
|
|
239
292
|
CLAUDE_4_5_HAIKU = "claude-haiku-4-5-20251001",
|
|
@@ -271,6 +324,13 @@ export declare enum MistralModels {
|
|
|
271
324
|
PIXTRAL_12B = "pixtral-12b",
|
|
272
325
|
VOXTRAL_SMALL_LATEST = "voxtral-small-latest",
|
|
273
326
|
VOXTRAL_MINI_LATEST = "voxtral-mini-latest",
|
|
327
|
+
DEVSTRAL_2 = "devstral-2512",
|
|
328
|
+
DEVSTRAL_SMALL_2 = "devstral-small-2512",
|
|
329
|
+
MAGISTRAL_MEDIUM_2509 = "magistral-medium-2509",
|
|
330
|
+
MAGISTRAL_SMALL_2509 = "magistral-small-2509",
|
|
331
|
+
VOXTRAL_MINI_TRANSCRIBE_2 = "voxtral-mini-2602",
|
|
332
|
+
MISTRAL_OCR_3 = "mistral-ocr-2512",
|
|
333
|
+
MISTRAL_OCR_LATEST = "mistral-ocr-latest",
|
|
274
334
|
MISTRAL_NEMO = "mistral-nemo",
|
|
275
335
|
MISTRAL_EMBED = "mistral-embed",
|
|
276
336
|
MISTRAL_MODERATION_LATEST = "mistral-moderation-latest"
|
|
@@ -341,7 +401,17 @@ export declare enum OllamaModels {
|
|
|
341
401
|
STARCODER2_15B = "starcoder2:15b",
|
|
342
402
|
MIXTRAL_8X7B = "mixtral:8x7b",
|
|
343
403
|
MIXTRAL_8X22B = "mixtral:8x22b",
|
|
344
|
-
COMMAND_R_PLUS = "command-r-plus:104b"
|
|
404
|
+
COMMAND_R_PLUS = "command-r-plus:104b",
|
|
405
|
+
GLM_5_LATEST = "glm-5:latest",
|
|
406
|
+
KIMI_K2_5_LATEST = "kimi-k2.5:latest",
|
|
407
|
+
QWEN3_5_LATEST = "qwen3.5:latest",
|
|
408
|
+
QWEN3_CODER_LATEST = "qwen3-coder:latest",
|
|
409
|
+
QWEN3_CODER_30B = "qwen3-coder:30b",
|
|
410
|
+
DEEPSEEK_V3_2_LATEST = "deepseek-v3.2:latest",
|
|
411
|
+
NEMOTRON_3_NANO_LATEST = "nemotron-3-nano:latest",
|
|
412
|
+
NEMOTRON_3_NANO_30B = "nemotron-3-nano:30b",
|
|
413
|
+
SMOLLM3_3B = "smollm3:3b",
|
|
414
|
+
GPT_OSS_LATEST = "gpt-oss:latest"
|
|
345
415
|
}
|
|
346
416
|
/**
|
|
347
417
|
* Common Models for LiteLLM Proxy
|
|
@@ -381,6 +451,12 @@ export declare enum LiteLLMModels {
|
|
|
381
451
|
MISTRAL_MAGISTRAL_MEDIUM = "mistral/magistral-medium-2506",
|
|
382
452
|
BEDROCK_CLAUDE_3_5_SONNET = "bedrock/anthropic.claude-3-5-sonnet-20240620-v1:0",
|
|
383
453
|
BEDROCK_CLAUDE_3_HAIKU = "bedrock/anthropic.claude-3-haiku-20240307-v1:0",
|
|
454
|
+
OPENAI_GPT_5_2 = "openai/gpt-5.2",
|
|
455
|
+
OPENAI_GPT_5_2_CODEX = "openai/gpt-5.2-codex",
|
|
456
|
+
ANTHROPIC_CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4-6",
|
|
457
|
+
ANTHROPIC_CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4-6",
|
|
458
|
+
GEMINI_3_1_PRO = "gemini/gemini-3.1-pro-preview",
|
|
459
|
+
XAI_GROK_4_1_FAST = "xai/grok-4.1-fast",
|
|
384
460
|
PERPLEXITY_SONAR_PRO = "perplexity/sonar-pro",
|
|
385
461
|
PERPLEXITY_SONAR_REASONING_PRO = "perplexity/sonar-reasoning-pro"
|
|
386
462
|
}
|
|
@@ -433,7 +509,13 @@ export declare enum HuggingFaceModels {
|
|
|
433
509
|
STARCODER2_15B = "bigcode/starcoder2-15b",
|
|
434
510
|
CODELLAMA_34B_INSTRUCT = "codellama/CodeLlama-34b-Instruct-hf",
|
|
435
511
|
BLOOM_7B1 = "bigscience/bloom-7b1",
|
|
436
|
-
BLOOM_1B3 = "bigscience/bloom-1b3"
|
|
512
|
+
BLOOM_1B3 = "bigscience/bloom-1b3",
|
|
513
|
+
GLM_5 = "zai-org/GLM-5",
|
|
514
|
+
QWEN_3_5_397B_A17B = "Qwen/Qwen3.5-397B-A17B",
|
|
515
|
+
NEMOTRON_3_NANO_30B = "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16",
|
|
516
|
+
SMOLLM3_3B = "HuggingFaceTB/SmolLM3-3B",
|
|
517
|
+
FALCON_3_7B_INSTRUCT = "tiiuae/Falcon3-7B-Instruct",
|
|
518
|
+
FALCON_3_10B_INSTRUCT = "tiiuae/Falcon3-10B-Instruct"
|
|
437
519
|
}
|
|
438
520
|
/**
|
|
439
521
|
* Supported Models for AWS SageMaker JumpStart
|
|
@@ -455,7 +537,9 @@ export declare enum SageMakerModels {
|
|
|
455
537
|
FALCON_3_7B = "tii-falcon-3-7b-instruct",
|
|
456
538
|
FALCON_3_10B = "tii-falcon-3-10b-instruct",
|
|
457
539
|
FALCON_40B = "tii-falcon-40b-instruct",
|
|
458
|
-
FALCON_180B = "tii-falcon-180b"
|
|
540
|
+
FALCON_180B = "tii-falcon-180b",
|
|
541
|
+
NEMOTRON_3_NANO_30B = "nvidia-nemotron-3-nano-30b",
|
|
542
|
+
QWEN3_VL_8B = "qwen3-vl-8b-instruct"
|
|
459
543
|
}
|
|
460
544
|
/**
|
|
461
545
|
* API Versions for various providers
|