@juspay/neurolink 9.30.0 → 9.31.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +14 -0
- package/README.md +2 -3
- package/dist/adapters/providerImageAdapter.js +13 -22
- package/dist/adapters/video/videoAnalyzer.d.ts +4 -4
- package/dist/adapters/video/videoAnalyzer.js +3 -3
- package/dist/agent/directTools.d.ts +20 -289
- package/dist/agent/directTools.js +11 -10
- package/dist/auth/accountPool.d.ts +68 -0
- package/dist/auth/accountPool.js +178 -0
- package/dist/auth/anthropicOAuth.d.ts +15 -5
- package/dist/auth/anthropicOAuth.js +117 -57
- package/dist/auth/index.d.ts +7 -5
- package/dist/auth/index.js +6 -2
- package/dist/auth/tokenStore.d.ts +71 -27
- package/dist/auth/tokenStore.js +342 -64
- package/dist/cli/commands/auth.d.ts +39 -2
- package/dist/cli/commands/auth.js +585 -36
- package/dist/cli/commands/config.d.ts +47 -574
- package/dist/cli/commands/config.js +142 -24
- package/dist/cli/commands/docs.d.ts +1 -5
- package/dist/cli/commands/observability.d.ts +1 -17
- package/dist/cli/commands/ollama.js +1 -1
- package/dist/cli/commands/proxy.d.ts +20 -0
- package/dist/cli/commands/proxy.js +1254 -0
- package/dist/cli/commands/setup-anthropic.js +1 -1
- package/dist/cli/commands/setup-azure.js +1 -1
- package/dist/cli/commands/setup-bedrock.js +2 -2
- package/dist/cli/commands/setup-gcp.js +1 -1
- package/dist/cli/commands/setup-google-ai.js +1 -1
- package/dist/cli/commands/setup-huggingface.js +2 -2
- package/dist/cli/commands/setup-mistral.js +1 -1
- package/dist/cli/commands/setup-openai.js +1 -1
- package/dist/cli/commands/setup.js +3 -3
- package/dist/cli/commands/telemetry.d.ts +1 -22
- package/dist/cli/factories/authCommandFactory.d.ts +16 -11
- package/dist/cli/factories/authCommandFactory.js +96 -1
- package/dist/cli/factories/ollamaCommandFactory.js +1 -1
- package/dist/cli/factories/sagemakerCommandFactory.js +25 -6
- package/dist/cli/index.d.ts +0 -6
- package/dist/cli/index.js +5 -2
- package/dist/cli/loop/conversationSelector.js +7 -2
- package/dist/cli/parser.js +19 -1
- package/dist/cli/utils/envManager.js +2 -2
- package/dist/cli/utils/ollamaUtils.d.ts +1 -2
- package/dist/client/adapters/providerImageAdapter.js +588 -0
- package/dist/client/adapters/tts/googleTTSHandler.js +344 -0
- package/dist/client/adapters/video/directorPipeline.js +516 -0
- package/dist/client/adapters/video/ffmpegAdapter.js +206 -0
- package/dist/client/adapters/video/frameExtractor.js +143 -0
- package/dist/client/adapters/video/vertexVideoHandler.js +763 -0
- package/dist/client/adapters/video/videoAnalyzer.js +238 -0
- package/dist/client/adapters/video/videoMerger.js +171 -0
- package/dist/client/agent/directTools.js +840 -0
- package/dist/client/aiSdkAdapter.d.ts +196 -0
- package/dist/client/aiSdkAdapter.js +487 -0
- package/dist/client/auth/anthropicOAuth.js +974 -0
- package/dist/client/auth/tokenStore.js +799 -0
- package/dist/client/auth.d.ts +248 -0
- package/dist/client/auth.js +473 -0
- package/dist/client/client/aiSdkAdapter.js +487 -0
- package/dist/client/client/auth.js +473 -0
- package/dist/client/client/errors.js +552 -0
- package/dist/client/client/httpClient.js +837 -0
- package/dist/client/client/index.js +172 -0
- package/dist/client/client/interceptors.js +601 -0
- package/dist/client/client/reactHooks.js +1159 -0
- package/dist/client/client/sseClient.js +545 -0
- package/dist/client/client/streamingClient.js +917 -0
- package/dist/client/client/wsClient.js +369 -0
- package/dist/client/config/configManager.js +303 -0
- package/dist/client/config/conversationMemory.js +86 -0
- package/dist/client/config/taskClassificationConfig.js +148 -0
- package/dist/client/constants/contextWindows.js +295 -0
- package/dist/client/constants/enums.js +853 -0
- package/dist/client/constants/index.js +207 -0
- package/dist/client/constants/performance.js +389 -0
- package/dist/client/constants/retry.js +266 -0
- package/dist/client/constants/timeouts.js +182 -0
- package/dist/client/constants/tokens.js +380 -0
- package/dist/client/constants/videoErrors.js +46 -0
- package/dist/client/context/budgetChecker.js +98 -0
- package/dist/client/context/contextCompactor.js +205 -0
- package/dist/client/context/emergencyTruncation.js +88 -0
- package/dist/client/context/errorDetection.js +171 -0
- package/dist/client/context/errors.js +21 -0
- package/dist/client/context/fileTokenBudget.js +127 -0
- package/dist/client/context/prompts/summarizationPrompt.js +117 -0
- package/dist/client/context/stages/fileReadDeduplicator.js +66 -0
- package/dist/client/context/stages/slidingWindowTruncator.js +190 -0
- package/dist/client/context/stages/structuredSummarizer.js +99 -0
- package/dist/client/context/stages/toolOutputPruner.js +52 -0
- package/dist/client/context/summarizationEngine.js +136 -0
- package/dist/client/context/toolOutputLimits.js +78 -0
- package/dist/client/context/toolPairRepair.js +66 -0
- package/dist/client/core/analytics.js +88 -0
- package/dist/client/core/baseProvider.js +1385 -0
- package/dist/client/core/constants.js +140 -0
- package/dist/client/core/conversationMemoryFactory.js +141 -0
- package/dist/client/core/conversationMemoryInitializer.js +128 -0
- package/dist/client/core/conversationMemoryManager.js +344 -0
- package/dist/client/core/dynamicModels.js +358 -0
- package/dist/client/core/evaluation.js +309 -0
- package/dist/client/core/evaluationProviders.js +248 -0
- package/dist/client/core/factory.js +412 -0
- package/dist/client/core/infrastructure/baseError.js +22 -0
- package/dist/client/core/infrastructure/baseFactory.js +54 -0
- package/dist/client/core/infrastructure/baseRegistry.js +49 -0
- package/dist/client/core/infrastructure/index.js +5 -0
- package/dist/client/core/infrastructure/retry.js +20 -0
- package/dist/client/core/infrastructure/typedEventEmitter.js +23 -0
- package/dist/client/core/modelConfiguration.js +851 -0
- package/dist/client/core/modules/GenerationHandler.js +588 -0
- package/dist/client/core/modules/MessageBuilder.js +273 -0
- package/dist/client/core/modules/StreamHandler.js +185 -0
- package/dist/client/core/modules/TelemetryHandler.js +203 -0
- package/dist/client/core/modules/ToolsManager.js +499 -0
- package/dist/client/core/modules/Utilities.js +331 -0
- package/dist/client/core/redisConversationMemoryManager.js +1435 -0
- package/dist/client/core/streamAnalytics.js +131 -0
- package/dist/client/errors.d.ts +299 -0
- package/dist/client/errors.js +552 -0
- package/dist/client/evaluation/contextBuilder.js +134 -0
- package/dist/client/evaluation/index.js +61 -0
- package/dist/client/evaluation/prompts.js +73 -0
- package/dist/client/evaluation/ragasEvaluator.js +110 -0
- package/dist/client/evaluation/retryManager.js +78 -0
- package/dist/client/evaluation/scoring.js +61 -0
- package/dist/client/factories/providerFactory.js +166 -0
- package/dist/client/factories/providerRegistry.js +166 -0
- package/dist/client/features/ppt/constants.js +896 -0
- package/dist/client/features/ppt/contentPlanner.js +529 -0
- package/dist/client/features/ppt/presentationOrchestrator.js +236 -0
- package/dist/client/features/ppt/slideGenerator.js +532 -0
- package/dist/client/features/ppt/slideRenderers.js +2383 -0
- package/dist/client/features/ppt/slideTypeInference.js +405 -0
- package/dist/client/features/ppt/types.js +13 -0
- package/dist/client/features/ppt/utils.js +443 -0
- package/dist/client/files/fileReferenceRegistry.js +1543 -0
- package/dist/client/files/fileTools.js +450 -0
- package/dist/client/files/streamingReader.js +321 -0
- package/dist/client/files/types.js +23 -0
- package/dist/client/hitl/hitlErrors.js +54 -0
- package/dist/client/hitl/hitlManager.js +460 -0
- package/dist/client/httpClient.d.ts +297 -0
- package/dist/client/httpClient.js +837 -0
- package/dist/client/index.d.ts +111 -0
- package/dist/client/index.js +511 -0
- package/dist/client/interceptors.d.ts +283 -0
- package/dist/client/interceptors.js +601 -0
- package/dist/client/mcp/agentExposure.js +356 -0
- package/dist/client/mcp/auth/index.js +11 -0
- package/dist/client/mcp/auth/oauthClientProvider.js +325 -0
- package/dist/client/mcp/auth/tokenStorage.js +134 -0
- package/dist/client/mcp/batching/index.js +10 -0
- package/dist/client/mcp/batching/requestBatcher.js +441 -0
- package/dist/client/mcp/caching/index.js +10 -0
- package/dist/client/mcp/caching/toolCache.js +433 -0
- package/dist/client/mcp/elicitation/elicitationManager.js +376 -0
- package/dist/client/mcp/elicitation/index.js +11 -0
- package/dist/client/mcp/elicitation/types.js +10 -0
- package/dist/client/mcp/elicitationProtocol.js +375 -0
- package/dist/client/mcp/enhancedToolDiscovery.js +481 -0
- package/dist/client/mcp/externalServerManager.js +1478 -0
- package/dist/client/mcp/factory.js +161 -0
- package/dist/client/mcp/flexibleToolValidator.js +161 -0
- package/dist/client/mcp/httpRateLimiter.js +391 -0
- package/dist/client/mcp/httpRetryHandler.js +178 -0
- package/dist/client/mcp/index.js +74 -0
- package/dist/client/mcp/mcpCircuitBreaker.js +427 -0
- package/dist/client/mcp/mcpClientFactory.js +708 -0
- package/dist/client/mcp/mcpRegistryClient.js +488 -0
- package/dist/client/mcp/mcpServerBase.js +373 -0
- package/dist/client/mcp/multiServerManager.js +579 -0
- package/dist/client/mcp/registry.js +158 -0
- package/dist/client/mcp/routing/index.js +10 -0
- package/dist/client/mcp/routing/toolRouter.js +416 -0
- package/dist/client/mcp/serverCapabilities.js +502 -0
- package/dist/client/mcp/servers/agent/directToolsServer.js +150 -0
- package/dist/client/mcp/toolAnnotations.js +239 -0
- package/dist/client/mcp/toolConverter.js +258 -0
- package/dist/client/mcp/toolDiscoveryService.js +798 -0
- package/dist/client/mcp/toolIntegration.js +334 -0
- package/dist/client/mcp/toolRegistry.js +719 -0
- package/dist/client/memory/hippocampusInitializer.js +19 -0
- package/dist/client/memory/memoryRetrievalTools.js +166 -0
- package/dist/client/middleware/builtin/analytics.js +132 -0
- package/dist/client/middleware/builtin/autoEvaluation.js +203 -0
- package/dist/client/middleware/builtin/guardrails.js +109 -0
- package/dist/client/middleware/builtin/lifecycle.js +168 -0
- package/dist/client/middleware/factory.js +327 -0
- package/dist/client/middleware/registry.js +295 -0
- package/dist/client/middleware/utils/guardrailsUtils.js +396 -0
- package/dist/client/models/anthropicModels.js +527 -0
- package/dist/client/neurolink.js +8015 -0
- package/dist/client/observability/exporterRegistry.js +413 -0
- package/dist/client/observability/exporters/arizeExporter.js +138 -0
- package/dist/client/observability/exporters/baseExporter.js +190 -0
- package/dist/client/observability/exporters/braintrustExporter.js +154 -0
- package/dist/client/observability/exporters/datadogExporter.js +196 -0
- package/dist/client/observability/exporters/laminarExporter.js +302 -0
- package/dist/client/observability/exporters/langfuseExporter.js +209 -0
- package/dist/client/observability/exporters/langsmithExporter.js +143 -0
- package/dist/client/observability/exporters/otelExporter.js +164 -0
- package/dist/client/observability/exporters/posthogExporter.js +287 -0
- package/dist/client/observability/exporters/sentryExporter.js +165 -0
- package/dist/client/observability/index.js +31 -0
- package/dist/client/observability/metricsAggregator.js +556 -0
- package/dist/client/observability/otelBridge.js +131 -0
- package/dist/client/observability/retryPolicy.js +383 -0
- package/dist/client/observability/sampling/samplers.js +216 -0
- package/dist/client/observability/spanProcessor.js +303 -0
- package/dist/client/observability/tokenTracker.js +413 -0
- package/dist/client/observability/types/exporterTypes.js +5 -0
- package/dist/client/observability/types/index.js +4 -0
- package/dist/client/observability/types/spanTypes.js +92 -0
- package/dist/client/observability/utils/safeMetadata.js +25 -0
- package/dist/client/observability/utils/spanSerializer.js +292 -0
- package/dist/client/processors/archive/ArchiveProcessor.js +1308 -0
- package/dist/client/processors/base/BaseFileProcessor.js +614 -0
- package/dist/client/processors/base/types.js +82 -0
- package/dist/client/processors/config/fileTypes.js +520 -0
- package/dist/client/processors/config/index.js +92 -0
- package/dist/client/processors/config/languageMap.js +410 -0
- package/dist/client/processors/config/mimeTypes.js +363 -0
- package/dist/client/processors/config/sizeLimits.js +258 -0
- package/dist/client/processors/document/ExcelProcessor.js +590 -0
- package/dist/client/processors/document/OpenDocumentProcessor.js +212 -0
- package/dist/client/processors/document/PptxProcessor.js +157 -0
- package/dist/client/processors/document/RtfProcessor.js +361 -0
- package/dist/client/processors/document/WordProcessor.js +353 -0
- package/dist/client/processors/errors/FileErrorCode.js +255 -0
- package/dist/client/processors/errors/errorHelpers.js +386 -0
- package/dist/client/processors/errors/errorSerializer.js +507 -0
- package/dist/client/processors/errors/index.js +49 -0
- package/dist/client/processors/markup/SvgProcessor.js +240 -0
- package/dist/client/processors/media/AudioProcessor.js +707 -0
- package/dist/client/processors/media/VideoProcessor.js +1045 -0
- package/dist/client/providers/amazonBedrock.js +1512 -0
- package/dist/client/providers/amazonSagemaker.js +162 -0
- package/dist/client/providers/anthropic.js +831 -0
- package/dist/client/providers/azureOpenai.js +143 -0
- package/dist/client/providers/googleAiStudio.js +1200 -0
- package/dist/client/providers/googleNativeGemini3.js +543 -0
- package/dist/client/providers/googleVertex.js +2936 -0
- package/dist/client/providers/huggingFace.js +315 -0
- package/dist/client/providers/litellm.js +488 -0
- package/dist/client/providers/mistral.js +157 -0
- package/dist/client/providers/ollama.js +1579 -0
- package/dist/client/providers/openAI.js +627 -0
- package/dist/client/providers/openRouter.js +543 -0
- package/dist/client/providers/openaiCompatible.js +290 -0
- package/dist/client/providers/providerTypeUtils.js +46 -0
- package/dist/client/providers/sagemaker/adaptive-semaphore.js +215 -0
- package/dist/client/providers/sagemaker/client.js +472 -0
- package/dist/client/providers/sagemaker/config.js +317 -0
- package/dist/client/providers/sagemaker/detection.js +606 -0
- package/dist/client/providers/sagemaker/error-constants.js +227 -0
- package/dist/client/providers/sagemaker/errors.js +299 -0
- package/dist/client/providers/sagemaker/language-model.js +775 -0
- package/dist/client/providers/sagemaker/parsers.js +634 -0
- package/dist/client/providers/sagemaker/streaming.js +331 -0
- package/dist/client/providers/sagemaker/structured-parser.js +625 -0
- package/dist/client/proxy/accountQuota.js +162 -0
- package/dist/client/proxy/claudeFormat.js +595 -0
- package/dist/client/proxy/modelRouter.js +29 -0
- package/dist/client/proxy/oauthFetch.js +367 -0
- package/dist/client/proxy/proxyFetch.js +586 -0
- package/dist/client/proxy/requestLogger.js +207 -0
- package/dist/client/proxy/tokenRefresh.js +124 -0
- package/dist/client/proxy/usageStats.js +74 -0
- package/dist/client/proxy/utils/noProxyUtils.js +149 -0
- package/dist/client/rag/ChunkerFactory.js +320 -0
- package/dist/client/rag/ChunkerRegistry.js +421 -0
- package/dist/client/rag/chunkers/BaseChunker.js +143 -0
- package/dist/client/rag/chunkers/CharacterChunker.js +28 -0
- package/dist/client/rag/chunkers/HTMLChunker.js +38 -0
- package/dist/client/rag/chunkers/JSONChunker.js +68 -0
- package/dist/client/rag/chunkers/LaTeXChunker.js +63 -0
- package/dist/client/rag/chunkers/MarkdownChunker.js +306 -0
- package/dist/client/rag/chunkers/RecursiveChunker.js +139 -0
- package/dist/client/rag/chunkers/SemanticMarkdownChunker.js +138 -0
- package/dist/client/rag/chunkers/SentenceChunker.js +66 -0
- package/dist/client/rag/chunkers/TokenChunker.js +61 -0
- package/dist/client/rag/chunkers/index.js +15 -0
- package/dist/client/rag/chunking/characterChunker.js +142 -0
- package/dist/client/rag/chunking/chunkerRegistry.js +194 -0
- package/dist/client/rag/chunking/htmlChunker.js +247 -0
- package/dist/client/rag/chunking/index.js +17 -0
- package/dist/client/rag/chunking/jsonChunker.js +281 -0
- package/dist/client/rag/chunking/latexChunker.js +251 -0
- package/dist/client/rag/chunking/markdownChunker.js +373 -0
- package/dist/client/rag/chunking/recursiveChunker.js +148 -0
- package/dist/client/rag/chunking/semanticChunker.js +306 -0
- package/dist/client/rag/chunking/sentenceChunker.js +230 -0
- package/dist/client/rag/chunking/tokenChunker.js +183 -0
- package/dist/client/rag/document/MDocument.js +392 -0
- package/dist/client/rag/document/index.js +5 -0
- package/dist/client/rag/document/loaders.js +500 -0
- package/dist/client/rag/errors/RAGError.js +274 -0
- package/dist/client/rag/errors/index.js +6 -0
- package/dist/client/rag/graphRag/graphRAG.js +401 -0
- package/dist/client/rag/graphRag/index.js +4 -0
- package/dist/client/rag/index.js +141 -0
- package/dist/client/rag/metadata/MetadataExtractorFactory.js +418 -0
- package/dist/client/rag/metadata/MetadataExtractorRegistry.js +362 -0
- package/dist/client/rag/metadata/index.js +9 -0
- package/dist/client/rag/metadata/metadataExtractor.js +280 -0
- package/dist/client/rag/pipeline/RAGPipeline.js +436 -0
- package/dist/client/rag/pipeline/contextAssembly.js +341 -0
- package/dist/client/rag/pipeline/index.js +5 -0
- package/dist/client/rag/ragIntegration.js +321 -0
- package/dist/client/rag/reranker/RerankerFactory.js +430 -0
- package/dist/client/rag/reranker/RerankerRegistry.js +402 -0
- package/dist/client/rag/reranker/index.js +9 -0
- package/dist/client/rag/reranker/reranker.js +277 -0
- package/dist/client/rag/resilience/CircuitBreaker.js +431 -0
- package/dist/client/rag/resilience/RetryHandler.js +304 -0
- package/dist/client/rag/resilience/index.js +7 -0
- package/dist/client/rag/retrieval/hybridSearch.js +335 -0
- package/dist/client/rag/retrieval/index.js +5 -0
- package/dist/client/rag/retrieval/vectorQueryTool.js +307 -0
- package/dist/client/rag/types.js +8 -0
- package/dist/client/reactHooks.d.ts +239 -0
- package/dist/client/reactHooks.tsx +1483 -0
- package/dist/client/sdk/toolRegistration.js +377 -0
- package/dist/client/server/abstract/baseServerAdapter.js +575 -0
- package/dist/client/server/adapters/expressAdapter.js +486 -0
- package/dist/client/server/adapters/fastifyAdapter.js +472 -0
- package/dist/client/server/adapters/honoAdapter.js +632 -0
- package/dist/client/server/adapters/koaAdapter.js +510 -0
- package/dist/client/server/errors.js +486 -0
- package/dist/client/server/factory/serverAdapterFactory.js +160 -0
- package/dist/client/server/index.js +108 -0
- package/dist/client/server/middleware/abortSignal.js +111 -0
- package/dist/client/server/middleware/auth.js +388 -0
- package/dist/client/server/middleware/cache.js +359 -0
- package/dist/client/server/middleware/common.js +281 -0
- package/dist/client/server/middleware/deprecation.js +190 -0
- package/dist/client/server/middleware/mcpBodyAttachment.js +63 -0
- package/dist/client/server/middleware/rateLimit.js +227 -0
- package/dist/client/server/middleware/validation.js +388 -0
- package/dist/client/server/openapi/generator.js +398 -0
- package/dist/client/server/openapi/index.js +36 -0
- package/dist/client/server/openapi/schemas.js +695 -0
- package/dist/client/server/openapi/templates.js +374 -0
- package/dist/client/server/routes/agentRoutes.js +171 -0
- package/dist/client/server/routes/claudeProxyRoutes.js +1600 -0
- package/dist/client/server/routes/healthRoutes.js +187 -0
- package/dist/client/server/routes/index.js +57 -0
- package/dist/client/server/routes/mcpRoutes.js +342 -0
- package/dist/client/server/routes/memoryRoutes.js +350 -0
- package/dist/client/server/routes/openApiRoutes.js +126 -0
- package/dist/client/server/routes/toolRoutes.js +199 -0
- package/dist/client/server/streaming/dataStream.js +486 -0
- package/dist/client/server/streaming/index.js +11 -0
- package/dist/client/server/types.js +67 -0
- package/dist/client/server/utils/redaction.js +334 -0
- package/dist/client/server/utils/validation.js +243 -0
- package/dist/client/server/websocket/WebSocketHandler.js +383 -0
- package/dist/client/server/websocket/index.js +4 -0
- package/dist/client/services/server/ai/observability/instrumentation.js +808 -0
- package/dist/client/sseClient.d.ts +156 -0
- package/dist/client/sseClient.js +545 -0
- package/dist/client/streamingClient.d.ts +327 -0
- package/dist/client/streamingClient.js +917 -0
- package/dist/client/telemetry/attributes.js +100 -0
- package/dist/client/telemetry/index.js +26 -0
- package/dist/client/telemetry/telemetryService.js +308 -0
- package/dist/client/telemetry/tracers.js +17 -0
- package/dist/client/telemetry/withSpan.js +34 -0
- package/dist/client/types/actionTypes.js +6 -0
- package/dist/client/types/analytics.js +5 -0
- package/dist/client/types/authTypes.js +8 -0
- package/dist/client/types/circuitBreakerErrors.js +34 -0
- package/dist/client/types/cli.js +21 -0
- package/dist/client/types/clientTypes.js +10 -0
- package/dist/client/types/common.js +51 -0
- package/dist/client/types/configTypes.js +49 -0
- package/dist/client/types/content.js +19 -0
- package/dist/client/types/contextTypes.js +400 -0
- package/dist/client/types/conversation.js +47 -0
- package/dist/client/types/conversationMemoryInterface.js +6 -0
- package/dist/client/types/domainTypes.js +5 -0
- package/dist/client/types/errors.js +167 -0
- package/dist/client/types/evaluation.js +5 -0
- package/dist/client/types/evaluationProviders.js +5 -0
- package/dist/client/types/evaluationTypes.js +1 -0
- package/dist/client/types/externalMcp.js +6 -0
- package/dist/client/types/fileReferenceTypes.js +8 -0
- package/dist/client/types/fileTypes.js +4 -0
- package/dist/client/types/generateTypes.js +1 -0
- package/dist/client/types/guardrails.js +1 -0
- package/dist/client/types/hitlTypes.js +8 -0
- package/dist/client/types/index.js +57 -0
- package/dist/client/types/mcpTypes.js +5 -0
- package/dist/client/types/middlewareTypes.js +1 -0
- package/dist/client/types/modelTypes.js +30 -0
- package/dist/client/types/multimodal.js +135 -0
- package/dist/client/types/observability.js +6 -0
- package/dist/client/types/pptTypes.js +82 -0
- package/dist/client/types/providers.js +111 -0
- package/dist/client/types/proxyTypes.js +16 -0
- package/dist/client/types/ragTypes.js +7 -0
- package/dist/client/types/sdkTypes.js +8 -0
- package/dist/client/types/serviceTypes.js +5 -0
- package/dist/client/types/streamTypes.js +1 -0
- package/dist/client/types/subscriptionTypes.js +9 -0
- package/dist/client/types/taskClassificationTypes.js +5 -0
- package/dist/client/types/tools.js +24 -0
- package/dist/client/types/ttsTypes.js +57 -0
- package/dist/client/types/typeAliases.js +48 -0
- package/dist/client/types/utilities.js +4 -0
- package/dist/client/types/workflowTypes.js +30 -0
- package/dist/client/utils/async/withTimeout.js +98 -0
- package/dist/client/utils/asyncMutex.js +60 -0
- package/dist/client/utils/conversationMemory.js +431 -0
- package/dist/client/utils/csvProcessor.js +846 -0
- package/dist/client/utils/errorHandling.js +936 -0
- package/dist/client/utils/evaluationUtils.js +131 -0
- package/dist/client/utils/factoryProcessing.js +589 -0
- package/dist/client/utils/fileDetector.js +2161 -0
- package/dist/client/utils/imageCache.js +376 -0
- package/dist/client/utils/imageProcessor.js +704 -0
- package/dist/client/utils/logger.js +491 -0
- package/dist/client/utils/mcpDefaults.js +134 -0
- package/dist/client/utils/messageBuilder.js +1653 -0
- package/dist/client/utils/modelAliasResolver.js +54 -0
- package/dist/client/utils/modelDetection.js +80 -0
- package/dist/client/utils/modelRouter.js +292 -0
- package/dist/client/utils/multimodalOptionsBuilder.js +65 -0
- package/dist/client/utils/observabilityHelpers.js +47 -0
- package/dist/client/utils/parameterValidation.js +966 -0
- package/dist/client/utils/pdfProcessor.js +410 -0
- package/dist/client/utils/performance.js +222 -0
- package/dist/client/utils/pricing.js +340 -0
- package/dist/client/utils/promptRedaction.js +62 -0
- package/dist/client/utils/providerConfig.js +1009 -0
- package/dist/client/utils/providerHealth.js +1237 -0
- package/dist/client/utils/providerRetry.js +112 -0
- package/dist/client/utils/providerUtils.js +434 -0
- package/dist/client/utils/rateLimiter.js +200 -0
- package/dist/client/utils/redis.js +368 -0
- package/dist/client/utils/retryHandler.js +269 -0
- package/dist/client/utils/retryability.js +22 -0
- package/dist/client/utils/sanitizers/svg.js +481 -0
- package/dist/client/utils/schemaConversion.js +255 -0
- package/dist/client/utils/taskClassificationUtils.js +149 -0
- package/dist/client/utils/taskClassifier.js +94 -0
- package/dist/client/utils/thinkingConfig.js +104 -0
- package/dist/client/utils/timeout.js +359 -0
- package/dist/client/utils/tokenEstimation.js +142 -0
- package/dist/client/utils/tokenLimits.js +125 -0
- package/dist/client/utils/tokenUtils.js +239 -0
- package/dist/client/utils/toolUtils.js +75 -0
- package/dist/client/utils/transformationUtils.js +554 -0
- package/dist/client/utils/ttsProcessor.js +286 -0
- package/dist/client/utils/typeUtils.js +97 -0
- package/dist/client/utils/videoAnalysisProcessor.js +67 -0
- package/dist/client/workflow/config.js +398 -0
- package/dist/client/workflow/core/ensembleExecutor.js +407 -0
- package/dist/client/workflow/core/judgeScorer.js +544 -0
- package/dist/client/workflow/core/responseConditioner.js +225 -0
- package/dist/client/workflow/core/types/conditionerTypes.js +7 -0
- package/dist/client/workflow/core/types/ensembleTypes.js +7 -0
- package/dist/client/workflow/core/types/index.js +7 -0
- package/dist/client/workflow/core/types/judgeTypes.js +7 -0
- package/dist/client/workflow/core/types/layerTypes.js +7 -0
- package/dist/client/workflow/core/types/registryTypes.js +7 -0
- package/dist/client/workflow/core/workflowRegistry.js +304 -0
- package/dist/client/workflow/core/workflowRunner.js +586 -0
- package/dist/client/workflow/index.js +50 -0
- package/dist/client/workflow/types.js +9 -0
- package/dist/client/workflow/utils/types/index.js +7 -0
- package/dist/client/workflow/utils/workflowMetrics.js +311 -0
- package/dist/client/workflow/utils/workflowValidation.js +420 -0
- package/dist/client/workflow/workflows/adaptiveWorkflow.js +366 -0
- package/dist/client/workflow/workflows/consensusWorkflow.js +192 -0
- package/dist/client/workflow/workflows/fallbackWorkflow.js +225 -0
- package/dist/client/workflow/workflows/multiJudgeWorkflow.js +351 -0
- package/dist/client/wsClient.d.ts +130 -0
- package/dist/client/wsClient.js +369 -0
- package/dist/config/configManager.js +2 -2
- package/dist/constants/contextWindows.js +15 -13
- package/dist/constants/enums.d.ts +10 -16
- package/dist/constants/enums.js +12 -18
- package/dist/constants/index.d.ts +0 -10
- package/dist/constants/index.js +1 -1
- package/dist/constants/tokens.d.ts +29 -16
- package/dist/constants/tokens.js +23 -16
- package/dist/core/baseProvider.d.ts +5 -5
- package/dist/core/baseProvider.js +6 -6
- package/dist/core/constants.js +6 -1
- package/dist/core/dynamicModels.js +10 -6
- package/dist/core/evaluationProviders.js +1 -1
- package/dist/core/infrastructure/baseError.d.ts +1 -1
- package/dist/core/infrastructure/baseFactory.d.ts +1 -6
- package/dist/core/infrastructure/baseRegistry.d.ts +6 -5
- package/dist/core/infrastructure/index.d.ts +6 -4
- package/dist/core/infrastructure/index.js +2 -2
- package/dist/core/modelConfiguration.js +3 -1
- package/dist/core/modules/GenerationHandler.d.ts +3 -3
- package/dist/core/modules/GenerationHandler.js +49 -41
- package/dist/core/modules/MessageBuilder.d.ts +5 -5
- package/dist/core/modules/MessageBuilder.js +4 -6
- package/dist/core/modules/StreamHandler.js +26 -12
- package/dist/core/modules/TelemetryHandler.d.ts +4 -6
- package/dist/core/modules/TelemetryHandler.js +7 -6
- package/dist/core/modules/ToolsManager.d.ts +2 -12
- package/dist/core/modules/ToolsManager.js +20 -4
- package/dist/core/modules/Utilities.js +3 -1
- package/dist/core/redisConversationMemoryManager.js +3 -3
- package/dist/core/streamAnalytics.js +23 -9
- package/dist/evaluation/contextBuilder.d.ts +2 -2
- package/dist/evaluation/contextBuilder.js +2 -2
- package/dist/evaluation/index.d.ts +2 -2
- package/dist/evaluation/retryManager.js +1 -1
- package/dist/factories/providerFactory.js +2 -2
- package/dist/features/ppt/constants.js +1 -1
- package/dist/features/ppt/presentationOrchestrator.js +7 -3
- package/dist/features/ppt/slideGenerator.d.ts +2 -1
- package/dist/features/ppt/slideGenerator.js +6 -1
- package/dist/files/fileTools.d.ts +16 -247
- package/dist/files/fileTools.js +16 -15
- package/dist/index.d.ts +5 -3
- package/dist/index.js +20 -3
- package/dist/lib/adapters/providerImageAdapter.js +13 -22
- package/dist/lib/adapters/video/videoAnalyzer.d.ts +4 -4
- package/dist/lib/adapters/video/videoAnalyzer.js +3 -3
- package/dist/lib/agent/directTools.d.ts +20 -289
- package/dist/lib/agent/directTools.js +11 -10
- package/dist/lib/auth/accountPool.d.ts +68 -0
- package/dist/lib/auth/accountPool.js +179 -0
- package/dist/lib/auth/anthropicOAuth.d.ts +15 -5
- package/dist/lib/auth/anthropicOAuth.js +117 -57
- package/dist/lib/auth/index.d.ts +7 -5
- package/dist/lib/auth/index.js +6 -2
- package/dist/lib/auth/tokenStore.d.ts +71 -27
- package/dist/lib/auth/tokenStore.js +342 -64
- package/dist/lib/client/aiSdkAdapter.d.ts +196 -0
- package/dist/lib/client/aiSdkAdapter.js +488 -0
- package/dist/lib/client/auth.d.ts +248 -0
- package/dist/lib/client/auth.js +474 -0
- package/dist/lib/client/errors.d.ts +299 -0
- package/dist/lib/client/errors.js +553 -0
- package/dist/lib/client/httpClient.d.ts +297 -0
- package/dist/lib/client/httpClient.js +838 -0
- package/dist/lib/client/index.d.ts +111 -0
- package/dist/lib/client/index.js +173 -0
- package/dist/lib/client/interceptors.d.ts +283 -0
- package/dist/lib/client/interceptors.js +602 -0
- package/dist/lib/client/reactHooks.d.ts +239 -0
- package/dist/lib/client/reactHooks.js +1160 -0
- package/dist/lib/client/sseClient.d.ts +156 -0
- package/dist/lib/client/sseClient.js +546 -0
- package/dist/lib/client/streamingClient.d.ts +327 -0
- package/dist/lib/client/streamingClient.js +918 -0
- package/dist/lib/client/wsClient.d.ts +130 -0
- package/dist/lib/client/wsClient.js +370 -0
- package/dist/lib/config/configManager.js +2 -2
- package/dist/lib/constants/contextWindows.js +15 -13
- package/dist/lib/constants/enums.d.ts +10 -16
- package/dist/lib/constants/enums.js +12 -18
- package/dist/lib/constants/index.d.ts +0 -10
- package/dist/lib/constants/index.js +1 -1
- package/dist/lib/constants/tokens.d.ts +29 -16
- package/dist/lib/constants/tokens.js +23 -16
- package/dist/lib/core/baseProvider.d.ts +5 -5
- package/dist/lib/core/baseProvider.js +6 -6
- package/dist/lib/core/constants.js +6 -1
- package/dist/lib/core/dynamicModels.js +10 -6
- package/dist/lib/core/evaluationProviders.js +1 -1
- package/dist/lib/core/infrastructure/baseError.d.ts +1 -1
- package/dist/lib/core/infrastructure/baseFactory.d.ts +1 -6
- package/dist/lib/core/infrastructure/baseRegistry.d.ts +6 -5
- package/dist/lib/core/infrastructure/index.d.ts +6 -4
- package/dist/lib/core/infrastructure/index.js +2 -2
- package/dist/lib/core/modelConfiguration.js +3 -1
- package/dist/lib/core/modules/GenerationHandler.d.ts +3 -3
- package/dist/lib/core/modules/GenerationHandler.js +49 -41
- package/dist/lib/core/modules/MessageBuilder.d.ts +5 -5
- package/dist/lib/core/modules/MessageBuilder.js +4 -6
- package/dist/lib/core/modules/StreamHandler.js +26 -12
- package/dist/lib/core/modules/TelemetryHandler.d.ts +4 -6
- package/dist/lib/core/modules/TelemetryHandler.js +7 -6
- package/dist/lib/core/modules/ToolsManager.d.ts +2 -12
- package/dist/lib/core/modules/ToolsManager.js +20 -4
- package/dist/lib/core/modules/Utilities.js +3 -1
- package/dist/lib/core/redisConversationMemoryManager.js +3 -3
- package/dist/lib/core/streamAnalytics.js +23 -9
- package/dist/lib/evaluation/contextBuilder.d.ts +2 -2
- package/dist/lib/evaluation/contextBuilder.js +2 -2
- package/dist/lib/evaluation/index.d.ts +2 -2
- package/dist/lib/evaluation/retryManager.js +1 -1
- package/dist/lib/factories/providerFactory.js +2 -2
- package/dist/lib/features/ppt/constants.js +1 -1
- package/dist/lib/features/ppt/presentationOrchestrator.js +7 -3
- package/dist/lib/features/ppt/slideGenerator.d.ts +2 -1
- package/dist/lib/features/ppt/slideGenerator.js +6 -1
- package/dist/lib/files/fileTools.d.ts +16 -247
- package/dist/lib/files/fileTools.js +16 -15
- package/dist/lib/index.d.ts +5 -3
- package/dist/lib/index.js +20 -3
- package/dist/lib/mcp/batching/requestBatcher.js +1 -1
- package/dist/lib/mcp/externalServerManager.js +5 -2
- package/dist/lib/mcp/factory.js +1 -1
- package/dist/lib/mcp/index.d.ts +1 -1
- package/dist/lib/mcp/index.js +1 -1
- package/dist/lib/mcp/mcpCircuitBreaker.d.ts +1 -0
- package/dist/lib/mcp/mcpCircuitBreaker.js +30 -4
- package/dist/lib/mcp/mcpClientFactory.js +33 -4
- package/dist/lib/mcp/toolDiscoveryService.js +52 -5
- package/dist/lib/mcp/toolRegistry.js +7 -1
- package/dist/lib/memory/memoryRetrievalTools.d.ts +5 -89
- package/dist/lib/memory/memoryRetrievalTools.js +1 -1
- package/dist/lib/middleware/builtin/analytics.js +3 -0
- package/dist/lib/middleware/builtin/autoEvaluation.js +46 -24
- package/dist/lib/middleware/builtin/guardrails.js +4 -0
- package/dist/lib/middleware/builtin/lifecycle.js +10 -6
- package/dist/lib/middleware/factory.d.ts +3 -3
- package/dist/lib/middleware/factory.js +3 -2
- package/dist/lib/middleware/index.d.ts +1 -1
- package/dist/lib/middleware/registry.d.ts +2 -2
- package/dist/lib/middleware/registry.js +1 -0
- package/dist/lib/middleware/utils/guardrailsUtils.d.ts +5 -6
- package/dist/lib/middleware/utils/guardrailsUtils.js +15 -6
- package/dist/lib/neurolink.d.ts +9 -20
- package/dist/lib/neurolink.js +278 -186
- package/dist/lib/observability/retryPolicy.d.ts +2 -13
- package/dist/lib/observability/sampling/samplers.d.ts +2 -11
- package/dist/lib/observability/spanProcessor.d.ts +2 -14
- package/dist/lib/processors/base/BaseFileProcessor.js +1 -1
- package/dist/lib/processors/document/OpenDocumentProcessor.js +5 -3
- package/dist/lib/processors/media/VideoProcessor.js +157 -101
- package/dist/lib/providers/amazonBedrock.js +12 -5
- package/dist/lib/providers/amazonSagemaker.d.ts +5 -5
- package/dist/lib/providers/amazonSagemaker.js +6 -2
- package/dist/lib/providers/anthropic.d.ts +3 -3
- package/dist/lib/providers/anthropic.js +23 -192
- package/dist/lib/providers/anthropicBaseProvider.d.ts +4 -4
- package/dist/lib/providers/anthropicBaseProvider.js +24 -13
- package/dist/lib/providers/azureOpenai.d.ts +2 -2
- package/dist/lib/providers/azureOpenai.js +6 -6
- package/dist/lib/providers/googleAiStudio.d.ts +2 -2
- package/dist/lib/providers/googleAiStudio.js +15 -7
- package/dist/lib/providers/googleNativeGemini3.d.ts +3 -54
- package/dist/lib/providers/googleNativeGemini3.js +14 -10
- package/dist/lib/providers/googleVertex.d.ts +6 -6
- package/dist/lib/providers/googleVertex.js +32 -26
- package/dist/lib/providers/huggingFace.d.ts +4 -4
- package/dist/lib/providers/huggingFace.js +15 -5
- package/dist/lib/providers/litellm.d.ts +4 -4
- package/dist/lib/providers/litellm.js +54 -42
- package/dist/lib/providers/mistral.d.ts +2 -2
- package/dist/lib/providers/mistral.js +5 -4
- package/dist/lib/providers/ollama.d.ts +7 -4
- package/dist/lib/providers/ollama.js +30 -8
- package/dist/lib/providers/openAI.d.ts +2 -2
- package/dist/lib/providers/openAI.js +46 -21
- package/dist/lib/providers/openRouter.d.ts +4 -4
- package/dist/lib/providers/openRouter.js +63 -35
- package/dist/lib/providers/openaiCompatible.d.ts +2 -2
- package/dist/lib/providers/openaiCompatible.js +18 -9
- package/dist/lib/providers/providerTypeUtils.d.ts +28 -0
- package/dist/lib/providers/providerTypeUtils.js +47 -0
- package/dist/lib/providers/sagemaker/config.js +5 -5
- package/dist/lib/providers/sagemaker/language-model.d.ts +23 -13
- package/dist/lib/providers/sagemaker/language-model.js +20 -8
- package/dist/lib/proxy/accountQuota.d.ts +33 -0
- package/dist/lib/proxy/accountQuota.js +163 -0
- package/dist/lib/proxy/claudeFormat.d.ts +143 -0
- package/dist/lib/proxy/claudeFormat.js +596 -0
- package/dist/lib/proxy/cloaking/index.d.ts +44 -0
- package/dist/lib/proxy/cloaking/index.js +87 -0
- package/dist/lib/proxy/cloaking/plugins/headerScrubber.d.ts +9 -0
- package/dist/lib/proxy/cloaking/plugins/headerScrubber.js +87 -0
- package/dist/lib/proxy/cloaking/plugins/sessionIdentity.d.ts +15 -0
- package/dist/lib/proxy/cloaking/plugins/sessionIdentity.js +66 -0
- package/dist/lib/proxy/cloaking/plugins/systemPromptInjector.d.ts +11 -0
- package/dist/lib/proxy/cloaking/plugins/systemPromptInjector.js +84 -0
- package/dist/lib/proxy/cloaking/plugins/tlsFingerprint.d.ts +14 -0
- package/dist/lib/proxy/cloaking/plugins/tlsFingerprint.js +39 -0
- package/dist/lib/proxy/cloaking/plugins/wordObfuscator.d.ts +9 -0
- package/dist/lib/proxy/cloaking/plugins/wordObfuscator.js +122 -0
- package/dist/lib/proxy/cloaking/types.d.ts +1 -0
- package/dist/lib/proxy/cloaking/types.js +2 -0
- package/dist/lib/proxy/modelRouter.d.ts +10 -0
- package/dist/lib/proxy/modelRouter.js +30 -0
- package/dist/lib/proxy/oauthFetch.d.ts +36 -0
- package/dist/lib/proxy/oauthFetch.js +368 -0
- package/dist/lib/proxy/proxyConfig.d.ts +42 -0
- package/dist/lib/proxy/proxyConfig.js +500 -0
- package/dist/lib/proxy/proxyFetch.js +2 -1
- package/dist/lib/proxy/requestLogger.d.ts +50 -0
- package/dist/lib/proxy/requestLogger.js +208 -0
- package/dist/lib/proxy/tokenRefresh.d.ts +4 -0
- package/dist/lib/proxy/tokenRefresh.js +125 -0
- package/dist/lib/proxy/usageStats.d.ts +13 -0
- package/dist/lib/proxy/usageStats.js +75 -0
- package/dist/lib/rag/document/loaders.js +1 -1
- package/dist/lib/rag/pipeline/contextAssembly.d.ts +4 -7
- package/dist/lib/rag/ragIntegration.d.ts +2 -14
- package/dist/lib/rag/ragIntegration.js +1 -1
- package/dist/lib/rag/resilience/CircuitBreaker.d.ts +5 -44
- package/dist/lib/rag/resilience/RetryHandler.js +1 -1
- package/dist/lib/rag/retrieval/vectorQueryTool.d.ts +1 -9
- package/dist/lib/rag/retrieval/vectorQueryTool.js +1 -1
- package/dist/lib/sdk/toolRegistration.js +12 -1
- package/dist/lib/server/abstract/baseServerAdapter.js +2 -2
- package/dist/lib/server/adapters/honoAdapter.d.ts +6 -0
- package/dist/lib/server/adapters/honoAdapter.js +76 -10
- package/dist/lib/server/middleware/cache.js +3 -0
- package/dist/lib/server/routes/claudeProxyRoutes.d.ts +44 -0
- package/dist/lib/server/routes/claudeProxyRoutes.js +1601 -0
- package/dist/lib/server/routes/healthRoutes.js +18 -1
- package/dist/lib/server/routes/index.d.ts +7 -0
- package/dist/lib/server/routes/index.js +8 -0
- package/dist/lib/server/streaming/dataStream.d.ts +1 -5
- package/dist/lib/server/streaming/dataStream.js +3 -0
- package/dist/lib/server/utils/validation.d.ts +24 -124
- package/dist/lib/server/utils/validation.js +2 -2
- package/dist/lib/services/server/ai/observability/instrumentation.js +4 -0
- package/dist/lib/telemetry/attributes.d.ts +38 -0
- package/dist/lib/telemetry/attributes.js +40 -0
- package/dist/lib/telemetry/tracers.d.ts +1 -0
- package/dist/lib/telemetry/tracers.js +1 -0
- package/dist/lib/types/authTypes.d.ts +56 -0
- package/dist/lib/types/authTypes.js +9 -0
- package/dist/lib/types/circuitBreakerErrors.d.ts +30 -0
- package/dist/lib/types/circuitBreakerErrors.js +35 -0
- package/dist/lib/types/cli.d.ts +258 -0
- package/dist/lib/types/clientTypes.d.ts +1050 -0
- package/dist/lib/types/clientTypes.js +11 -0
- package/dist/lib/types/common.d.ts +123 -0
- package/dist/lib/types/configTypes.d.ts +49 -0
- package/dist/lib/types/configTypes.js +4 -0
- package/dist/lib/types/conversation.d.ts +0 -5
- package/dist/lib/types/evaluationTypes.d.ts +2 -2
- package/dist/lib/types/fileTypes.d.ts +47 -0
- package/dist/lib/types/generateTypes.d.ts +7 -3
- package/dist/lib/types/guardrails.d.ts +2 -2
- package/dist/lib/types/index.d.ts +4 -1
- package/dist/lib/types/index.js +5 -0
- package/dist/lib/types/middlewareTypes.d.ts +3 -3
- package/dist/lib/types/modelTypes.d.ts +7 -97
- package/dist/lib/types/modelTypes.js +3 -3
- package/dist/lib/types/observability.d.ts +37 -0
- package/dist/lib/types/providers.d.ts +107 -0
- package/dist/lib/types/proxyTypes.d.ts +536 -0
- package/dist/lib/types/proxyTypes.js +17 -0
- package/dist/lib/types/ragTypes.d.ts +49 -1
- package/dist/lib/types/streamTypes.d.ts +37 -13
- package/dist/lib/types/subscriptionTypes.d.ts +77 -0
- package/dist/lib/types/subscriptionTypes.js +2 -0
- package/dist/lib/types/tools.d.ts +45 -1
- package/dist/lib/types/typeAliases.d.ts +8 -0
- package/dist/lib/types/typeAliases.js +1 -0
- package/dist/lib/utils/async/retry.d.ts +4 -33
- package/dist/lib/utils/asyncMutex.d.ts +14 -0
- package/dist/lib/utils/asyncMutex.js +61 -0
- package/dist/lib/utils/errorHandling.d.ts +2 -1
- package/dist/lib/utils/errorHandling.js +14 -6
- package/dist/lib/utils/fileDetector.d.ts +13 -1
- package/dist/lib/utils/fileDetector.js +114 -32
- package/dist/lib/utils/imageProcessor.js +7 -7
- package/dist/lib/utils/json/safeParse.d.ts +1 -8
- package/dist/lib/utils/mcpDefaults.d.ts +1 -1
- package/dist/lib/utils/mcpDefaults.js +11 -2
- package/dist/lib/utils/messageBuilder.d.ts +5 -5
- package/dist/lib/utils/messageBuilder.js +106 -80
- package/dist/lib/utils/modelChoices.d.ts +1 -8
- package/dist/lib/utils/pdfProcessor.d.ts +1 -25
- package/dist/lib/utils/pdfProcessor.js +5 -4
- package/dist/lib/utils/pricing.js +28 -5
- package/dist/lib/utils/providerHealth.d.ts +1 -1
- package/dist/lib/utils/rateLimiter.d.ts +1 -15
- package/dist/lib/utils/redis.d.ts +1 -1
- package/dist/lib/utils/redis.js +3 -3
- package/dist/lib/utils/sanitizers/filename.d.ts +2 -22
- package/dist/lib/utils/sanitizers/index.d.ts +4 -2
- package/dist/lib/utils/sanitizers/svg.d.ts +1 -11
- package/dist/lib/utils/schemaConversion.js +4 -1
- package/dist/lib/utils/thinkingConfig.d.ts +1 -33
- package/dist/lib/utils/tokenUtils.d.ts +1 -39
- package/dist/lib/utils/videoAnalysisProcessor.d.ts +5 -5
- package/dist/lib/utils/videoAnalysisProcessor.js +2 -2
- package/dist/lib/workflow/config.d.ts +89 -1257
- package/dist/lib/workflow/utils/workflowValidation.js +1 -1
- package/dist/mcp/batching/requestBatcher.js +1 -1
- package/dist/mcp/externalServerManager.js +5 -2
- package/dist/mcp/factory.js +1 -1
- package/dist/mcp/index.d.ts +1 -1
- package/dist/mcp/index.js +1 -1
- package/dist/mcp/mcpCircuitBreaker.d.ts +1 -0
- package/dist/mcp/mcpCircuitBreaker.js +30 -4
- package/dist/mcp/mcpClientFactory.js +33 -4
- package/dist/mcp/toolDiscoveryService.js +52 -5
- package/dist/mcp/toolRegistry.js +7 -1
- package/dist/memory/memoryRetrievalTools.d.ts +5 -89
- package/dist/memory/memoryRetrievalTools.js +1 -1
- package/dist/middleware/builtin/analytics.js +3 -0
- package/dist/middleware/builtin/autoEvaluation.js +46 -24
- package/dist/middleware/builtin/guardrails.js +4 -0
- package/dist/middleware/builtin/lifecycle.js +10 -6
- package/dist/middleware/factory.d.ts +3 -3
- package/dist/middleware/factory.js +3 -2
- package/dist/middleware/index.d.ts +1 -1
- package/dist/middleware/registry.d.ts +2 -2
- package/dist/middleware/registry.js +1 -0
- package/dist/middleware/utils/guardrailsUtils.d.ts +5 -6
- package/dist/middleware/utils/guardrailsUtils.js +15 -6
- package/dist/neurolink.d.ts +9 -20
- package/dist/neurolink.js +278 -186
- package/dist/observability/retryPolicy.d.ts +2 -13
- package/dist/observability/sampling/samplers.d.ts +2 -11
- package/dist/observability/spanProcessor.d.ts +2 -14
- package/dist/processors/base/BaseFileProcessor.js +1 -1
- package/dist/processors/document/OpenDocumentProcessor.js +5 -3
- package/dist/processors/media/VideoProcessor.js +157 -101
- package/dist/providers/amazonBedrock.js +12 -5
- package/dist/providers/amazonSagemaker.d.ts +5 -5
- package/dist/providers/amazonSagemaker.js +6 -2
- package/dist/providers/anthropic.d.ts +3 -3
- package/dist/providers/anthropic.js +23 -192
- package/dist/providers/anthropicBaseProvider.d.ts +4 -4
- package/dist/providers/anthropicBaseProvider.js +24 -13
- package/dist/providers/azureOpenai.d.ts +2 -2
- package/dist/providers/azureOpenai.js +6 -6
- package/dist/providers/googleAiStudio.d.ts +2 -2
- package/dist/providers/googleAiStudio.js +15 -7
- package/dist/providers/googleNativeGemini3.d.ts +3 -54
- package/dist/providers/googleNativeGemini3.js +14 -10
- package/dist/providers/googleVertex.d.ts +6 -6
- package/dist/providers/googleVertex.js +32 -26
- package/dist/providers/huggingFace.d.ts +4 -4
- package/dist/providers/huggingFace.js +15 -5
- package/dist/providers/litellm.d.ts +4 -4
- package/dist/providers/litellm.js +54 -42
- package/dist/providers/mistral.d.ts +2 -2
- package/dist/providers/mistral.js +5 -4
- package/dist/providers/ollama.d.ts +7 -4
- package/dist/providers/ollama.js +30 -8
- package/dist/providers/openAI.d.ts +2 -2
- package/dist/providers/openAI.js +46 -21
- package/dist/providers/openRouter.d.ts +4 -4
- package/dist/providers/openRouter.js +63 -35
- package/dist/providers/openaiCompatible.d.ts +2 -2
- package/dist/providers/openaiCompatible.js +18 -9
- package/dist/providers/providerTypeUtils.d.ts +28 -0
- package/dist/providers/providerTypeUtils.js +46 -0
- package/dist/providers/sagemaker/config.js +5 -5
- package/dist/providers/sagemaker/language-model.d.ts +23 -13
- package/dist/providers/sagemaker/language-model.js +20 -8
- package/dist/proxy/accountQuota.d.ts +33 -0
- package/dist/proxy/accountQuota.js +162 -0
- package/dist/proxy/claudeFormat.d.ts +143 -0
- package/dist/proxy/claudeFormat.js +595 -0
- package/dist/proxy/cloaking/index.d.ts +44 -0
- package/dist/proxy/cloaking/index.js +86 -0
- package/dist/proxy/cloaking/plugins/headerScrubber.d.ts +9 -0
- package/dist/proxy/cloaking/plugins/headerScrubber.js +86 -0
- package/dist/proxy/cloaking/plugins/sessionIdentity.d.ts +15 -0
- package/dist/proxy/cloaking/plugins/sessionIdentity.js +65 -0
- package/dist/proxy/cloaking/plugins/systemPromptInjector.d.ts +11 -0
- package/dist/proxy/cloaking/plugins/systemPromptInjector.js +83 -0
- package/dist/proxy/cloaking/plugins/tlsFingerprint.d.ts +14 -0
- package/dist/proxy/cloaking/plugins/tlsFingerprint.js +38 -0
- package/dist/proxy/cloaking/plugins/wordObfuscator.d.ts +9 -0
- package/dist/proxy/cloaking/plugins/wordObfuscator.js +121 -0
- package/dist/proxy/cloaking/types.d.ts +1 -0
- package/dist/proxy/cloaking/types.js +1 -0
- package/dist/proxy/modelRouter.d.ts +10 -0
- package/dist/proxy/modelRouter.js +29 -0
- package/dist/proxy/oauthFetch.d.ts +36 -0
- package/dist/proxy/oauthFetch.js +367 -0
- package/dist/proxy/proxyConfig.d.ts +42 -0
- package/dist/proxy/proxyConfig.js +499 -0
- package/dist/proxy/proxyFetch.js +2 -1
- package/dist/proxy/requestLogger.d.ts +50 -0
- package/dist/proxy/requestLogger.js +207 -0
- package/dist/proxy/tokenRefresh.d.ts +4 -0
- package/dist/proxy/tokenRefresh.js +124 -0
- package/dist/proxy/usageStats.d.ts +13 -0
- package/dist/proxy/usageStats.js +74 -0
- package/dist/rag/document/loaders.js +1 -1
- package/dist/rag/pipeline/contextAssembly.d.ts +4 -7
- package/dist/rag/ragIntegration.d.ts +2 -14
- package/dist/rag/ragIntegration.js +1 -1
- package/dist/rag/resilience/CircuitBreaker.d.ts +5 -44
- package/dist/rag/resilience/RetryHandler.js +1 -1
- package/dist/rag/retrieval/vectorQueryTool.d.ts +1 -9
- package/dist/rag/retrieval/vectorQueryTool.js +1 -1
- package/dist/sdk/toolRegistration.js +12 -1
- package/dist/server/abstract/baseServerAdapter.js +2 -2
- package/dist/server/adapters/honoAdapter.d.ts +6 -0
- package/dist/server/adapters/honoAdapter.js +76 -10
- package/dist/server/middleware/cache.js +3 -0
- package/dist/server/routes/claudeProxyRoutes.d.ts +44 -0
- package/dist/server/routes/claudeProxyRoutes.js +1600 -0
- package/dist/server/routes/healthRoutes.js +18 -1
- package/dist/server/routes/index.d.ts +7 -0
- package/dist/server/routes/index.js +8 -0
- package/dist/server/streaming/dataStream.d.ts +1 -5
- package/dist/server/streaming/dataStream.js +3 -0
- package/dist/server/utils/validation.d.ts +24 -124
- package/dist/server/utils/validation.js +2 -2
- package/dist/services/server/ai/observability/instrumentation.js +4 -0
- package/dist/telemetry/attributes.d.ts +38 -0
- package/dist/telemetry/attributes.js +40 -0
- package/dist/telemetry/tracers.d.ts +1 -0
- package/dist/telemetry/tracers.js +1 -0
- package/dist/types/authTypes.d.ts +56 -0
- package/dist/types/authTypes.js +8 -0
- package/dist/types/circuitBreakerErrors.d.ts +30 -0
- package/dist/types/circuitBreakerErrors.js +34 -0
- package/dist/types/cli.d.ts +258 -0
- package/dist/types/clientTypes.d.ts +1050 -0
- package/dist/types/clientTypes.js +10 -0
- package/dist/types/common.d.ts +123 -0
- package/dist/types/configTypes.d.ts +49 -0
- package/dist/types/configTypes.js +4 -0
- package/dist/types/conversation.d.ts +0 -5
- package/dist/types/evaluationTypes.d.ts +2 -2
- package/dist/types/fileTypes.d.ts +47 -0
- package/dist/types/generateTypes.d.ts +7 -3
- package/dist/types/guardrails.d.ts +2 -2
- package/dist/types/index.d.ts +4 -1
- package/dist/types/index.js +5 -0
- package/dist/types/middlewareTypes.d.ts +3 -3
- package/dist/types/modelTypes.d.ts +7 -97
- package/dist/types/modelTypes.js +3 -3
- package/dist/types/observability.d.ts +37 -0
- package/dist/types/providers.d.ts +107 -0
- package/dist/types/proxyTypes.d.ts +536 -0
- package/dist/types/proxyTypes.js +16 -0
- package/dist/types/ragTypes.d.ts +49 -1
- package/dist/types/streamTypes.d.ts +37 -13
- package/dist/types/subscriptionTypes.d.ts +77 -0
- package/dist/types/subscriptionTypes.js +2 -0
- package/dist/types/tools.d.ts +45 -1
- package/dist/types/typeAliases.d.ts +8 -0
- package/dist/types/typeAliases.js +1 -0
- package/dist/utils/async/retry.d.ts +4 -33
- package/dist/utils/asyncMutex.d.ts +14 -0
- package/dist/utils/asyncMutex.js +60 -0
- package/dist/utils/errorHandling.d.ts +2 -1
- package/dist/utils/errorHandling.js +14 -6
- package/dist/utils/fileDetector.d.ts +13 -1
- package/dist/utils/fileDetector.js +114 -32
- package/dist/utils/imageProcessor.js +7 -7
- package/dist/utils/json/safeParse.d.ts +1 -8
- package/dist/utils/mcpDefaults.d.ts +1 -1
- package/dist/utils/mcpDefaults.js +11 -2
- package/dist/utils/messageBuilder.d.ts +5 -5
- package/dist/utils/messageBuilder.js +106 -80
- package/dist/utils/modelChoices.d.ts +1 -8
- package/dist/utils/pdfProcessor.d.ts +1 -25
- package/dist/utils/pdfProcessor.js +5 -4
- package/dist/utils/pricing.js +28 -5
- package/dist/utils/rateLimiter.d.ts +1 -15
- package/dist/utils/redis.d.ts +1 -1
- package/dist/utils/redis.js +3 -3
- package/dist/utils/sanitizers/filename.d.ts +2 -22
- package/dist/utils/sanitizers/index.d.ts +4 -2
- package/dist/utils/sanitizers/svg.d.ts +1 -11
- package/dist/utils/schemaConversion.js +4 -1
- package/dist/utils/thinkingConfig.d.ts +1 -33
- package/dist/utils/tokenUtils.d.ts +1 -39
- package/dist/utils/videoAnalysisProcessor.d.ts +5 -5
- package/dist/utils/videoAnalysisProcessor.js +2 -2
- package/dist/workflow/config.d.ts +89 -1257
- package/dist/workflow/utils/workflowValidation.js +1 -1
- package/docs-site/mcp-server/index.js +2 -3
- package/package.json +138 -105
- package/dist/lib/memory/mem0Initializer.d.ts +0 -46
- package/dist/lib/memory/mem0Initializer.js +0 -85
- package/dist/memory/mem0Initializer.d.ts +0 -46
- package/dist/memory/mem0Initializer.js +0 -84
|
@@ -0,0 +1,775 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* SageMaker Language Model Implementation
|
|
3
|
+
*
|
|
4
|
+
* This module implements the LanguageModel interface for Amazon SageMaker
|
|
5
|
+
* integration with the Vercel AI SDK.
|
|
6
|
+
*/
|
|
7
|
+
import { randomUUID } from "crypto";
|
|
8
|
+
import { SageMakerRuntimeClient } from "./client.js";
|
|
9
|
+
import { handleSageMakerError } from "./errors.js";
|
|
10
|
+
import { estimateTokenUsage, createSageMakerStream } from "./streaming.js";
|
|
11
|
+
import { createAdaptiveSemaphore } from "./adaptive-semaphore.js";
|
|
12
|
+
import { logger } from "../../utils/logger.js";
|
|
13
|
+
/**
|
|
14
|
+
* Base synthetic streaming delay in milliseconds for simulating real-time response
|
|
15
|
+
* Can be configured via SAGEMAKER_BASE_STREAMING_DELAY_MS environment variable
|
|
16
|
+
*/
|
|
17
|
+
const BASE_SYNTHETIC_STREAMING_DELAY_MS = process.env
|
|
18
|
+
.SAGEMAKER_BASE_STREAMING_DELAY_MS
|
|
19
|
+
? parseInt(process.env.SAGEMAKER_BASE_STREAMING_DELAY_MS, 10)
|
|
20
|
+
: 50;
|
|
21
|
+
/**
|
|
22
|
+
* Maximum synthetic streaming delay in milliseconds to prevent excessively slow streaming
|
|
23
|
+
* Can be configured via SAGEMAKER_MAX_STREAMING_DELAY_MS environment variable
|
|
24
|
+
*/
|
|
25
|
+
const MAX_SYNTHETIC_STREAMING_DELAY_MS = process.env
|
|
26
|
+
.SAGEMAKER_MAX_STREAMING_DELAY_MS
|
|
27
|
+
? parseInt(process.env.SAGEMAKER_MAX_STREAMING_DELAY_MS, 10)
|
|
28
|
+
: 200;
|
|
29
|
+
/**
|
|
30
|
+
* Calculate adaptive delay based on text size to avoid slow streaming for large texts
|
|
31
|
+
* Smaller texts get longer delays for realistic feel, larger texts get shorter delays for performance
|
|
32
|
+
*/
|
|
33
|
+
function calculateAdaptiveDelay(textLength, chunkCount) {
|
|
34
|
+
// Base calculation: smaller delay for larger texts
|
|
35
|
+
const adaptiveDelay = Math.max(10, // Minimum 10ms delay
|
|
36
|
+
Math.min(MAX_SYNTHETIC_STREAMING_DELAY_MS, BASE_SYNTHETIC_STREAMING_DELAY_MS * (1000 / Math.max(textLength, 100))));
|
|
37
|
+
// Further reduce delay if there are many chunks to process
|
|
38
|
+
if (chunkCount > 20) {
|
|
39
|
+
return Math.max(10, adaptiveDelay * 0.5); // Half delay for many chunks
|
|
40
|
+
}
|
|
41
|
+
else if (chunkCount > 10) {
|
|
42
|
+
return Math.max(15, adaptiveDelay * 0.7); // Reduced delay for moderate chunks
|
|
43
|
+
}
|
|
44
|
+
return adaptiveDelay;
|
|
45
|
+
}
|
|
46
|
+
/**
|
|
47
|
+
* Create an async iterator for text chunks with adaptive delay between chunks
|
|
48
|
+
* Used for synthetic streaming simulation with performance optimization for large texts
|
|
49
|
+
*/
|
|
50
|
+
async function* createTextChunkIterator(text) {
|
|
51
|
+
if (!text) {
|
|
52
|
+
return; // No text to emit
|
|
53
|
+
}
|
|
54
|
+
const words = text.split(/\s+/);
|
|
55
|
+
const chunkSize = Math.max(1, Math.floor(words.length / 10));
|
|
56
|
+
const totalChunks = Math.ceil(words.length / chunkSize);
|
|
57
|
+
// Calculate adaptive delay based on text size and chunk count
|
|
58
|
+
const adaptiveDelay = calculateAdaptiveDelay(text.length, totalChunks);
|
|
59
|
+
for (let i = 0; i < words.length; i += chunkSize) {
|
|
60
|
+
const chunk = words.slice(i, i + chunkSize).join(" ");
|
|
61
|
+
const deltaText = i === 0 ? chunk : " " + chunk;
|
|
62
|
+
// Add adaptive delay between chunks for realistic streaming simulation
|
|
63
|
+
// Delay is shorter for larger texts to improve performance
|
|
64
|
+
if (i > 0) {
|
|
65
|
+
await new Promise((resolve) => setTimeout(resolve, adaptiveDelay));
|
|
66
|
+
}
|
|
67
|
+
yield deltaText;
|
|
68
|
+
}
|
|
69
|
+
}
|
|
70
|
+
/**
|
|
71
|
+
* Batch processing concurrency constants
|
|
72
|
+
*/
|
|
73
|
+
const DEFAULT_INITIAL_CONCURRENCY = 5;
|
|
74
|
+
const DEFAULT_MAX_CONCURRENCY = 10;
|
|
75
|
+
const DEFAULT_MIN_CONCURRENCY = 1;
|
|
76
|
+
/**
|
|
77
|
+
* SageMaker Language Model implementing LanguageModel interface
|
|
78
|
+
*
|
|
79
|
+
* Token Limit Behavior:
|
|
80
|
+
* - When maxTokens is undefined, SageMaker uses the model's default token limits
|
|
81
|
+
* - When maxTokens is specified, it sets max_new_tokens parameter explicitly
|
|
82
|
+
* - This aligns with the unlimited-by-default token policy across all providers
|
|
83
|
+
*/
|
|
84
|
+
export class SageMakerLanguageModel {
|
|
85
|
+
/**
|
|
86
|
+
* Specification version for the AI SDK LanguageModel interface.
|
|
87
|
+
* Uses "v2" for structural compatibility with AI SDK v6's `LanguageModelV2`.
|
|
88
|
+
* The AI SDK checks this field to determine which interface version to use.
|
|
89
|
+
*/
|
|
90
|
+
specificationVersion = "v2";
|
|
91
|
+
provider = "sagemaker";
|
|
92
|
+
modelId;
|
|
93
|
+
supportsStreaming = true;
|
|
94
|
+
defaultObjectGenerationMode = "json";
|
|
95
|
+
/**
|
|
96
|
+
* Supported URL patterns by media type.
|
|
97
|
+
* SageMaker endpoints do not natively download URLs, so this is empty.
|
|
98
|
+
* Required by the LanguageModelV2 interface.
|
|
99
|
+
*/
|
|
100
|
+
supportedUrls = {};
|
|
101
|
+
client;
|
|
102
|
+
config;
|
|
103
|
+
modelConfig;
|
|
104
|
+
constructor(modelId, config, modelConfig) {
|
|
105
|
+
this.modelId = modelId;
|
|
106
|
+
this.config = config;
|
|
107
|
+
this.modelConfig = modelConfig;
|
|
108
|
+
this.client = new SageMakerRuntimeClient(config);
|
|
109
|
+
logger.debug("SageMaker Language Model initialized", {
|
|
110
|
+
modelId: this.modelId,
|
|
111
|
+
endpointName: this.modelConfig.endpointName,
|
|
112
|
+
provider: this.provider,
|
|
113
|
+
specificationVersion: this.specificationVersion,
|
|
114
|
+
});
|
|
115
|
+
}
|
|
116
|
+
/**
|
|
117
|
+
* Generate text synchronously using SageMaker endpoint
|
|
118
|
+
*/
|
|
119
|
+
async doGenerate(options) {
|
|
120
|
+
const startTime = Date.now();
|
|
121
|
+
try {
|
|
122
|
+
const promptText = this.extractPromptText(options);
|
|
123
|
+
logger.debug("SageMaker doGenerate called", {
|
|
124
|
+
endpointName: this.modelConfig.endpointName,
|
|
125
|
+
promptLength: promptText.length,
|
|
126
|
+
maxTokens: options.maxTokens,
|
|
127
|
+
temperature: options.temperature,
|
|
128
|
+
});
|
|
129
|
+
// Convert AI SDK options to SageMaker request format
|
|
130
|
+
const sagemakerRequest = this.convertToSageMakerRequest(options);
|
|
131
|
+
// Invoke SageMaker endpoint
|
|
132
|
+
const response = await this.client.invokeEndpoint({
|
|
133
|
+
EndpointName: this.modelConfig.endpointName,
|
|
134
|
+
Body: JSON.stringify(sagemakerRequest),
|
|
135
|
+
ContentType: "application/json",
|
|
136
|
+
Accept: "application/json",
|
|
137
|
+
});
|
|
138
|
+
// Parse SageMaker response
|
|
139
|
+
const responseBody = JSON.parse(new TextDecoder().decode(response.Body));
|
|
140
|
+
const generatedText = this.extractTextFromResponse(responseBody);
|
|
141
|
+
// Extract tool calls if present (Phase 4 enhancement)
|
|
142
|
+
const toolCalls = this.extractToolCallsFromResponse(responseBody);
|
|
143
|
+
// Calculate token usage
|
|
144
|
+
const usage = estimateTokenUsage(promptText, generatedText);
|
|
145
|
+
// Determine finish reason based on response content
|
|
146
|
+
let finishReason = "stop";
|
|
147
|
+
if (toolCalls && toolCalls.length > 0) {
|
|
148
|
+
finishReason = "tool-calls";
|
|
149
|
+
}
|
|
150
|
+
else if (responseBody.finish_reason) {
|
|
151
|
+
finishReason = this.mapSageMakerFinishReason(responseBody.finish_reason);
|
|
152
|
+
}
|
|
153
|
+
const duration = Date.now() - startTime;
|
|
154
|
+
logger.debug("SageMaker doGenerate completed", {
|
|
155
|
+
duration,
|
|
156
|
+
outputLength: generatedText.length,
|
|
157
|
+
usage,
|
|
158
|
+
toolCallsCount: toolCalls?.length || 0,
|
|
159
|
+
finishReason,
|
|
160
|
+
});
|
|
161
|
+
const result = {
|
|
162
|
+
text: generatedText,
|
|
163
|
+
usage: {
|
|
164
|
+
inputTokens: usage.promptTokens,
|
|
165
|
+
outputTokens: usage.completionTokens,
|
|
166
|
+
totalTokens: usage.total,
|
|
167
|
+
},
|
|
168
|
+
finishReason,
|
|
169
|
+
rawCall: {
|
|
170
|
+
rawPrompt: options.prompt,
|
|
171
|
+
rawSettings: {
|
|
172
|
+
maxTokens: options.maxTokens,
|
|
173
|
+
temperature: options.temperature,
|
|
174
|
+
topP: options.topP,
|
|
175
|
+
endpointName: this.modelConfig.endpointName,
|
|
176
|
+
},
|
|
177
|
+
},
|
|
178
|
+
rawResponse: {
|
|
179
|
+
headers: {
|
|
180
|
+
"content-type": response.ContentType || "application/json",
|
|
181
|
+
"invoked-variant": response.InvokedProductionVariant || "",
|
|
182
|
+
},
|
|
183
|
+
},
|
|
184
|
+
request: {
|
|
185
|
+
body: JSON.stringify(sagemakerRequest),
|
|
186
|
+
},
|
|
187
|
+
};
|
|
188
|
+
// Add tool calls to result if present
|
|
189
|
+
if (toolCalls && toolCalls.length > 0) {
|
|
190
|
+
result.toolCalls = toolCalls;
|
|
191
|
+
}
|
|
192
|
+
// Add structured data if response format was specified (Phase 4)
|
|
193
|
+
const responseFormat = sagemakerRequest
|
|
194
|
+
.response_format;
|
|
195
|
+
if (responseFormat &&
|
|
196
|
+
(responseFormat.type === "json_object" ||
|
|
197
|
+
responseFormat.type === "json_schema")) {
|
|
198
|
+
try {
|
|
199
|
+
const parsedData = JSON.parse(generatedText);
|
|
200
|
+
result.object = parsedData;
|
|
201
|
+
logger.debug("Extracted structured data from response", {
|
|
202
|
+
responseFormat: responseFormat.type,
|
|
203
|
+
hasObject: !!result.object,
|
|
204
|
+
});
|
|
205
|
+
}
|
|
206
|
+
catch (parseError) {
|
|
207
|
+
logger.warn("Failed to parse structured response as JSON", {
|
|
208
|
+
error: parseError instanceof Error
|
|
209
|
+
? parseError.message
|
|
210
|
+
: String(parseError),
|
|
211
|
+
responseText: generatedText.substring(0, 200),
|
|
212
|
+
});
|
|
213
|
+
// Keep the text response as fallback
|
|
214
|
+
}
|
|
215
|
+
}
|
|
216
|
+
return result;
|
|
217
|
+
}
|
|
218
|
+
catch (error) {
|
|
219
|
+
const duration = Date.now() - startTime;
|
|
220
|
+
logger.error("SageMaker doGenerate failed", {
|
|
221
|
+
duration,
|
|
222
|
+
error: error instanceof Error ? error.message : String(error),
|
|
223
|
+
});
|
|
224
|
+
throw handleSageMakerError(error, this.modelConfig.endpointName);
|
|
225
|
+
}
|
|
226
|
+
}
|
|
227
|
+
/**
|
|
228
|
+
* Generate text with streaming using SageMaker endpoint
|
|
229
|
+
*/
|
|
230
|
+
async doStream(options) {
|
|
231
|
+
try {
|
|
232
|
+
const promptText = this.extractPromptText(options);
|
|
233
|
+
logger.debug("SageMaker doStream called", {
|
|
234
|
+
endpointName: this.modelConfig.endpointName,
|
|
235
|
+
promptLength: promptText.length,
|
|
236
|
+
});
|
|
237
|
+
// Phase 2: Full streaming implementation with automatic detection
|
|
238
|
+
const sagemakerRequest = this.convertToSageMakerRequest(options);
|
|
239
|
+
// Add streaming parameter if model supports it
|
|
240
|
+
const requestWithStreaming = {
|
|
241
|
+
...sagemakerRequest,
|
|
242
|
+
parameters: {
|
|
243
|
+
...(typeof sagemakerRequest.parameters === "object" &&
|
|
244
|
+
sagemakerRequest.parameters !== null
|
|
245
|
+
? sagemakerRequest.parameters
|
|
246
|
+
: {}),
|
|
247
|
+
stream: true, // Will be validated by detection system
|
|
248
|
+
},
|
|
249
|
+
};
|
|
250
|
+
logger.debug("Attempting streaming generation", {
|
|
251
|
+
endpointName: this.modelConfig.endpointName,
|
|
252
|
+
hasStreamingFlag: true,
|
|
253
|
+
});
|
|
254
|
+
try {
|
|
255
|
+
// First, try to invoke with streaming
|
|
256
|
+
const response = await this.client.invokeEndpointWithStreaming({
|
|
257
|
+
EndpointName: this.modelConfig.endpointName,
|
|
258
|
+
Body: JSON.stringify(requestWithStreaming),
|
|
259
|
+
ContentType: this.modelConfig.contentType || "application/json",
|
|
260
|
+
Accept: this.modelConfig.accept || "application/json",
|
|
261
|
+
});
|
|
262
|
+
// Create intelligent streaming response
|
|
263
|
+
const stream = await createSageMakerStream(response.Body, this.modelConfig.endpointName, this.config, {
|
|
264
|
+
prompt: promptText,
|
|
265
|
+
onChunk: (chunk) => {
|
|
266
|
+
logger.debug("Streaming chunk received", {
|
|
267
|
+
contentLength: chunk.content?.length || 0,
|
|
268
|
+
done: chunk.done,
|
|
269
|
+
});
|
|
270
|
+
},
|
|
271
|
+
onComplete: (usage) => {
|
|
272
|
+
logger.debug("Streaming completed", {
|
|
273
|
+
usage,
|
|
274
|
+
endpointName: this.modelConfig.endpointName,
|
|
275
|
+
});
|
|
276
|
+
},
|
|
277
|
+
onError: (error) => {
|
|
278
|
+
logger.error("Streaming error", {
|
|
279
|
+
error: error.message,
|
|
280
|
+
endpointName: this.modelConfig.endpointName,
|
|
281
|
+
});
|
|
282
|
+
},
|
|
283
|
+
});
|
|
284
|
+
return {
|
|
285
|
+
stream: stream,
|
|
286
|
+
rawCall: {
|
|
287
|
+
rawPrompt: sagemakerRequest,
|
|
288
|
+
rawSettings: this.modelConfig,
|
|
289
|
+
},
|
|
290
|
+
rawResponse: {
|
|
291
|
+
headers: {
|
|
292
|
+
"Content-Type": response.ContentType || "application/json",
|
|
293
|
+
"X-Invoked-Production-Variant": response.InvokedProductionVariant || "unknown",
|
|
294
|
+
},
|
|
295
|
+
},
|
|
296
|
+
};
|
|
297
|
+
}
|
|
298
|
+
catch (streamingError) {
|
|
299
|
+
logger.warn("Streaming failed, falling back to non-streaming", {
|
|
300
|
+
endpointName: this.modelConfig.endpointName,
|
|
301
|
+
error: streamingError instanceof Error
|
|
302
|
+
? streamingError.message
|
|
303
|
+
: String(streamingError),
|
|
304
|
+
});
|
|
305
|
+
// Fallback: Generate normally and create synthetic stream
|
|
306
|
+
const result = await this.doGenerate(options);
|
|
307
|
+
// Create synthetic stream from complete result using async iterator pattern
|
|
308
|
+
const syntheticStream = new ReadableStream({
|
|
309
|
+
async start(controller) {
|
|
310
|
+
try {
|
|
311
|
+
// Create async iterator for text chunks
|
|
312
|
+
const textChunks = createTextChunkIterator(result.text);
|
|
313
|
+
// Process chunks with async iterator pattern
|
|
314
|
+
for await (const deltaText of textChunks) {
|
|
315
|
+
controller.enqueue({
|
|
316
|
+
type: "text-delta",
|
|
317
|
+
textDelta: deltaText,
|
|
318
|
+
});
|
|
319
|
+
}
|
|
320
|
+
// Emit completion
|
|
321
|
+
controller.enqueue({
|
|
322
|
+
type: "finish",
|
|
323
|
+
finishReason: result.finishReason,
|
|
324
|
+
usage: result.usage,
|
|
325
|
+
});
|
|
326
|
+
controller.close();
|
|
327
|
+
}
|
|
328
|
+
catch (error) {
|
|
329
|
+
controller.error(error);
|
|
330
|
+
}
|
|
331
|
+
},
|
|
332
|
+
});
|
|
333
|
+
return {
|
|
334
|
+
stream: syntheticStream,
|
|
335
|
+
rawCall: result.rawCall,
|
|
336
|
+
rawResponse: result.rawResponse,
|
|
337
|
+
request: result.request,
|
|
338
|
+
warnings: [
|
|
339
|
+
...(result.warnings || []),
|
|
340
|
+
{
|
|
341
|
+
type: "other",
|
|
342
|
+
message: "Streaming not supported, using synthetic stream",
|
|
343
|
+
},
|
|
344
|
+
],
|
|
345
|
+
};
|
|
346
|
+
}
|
|
347
|
+
}
|
|
348
|
+
catch (error) {
|
|
349
|
+
logger.error("SageMaker doStream failed", {
|
|
350
|
+
error: error instanceof Error ? error.message : String(error),
|
|
351
|
+
});
|
|
352
|
+
throw handleSageMakerError(error, this.modelConfig.endpointName);
|
|
353
|
+
}
|
|
354
|
+
}
|
|
355
|
+
/**
|
|
356
|
+
* Convert AI SDK options to SageMaker request format
|
|
357
|
+
*/
|
|
358
|
+
convertToSageMakerRequest(options) {
|
|
359
|
+
const promptText = this.extractPromptText(options);
|
|
360
|
+
// Enhanced SageMaker request format with tool support (Phase 4)
|
|
361
|
+
const request = {
|
|
362
|
+
inputs: promptText,
|
|
363
|
+
parameters: {
|
|
364
|
+
// Only include max_new_tokens if explicitly specified; let SageMaker use model defaults otherwise
|
|
365
|
+
...(options.maxTokens !== undefined
|
|
366
|
+
? { max_new_tokens: options.maxTokens }
|
|
367
|
+
: {}),
|
|
368
|
+
temperature: options.temperature || 0.7,
|
|
369
|
+
top_p: options.topP || 0.9,
|
|
370
|
+
stop: options.stopSequences || [],
|
|
371
|
+
},
|
|
372
|
+
};
|
|
373
|
+
// Add tool support if tools are present
|
|
374
|
+
const tools = options.tools;
|
|
375
|
+
if (tools && Array.isArray(tools) && tools.length > 0) {
|
|
376
|
+
request.tools = this.convertToolsToSageMakerFormat(tools);
|
|
377
|
+
// Add tool choice if specified
|
|
378
|
+
const toolChoice = options.toolChoice;
|
|
379
|
+
if (toolChoice) {
|
|
380
|
+
request.tool_choice =
|
|
381
|
+
this.convertToolChoiceToSageMakerFormat(toolChoice);
|
|
382
|
+
}
|
|
383
|
+
logger.debug("Added tool support to SageMaker request", {
|
|
384
|
+
toolCount: tools.length,
|
|
385
|
+
toolChoice: toolChoice,
|
|
386
|
+
});
|
|
387
|
+
}
|
|
388
|
+
// Add structured output support (Phase 4)
|
|
389
|
+
const responseFormat = options
|
|
390
|
+
.responseFormat;
|
|
391
|
+
if (responseFormat) {
|
|
392
|
+
request.response_format =
|
|
393
|
+
this.convertResponseFormatToSageMakerFormat(responseFormat);
|
|
394
|
+
logger.debug("Added structured output support to SageMaker request", {
|
|
395
|
+
responseFormat: responseFormat.type,
|
|
396
|
+
});
|
|
397
|
+
}
|
|
398
|
+
logger.debug("Converted to SageMaker request format", {
|
|
399
|
+
inputLength: promptText.length,
|
|
400
|
+
parameters: request.parameters,
|
|
401
|
+
hasTools: !!request.tools,
|
|
402
|
+
});
|
|
403
|
+
return request;
|
|
404
|
+
}
|
|
405
|
+
/**
|
|
406
|
+
* Convert Vercel AI SDK tools to SageMaker format
|
|
407
|
+
*/
|
|
408
|
+
convertToolsToSageMakerFormat(tools) {
|
|
409
|
+
return tools.map((tool) => {
|
|
410
|
+
if (tool.type === "function") {
|
|
411
|
+
return {
|
|
412
|
+
type: "function",
|
|
413
|
+
function: {
|
|
414
|
+
name: tool.function.name,
|
|
415
|
+
description: tool.function.description || "",
|
|
416
|
+
parameters: tool.function.parameters || {},
|
|
417
|
+
},
|
|
418
|
+
};
|
|
419
|
+
}
|
|
420
|
+
return tool; // Pass through other tool types
|
|
421
|
+
});
|
|
422
|
+
}
|
|
423
|
+
/**
|
|
424
|
+
* Convert Vercel AI SDK tool choice to SageMaker format
|
|
425
|
+
*/
|
|
426
|
+
convertToolChoiceToSageMakerFormat(toolChoice) {
|
|
427
|
+
if (typeof toolChoice === "string") {
|
|
428
|
+
return toolChoice; // 'auto', 'none', etc.
|
|
429
|
+
}
|
|
430
|
+
if (toolChoice?.type === "function") {
|
|
431
|
+
return {
|
|
432
|
+
type: "function",
|
|
433
|
+
function: {
|
|
434
|
+
name: toolChoice.function.name,
|
|
435
|
+
},
|
|
436
|
+
};
|
|
437
|
+
}
|
|
438
|
+
return toolChoice;
|
|
439
|
+
}
|
|
440
|
+
/**
|
|
441
|
+
* Convert Vercel AI SDK response format to SageMaker format (Phase 4)
|
|
442
|
+
*/
|
|
443
|
+
convertResponseFormatToSageMakerFormat(responseFormat) {
|
|
444
|
+
if (responseFormat.type === "json_object") {
|
|
445
|
+
return {
|
|
446
|
+
type: "json_object",
|
|
447
|
+
schema: responseFormat.schema || undefined,
|
|
448
|
+
};
|
|
449
|
+
}
|
|
450
|
+
if (responseFormat.type === "json_schema") {
|
|
451
|
+
return {
|
|
452
|
+
type: "json_schema",
|
|
453
|
+
json_schema: {
|
|
454
|
+
name: responseFormat.json_schema?.name || "response",
|
|
455
|
+
description: responseFormat.json_schema?.description ||
|
|
456
|
+
"Generated response",
|
|
457
|
+
schema: responseFormat.json_schema?.schema || {},
|
|
458
|
+
},
|
|
459
|
+
};
|
|
460
|
+
}
|
|
461
|
+
// Default to text
|
|
462
|
+
return {
|
|
463
|
+
type: "text",
|
|
464
|
+
};
|
|
465
|
+
}
|
|
466
|
+
/**
|
|
467
|
+
* Extract text content from AI SDK prompt format
|
|
468
|
+
*/
|
|
469
|
+
extractPromptText(options) {
|
|
470
|
+
// Check for messages first (like Ollama)
|
|
471
|
+
const messages = options.messages;
|
|
472
|
+
if (messages && Array.isArray(messages)) {
|
|
473
|
+
return messages
|
|
474
|
+
.filter((msg) => msg.role && msg.content)
|
|
475
|
+
.map((msg) => {
|
|
476
|
+
if (typeof msg.content === "string") {
|
|
477
|
+
return `${msg.role}: ${msg.content}`;
|
|
478
|
+
}
|
|
479
|
+
return `${msg.role}: ${JSON.stringify(msg.content)}`;
|
|
480
|
+
})
|
|
481
|
+
.join("\n");
|
|
482
|
+
}
|
|
483
|
+
// Fallback to prompt property
|
|
484
|
+
const prompt = options.prompt;
|
|
485
|
+
if (typeof prompt === "string") {
|
|
486
|
+
return prompt;
|
|
487
|
+
}
|
|
488
|
+
if (Array.isArray(prompt)) {
|
|
489
|
+
return prompt
|
|
490
|
+
.filter((msg) => msg.role && msg.content)
|
|
491
|
+
.map((msg) => {
|
|
492
|
+
if (typeof msg.content === "string") {
|
|
493
|
+
return `${msg.role}: ${msg.content}`;
|
|
494
|
+
}
|
|
495
|
+
return `${msg.role}: ${JSON.stringify(msg.content)}`;
|
|
496
|
+
})
|
|
497
|
+
.join("\n");
|
|
498
|
+
}
|
|
499
|
+
return String(prompt);
|
|
500
|
+
}
|
|
501
|
+
/**
|
|
502
|
+
* Extract generated text from SageMaker response
|
|
503
|
+
*/
|
|
504
|
+
extractTextFromResponse(responseBody) {
|
|
505
|
+
// Handle common SageMaker response formats
|
|
506
|
+
if (typeof responseBody === "string") {
|
|
507
|
+
return responseBody;
|
|
508
|
+
}
|
|
509
|
+
if (responseBody.generated_text) {
|
|
510
|
+
return responseBody.generated_text;
|
|
511
|
+
}
|
|
512
|
+
if (responseBody.outputs) {
|
|
513
|
+
return responseBody.outputs;
|
|
514
|
+
}
|
|
515
|
+
if (responseBody.text) {
|
|
516
|
+
return responseBody.text;
|
|
517
|
+
}
|
|
518
|
+
if (Array.isArray(responseBody) && responseBody[0]?.generated_text) {
|
|
519
|
+
return responseBody[0].generated_text;
|
|
520
|
+
}
|
|
521
|
+
// Handle response with tool calls
|
|
522
|
+
if (responseBody.choices && Array.isArray(responseBody.choices)) {
|
|
523
|
+
const choice = responseBody.choices[0];
|
|
524
|
+
if (choice?.message?.content) {
|
|
525
|
+
return choice.message.content;
|
|
526
|
+
}
|
|
527
|
+
}
|
|
528
|
+
// Fallback: stringify the entire response
|
|
529
|
+
return JSON.stringify(responseBody);
|
|
530
|
+
}
|
|
531
|
+
/**
|
|
532
|
+
* Extract tool calls from SageMaker response (Phase 4)
|
|
533
|
+
*/
|
|
534
|
+
extractToolCallsFromResponse(responseBody) {
|
|
535
|
+
// Handle OpenAI-compatible format (common for many SageMaker models)
|
|
536
|
+
if (responseBody.choices && Array.isArray(responseBody.choices)) {
|
|
537
|
+
const choice = responseBody.choices[0];
|
|
538
|
+
if (choice?.message?.tool_calls) {
|
|
539
|
+
return choice.message.tool_calls.map((toolCall) => ({
|
|
540
|
+
type: "function",
|
|
541
|
+
id: String(toolCall.id || `call_${randomUUID()}`),
|
|
542
|
+
function: {
|
|
543
|
+
name: String(toolCall.function.name),
|
|
544
|
+
arguments: String(toolCall.function.arguments),
|
|
545
|
+
},
|
|
546
|
+
}));
|
|
547
|
+
}
|
|
548
|
+
}
|
|
549
|
+
// Handle custom SageMaker tool call format
|
|
550
|
+
if (responseBody.tool_calls && Array.isArray(responseBody.tool_calls)) {
|
|
551
|
+
return responseBody.tool_calls;
|
|
552
|
+
}
|
|
553
|
+
// Handle Anthropic-style tool use
|
|
554
|
+
if (responseBody.content && Array.isArray(responseBody.content)) {
|
|
555
|
+
const toolUses = responseBody.content.filter((item) => item.type === "tool_use");
|
|
556
|
+
if (toolUses.length > 0) {
|
|
557
|
+
return toolUses.map((toolUse) => ({
|
|
558
|
+
type: "function",
|
|
559
|
+
id: String(toolUse.id || `call_${randomUUID()}`),
|
|
560
|
+
function: {
|
|
561
|
+
name: String(toolUse.name),
|
|
562
|
+
arguments: JSON.stringify(toolUse.input || {}),
|
|
563
|
+
},
|
|
564
|
+
}));
|
|
565
|
+
}
|
|
566
|
+
}
|
|
567
|
+
return undefined;
|
|
568
|
+
}
|
|
569
|
+
/**
|
|
570
|
+
* Map SageMaker finish reason to standardized format
|
|
571
|
+
*/
|
|
572
|
+
mapSageMakerFinishReason(sagemakerReason) {
|
|
573
|
+
switch (sagemakerReason?.toLowerCase()) {
|
|
574
|
+
case "stop":
|
|
575
|
+
case "end_turn":
|
|
576
|
+
case "stop_sequence":
|
|
577
|
+
return "stop";
|
|
578
|
+
case "length":
|
|
579
|
+
case "max_tokens":
|
|
580
|
+
case "max_length":
|
|
581
|
+
return "length";
|
|
582
|
+
case "content_filter":
|
|
583
|
+
case "content_filtered":
|
|
584
|
+
return "content-filter";
|
|
585
|
+
case "tool_calls":
|
|
586
|
+
case "function_call":
|
|
587
|
+
return "tool-calls";
|
|
588
|
+
case "error":
|
|
589
|
+
return "error";
|
|
590
|
+
default:
|
|
591
|
+
return "unknown";
|
|
592
|
+
}
|
|
593
|
+
}
|
|
594
|
+
/**
|
|
595
|
+
* Get model configuration summary for debugging
|
|
596
|
+
*/
|
|
597
|
+
getModelInfo() {
|
|
598
|
+
return {
|
|
599
|
+
modelId: this.modelId,
|
|
600
|
+
provider: this.provider,
|
|
601
|
+
specificationVersion: this.specificationVersion,
|
|
602
|
+
endpointName: this.modelConfig.endpointName,
|
|
603
|
+
modelType: this.modelConfig.modelType,
|
|
604
|
+
region: this.config.region,
|
|
605
|
+
};
|
|
606
|
+
}
|
|
607
|
+
/**
|
|
608
|
+
* Test basic connectivity to the SageMaker endpoint
|
|
609
|
+
*/
|
|
610
|
+
async testConnectivity() {
|
|
611
|
+
try {
|
|
612
|
+
// Use the same pattern as Ollama - pass messages directly
|
|
613
|
+
const result = await this.doGenerate({
|
|
614
|
+
inputFormat: "messages",
|
|
615
|
+
mode: { type: "regular" },
|
|
616
|
+
prompt: [
|
|
617
|
+
{ role: "user", content: [{ type: "text", text: "Hello" }] },
|
|
618
|
+
],
|
|
619
|
+
maxTokens: 10,
|
|
620
|
+
});
|
|
621
|
+
return {
|
|
622
|
+
success: !!result.text,
|
|
623
|
+
};
|
|
624
|
+
}
|
|
625
|
+
catch (error) {
|
|
626
|
+
return {
|
|
627
|
+
success: false,
|
|
628
|
+
error: error instanceof Error ? error.message : String(error),
|
|
629
|
+
};
|
|
630
|
+
}
|
|
631
|
+
}
|
|
632
|
+
/**
|
|
633
|
+
* Batch inference support (Phase 4)
|
|
634
|
+
* Process multiple prompts in a single request for efficiency
|
|
635
|
+
*/
|
|
636
|
+
async doBatchGenerate(prompts, options) {
|
|
637
|
+
try {
|
|
638
|
+
logger.debug("SageMaker batch generate called", {
|
|
639
|
+
batchSize: prompts.length,
|
|
640
|
+
endpointName: this.modelConfig.endpointName,
|
|
641
|
+
});
|
|
642
|
+
// Advanced parallel processing with dynamic concurrency and error handling
|
|
643
|
+
const results = await this.processPromptsInParallel(prompts, options);
|
|
644
|
+
logger.debug("SageMaker batch generate completed", {
|
|
645
|
+
batchSize: prompts.length,
|
|
646
|
+
successCount: results.length,
|
|
647
|
+
});
|
|
648
|
+
return results;
|
|
649
|
+
}
|
|
650
|
+
catch (error) {
|
|
651
|
+
logger.error("SageMaker batch generate failed", {
|
|
652
|
+
error: error instanceof Error ? error.message : String(error),
|
|
653
|
+
batchSize: prompts.length,
|
|
654
|
+
});
|
|
655
|
+
throw handleSageMakerError(error, this.modelConfig.endpointName);
|
|
656
|
+
}
|
|
657
|
+
}
|
|
658
|
+
/**
|
|
659
|
+
* Process prompts in parallel with advanced concurrency control and error handling
|
|
660
|
+
*/
|
|
661
|
+
async processPromptsInParallel(prompts, options) {
|
|
662
|
+
// Dynamic concurrency based on batch size and endpoint capacity
|
|
663
|
+
const INITIAL_CONCURRENCY = Math.min(this.modelConfig.initialConcurrency ?? DEFAULT_INITIAL_CONCURRENCY, prompts.length);
|
|
664
|
+
const MAX_CONCURRENCY = this.modelConfig.maxConcurrency ?? DEFAULT_MAX_CONCURRENCY;
|
|
665
|
+
const MIN_CONCURRENCY = this.modelConfig.minConcurrency ?? DEFAULT_MIN_CONCURRENCY;
|
|
666
|
+
const results = new Array(prompts.length);
|
|
667
|
+
const errors = [];
|
|
668
|
+
// Use adaptive semaphore utility for concurrency control
|
|
669
|
+
const semaphore = createAdaptiveSemaphore(INITIAL_CONCURRENCY, MAX_CONCURRENCY, MIN_CONCURRENCY);
|
|
670
|
+
// Process each prompt with adaptive concurrency
|
|
671
|
+
const processPrompt = async (prompt, index) => {
|
|
672
|
+
await semaphore.acquire();
|
|
673
|
+
const startTime = Date.now();
|
|
674
|
+
try {
|
|
675
|
+
const result = await this.doGenerate({
|
|
676
|
+
inputFormat: "messages",
|
|
677
|
+
mode: { type: "regular" },
|
|
678
|
+
prompt: [
|
|
679
|
+
{
|
|
680
|
+
role: "user",
|
|
681
|
+
content: [{ type: "text", text: prompt }],
|
|
682
|
+
},
|
|
683
|
+
],
|
|
684
|
+
maxTokens: options?.maxTokens,
|
|
685
|
+
temperature: options?.temperature,
|
|
686
|
+
topP: options?.topP,
|
|
687
|
+
});
|
|
688
|
+
const duration = Date.now() - startTime;
|
|
689
|
+
results[index] = {
|
|
690
|
+
text: result.text || "",
|
|
691
|
+
usage: {
|
|
692
|
+
promptTokens: result.usage.inputTokens ?? 0,
|
|
693
|
+
completionTokens: result.usage.outputTokens ?? 0,
|
|
694
|
+
total: result.usage.totalTokens ??
|
|
695
|
+
(result.usage.inputTokens ?? 0) +
|
|
696
|
+
(result.usage.outputTokens ?? 0),
|
|
697
|
+
},
|
|
698
|
+
finishReason: result.finishReason,
|
|
699
|
+
index,
|
|
700
|
+
};
|
|
701
|
+
// Record successful completion for adaptive concurrency adjustment
|
|
702
|
+
semaphore.recordSuccess(duration);
|
|
703
|
+
}
|
|
704
|
+
catch (error) {
|
|
705
|
+
errors.push({
|
|
706
|
+
index,
|
|
707
|
+
error: error instanceof Error ? error : new Error(String(error)),
|
|
708
|
+
});
|
|
709
|
+
// Record error for adaptive concurrency adjustment
|
|
710
|
+
const duration = Date.now() - startTime;
|
|
711
|
+
semaphore.recordError(duration);
|
|
712
|
+
// Create error result
|
|
713
|
+
results[index] = {
|
|
714
|
+
text: "",
|
|
715
|
+
usage: { promptTokens: 0, completionTokens: 0, total: 0 },
|
|
716
|
+
finishReason: "error",
|
|
717
|
+
index,
|
|
718
|
+
};
|
|
719
|
+
}
|
|
720
|
+
finally {
|
|
721
|
+
semaphore.release();
|
|
722
|
+
}
|
|
723
|
+
};
|
|
724
|
+
// Start all requests with concurrency control
|
|
725
|
+
const allPromises = prompts.map((prompt, index) => processPrompt(prompt, index));
|
|
726
|
+
// Wait for all requests to complete
|
|
727
|
+
await Promise.all(allPromises);
|
|
728
|
+
// Log final statistics using semaphore metrics
|
|
729
|
+
const metrics = semaphore.getMetrics();
|
|
730
|
+
logger.debug("Parallel batch processing completed", {
|
|
731
|
+
totalPrompts: prompts.length,
|
|
732
|
+
successCount: metrics.completedCount,
|
|
733
|
+
errorCount: metrics.errorCount,
|
|
734
|
+
finalConcurrency: metrics.currentConcurrency,
|
|
735
|
+
errorRate: metrics.errorCount / prompts.length,
|
|
736
|
+
averageResponseTime: metrics.averageResponseTime,
|
|
737
|
+
});
|
|
738
|
+
// If we have too many errors, log them for debugging
|
|
739
|
+
if (errors.length > 0) {
|
|
740
|
+
logger.warn("Batch processing encountered errors", {
|
|
741
|
+
errorCount: errors.length,
|
|
742
|
+
sampleErrors: errors.slice(0, 3).map((e) => ({
|
|
743
|
+
index: e.index,
|
|
744
|
+
message: e.error.message,
|
|
745
|
+
})),
|
|
746
|
+
});
|
|
747
|
+
}
|
|
748
|
+
// Return results in original order (already sorted by index)
|
|
749
|
+
return results.map(({ text, usage, finishReason }) => ({
|
|
750
|
+
text,
|
|
751
|
+
usage,
|
|
752
|
+
finishReason,
|
|
753
|
+
}));
|
|
754
|
+
}
|
|
755
|
+
/**
|
|
756
|
+
* Enhanced model information with batch capabilities
|
|
757
|
+
*/
|
|
758
|
+
getModelCapabilities() {
|
|
759
|
+
return {
|
|
760
|
+
...this.getModelInfo(),
|
|
761
|
+
capabilities: {
|
|
762
|
+
streaming: true,
|
|
763
|
+
toolCalling: true,
|
|
764
|
+
structuredOutput: true,
|
|
765
|
+
batchInference: true,
|
|
766
|
+
supportedResponseFormats: ["text", "json_object", "json_schema"],
|
|
767
|
+
supportedToolTypes: ["function"],
|
|
768
|
+
maxBatchSize: 100, // Increased limit with parallel processing
|
|
769
|
+
adaptiveConcurrency: true,
|
|
770
|
+
errorRecovery: true,
|
|
771
|
+
},
|
|
772
|
+
};
|
|
773
|
+
}
|
|
774
|
+
}
|
|
775
|
+
export default SageMakerLanguageModel;
|