@juspay/neurolink 9.30.0 → 9.31.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +20 -0
- package/README.md +2 -3
- package/dist/adapters/providerImageAdapter.js +13 -22
- package/dist/adapters/video/videoAnalyzer.d.ts +4 -4
- package/dist/adapters/video/videoAnalyzer.js +3 -3
- package/dist/agent/directTools.d.ts +20 -289
- package/dist/agent/directTools.js +11 -10
- package/dist/auth/accountPool.d.ts +68 -0
- package/dist/auth/accountPool.js +178 -0
- package/dist/auth/anthropicOAuth.d.ts +15 -5
- package/dist/auth/anthropicOAuth.js +117 -57
- package/dist/auth/index.d.ts +7 -5
- package/dist/auth/index.js +6 -2
- package/dist/auth/tokenStore.d.ts +71 -27
- package/dist/auth/tokenStore.js +342 -64
- package/dist/cli/commands/auth.d.ts +39 -2
- package/dist/cli/commands/auth.js +585 -36
- package/dist/cli/commands/config.d.ts +47 -574
- package/dist/cli/commands/config.js +142 -24
- package/dist/cli/commands/docs.d.ts +1 -5
- package/dist/cli/commands/observability.d.ts +1 -17
- package/dist/cli/commands/ollama.js +1 -1
- package/dist/cli/commands/proxy.d.ts +20 -0
- package/dist/cli/commands/proxy.js +1254 -0
- package/dist/cli/commands/setup-anthropic.js +1 -1
- package/dist/cli/commands/setup-azure.js +1 -1
- package/dist/cli/commands/setup-bedrock.js +2 -2
- package/dist/cli/commands/setup-gcp.js +1 -1
- package/dist/cli/commands/setup-google-ai.js +1 -1
- package/dist/cli/commands/setup-huggingface.js +2 -2
- package/dist/cli/commands/setup-mistral.js +1 -1
- package/dist/cli/commands/setup-openai.js +1 -1
- package/dist/cli/commands/setup.js +3 -3
- package/dist/cli/commands/telemetry.d.ts +1 -22
- package/dist/cli/factories/authCommandFactory.d.ts +16 -11
- package/dist/cli/factories/authCommandFactory.js +96 -1
- package/dist/cli/factories/ollamaCommandFactory.js +1 -1
- package/dist/cli/factories/sagemakerCommandFactory.js +25 -6
- package/dist/cli/index.d.ts +0 -6
- package/dist/cli/index.js +5 -2
- package/dist/cli/loop/conversationSelector.js +7 -2
- package/dist/cli/parser.js +19 -1
- package/dist/cli/utils/envManager.js +2 -2
- package/dist/cli/utils/ollamaUtils.d.ts +1 -2
- package/dist/client/adapters/providerImageAdapter.js +588 -0
- package/dist/client/adapters/tts/googleTTSHandler.js +344 -0
- package/dist/client/adapters/video/directorPipeline.js +516 -0
- package/dist/client/adapters/video/ffmpegAdapter.js +206 -0
- package/dist/client/adapters/video/frameExtractor.js +143 -0
- package/dist/client/adapters/video/vertexVideoHandler.js +763 -0
- package/dist/client/adapters/video/videoAnalyzer.js +238 -0
- package/dist/client/adapters/video/videoMerger.js +171 -0
- package/dist/client/agent/directTools.js +840 -0
- package/dist/client/aiSdkAdapter.d.ts +196 -0
- package/dist/client/aiSdkAdapter.js +487 -0
- package/dist/client/auth/anthropicOAuth.js +974 -0
- package/dist/client/auth/tokenStore.js +799 -0
- package/dist/client/auth.d.ts +248 -0
- package/dist/client/auth.js +473 -0
- package/dist/client/client/aiSdkAdapter.js +487 -0
- package/dist/client/client/auth.js +473 -0
- package/dist/client/client/errors.js +552 -0
- package/dist/client/client/httpClient.js +837 -0
- package/dist/client/client/index.js +172 -0
- package/dist/client/client/interceptors.js +601 -0
- package/dist/client/client/reactHooks.js +1159 -0
- package/dist/client/client/sseClient.js +545 -0
- package/dist/client/client/streamingClient.js +917 -0
- package/dist/client/client/wsClient.js +369 -0
- package/dist/client/config/configManager.js +303 -0
- package/dist/client/config/conversationMemory.js +86 -0
- package/dist/client/config/taskClassificationConfig.js +148 -0
- package/dist/client/constants/contextWindows.js +295 -0
- package/dist/client/constants/enums.js +853 -0
- package/dist/client/constants/index.js +207 -0
- package/dist/client/constants/performance.js +389 -0
- package/dist/client/constants/retry.js +266 -0
- package/dist/client/constants/timeouts.js +182 -0
- package/dist/client/constants/tokens.js +380 -0
- package/dist/client/constants/videoErrors.js +46 -0
- package/dist/client/context/budgetChecker.js +98 -0
- package/dist/client/context/contextCompactor.js +205 -0
- package/dist/client/context/emergencyTruncation.js +88 -0
- package/dist/client/context/errorDetection.js +171 -0
- package/dist/client/context/errors.js +21 -0
- package/dist/client/context/fileTokenBudget.js +127 -0
- package/dist/client/context/prompts/summarizationPrompt.js +117 -0
- package/dist/client/context/stages/fileReadDeduplicator.js +66 -0
- package/dist/client/context/stages/slidingWindowTruncator.js +190 -0
- package/dist/client/context/stages/structuredSummarizer.js +99 -0
- package/dist/client/context/stages/toolOutputPruner.js +52 -0
- package/dist/client/context/summarizationEngine.js +136 -0
- package/dist/client/context/toolOutputLimits.js +78 -0
- package/dist/client/context/toolPairRepair.js +66 -0
- package/dist/client/core/analytics.js +88 -0
- package/dist/client/core/baseProvider.js +1385 -0
- package/dist/client/core/constants.js +140 -0
- package/dist/client/core/conversationMemoryFactory.js +141 -0
- package/dist/client/core/conversationMemoryInitializer.js +128 -0
- package/dist/client/core/conversationMemoryManager.js +344 -0
- package/dist/client/core/dynamicModels.js +358 -0
- package/dist/client/core/evaluation.js +309 -0
- package/dist/client/core/evaluationProviders.js +248 -0
- package/dist/client/core/factory.js +412 -0
- package/dist/client/core/infrastructure/baseError.js +22 -0
- package/dist/client/core/infrastructure/baseFactory.js +54 -0
- package/dist/client/core/infrastructure/baseRegistry.js +49 -0
- package/dist/client/core/infrastructure/index.js +5 -0
- package/dist/client/core/infrastructure/retry.js +20 -0
- package/dist/client/core/infrastructure/typedEventEmitter.js +23 -0
- package/dist/client/core/modelConfiguration.js +851 -0
- package/dist/client/core/modules/GenerationHandler.js +588 -0
- package/dist/client/core/modules/MessageBuilder.js +273 -0
- package/dist/client/core/modules/StreamHandler.js +185 -0
- package/dist/client/core/modules/TelemetryHandler.js +203 -0
- package/dist/client/core/modules/ToolsManager.js +499 -0
- package/dist/client/core/modules/Utilities.js +331 -0
- package/dist/client/core/redisConversationMemoryManager.js +1435 -0
- package/dist/client/core/streamAnalytics.js +131 -0
- package/dist/client/errors.d.ts +299 -0
- package/dist/client/errors.js +552 -0
- package/dist/client/evaluation/contextBuilder.js +134 -0
- package/dist/client/evaluation/index.js +61 -0
- package/dist/client/evaluation/prompts.js +73 -0
- package/dist/client/evaluation/ragasEvaluator.js +110 -0
- package/dist/client/evaluation/retryManager.js +78 -0
- package/dist/client/evaluation/scoring.js +61 -0
- package/dist/client/factories/providerFactory.js +166 -0
- package/dist/client/factories/providerRegistry.js +166 -0
- package/dist/client/features/ppt/constants.js +896 -0
- package/dist/client/features/ppt/contentPlanner.js +529 -0
- package/dist/client/features/ppt/presentationOrchestrator.js +236 -0
- package/dist/client/features/ppt/slideGenerator.js +532 -0
- package/dist/client/features/ppt/slideRenderers.js +2383 -0
- package/dist/client/features/ppt/slideTypeInference.js +405 -0
- package/dist/client/features/ppt/types.js +13 -0
- package/dist/client/features/ppt/utils.js +443 -0
- package/dist/client/files/fileReferenceRegistry.js +1543 -0
- package/dist/client/files/fileTools.js +450 -0
- package/dist/client/files/streamingReader.js +321 -0
- package/dist/client/files/types.js +23 -0
- package/dist/client/hitl/hitlErrors.js +54 -0
- package/dist/client/hitl/hitlManager.js +460 -0
- package/dist/client/httpClient.d.ts +297 -0
- package/dist/client/httpClient.js +837 -0
- package/dist/client/index.d.ts +111 -0
- package/dist/client/index.js +511 -0
- package/dist/client/interceptors.d.ts +283 -0
- package/dist/client/interceptors.js +601 -0
- package/dist/client/mcp/agentExposure.js +356 -0
- package/dist/client/mcp/auth/index.js +11 -0
- package/dist/client/mcp/auth/oauthClientProvider.js +325 -0
- package/dist/client/mcp/auth/tokenStorage.js +134 -0
- package/dist/client/mcp/batching/index.js +10 -0
- package/dist/client/mcp/batching/requestBatcher.js +441 -0
- package/dist/client/mcp/caching/index.js +10 -0
- package/dist/client/mcp/caching/toolCache.js +433 -0
- package/dist/client/mcp/elicitation/elicitationManager.js +376 -0
- package/dist/client/mcp/elicitation/index.js +11 -0
- package/dist/client/mcp/elicitation/types.js +10 -0
- package/dist/client/mcp/elicitationProtocol.js +375 -0
- package/dist/client/mcp/enhancedToolDiscovery.js +481 -0
- package/dist/client/mcp/externalServerManager.js +1478 -0
- package/dist/client/mcp/factory.js +161 -0
- package/dist/client/mcp/flexibleToolValidator.js +161 -0
- package/dist/client/mcp/httpRateLimiter.js +391 -0
- package/dist/client/mcp/httpRetryHandler.js +178 -0
- package/dist/client/mcp/index.js +74 -0
- package/dist/client/mcp/mcpCircuitBreaker.js +427 -0
- package/dist/client/mcp/mcpClientFactory.js +708 -0
- package/dist/client/mcp/mcpRegistryClient.js +488 -0
- package/dist/client/mcp/mcpServerBase.js +373 -0
- package/dist/client/mcp/multiServerManager.js +579 -0
- package/dist/client/mcp/registry.js +158 -0
- package/dist/client/mcp/routing/index.js +10 -0
- package/dist/client/mcp/routing/toolRouter.js +416 -0
- package/dist/client/mcp/serverCapabilities.js +502 -0
- package/dist/client/mcp/servers/agent/directToolsServer.js +150 -0
- package/dist/client/mcp/toolAnnotations.js +239 -0
- package/dist/client/mcp/toolConverter.js +258 -0
- package/dist/client/mcp/toolDiscoveryService.js +798 -0
- package/dist/client/mcp/toolIntegration.js +334 -0
- package/dist/client/mcp/toolRegistry.js +719 -0
- package/dist/client/memory/hippocampusInitializer.js +19 -0
- package/dist/client/memory/memoryRetrievalTools.js +166 -0
- package/dist/client/middleware/builtin/analytics.js +132 -0
- package/dist/client/middleware/builtin/autoEvaluation.js +203 -0
- package/dist/client/middleware/builtin/guardrails.js +109 -0
- package/dist/client/middleware/builtin/lifecycle.js +168 -0
- package/dist/client/middleware/factory.js +327 -0
- package/dist/client/middleware/registry.js +295 -0
- package/dist/client/middleware/utils/guardrailsUtils.js +396 -0
- package/dist/client/models/anthropicModels.js +527 -0
- package/dist/client/neurolink.js +8015 -0
- package/dist/client/observability/exporterRegistry.js +413 -0
- package/dist/client/observability/exporters/arizeExporter.js +138 -0
- package/dist/client/observability/exporters/baseExporter.js +190 -0
- package/dist/client/observability/exporters/braintrustExporter.js +154 -0
- package/dist/client/observability/exporters/datadogExporter.js +196 -0
- package/dist/client/observability/exporters/laminarExporter.js +302 -0
- package/dist/client/observability/exporters/langfuseExporter.js +209 -0
- package/dist/client/observability/exporters/langsmithExporter.js +143 -0
- package/dist/client/observability/exporters/otelExporter.js +164 -0
- package/dist/client/observability/exporters/posthogExporter.js +287 -0
- package/dist/client/observability/exporters/sentryExporter.js +165 -0
- package/dist/client/observability/index.js +31 -0
- package/dist/client/observability/metricsAggregator.js +556 -0
- package/dist/client/observability/otelBridge.js +131 -0
- package/dist/client/observability/retryPolicy.js +383 -0
- package/dist/client/observability/sampling/samplers.js +216 -0
- package/dist/client/observability/spanProcessor.js +303 -0
- package/dist/client/observability/tokenTracker.js +413 -0
- package/dist/client/observability/types/exporterTypes.js +5 -0
- package/dist/client/observability/types/index.js +4 -0
- package/dist/client/observability/types/spanTypes.js +92 -0
- package/dist/client/observability/utils/safeMetadata.js +25 -0
- package/dist/client/observability/utils/spanSerializer.js +292 -0
- package/dist/client/processors/archive/ArchiveProcessor.js +1308 -0
- package/dist/client/processors/base/BaseFileProcessor.js +614 -0
- package/dist/client/processors/base/types.js +82 -0
- package/dist/client/processors/config/fileTypes.js +520 -0
- package/dist/client/processors/config/index.js +92 -0
- package/dist/client/processors/config/languageMap.js +410 -0
- package/dist/client/processors/config/mimeTypes.js +363 -0
- package/dist/client/processors/config/sizeLimits.js +258 -0
- package/dist/client/processors/document/ExcelProcessor.js +590 -0
- package/dist/client/processors/document/OpenDocumentProcessor.js +212 -0
- package/dist/client/processors/document/PptxProcessor.js +157 -0
- package/dist/client/processors/document/RtfProcessor.js +361 -0
- package/dist/client/processors/document/WordProcessor.js +353 -0
- package/dist/client/processors/errors/FileErrorCode.js +255 -0
- package/dist/client/processors/errors/errorHelpers.js +386 -0
- package/dist/client/processors/errors/errorSerializer.js +507 -0
- package/dist/client/processors/errors/index.js +49 -0
- package/dist/client/processors/markup/SvgProcessor.js +240 -0
- package/dist/client/processors/media/AudioProcessor.js +707 -0
- package/dist/client/processors/media/VideoProcessor.js +1045 -0
- package/dist/client/providers/amazonBedrock.js +1512 -0
- package/dist/client/providers/amazonSagemaker.js +162 -0
- package/dist/client/providers/anthropic.js +831 -0
- package/dist/client/providers/azureOpenai.js +143 -0
- package/dist/client/providers/googleAiStudio.js +1200 -0
- package/dist/client/providers/googleNativeGemini3.js +543 -0
- package/dist/client/providers/googleVertex.js +2936 -0
- package/dist/client/providers/huggingFace.js +315 -0
- package/dist/client/providers/litellm.js +488 -0
- package/dist/client/providers/mistral.js +157 -0
- package/dist/client/providers/ollama.js +1579 -0
- package/dist/client/providers/openAI.js +627 -0
- package/dist/client/providers/openRouter.js +543 -0
- package/dist/client/providers/openaiCompatible.js +290 -0
- package/dist/client/providers/providerTypeUtils.js +46 -0
- package/dist/client/providers/sagemaker/adaptive-semaphore.js +215 -0
- package/dist/client/providers/sagemaker/client.js +472 -0
- package/dist/client/providers/sagemaker/config.js +317 -0
- package/dist/client/providers/sagemaker/detection.js +606 -0
- package/dist/client/providers/sagemaker/error-constants.js +227 -0
- package/dist/client/providers/sagemaker/errors.js +299 -0
- package/dist/client/providers/sagemaker/language-model.js +775 -0
- package/dist/client/providers/sagemaker/parsers.js +634 -0
- package/dist/client/providers/sagemaker/streaming.js +331 -0
- package/dist/client/providers/sagemaker/structured-parser.js +625 -0
- package/dist/client/proxy/accountQuota.js +162 -0
- package/dist/client/proxy/claudeFormat.js +595 -0
- package/dist/client/proxy/modelRouter.js +29 -0
- package/dist/client/proxy/oauthFetch.js +367 -0
- package/dist/client/proxy/proxyFetch.js +586 -0
- package/dist/client/proxy/requestLogger.js +207 -0
- package/dist/client/proxy/tokenRefresh.js +124 -0
- package/dist/client/proxy/usageStats.js +74 -0
- package/dist/client/proxy/utils/noProxyUtils.js +149 -0
- package/dist/client/rag/ChunkerFactory.js +320 -0
- package/dist/client/rag/ChunkerRegistry.js +421 -0
- package/dist/client/rag/chunkers/BaseChunker.js +143 -0
- package/dist/client/rag/chunkers/CharacterChunker.js +28 -0
- package/dist/client/rag/chunkers/HTMLChunker.js +38 -0
- package/dist/client/rag/chunkers/JSONChunker.js +68 -0
- package/dist/client/rag/chunkers/LaTeXChunker.js +63 -0
- package/dist/client/rag/chunkers/MarkdownChunker.js +306 -0
- package/dist/client/rag/chunkers/RecursiveChunker.js +139 -0
- package/dist/client/rag/chunkers/SemanticMarkdownChunker.js +138 -0
- package/dist/client/rag/chunkers/SentenceChunker.js +66 -0
- package/dist/client/rag/chunkers/TokenChunker.js +61 -0
- package/dist/client/rag/chunkers/index.js +15 -0
- package/dist/client/rag/chunking/characterChunker.js +142 -0
- package/dist/client/rag/chunking/chunkerRegistry.js +194 -0
- package/dist/client/rag/chunking/htmlChunker.js +247 -0
- package/dist/client/rag/chunking/index.js +17 -0
- package/dist/client/rag/chunking/jsonChunker.js +281 -0
- package/dist/client/rag/chunking/latexChunker.js +251 -0
- package/dist/client/rag/chunking/markdownChunker.js +373 -0
- package/dist/client/rag/chunking/recursiveChunker.js +148 -0
- package/dist/client/rag/chunking/semanticChunker.js +306 -0
- package/dist/client/rag/chunking/sentenceChunker.js +230 -0
- package/dist/client/rag/chunking/tokenChunker.js +183 -0
- package/dist/client/rag/document/MDocument.js +392 -0
- package/dist/client/rag/document/index.js +5 -0
- package/dist/client/rag/document/loaders.js +500 -0
- package/dist/client/rag/errors/RAGError.js +274 -0
- package/dist/client/rag/errors/index.js +6 -0
- package/dist/client/rag/graphRag/graphRAG.js +401 -0
- package/dist/client/rag/graphRag/index.js +4 -0
- package/dist/client/rag/index.js +141 -0
- package/dist/client/rag/metadata/MetadataExtractorFactory.js +418 -0
- package/dist/client/rag/metadata/MetadataExtractorRegistry.js +362 -0
- package/dist/client/rag/metadata/index.js +9 -0
- package/dist/client/rag/metadata/metadataExtractor.js +280 -0
- package/dist/client/rag/pipeline/RAGPipeline.js +436 -0
- package/dist/client/rag/pipeline/contextAssembly.js +341 -0
- package/dist/client/rag/pipeline/index.js +5 -0
- package/dist/client/rag/ragIntegration.js +321 -0
- package/dist/client/rag/reranker/RerankerFactory.js +430 -0
- package/dist/client/rag/reranker/RerankerRegistry.js +402 -0
- package/dist/client/rag/reranker/index.js +9 -0
- package/dist/client/rag/reranker/reranker.js +277 -0
- package/dist/client/rag/resilience/CircuitBreaker.js +431 -0
- package/dist/client/rag/resilience/RetryHandler.js +304 -0
- package/dist/client/rag/resilience/index.js +7 -0
- package/dist/client/rag/retrieval/hybridSearch.js +335 -0
- package/dist/client/rag/retrieval/index.js +5 -0
- package/dist/client/rag/retrieval/vectorQueryTool.js +307 -0
- package/dist/client/rag/types.js +8 -0
- package/dist/client/reactHooks.d.ts +239 -0
- package/dist/client/reactHooks.tsx +1483 -0
- package/dist/client/sdk/toolRegistration.js +377 -0
- package/dist/client/server/abstract/baseServerAdapter.js +575 -0
- package/dist/client/server/adapters/expressAdapter.js +486 -0
- package/dist/client/server/adapters/fastifyAdapter.js +472 -0
- package/dist/client/server/adapters/honoAdapter.js +632 -0
- package/dist/client/server/adapters/koaAdapter.js +510 -0
- package/dist/client/server/errors.js +486 -0
- package/dist/client/server/factory/serverAdapterFactory.js +160 -0
- package/dist/client/server/index.js +108 -0
- package/dist/client/server/middleware/abortSignal.js +111 -0
- package/dist/client/server/middleware/auth.js +388 -0
- package/dist/client/server/middleware/cache.js +359 -0
- package/dist/client/server/middleware/common.js +281 -0
- package/dist/client/server/middleware/deprecation.js +190 -0
- package/dist/client/server/middleware/mcpBodyAttachment.js +63 -0
- package/dist/client/server/middleware/rateLimit.js +227 -0
- package/dist/client/server/middleware/validation.js +388 -0
- package/dist/client/server/openapi/generator.js +398 -0
- package/dist/client/server/openapi/index.js +36 -0
- package/dist/client/server/openapi/schemas.js +695 -0
- package/dist/client/server/openapi/templates.js +374 -0
- package/dist/client/server/routes/agentRoutes.js +171 -0
- package/dist/client/server/routes/claudeProxyRoutes.js +1600 -0
- package/dist/client/server/routes/healthRoutes.js +187 -0
- package/dist/client/server/routes/index.js +57 -0
- package/dist/client/server/routes/mcpRoutes.js +342 -0
- package/dist/client/server/routes/memoryRoutes.js +350 -0
- package/dist/client/server/routes/openApiRoutes.js +126 -0
- package/dist/client/server/routes/toolRoutes.js +199 -0
- package/dist/client/server/streaming/dataStream.js +486 -0
- package/dist/client/server/streaming/index.js +11 -0
- package/dist/client/server/types.js +67 -0
- package/dist/client/server/utils/redaction.js +334 -0
- package/dist/client/server/utils/validation.js +243 -0
- package/dist/client/server/websocket/WebSocketHandler.js +383 -0
- package/dist/client/server/websocket/index.js +4 -0
- package/dist/client/services/server/ai/observability/instrumentation.js +808 -0
- package/dist/client/sseClient.d.ts +156 -0
- package/dist/client/sseClient.js +545 -0
- package/dist/client/streamingClient.d.ts +327 -0
- package/dist/client/streamingClient.js +917 -0
- package/dist/client/telemetry/attributes.js +100 -0
- package/dist/client/telemetry/index.js +26 -0
- package/dist/client/telemetry/telemetryService.js +308 -0
- package/dist/client/telemetry/tracers.js +17 -0
- package/dist/client/telemetry/withSpan.js +34 -0
- package/dist/client/types/actionTypes.js +6 -0
- package/dist/client/types/analytics.js +5 -0
- package/dist/client/types/authTypes.js +8 -0
- package/dist/client/types/circuitBreakerErrors.js +34 -0
- package/dist/client/types/cli.js +21 -0
- package/dist/client/types/clientTypes.js +10 -0
- package/dist/client/types/common.js +51 -0
- package/dist/client/types/configTypes.js +49 -0
- package/dist/client/types/content.js +19 -0
- package/dist/client/types/contextTypes.js +400 -0
- package/dist/client/types/conversation.js +47 -0
- package/dist/client/types/conversationMemoryInterface.js +6 -0
- package/dist/client/types/domainTypes.js +5 -0
- package/dist/client/types/errors.js +167 -0
- package/dist/client/types/evaluation.js +5 -0
- package/dist/client/types/evaluationProviders.js +5 -0
- package/dist/client/types/evaluationTypes.js +1 -0
- package/dist/client/types/externalMcp.js +6 -0
- package/dist/client/types/fileReferenceTypes.js +8 -0
- package/dist/client/types/fileTypes.js +4 -0
- package/dist/client/types/generateTypes.js +1 -0
- package/dist/client/types/guardrails.js +1 -0
- package/dist/client/types/hitlTypes.js +8 -0
- package/dist/client/types/index.js +57 -0
- package/dist/client/types/mcpTypes.js +5 -0
- package/dist/client/types/middlewareTypes.js +1 -0
- package/dist/client/types/modelTypes.js +30 -0
- package/dist/client/types/multimodal.js +135 -0
- package/dist/client/types/observability.js +6 -0
- package/dist/client/types/pptTypes.js +82 -0
- package/dist/client/types/providers.js +111 -0
- package/dist/client/types/proxyTypes.js +16 -0
- package/dist/client/types/ragTypes.js +7 -0
- package/dist/client/types/sdkTypes.js +8 -0
- package/dist/client/types/serviceTypes.js +5 -0
- package/dist/client/types/streamTypes.js +1 -0
- package/dist/client/types/subscriptionTypes.js +9 -0
- package/dist/client/types/taskClassificationTypes.js +5 -0
- package/dist/client/types/tools.js +24 -0
- package/dist/client/types/ttsTypes.js +57 -0
- package/dist/client/types/typeAliases.js +48 -0
- package/dist/client/types/utilities.js +4 -0
- package/dist/client/types/workflowTypes.js +30 -0
- package/dist/client/utils/async/withTimeout.js +98 -0
- package/dist/client/utils/asyncMutex.js +60 -0
- package/dist/client/utils/conversationMemory.js +431 -0
- package/dist/client/utils/csvProcessor.js +846 -0
- package/dist/client/utils/errorHandling.js +936 -0
- package/dist/client/utils/evaluationUtils.js +131 -0
- package/dist/client/utils/factoryProcessing.js +589 -0
- package/dist/client/utils/fileDetector.js +2161 -0
- package/dist/client/utils/imageCache.js +376 -0
- package/dist/client/utils/imageProcessor.js +704 -0
- package/dist/client/utils/logger.js +491 -0
- package/dist/client/utils/mcpDefaults.js +134 -0
- package/dist/client/utils/messageBuilder.js +1653 -0
- package/dist/client/utils/modelAliasResolver.js +54 -0
- package/dist/client/utils/modelDetection.js +80 -0
- package/dist/client/utils/modelRouter.js +292 -0
- package/dist/client/utils/multimodalOptionsBuilder.js +65 -0
- package/dist/client/utils/observabilityHelpers.js +47 -0
- package/dist/client/utils/parameterValidation.js +966 -0
- package/dist/client/utils/pdfProcessor.js +410 -0
- package/dist/client/utils/performance.js +222 -0
- package/dist/client/utils/pricing.js +340 -0
- package/dist/client/utils/promptRedaction.js +62 -0
- package/dist/client/utils/providerConfig.js +1009 -0
- package/dist/client/utils/providerHealth.js +1237 -0
- package/dist/client/utils/providerRetry.js +112 -0
- package/dist/client/utils/providerUtils.js +434 -0
- package/dist/client/utils/rateLimiter.js +200 -0
- package/dist/client/utils/redis.js +368 -0
- package/dist/client/utils/retryHandler.js +269 -0
- package/dist/client/utils/retryability.js +22 -0
- package/dist/client/utils/sanitizers/svg.js +481 -0
- package/dist/client/utils/schemaConversion.js +255 -0
- package/dist/client/utils/taskClassificationUtils.js +149 -0
- package/dist/client/utils/taskClassifier.js +94 -0
- package/dist/client/utils/thinkingConfig.js +104 -0
- package/dist/client/utils/timeout.js +359 -0
- package/dist/client/utils/tokenEstimation.js +142 -0
- package/dist/client/utils/tokenLimits.js +125 -0
- package/dist/client/utils/tokenUtils.js +239 -0
- package/dist/client/utils/toolUtils.js +75 -0
- package/dist/client/utils/transformationUtils.js +554 -0
- package/dist/client/utils/ttsProcessor.js +286 -0
- package/dist/client/utils/typeUtils.js +97 -0
- package/dist/client/utils/videoAnalysisProcessor.js +67 -0
- package/dist/client/workflow/config.js +398 -0
- package/dist/client/workflow/core/ensembleExecutor.js +407 -0
- package/dist/client/workflow/core/judgeScorer.js +544 -0
- package/dist/client/workflow/core/responseConditioner.js +225 -0
- package/dist/client/workflow/core/types/conditionerTypes.js +7 -0
- package/dist/client/workflow/core/types/ensembleTypes.js +7 -0
- package/dist/client/workflow/core/types/index.js +7 -0
- package/dist/client/workflow/core/types/judgeTypes.js +7 -0
- package/dist/client/workflow/core/types/layerTypes.js +7 -0
- package/dist/client/workflow/core/types/registryTypes.js +7 -0
- package/dist/client/workflow/core/workflowRegistry.js +304 -0
- package/dist/client/workflow/core/workflowRunner.js +586 -0
- package/dist/client/workflow/index.js +50 -0
- package/dist/client/workflow/types.js +9 -0
- package/dist/client/workflow/utils/types/index.js +7 -0
- package/dist/client/workflow/utils/workflowMetrics.js +311 -0
- package/dist/client/workflow/utils/workflowValidation.js +420 -0
- package/dist/client/workflow/workflows/adaptiveWorkflow.js +366 -0
- package/dist/client/workflow/workflows/consensusWorkflow.js +192 -0
- package/dist/client/workflow/workflows/fallbackWorkflow.js +225 -0
- package/dist/client/workflow/workflows/multiJudgeWorkflow.js +351 -0
- package/dist/client/wsClient.d.ts +130 -0
- package/dist/client/wsClient.js +369 -0
- package/dist/config/configManager.js +2 -2
- package/dist/constants/contextWindows.js +15 -13
- package/dist/constants/enums.d.ts +10 -16
- package/dist/constants/enums.js +12 -18
- package/dist/constants/index.d.ts +0 -10
- package/dist/constants/index.js +1 -1
- package/dist/constants/tokens.d.ts +29 -16
- package/dist/constants/tokens.js +23 -16
- package/dist/core/baseProvider.d.ts +5 -5
- package/dist/core/baseProvider.js +6 -6
- package/dist/core/constants.js +6 -1
- package/dist/core/dynamicModels.js +10 -6
- package/dist/core/evaluationProviders.js +1 -1
- package/dist/core/infrastructure/baseError.d.ts +1 -1
- package/dist/core/infrastructure/baseFactory.d.ts +1 -6
- package/dist/core/infrastructure/baseRegistry.d.ts +6 -5
- package/dist/core/infrastructure/index.d.ts +6 -4
- package/dist/core/infrastructure/index.js +2 -2
- package/dist/core/modelConfiguration.js +3 -1
- package/dist/core/modules/GenerationHandler.d.ts +3 -3
- package/dist/core/modules/GenerationHandler.js +49 -41
- package/dist/core/modules/MessageBuilder.d.ts +5 -5
- package/dist/core/modules/MessageBuilder.js +4 -6
- package/dist/core/modules/StreamHandler.js +26 -12
- package/dist/core/modules/TelemetryHandler.d.ts +4 -6
- package/dist/core/modules/TelemetryHandler.js +7 -6
- package/dist/core/modules/ToolsManager.d.ts +2 -12
- package/dist/core/modules/ToolsManager.js +20 -4
- package/dist/core/modules/Utilities.js +3 -1
- package/dist/core/redisConversationMemoryManager.js +3 -3
- package/dist/core/streamAnalytics.js +23 -9
- package/dist/evaluation/contextBuilder.d.ts +2 -2
- package/dist/evaluation/contextBuilder.js +2 -2
- package/dist/evaluation/index.d.ts +2 -2
- package/dist/evaluation/retryManager.js +1 -1
- package/dist/factories/providerFactory.js +2 -2
- package/dist/features/ppt/constants.js +1 -1
- package/dist/features/ppt/presentationOrchestrator.js +7 -3
- package/dist/features/ppt/slideGenerator.d.ts +2 -1
- package/dist/features/ppt/slideGenerator.js +6 -1
- package/dist/files/fileTools.d.ts +16 -247
- package/dist/files/fileTools.js +16 -15
- package/dist/index.d.ts +5 -3
- package/dist/index.js +20 -3
- package/dist/lib/adapters/providerImageAdapter.js +13 -22
- package/dist/lib/adapters/video/videoAnalyzer.d.ts +4 -4
- package/dist/lib/adapters/video/videoAnalyzer.js +3 -3
- package/dist/lib/agent/directTools.d.ts +20 -289
- package/dist/lib/agent/directTools.js +11 -10
- package/dist/lib/auth/accountPool.d.ts +68 -0
- package/dist/lib/auth/accountPool.js +179 -0
- package/dist/lib/auth/anthropicOAuth.d.ts +15 -5
- package/dist/lib/auth/anthropicOAuth.js +117 -57
- package/dist/lib/auth/index.d.ts +7 -5
- package/dist/lib/auth/index.js +6 -2
- package/dist/lib/auth/tokenStore.d.ts +71 -27
- package/dist/lib/auth/tokenStore.js +342 -64
- package/dist/lib/client/aiSdkAdapter.d.ts +196 -0
- package/dist/lib/client/aiSdkAdapter.js +488 -0
- package/dist/lib/client/auth.d.ts +248 -0
- package/dist/lib/client/auth.js +474 -0
- package/dist/lib/client/errors.d.ts +299 -0
- package/dist/lib/client/errors.js +553 -0
- package/dist/lib/client/httpClient.d.ts +297 -0
- package/dist/lib/client/httpClient.js +838 -0
- package/dist/lib/client/index.d.ts +111 -0
- package/dist/lib/client/index.js +173 -0
- package/dist/lib/client/interceptors.d.ts +283 -0
- package/dist/lib/client/interceptors.js +602 -0
- package/dist/lib/client/reactHooks.d.ts +239 -0
- package/dist/lib/client/reactHooks.js +1160 -0
- package/dist/lib/client/sseClient.d.ts +156 -0
- package/dist/lib/client/sseClient.js +546 -0
- package/dist/lib/client/streamingClient.d.ts +327 -0
- package/dist/lib/client/streamingClient.js +918 -0
- package/dist/lib/client/wsClient.d.ts +130 -0
- package/dist/lib/client/wsClient.js +370 -0
- package/dist/lib/config/configManager.js +2 -2
- package/dist/lib/constants/contextWindows.js +15 -13
- package/dist/lib/constants/enums.d.ts +10 -16
- package/dist/lib/constants/enums.js +12 -18
- package/dist/lib/constants/index.d.ts +0 -10
- package/dist/lib/constants/index.js +1 -1
- package/dist/lib/constants/tokens.d.ts +29 -16
- package/dist/lib/constants/tokens.js +23 -16
- package/dist/lib/core/baseProvider.d.ts +5 -5
- package/dist/lib/core/baseProvider.js +6 -6
- package/dist/lib/core/constants.js +6 -1
- package/dist/lib/core/dynamicModels.js +10 -6
- package/dist/lib/core/evaluationProviders.js +1 -1
- package/dist/lib/core/infrastructure/baseError.d.ts +1 -1
- package/dist/lib/core/infrastructure/baseFactory.d.ts +1 -6
- package/dist/lib/core/infrastructure/baseRegistry.d.ts +6 -5
- package/dist/lib/core/infrastructure/index.d.ts +6 -4
- package/dist/lib/core/infrastructure/index.js +2 -2
- package/dist/lib/core/modelConfiguration.js +3 -1
- package/dist/lib/core/modules/GenerationHandler.d.ts +3 -3
- package/dist/lib/core/modules/GenerationHandler.js +49 -41
- package/dist/lib/core/modules/MessageBuilder.d.ts +5 -5
- package/dist/lib/core/modules/MessageBuilder.js +4 -6
- package/dist/lib/core/modules/StreamHandler.js +26 -12
- package/dist/lib/core/modules/TelemetryHandler.d.ts +4 -6
- package/dist/lib/core/modules/TelemetryHandler.js +7 -6
- package/dist/lib/core/modules/ToolsManager.d.ts +2 -12
- package/dist/lib/core/modules/ToolsManager.js +20 -4
- package/dist/lib/core/modules/Utilities.js +3 -1
- package/dist/lib/core/redisConversationMemoryManager.js +3 -3
- package/dist/lib/core/streamAnalytics.js +23 -9
- package/dist/lib/evaluation/contextBuilder.d.ts +2 -2
- package/dist/lib/evaluation/contextBuilder.js +2 -2
- package/dist/lib/evaluation/index.d.ts +2 -2
- package/dist/lib/evaluation/retryManager.js +1 -1
- package/dist/lib/factories/providerFactory.js +2 -2
- package/dist/lib/features/ppt/constants.js +1 -1
- package/dist/lib/features/ppt/presentationOrchestrator.js +7 -3
- package/dist/lib/features/ppt/slideGenerator.d.ts +2 -1
- package/dist/lib/features/ppt/slideGenerator.js +6 -1
- package/dist/lib/files/fileTools.d.ts +16 -247
- package/dist/lib/files/fileTools.js +16 -15
- package/dist/lib/index.d.ts +5 -3
- package/dist/lib/index.js +20 -3
- package/dist/lib/mcp/batching/requestBatcher.js +1 -1
- package/dist/lib/mcp/externalServerManager.js +5 -2
- package/dist/lib/mcp/factory.js +1 -1
- package/dist/lib/mcp/index.d.ts +1 -1
- package/dist/lib/mcp/index.js +1 -1
- package/dist/lib/mcp/mcpCircuitBreaker.d.ts +1 -0
- package/dist/lib/mcp/mcpCircuitBreaker.js +30 -4
- package/dist/lib/mcp/mcpClientFactory.js +33 -4
- package/dist/lib/mcp/toolDiscoveryService.js +52 -5
- package/dist/lib/mcp/toolRegistry.js +7 -1
- package/dist/lib/memory/memoryRetrievalTools.d.ts +5 -89
- package/dist/lib/memory/memoryRetrievalTools.js +1 -1
- package/dist/lib/middleware/builtin/analytics.js +3 -0
- package/dist/lib/middleware/builtin/autoEvaluation.js +46 -24
- package/dist/lib/middleware/builtin/guardrails.js +4 -0
- package/dist/lib/middleware/builtin/lifecycle.js +10 -6
- package/dist/lib/middleware/factory.d.ts +3 -3
- package/dist/lib/middleware/factory.js +3 -2
- package/dist/lib/middleware/index.d.ts +1 -1
- package/dist/lib/middleware/registry.d.ts +2 -2
- package/dist/lib/middleware/registry.js +1 -0
- package/dist/lib/middleware/utils/guardrailsUtils.d.ts +5 -6
- package/dist/lib/middleware/utils/guardrailsUtils.js +15 -6
- package/dist/lib/neurolink.d.ts +9 -20
- package/dist/lib/neurolink.js +278 -186
- package/dist/lib/observability/retryPolicy.d.ts +2 -13
- package/dist/lib/observability/sampling/samplers.d.ts +2 -11
- package/dist/lib/observability/spanProcessor.d.ts +2 -14
- package/dist/lib/processors/base/BaseFileProcessor.js +1 -1
- package/dist/lib/processors/document/OpenDocumentProcessor.js +5 -3
- package/dist/lib/processors/media/VideoProcessor.js +157 -101
- package/dist/lib/providers/amazonBedrock.js +12 -5
- package/dist/lib/providers/amazonSagemaker.d.ts +5 -5
- package/dist/lib/providers/amazonSagemaker.js +6 -2
- package/dist/lib/providers/anthropic.d.ts +3 -3
- package/dist/lib/providers/anthropic.js +23 -192
- package/dist/lib/providers/anthropicBaseProvider.d.ts +4 -4
- package/dist/lib/providers/anthropicBaseProvider.js +24 -13
- package/dist/lib/providers/azureOpenai.d.ts +2 -2
- package/dist/lib/providers/azureOpenai.js +6 -6
- package/dist/lib/providers/googleAiStudio.d.ts +2 -2
- package/dist/lib/providers/googleAiStudio.js +15 -7
- package/dist/lib/providers/googleNativeGemini3.d.ts +3 -54
- package/dist/lib/providers/googleNativeGemini3.js +14 -10
- package/dist/lib/providers/googleVertex.d.ts +6 -6
- package/dist/lib/providers/googleVertex.js +32 -26
- package/dist/lib/providers/huggingFace.d.ts +4 -4
- package/dist/lib/providers/huggingFace.js +15 -5
- package/dist/lib/providers/litellm.d.ts +4 -4
- package/dist/lib/providers/litellm.js +54 -42
- package/dist/lib/providers/mistral.d.ts +2 -2
- package/dist/lib/providers/mistral.js +5 -4
- package/dist/lib/providers/ollama.d.ts +7 -4
- package/dist/lib/providers/ollama.js +30 -8
- package/dist/lib/providers/openAI.d.ts +2 -2
- package/dist/lib/providers/openAI.js +46 -21
- package/dist/lib/providers/openRouter.d.ts +4 -4
- package/dist/lib/providers/openRouter.js +63 -35
- package/dist/lib/providers/openaiCompatible.d.ts +2 -2
- package/dist/lib/providers/openaiCompatible.js +18 -9
- package/dist/lib/providers/providerTypeUtils.d.ts +28 -0
- package/dist/lib/providers/providerTypeUtils.js +47 -0
- package/dist/lib/providers/sagemaker/config.js +5 -5
- package/dist/lib/providers/sagemaker/language-model.d.ts +23 -13
- package/dist/lib/providers/sagemaker/language-model.js +20 -8
- package/dist/lib/proxy/accountQuota.d.ts +33 -0
- package/dist/lib/proxy/accountQuota.js +163 -0
- package/dist/lib/proxy/claudeFormat.d.ts +143 -0
- package/dist/lib/proxy/claudeFormat.js +596 -0
- package/dist/lib/proxy/cloaking/index.d.ts +44 -0
- package/dist/lib/proxy/cloaking/index.js +87 -0
- package/dist/lib/proxy/cloaking/plugins/headerScrubber.d.ts +9 -0
- package/dist/lib/proxy/cloaking/plugins/headerScrubber.js +87 -0
- package/dist/lib/proxy/cloaking/plugins/sessionIdentity.d.ts +15 -0
- package/dist/lib/proxy/cloaking/plugins/sessionIdentity.js +66 -0
- package/dist/lib/proxy/cloaking/plugins/systemPromptInjector.d.ts +11 -0
- package/dist/lib/proxy/cloaking/plugins/systemPromptInjector.js +84 -0
- package/dist/lib/proxy/cloaking/plugins/tlsFingerprint.d.ts +14 -0
- package/dist/lib/proxy/cloaking/plugins/tlsFingerprint.js +39 -0
- package/dist/lib/proxy/cloaking/plugins/wordObfuscator.d.ts +9 -0
- package/dist/lib/proxy/cloaking/plugins/wordObfuscator.js +122 -0
- package/dist/lib/proxy/cloaking/types.d.ts +1 -0
- package/dist/lib/proxy/cloaking/types.js +2 -0
- package/dist/lib/proxy/modelRouter.d.ts +10 -0
- package/dist/lib/proxy/modelRouter.js +30 -0
- package/dist/lib/proxy/oauthFetch.d.ts +36 -0
- package/dist/lib/proxy/oauthFetch.js +368 -0
- package/dist/lib/proxy/proxyConfig.d.ts +42 -0
- package/dist/lib/proxy/proxyConfig.js +500 -0
- package/dist/lib/proxy/proxyFetch.js +2 -1
- package/dist/lib/proxy/requestLogger.d.ts +50 -0
- package/dist/lib/proxy/requestLogger.js +208 -0
- package/dist/lib/proxy/tokenRefresh.d.ts +4 -0
- package/dist/lib/proxy/tokenRefresh.js +125 -0
- package/dist/lib/proxy/usageStats.d.ts +13 -0
- package/dist/lib/proxy/usageStats.js +75 -0
- package/dist/lib/rag/document/loaders.js +1 -1
- package/dist/lib/rag/pipeline/contextAssembly.d.ts +4 -7
- package/dist/lib/rag/ragIntegration.d.ts +2 -14
- package/dist/lib/rag/ragIntegration.js +1 -1
- package/dist/lib/rag/resilience/CircuitBreaker.d.ts +5 -44
- package/dist/lib/rag/resilience/RetryHandler.js +1 -1
- package/dist/lib/rag/retrieval/vectorQueryTool.d.ts +1 -9
- package/dist/lib/rag/retrieval/vectorQueryTool.js +1 -1
- package/dist/lib/sdk/toolRegistration.js +12 -1
- package/dist/lib/server/abstract/baseServerAdapter.js +2 -2
- package/dist/lib/server/adapters/honoAdapter.d.ts +6 -0
- package/dist/lib/server/adapters/honoAdapter.js +76 -10
- package/dist/lib/server/middleware/cache.js +3 -0
- package/dist/lib/server/routes/claudeProxyRoutes.d.ts +44 -0
- package/dist/lib/server/routes/claudeProxyRoutes.js +1601 -0
- package/dist/lib/server/routes/healthRoutes.js +18 -1
- package/dist/lib/server/routes/index.d.ts +7 -0
- package/dist/lib/server/routes/index.js +8 -0
- package/dist/lib/server/streaming/dataStream.d.ts +1 -5
- package/dist/lib/server/streaming/dataStream.js +3 -0
- package/dist/lib/server/utils/validation.d.ts +24 -124
- package/dist/lib/server/utils/validation.js +2 -2
- package/dist/lib/services/server/ai/observability/instrumentation.js +4 -0
- package/dist/lib/telemetry/attributes.d.ts +38 -0
- package/dist/lib/telemetry/attributes.js +40 -0
- package/dist/lib/telemetry/tracers.d.ts +1 -0
- package/dist/lib/telemetry/tracers.js +1 -0
- package/dist/lib/types/authTypes.d.ts +56 -0
- package/dist/lib/types/authTypes.js +9 -0
- package/dist/lib/types/circuitBreakerErrors.d.ts +30 -0
- package/dist/lib/types/circuitBreakerErrors.js +35 -0
- package/dist/lib/types/cli.d.ts +258 -0
- package/dist/lib/types/clientTypes.d.ts +1050 -0
- package/dist/lib/types/clientTypes.js +11 -0
- package/dist/lib/types/common.d.ts +123 -0
- package/dist/lib/types/configTypes.d.ts +49 -0
- package/dist/lib/types/configTypes.js +4 -0
- package/dist/lib/types/conversation.d.ts +0 -5
- package/dist/lib/types/evaluationTypes.d.ts +2 -2
- package/dist/lib/types/fileTypes.d.ts +47 -0
- package/dist/lib/types/generateTypes.d.ts +7 -3
- package/dist/lib/types/guardrails.d.ts +2 -2
- package/dist/lib/types/index.d.ts +4 -1
- package/dist/lib/types/index.js +5 -0
- package/dist/lib/types/middlewareTypes.d.ts +3 -3
- package/dist/lib/types/modelTypes.d.ts +7 -97
- package/dist/lib/types/modelTypes.js +3 -3
- package/dist/lib/types/observability.d.ts +37 -0
- package/dist/lib/types/providers.d.ts +107 -0
- package/dist/lib/types/proxyTypes.d.ts +536 -0
- package/dist/lib/types/proxyTypes.js +17 -0
- package/dist/lib/types/ragTypes.d.ts +49 -1
- package/dist/lib/types/streamTypes.d.ts +37 -13
- package/dist/lib/types/subscriptionTypes.d.ts +77 -0
- package/dist/lib/types/subscriptionTypes.js +2 -0
- package/dist/lib/types/tools.d.ts +45 -1
- package/dist/lib/types/typeAliases.d.ts +8 -0
- package/dist/lib/types/typeAliases.js +1 -0
- package/dist/lib/utils/async/retry.d.ts +4 -33
- package/dist/lib/utils/asyncMutex.d.ts +14 -0
- package/dist/lib/utils/asyncMutex.js +61 -0
- package/dist/lib/utils/errorHandling.d.ts +2 -1
- package/dist/lib/utils/errorHandling.js +14 -6
- package/dist/lib/utils/fileDetector.d.ts +13 -1
- package/dist/lib/utils/fileDetector.js +114 -32
- package/dist/lib/utils/imageProcessor.js +7 -7
- package/dist/lib/utils/json/safeParse.d.ts +1 -8
- package/dist/lib/utils/mcpDefaults.d.ts +1 -1
- package/dist/lib/utils/mcpDefaults.js +11 -2
- package/dist/lib/utils/messageBuilder.d.ts +5 -5
- package/dist/lib/utils/messageBuilder.js +106 -80
- package/dist/lib/utils/modelChoices.d.ts +1 -8
- package/dist/lib/utils/pdfProcessor.d.ts +1 -25
- package/dist/lib/utils/pdfProcessor.js +5 -4
- package/dist/lib/utils/pricing.js +28 -5
- package/dist/lib/utils/providerHealth.d.ts +1 -1
- package/dist/lib/utils/rateLimiter.d.ts +1 -15
- package/dist/lib/utils/redis.d.ts +1 -1
- package/dist/lib/utils/redis.js +3 -3
- package/dist/lib/utils/sanitizers/filename.d.ts +2 -22
- package/dist/lib/utils/sanitizers/index.d.ts +4 -2
- package/dist/lib/utils/sanitizers/svg.d.ts +1 -11
- package/dist/lib/utils/schemaConversion.js +4 -1
- package/dist/lib/utils/thinkingConfig.d.ts +1 -33
- package/dist/lib/utils/tokenUtils.d.ts +1 -39
- package/dist/lib/utils/videoAnalysisProcessor.d.ts +5 -5
- package/dist/lib/utils/videoAnalysisProcessor.js +2 -2
- package/dist/lib/workflow/config.d.ts +89 -1257
- package/dist/lib/workflow/utils/workflowValidation.js +1 -1
- package/dist/mcp/batching/requestBatcher.js +1 -1
- package/dist/mcp/externalServerManager.js +5 -2
- package/dist/mcp/factory.js +1 -1
- package/dist/mcp/index.d.ts +1 -1
- package/dist/mcp/index.js +1 -1
- package/dist/mcp/mcpCircuitBreaker.d.ts +1 -0
- package/dist/mcp/mcpCircuitBreaker.js +30 -4
- package/dist/mcp/mcpClientFactory.js +33 -4
- package/dist/mcp/toolDiscoveryService.js +52 -5
- package/dist/mcp/toolRegistry.js +7 -1
- package/dist/memory/memoryRetrievalTools.d.ts +5 -89
- package/dist/memory/memoryRetrievalTools.js +1 -1
- package/dist/middleware/builtin/analytics.js +3 -0
- package/dist/middleware/builtin/autoEvaluation.js +46 -24
- package/dist/middleware/builtin/guardrails.js +4 -0
- package/dist/middleware/builtin/lifecycle.js +10 -6
- package/dist/middleware/factory.d.ts +3 -3
- package/dist/middleware/factory.js +3 -2
- package/dist/middleware/index.d.ts +1 -1
- package/dist/middleware/registry.d.ts +2 -2
- package/dist/middleware/registry.js +1 -0
- package/dist/middleware/utils/guardrailsUtils.d.ts +5 -6
- package/dist/middleware/utils/guardrailsUtils.js +15 -6
- package/dist/neurolink.d.ts +9 -20
- package/dist/neurolink.js +278 -186
- package/dist/observability/retryPolicy.d.ts +2 -13
- package/dist/observability/sampling/samplers.d.ts +2 -11
- package/dist/observability/spanProcessor.d.ts +2 -14
- package/dist/processors/base/BaseFileProcessor.js +1 -1
- package/dist/processors/document/OpenDocumentProcessor.js +5 -3
- package/dist/processors/media/VideoProcessor.js +157 -101
- package/dist/providers/amazonBedrock.js +12 -5
- package/dist/providers/amazonSagemaker.d.ts +5 -5
- package/dist/providers/amazonSagemaker.js +6 -2
- package/dist/providers/anthropic.d.ts +3 -3
- package/dist/providers/anthropic.js +23 -192
- package/dist/providers/anthropicBaseProvider.d.ts +4 -4
- package/dist/providers/anthropicBaseProvider.js +24 -13
- package/dist/providers/azureOpenai.d.ts +2 -2
- package/dist/providers/azureOpenai.js +6 -6
- package/dist/providers/googleAiStudio.d.ts +2 -2
- package/dist/providers/googleAiStudio.js +15 -7
- package/dist/providers/googleNativeGemini3.d.ts +3 -54
- package/dist/providers/googleNativeGemini3.js +14 -10
- package/dist/providers/googleVertex.d.ts +6 -6
- package/dist/providers/googleVertex.js +32 -26
- package/dist/providers/huggingFace.d.ts +4 -4
- package/dist/providers/huggingFace.js +15 -5
- package/dist/providers/litellm.d.ts +4 -4
- package/dist/providers/litellm.js +54 -42
- package/dist/providers/mistral.d.ts +2 -2
- package/dist/providers/mistral.js +5 -4
- package/dist/providers/ollama.d.ts +7 -4
- package/dist/providers/ollama.js +30 -8
- package/dist/providers/openAI.d.ts +2 -2
- package/dist/providers/openAI.js +46 -21
- package/dist/providers/openRouter.d.ts +4 -4
- package/dist/providers/openRouter.js +63 -35
- package/dist/providers/openaiCompatible.d.ts +2 -2
- package/dist/providers/openaiCompatible.js +18 -9
- package/dist/providers/providerTypeUtils.d.ts +28 -0
- package/dist/providers/providerTypeUtils.js +46 -0
- package/dist/providers/sagemaker/config.js +5 -5
- package/dist/providers/sagemaker/language-model.d.ts +23 -13
- package/dist/providers/sagemaker/language-model.js +20 -8
- package/dist/proxy/accountQuota.d.ts +33 -0
- package/dist/proxy/accountQuota.js +162 -0
- package/dist/proxy/claudeFormat.d.ts +143 -0
- package/dist/proxy/claudeFormat.js +595 -0
- package/dist/proxy/cloaking/index.d.ts +44 -0
- package/dist/proxy/cloaking/index.js +86 -0
- package/dist/proxy/cloaking/plugins/headerScrubber.d.ts +9 -0
- package/dist/proxy/cloaking/plugins/headerScrubber.js +86 -0
- package/dist/proxy/cloaking/plugins/sessionIdentity.d.ts +15 -0
- package/dist/proxy/cloaking/plugins/sessionIdentity.js +65 -0
- package/dist/proxy/cloaking/plugins/systemPromptInjector.d.ts +11 -0
- package/dist/proxy/cloaking/plugins/systemPromptInjector.js +83 -0
- package/dist/proxy/cloaking/plugins/tlsFingerprint.d.ts +14 -0
- package/dist/proxy/cloaking/plugins/tlsFingerprint.js +38 -0
- package/dist/proxy/cloaking/plugins/wordObfuscator.d.ts +9 -0
- package/dist/proxy/cloaking/plugins/wordObfuscator.js +121 -0
- package/dist/proxy/cloaking/types.d.ts +1 -0
- package/dist/proxy/cloaking/types.js +1 -0
- package/dist/proxy/modelRouter.d.ts +10 -0
- package/dist/proxy/modelRouter.js +29 -0
- package/dist/proxy/oauthFetch.d.ts +36 -0
- package/dist/proxy/oauthFetch.js +367 -0
- package/dist/proxy/proxyConfig.d.ts +42 -0
- package/dist/proxy/proxyConfig.js +499 -0
- package/dist/proxy/proxyFetch.js +2 -1
- package/dist/proxy/requestLogger.d.ts +50 -0
- package/dist/proxy/requestLogger.js +207 -0
- package/dist/proxy/tokenRefresh.d.ts +4 -0
- package/dist/proxy/tokenRefresh.js +124 -0
- package/dist/proxy/usageStats.d.ts +13 -0
- package/dist/proxy/usageStats.js +74 -0
- package/dist/rag/document/loaders.js +1 -1
- package/dist/rag/pipeline/contextAssembly.d.ts +4 -7
- package/dist/rag/ragIntegration.d.ts +2 -14
- package/dist/rag/ragIntegration.js +1 -1
- package/dist/rag/resilience/CircuitBreaker.d.ts +5 -44
- package/dist/rag/resilience/RetryHandler.js +1 -1
- package/dist/rag/retrieval/vectorQueryTool.d.ts +1 -9
- package/dist/rag/retrieval/vectorQueryTool.js +1 -1
- package/dist/sdk/toolRegistration.js +12 -1
- package/dist/server/abstract/baseServerAdapter.js +2 -2
- package/dist/server/adapters/honoAdapter.d.ts +6 -0
- package/dist/server/adapters/honoAdapter.js +76 -10
- package/dist/server/middleware/cache.js +3 -0
- package/dist/server/routes/claudeProxyRoutes.d.ts +44 -0
- package/dist/server/routes/claudeProxyRoutes.js +1600 -0
- package/dist/server/routes/healthRoutes.js +18 -1
- package/dist/server/routes/index.d.ts +7 -0
- package/dist/server/routes/index.js +8 -0
- package/dist/server/streaming/dataStream.d.ts +1 -5
- package/dist/server/streaming/dataStream.js +3 -0
- package/dist/server/utils/validation.d.ts +24 -124
- package/dist/server/utils/validation.js +2 -2
- package/dist/services/server/ai/observability/instrumentation.js +4 -0
- package/dist/telemetry/attributes.d.ts +38 -0
- package/dist/telemetry/attributes.js +40 -0
- package/dist/telemetry/tracers.d.ts +1 -0
- package/dist/telemetry/tracers.js +1 -0
- package/dist/types/authTypes.d.ts +56 -0
- package/dist/types/authTypes.js +8 -0
- package/dist/types/circuitBreakerErrors.d.ts +30 -0
- package/dist/types/circuitBreakerErrors.js +34 -0
- package/dist/types/cli.d.ts +258 -0
- package/dist/types/clientTypes.d.ts +1050 -0
- package/dist/types/clientTypes.js +10 -0
- package/dist/types/common.d.ts +123 -0
- package/dist/types/configTypes.d.ts +49 -0
- package/dist/types/configTypes.js +4 -0
- package/dist/types/conversation.d.ts +0 -5
- package/dist/types/evaluationTypes.d.ts +2 -2
- package/dist/types/fileTypes.d.ts +47 -0
- package/dist/types/generateTypes.d.ts +7 -3
- package/dist/types/guardrails.d.ts +2 -2
- package/dist/types/index.d.ts +4 -1
- package/dist/types/index.js +5 -0
- package/dist/types/middlewareTypes.d.ts +3 -3
- package/dist/types/modelTypes.d.ts +7 -97
- package/dist/types/modelTypes.js +3 -3
- package/dist/types/observability.d.ts +37 -0
- package/dist/types/providers.d.ts +107 -0
- package/dist/types/proxyTypes.d.ts +536 -0
- package/dist/types/proxyTypes.js +16 -0
- package/dist/types/ragTypes.d.ts +49 -1
- package/dist/types/streamTypes.d.ts +37 -13
- package/dist/types/subscriptionTypes.d.ts +77 -0
- package/dist/types/subscriptionTypes.js +2 -0
- package/dist/types/tools.d.ts +45 -1
- package/dist/types/typeAliases.d.ts +8 -0
- package/dist/types/typeAliases.js +1 -0
- package/dist/utils/async/retry.d.ts +4 -33
- package/dist/utils/asyncMutex.d.ts +14 -0
- package/dist/utils/asyncMutex.js +60 -0
- package/dist/utils/errorHandling.d.ts +2 -1
- package/dist/utils/errorHandling.js +14 -6
- package/dist/utils/fileDetector.d.ts +13 -1
- package/dist/utils/fileDetector.js +114 -32
- package/dist/utils/imageProcessor.js +7 -7
- package/dist/utils/json/safeParse.d.ts +1 -8
- package/dist/utils/mcpDefaults.d.ts +1 -1
- package/dist/utils/mcpDefaults.js +11 -2
- package/dist/utils/messageBuilder.d.ts +5 -5
- package/dist/utils/messageBuilder.js +106 -80
- package/dist/utils/modelChoices.d.ts +1 -8
- package/dist/utils/pdfProcessor.d.ts +1 -25
- package/dist/utils/pdfProcessor.js +5 -4
- package/dist/utils/pricing.js +28 -5
- package/dist/utils/rateLimiter.d.ts +1 -15
- package/dist/utils/redis.d.ts +1 -1
- package/dist/utils/redis.js +3 -3
- package/dist/utils/sanitizers/filename.d.ts +2 -22
- package/dist/utils/sanitizers/index.d.ts +4 -2
- package/dist/utils/sanitizers/svg.d.ts +1 -11
- package/dist/utils/schemaConversion.js +4 -1
- package/dist/utils/thinkingConfig.d.ts +1 -33
- package/dist/utils/tokenUtils.d.ts +1 -39
- package/dist/utils/videoAnalysisProcessor.d.ts +5 -5
- package/dist/utils/videoAnalysisProcessor.js +2 -2
- package/dist/workflow/config.d.ts +89 -1257
- package/dist/workflow/utils/workflowValidation.js +1 -1
- package/docs-site/mcp-server/index.js +2 -3
- package/package.json +138 -105
- package/dist/lib/memory/mem0Initializer.d.ts +0 -46
- package/dist/lib/memory/mem0Initializer.js +0 -85
- package/dist/memory/mem0Initializer.d.ts +0 -46
- package/dist/memory/mem0Initializer.js +0 -84
|
@@ -0,0 +1,205 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* ContextCompactor
|
|
3
|
+
*
|
|
4
|
+
* Orchestrates multi-stage context reduction:
|
|
5
|
+
*
|
|
6
|
+
* Stage 1: Tool Output Pruning (cheapest -- no LLM call)
|
|
7
|
+
* Stage 2: File Read Deduplication (cheap -- no LLM call)
|
|
8
|
+
* Stage 3: LLM Summarization (expensive -- requires LLM call)
|
|
9
|
+
* Stage 4: Sliding Window Truncation (fallback -- no LLM call)
|
|
10
|
+
*/
|
|
11
|
+
import { estimateMessagesTokens } from "../utils/tokenEstimation.js";
|
|
12
|
+
import { logger } from "../utils/logger.js";
|
|
13
|
+
import { withTimeout } from "../utils/async/withTimeout.js";
|
|
14
|
+
import { SpanSerializer, SpanType, SpanStatus, } from "../observability/index.js";
|
|
15
|
+
import { getMetricsAggregator } from "../observability/index.js";
|
|
16
|
+
import { pruneToolOutputs } from "./stages/toolOutputPruner.js";
|
|
17
|
+
import { deduplicateFileReads } from "./stages/fileReadDeduplicator.js";
|
|
18
|
+
import { truncateWithSlidingWindow } from "./stages/slidingWindowTruncator.js";
|
|
19
|
+
import { summarizeMessages } from "./stages/structuredSummarizer.js";
|
|
20
|
+
const DEFAULT_CONFIG = {
|
|
21
|
+
enablePrune: true,
|
|
22
|
+
enableDeduplicate: true,
|
|
23
|
+
enableSummarize: true,
|
|
24
|
+
enableTruncate: true,
|
|
25
|
+
pruneProtectTokens: 40_000,
|
|
26
|
+
pruneMinimumSavings: 20_000,
|
|
27
|
+
pruneProtectedTools: ["skill"],
|
|
28
|
+
summarizationProvider: "vertex",
|
|
29
|
+
summarizationModel: "gemini-2.5-flash",
|
|
30
|
+
keepRecentRatio: 0.3,
|
|
31
|
+
truncationFraction: 0.5,
|
|
32
|
+
provider: "",
|
|
33
|
+
};
|
|
34
|
+
export class ContextCompactor {
|
|
35
|
+
config;
|
|
36
|
+
constructor(config) {
|
|
37
|
+
this.config = { ...DEFAULT_CONFIG, ...config };
|
|
38
|
+
}
|
|
39
|
+
/**
|
|
40
|
+
* Run the multi-stage compaction pipeline until messages fit within budget.
|
|
41
|
+
*/
|
|
42
|
+
async compact(messages, targetTokens, memoryConfig, requestId) {
|
|
43
|
+
let span = SpanSerializer.createSpan(SpanType.CONTEXT_COMPACTION, "context.compact", {
|
|
44
|
+
"context.operation": "compact",
|
|
45
|
+
"context.targetTokens": targetTokens,
|
|
46
|
+
});
|
|
47
|
+
const spanStartTime = Date.now();
|
|
48
|
+
try {
|
|
49
|
+
const provider = this.config.provider || undefined;
|
|
50
|
+
const tokensBefore = estimateMessagesTokens(messages, provider);
|
|
51
|
+
const stagesUsed = [];
|
|
52
|
+
let currentMessages = [...messages];
|
|
53
|
+
logger.info("[Compaction] Starting", {
|
|
54
|
+
requestId,
|
|
55
|
+
estimatedTokens: tokensBefore,
|
|
56
|
+
budgetTokens: targetTokens,
|
|
57
|
+
});
|
|
58
|
+
// Stage 1: Tool Output Pruning
|
|
59
|
+
if (this.config.enablePrune &&
|
|
60
|
+
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
61
|
+
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
62
|
+
const pruneResult = pruneToolOutputs(currentMessages, {
|
|
63
|
+
protectTokens: this.config.pruneProtectTokens,
|
|
64
|
+
minimumSavings: this.config.pruneMinimumSavings,
|
|
65
|
+
protectedTools: this.config.pruneProtectedTools,
|
|
66
|
+
provider,
|
|
67
|
+
});
|
|
68
|
+
if (pruneResult.pruned) {
|
|
69
|
+
currentMessages = pruneResult.messages;
|
|
70
|
+
stagesUsed.push("prune");
|
|
71
|
+
}
|
|
72
|
+
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
73
|
+
logger.info("[Compaction] Stage 1 (prune)", {
|
|
74
|
+
requestId,
|
|
75
|
+
ran: pruneResult.pruned,
|
|
76
|
+
tokensBefore: stageTokensBefore,
|
|
77
|
+
tokensAfter: stageTokensAfter,
|
|
78
|
+
saved: stageTokensBefore - stageTokensAfter,
|
|
79
|
+
});
|
|
80
|
+
}
|
|
81
|
+
// Stage 2: File Read Deduplication
|
|
82
|
+
if (this.config.enableDeduplicate &&
|
|
83
|
+
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
84
|
+
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
85
|
+
const dedupResult = deduplicateFileReads(currentMessages);
|
|
86
|
+
if (dedupResult.deduplicated) {
|
|
87
|
+
currentMessages = dedupResult.messages;
|
|
88
|
+
stagesUsed.push("deduplicate");
|
|
89
|
+
}
|
|
90
|
+
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
91
|
+
logger.info("[Compaction] Stage 2 (deduplicate)", {
|
|
92
|
+
requestId,
|
|
93
|
+
ran: dedupResult.deduplicated,
|
|
94
|
+
tokensBefore: stageTokensBefore,
|
|
95
|
+
tokensAfter: stageTokensAfter,
|
|
96
|
+
saved: stageTokensBefore - stageTokensAfter,
|
|
97
|
+
});
|
|
98
|
+
}
|
|
99
|
+
// Stage 3: LLM Summarization
|
|
100
|
+
if (this.config.enableSummarize &&
|
|
101
|
+
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
102
|
+
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
103
|
+
try {
|
|
104
|
+
const summarizeResult = await withTimeout(summarizeMessages(currentMessages, {
|
|
105
|
+
provider: this.config.summarizationProvider,
|
|
106
|
+
model: this.config.summarizationModel,
|
|
107
|
+
keepRecentRatio: this.config.keepRecentRatio,
|
|
108
|
+
memoryConfig,
|
|
109
|
+
targetTokens,
|
|
110
|
+
}), 120_000, "LLM summarization timed out after 120s");
|
|
111
|
+
if (summarizeResult.summarized) {
|
|
112
|
+
currentMessages = summarizeResult.messages;
|
|
113
|
+
stagesUsed.push("summarize");
|
|
114
|
+
}
|
|
115
|
+
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
116
|
+
logger.info("[Compaction] Stage 3 (summarize)", {
|
|
117
|
+
requestId,
|
|
118
|
+
ran: summarizeResult.summarized,
|
|
119
|
+
tokensBefore: stageTokensBefore,
|
|
120
|
+
tokensAfter: stageTokensAfter,
|
|
121
|
+
saved: stageTokensBefore - stageTokensAfter,
|
|
122
|
+
});
|
|
123
|
+
}
|
|
124
|
+
catch (error) {
|
|
125
|
+
const err = error instanceof Error ? error : new Error(String(error));
|
|
126
|
+
logger.warn("[Compaction] Stage 3 (summarize) FAILED", {
|
|
127
|
+
requestId,
|
|
128
|
+
error: err.message,
|
|
129
|
+
errorName: err.name,
|
|
130
|
+
tokensBefore: stageTokensBefore,
|
|
131
|
+
tokensAfter: stageTokensBefore,
|
|
132
|
+
saved: 0,
|
|
133
|
+
});
|
|
134
|
+
// Record failure on the compaction span for trace visibility
|
|
135
|
+
span = SpanSerializer.updateAttributes(span, {
|
|
136
|
+
"compaction.stage3.error": err.message,
|
|
137
|
+
"compaction.stage3.errorName": err.name,
|
|
138
|
+
"compaction.stage3.tokensBefore": stageTokensBefore,
|
|
139
|
+
"compaction.stage3_failed": true,
|
|
140
|
+
});
|
|
141
|
+
// Fall through to Stage 4 truncation as before
|
|
142
|
+
}
|
|
143
|
+
}
|
|
144
|
+
// Stage 4: Sliding Window Truncation (fallback)
|
|
145
|
+
if (this.config.enableTruncate &&
|
|
146
|
+
estimateMessagesTokens(currentMessages, provider) > targetTokens) {
|
|
147
|
+
const stageTokensBefore = estimateMessagesTokens(currentMessages, provider);
|
|
148
|
+
const truncResult = truncateWithSlidingWindow(currentMessages, {
|
|
149
|
+
fraction: this.config.truncationFraction,
|
|
150
|
+
currentTokens: stageTokensBefore,
|
|
151
|
+
targetTokens: targetTokens,
|
|
152
|
+
provider: provider,
|
|
153
|
+
adaptiveBuffer: 0.15,
|
|
154
|
+
maxIterations: 3,
|
|
155
|
+
});
|
|
156
|
+
if (truncResult.truncated) {
|
|
157
|
+
currentMessages = truncResult.messages;
|
|
158
|
+
stagesUsed.push("truncate");
|
|
159
|
+
}
|
|
160
|
+
const stageTokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
161
|
+
logger.info("[Compaction] Stage 4 (truncate)", {
|
|
162
|
+
requestId,
|
|
163
|
+
ran: truncResult.truncated,
|
|
164
|
+
tokensBefore: stageTokensBefore,
|
|
165
|
+
tokensAfter: stageTokensAfter,
|
|
166
|
+
saved: stageTokensBefore - stageTokensAfter,
|
|
167
|
+
});
|
|
168
|
+
}
|
|
169
|
+
const tokensAfter = estimateMessagesTokens(currentMessages, provider);
|
|
170
|
+
logger.info("[Compaction] Complete", {
|
|
171
|
+
requestId,
|
|
172
|
+
tokensBefore,
|
|
173
|
+
tokensAfter,
|
|
174
|
+
totalSaved: tokensBefore - tokensAfter,
|
|
175
|
+
stagesUsed,
|
|
176
|
+
durationMs: Date.now() - spanStartTime,
|
|
177
|
+
});
|
|
178
|
+
const result = {
|
|
179
|
+
compacted: stagesUsed.length > 0,
|
|
180
|
+
stagesUsed,
|
|
181
|
+
tokensBefore,
|
|
182
|
+
tokensAfter,
|
|
183
|
+
tokensSaved: tokensBefore - tokensAfter,
|
|
184
|
+
messages: currentMessages,
|
|
185
|
+
};
|
|
186
|
+
span.durationMs = Date.now() - spanStartTime;
|
|
187
|
+
const endedSpan = SpanSerializer.endSpan(SpanSerializer.updateAttributes(span, {
|
|
188
|
+
"context.stage": stagesUsed.join(",") || "none",
|
|
189
|
+
"context.tokensBefore": tokensBefore,
|
|
190
|
+
"context.tokensAfter": tokensAfter,
|
|
191
|
+
"context.tokensSaved": tokensBefore - tokensAfter,
|
|
192
|
+
}), SpanStatus.OK);
|
|
193
|
+
getMetricsAggregator().recordSpan(endedSpan);
|
|
194
|
+
return result;
|
|
195
|
+
}
|
|
196
|
+
catch (error) {
|
|
197
|
+
span.durationMs = Date.now() - spanStartTime;
|
|
198
|
+
const endedSpan = SpanSerializer.endSpan(span, SpanStatus.ERROR);
|
|
199
|
+
endedSpan.statusMessage =
|
|
200
|
+
error instanceof Error ? error.message : String(error);
|
|
201
|
+
getMetricsAggregator().recordSpan(endedSpan);
|
|
202
|
+
throw error;
|
|
203
|
+
}
|
|
204
|
+
}
|
|
205
|
+
}
|
|
@@ -0,0 +1,88 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Emergency Content Truncation
|
|
3
|
+
*
|
|
4
|
+
* When message-level removal (sliding window) can't fit context into budget,
|
|
5
|
+
* this truncates the CONTENT of the longest messages as a last resort.
|
|
6
|
+
*/
|
|
7
|
+
import { estimateTokens, estimateMessagesTokens, truncateToTokenBudget, } from "../utils/tokenEstimation.js";
|
|
8
|
+
import { logger } from "../utils/logger.js";
|
|
9
|
+
/**
|
|
10
|
+
* Emergency content truncation: truncate the content of the longest messages
|
|
11
|
+
* to fit within the available token budget.
|
|
12
|
+
*
|
|
13
|
+
* Strategy: Sort messages by content length (descending), truncate each
|
|
14
|
+
* to a proportional share of the available budget until total fits.
|
|
15
|
+
*/
|
|
16
|
+
export function emergencyContentTruncation(messages, availableTokensForHistory, breakdown, provider) {
|
|
17
|
+
// Budget available for conversation history specifically
|
|
18
|
+
const historyBudget = availableTokensForHistory -
|
|
19
|
+
breakdown.systemPrompt -
|
|
20
|
+
breakdown.currentPrompt -
|
|
21
|
+
breakdown.toolDefinitions -
|
|
22
|
+
breakdown.fileAttachments;
|
|
23
|
+
if (historyBudget <= 0) {
|
|
24
|
+
// No room for history: return empty to guarantee budget safety
|
|
25
|
+
return [];
|
|
26
|
+
}
|
|
27
|
+
const currentHistoryTokens = estimateMessagesTokens(messages, provider);
|
|
28
|
+
if (currentHistoryTokens <= historyBudget) {
|
|
29
|
+
return messages; // Already fits
|
|
30
|
+
}
|
|
31
|
+
// Calculate per-message budgets proportional to original size,
|
|
32
|
+
// but cap large messages to free space for others
|
|
33
|
+
const result = [...messages];
|
|
34
|
+
const reductionNeeded = currentHistoryTokens - historyBudget;
|
|
35
|
+
const reductionRatio = reductionNeeded / currentHistoryTokens;
|
|
36
|
+
// Sort indices by content length descending (truncate biggest first)
|
|
37
|
+
const sortedIndices = result
|
|
38
|
+
.map((msg, idx) => ({ idx, len: msg.content.length }))
|
|
39
|
+
.sort((a, b) => b.len - a.len);
|
|
40
|
+
let tokensSaved = 0;
|
|
41
|
+
for (const { idx } of sortedIndices) {
|
|
42
|
+
if (tokensSaved >= reductionNeeded) {
|
|
43
|
+
break;
|
|
44
|
+
}
|
|
45
|
+
const msg = result[idx];
|
|
46
|
+
// Don't truncate system messages or very short messages
|
|
47
|
+
if (msg.role === "system" || msg.content.length < 200) {
|
|
48
|
+
continue;
|
|
49
|
+
}
|
|
50
|
+
const msgTokens = estimateTokens(msg.content, provider);
|
|
51
|
+
const targetTokens = Math.floor(msgTokens * (1 - reductionRatio - 0.05));
|
|
52
|
+
if (targetTokens < msgTokens && targetTokens > 50) {
|
|
53
|
+
const truncated = truncateToTokenBudget(msg.content, targetTokens, provider);
|
|
54
|
+
if (truncated.truncated) {
|
|
55
|
+
const savedThisMsg = msgTokens - estimateTokens(truncated.text, provider);
|
|
56
|
+
tokensSaved += savedThisMsg;
|
|
57
|
+
result[idx] = {
|
|
58
|
+
...msg,
|
|
59
|
+
content: truncated.text,
|
|
60
|
+
metadata: { ...msg.metadata, truncated: true },
|
|
61
|
+
};
|
|
62
|
+
}
|
|
63
|
+
}
|
|
64
|
+
}
|
|
65
|
+
logger.info("[EmergencyTruncation] Content truncation complete", {
|
|
66
|
+
tokensSaved,
|
|
67
|
+
reductionNeeded,
|
|
68
|
+
messagesModified: result.filter((m, i) => m !== messages[i]).length,
|
|
69
|
+
});
|
|
70
|
+
// Final safety check: guarantee returned history fits budget
|
|
71
|
+
if (estimateMessagesTokens(result, provider) <= historyBudget) {
|
|
72
|
+
return result;
|
|
73
|
+
}
|
|
74
|
+
// Hard fallback: keep newest non-system messages that fit
|
|
75
|
+
const fallback = [];
|
|
76
|
+
for (let i = result.length - 1; i >= 0; i--) {
|
|
77
|
+
const msg = result[i];
|
|
78
|
+
if (msg.role === "system") {
|
|
79
|
+
continue;
|
|
80
|
+
}
|
|
81
|
+
fallback.unshift(msg);
|
|
82
|
+
if (estimateMessagesTokens(fallback, provider) > historyBudget) {
|
|
83
|
+
fallback.shift();
|
|
84
|
+
break;
|
|
85
|
+
}
|
|
86
|
+
}
|
|
87
|
+
return fallback;
|
|
88
|
+
}
|
|
@@ -0,0 +1,171 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Context Overflow Error Detection
|
|
3
|
+
*
|
|
4
|
+
* Cross-provider regex patterns to detect context window overflow errors.
|
|
5
|
+
* Modeled on Cline + pi-mono patterns.
|
|
6
|
+
*/
|
|
7
|
+
/**
|
|
8
|
+
* Provider-specific error patterns for context overflow.
|
|
9
|
+
*
|
|
10
|
+
* IMPORTANT: Order matters for getContextOverflowProvider - more specific
|
|
11
|
+
* patterns should be checked first. OpenAI patterns are very specific
|
|
12
|
+
* (e.g., "This model's maximum context length is") so they come first.
|
|
13
|
+
*/
|
|
14
|
+
const OVERFLOW_PATTERNS = [
|
|
15
|
+
{
|
|
16
|
+
provider: "openai",
|
|
17
|
+
patterns: [
|
|
18
|
+
/This model's maximum context length is/i,
|
|
19
|
+
/tokens\. However, (?:your messages|you requested)/i,
|
|
20
|
+
/reduce the length of the messages/i,
|
|
21
|
+
/Please reduce the length/i,
|
|
22
|
+
],
|
|
23
|
+
},
|
|
24
|
+
{
|
|
25
|
+
provider: "azure",
|
|
26
|
+
patterns: [/content_length_exceeded/i],
|
|
27
|
+
},
|
|
28
|
+
{
|
|
29
|
+
provider: "google",
|
|
30
|
+
patterns: [
|
|
31
|
+
/RESOURCE_EXHAUSTED/i,
|
|
32
|
+
/exceeds the maximum number of tokens/i,
|
|
33
|
+
/content is too long/i,
|
|
34
|
+
/request payload size exceeds/i,
|
|
35
|
+
/input token limit/i,
|
|
36
|
+
],
|
|
37
|
+
},
|
|
38
|
+
{
|
|
39
|
+
provider: "bedrock",
|
|
40
|
+
patterns: [
|
|
41
|
+
/ValidationException.*token/i,
|
|
42
|
+
/Input is too long/i,
|
|
43
|
+
/exceeds the model's maximum/i,
|
|
44
|
+
],
|
|
45
|
+
},
|
|
46
|
+
{
|
|
47
|
+
provider: "mistral",
|
|
48
|
+
patterns: [/context length exceeded/i, /maximum number of tokens/i],
|
|
49
|
+
},
|
|
50
|
+
{
|
|
51
|
+
provider: "openrouter",
|
|
52
|
+
patterns: [/context_length_exceeded/i],
|
|
53
|
+
},
|
|
54
|
+
{
|
|
55
|
+
provider: "anthropic",
|
|
56
|
+
patterns: [
|
|
57
|
+
/prompt is too long/i,
|
|
58
|
+
/input is too long/i,
|
|
59
|
+
/too many tokens/i,
|
|
60
|
+
/maximum context length/i,
|
|
61
|
+
],
|
|
62
|
+
},
|
|
63
|
+
];
|
|
64
|
+
/**
|
|
65
|
+
* Check if an error is a context overflow error from any provider.
|
|
66
|
+
*/
|
|
67
|
+
export function isContextOverflowError(error) {
|
|
68
|
+
const errorMessage = extractErrorMessage(error);
|
|
69
|
+
if (!errorMessage) {
|
|
70
|
+
return false;
|
|
71
|
+
}
|
|
72
|
+
return OVERFLOW_PATTERNS.some(({ patterns }) => patterns.some((pattern) => pattern.test(errorMessage)));
|
|
73
|
+
}
|
|
74
|
+
/**
|
|
75
|
+
* Identify which provider produced the context overflow error.
|
|
76
|
+
*/
|
|
77
|
+
export function getContextOverflowProvider(error) {
|
|
78
|
+
const errorMessage = extractErrorMessage(error);
|
|
79
|
+
if (!errorMessage) {
|
|
80
|
+
return null;
|
|
81
|
+
}
|
|
82
|
+
for (const { provider, patterns } of OVERFLOW_PATTERNS) {
|
|
83
|
+
if (patterns.some((pattern) => pattern.test(errorMessage))) {
|
|
84
|
+
return provider;
|
|
85
|
+
}
|
|
86
|
+
}
|
|
87
|
+
return null;
|
|
88
|
+
}
|
|
89
|
+
/**
|
|
90
|
+
* Extract actual token counts from provider overflow error messages.
|
|
91
|
+
*
|
|
92
|
+
* Many providers include the actual/max token counts in their error messages:
|
|
93
|
+
* - OpenAI: "This model's maximum context length is 128000 tokens. However, your messages resulted in 145000 tokens."
|
|
94
|
+
* - Anthropic: "prompt is too long: 180000 tokens > 200000 token limit"
|
|
95
|
+
* - Google: "exceeds the maximum number of tokens (180000 > 100000)"
|
|
96
|
+
*/
|
|
97
|
+
export function parseProviderOverflowDetails(error) {
|
|
98
|
+
const message = extractErrorMessage(error);
|
|
99
|
+
if (!message) {
|
|
100
|
+
return null;
|
|
101
|
+
}
|
|
102
|
+
// Guard against excessively long inputs that could slow regex matching
|
|
103
|
+
if (message.length > 2000) {
|
|
104
|
+
return null;
|
|
105
|
+
}
|
|
106
|
+
// OpenAI pattern: "resulted in X tokens" + "maximum context length is Y"
|
|
107
|
+
// Use single character-class number groups to prevent ReDoS (CodeQL: js/polynomial-redos)
|
|
108
|
+
const openaiActual = message.match(/resulted\s+in\s+(\d[\d,]{0,19})\s*tokens/i);
|
|
109
|
+
const openaiMax = message.match(/maximum\s+context\s+length\s+is\s+(\d[\d,]{0,19})/i);
|
|
110
|
+
if (openaiActual && openaiMax) {
|
|
111
|
+
return {
|
|
112
|
+
actualTokens: parseInt(openaiActual[1].replace(/,/g, ""), 10),
|
|
113
|
+
budgetTokens: parseInt(openaiMax[1].replace(/,/g, ""), 10),
|
|
114
|
+
};
|
|
115
|
+
}
|
|
116
|
+
// Anthropic pattern: "X tokens > Y token limit" or "X tokens, limit Y"
|
|
117
|
+
// Use single character-class number groups to prevent ReDoS (CodeQL: js/polynomial-redos)
|
|
118
|
+
const anthropicMatch = message.match(/(\d[\d,]{0,19})\s*tokens?\s*[>:]\s*(\d[\d,]{0,19})/i);
|
|
119
|
+
if (anthropicMatch) {
|
|
120
|
+
return {
|
|
121
|
+
actualTokens: parseInt(anthropicMatch[1].replace(/,/g, ""), 10),
|
|
122
|
+
budgetTokens: parseInt(anthropicMatch[2].replace(/,/g, ""), 10),
|
|
123
|
+
};
|
|
124
|
+
}
|
|
125
|
+
// Google pattern: "X > Y" or "X exceeds Y"
|
|
126
|
+
// Use single character-class number groups to prevent ReDoS (CodeQL: js/polynomial-redos)
|
|
127
|
+
const googleMatch = message.match(/(\d[\d,]{0,19})\s*(?:>|exceeds)\s*(\d[\d,]{0,19})/i);
|
|
128
|
+
if (googleMatch) {
|
|
129
|
+
return {
|
|
130
|
+
actualTokens: parseInt(googleMatch[1].replace(/,/g, ""), 10),
|
|
131
|
+
budgetTokens: parseInt(googleMatch[2].replace(/,/g, ""), 10),
|
|
132
|
+
};
|
|
133
|
+
}
|
|
134
|
+
return null;
|
|
135
|
+
}
|
|
136
|
+
/**
|
|
137
|
+
* Extract error message from various error formats.
|
|
138
|
+
*/
|
|
139
|
+
export function extractErrorMessage(error) {
|
|
140
|
+
if (!error) {
|
|
141
|
+
return null;
|
|
142
|
+
}
|
|
143
|
+
if (typeof error === "string") {
|
|
144
|
+
return error;
|
|
145
|
+
}
|
|
146
|
+
if (error instanceof Error) {
|
|
147
|
+
// Check nested error messages too
|
|
148
|
+
const msg = error.message;
|
|
149
|
+
const cause = error?.cause;
|
|
150
|
+
if (cause instanceof Error) {
|
|
151
|
+
return `${msg} ${cause.message}`;
|
|
152
|
+
}
|
|
153
|
+
return msg;
|
|
154
|
+
}
|
|
155
|
+
if (typeof error === "object") {
|
|
156
|
+
const obj = error;
|
|
157
|
+
if (typeof obj.message === "string") {
|
|
158
|
+
return obj.message;
|
|
159
|
+
}
|
|
160
|
+
if (typeof obj.error === "string") {
|
|
161
|
+
return obj.error;
|
|
162
|
+
}
|
|
163
|
+
if (typeof obj.error === "object" && obj.error !== null) {
|
|
164
|
+
const nested = obj.error;
|
|
165
|
+
if (typeof nested.message === "string") {
|
|
166
|
+
return nested.message;
|
|
167
|
+
}
|
|
168
|
+
}
|
|
169
|
+
}
|
|
170
|
+
return null;
|
|
171
|
+
}
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Context-specific error classes for budget and overflow scenarios.
|
|
3
|
+
*/
|
|
4
|
+
/**
|
|
5
|
+
* Thrown when context exceeds model budget after all compaction stages,
|
|
6
|
+
* preventing wasteful API calls to providers that will reject the request.
|
|
7
|
+
*/
|
|
8
|
+
export class ContextBudgetExceededError extends Error {
|
|
9
|
+
estimatedTokens;
|
|
10
|
+
availableTokens;
|
|
11
|
+
stagesUsed;
|
|
12
|
+
breakdown;
|
|
13
|
+
constructor(message, details) {
|
|
14
|
+
super(message);
|
|
15
|
+
this.name = "ContextBudgetExceededError";
|
|
16
|
+
this.estimatedTokens = details.estimatedTokens;
|
|
17
|
+
this.availableTokens = details.availableTokens;
|
|
18
|
+
this.stagesUsed = details.stagesUsed;
|
|
19
|
+
this.breakdown = details.breakdown;
|
|
20
|
+
}
|
|
21
|
+
}
|
|
@@ -0,0 +1,127 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* File Token Budget System
|
|
3
|
+
*
|
|
4
|
+
* Calculates how much of the remaining context window budget
|
|
5
|
+
* can be used for file reads. Implements fast-path for small files
|
|
6
|
+
* and preview mode for very large files.
|
|
7
|
+
*/
|
|
8
|
+
/** Percentage of remaining context to allocate for file reads */
|
|
9
|
+
export const FILE_READ_BUDGET_PERCENT = 0.6;
|
|
10
|
+
/** Files below this size skip budget validation (100KB) */
|
|
11
|
+
export const FILE_FAST_PATH_SIZE = 100 * 1024;
|
|
12
|
+
/** Files above this size get preview-only mode (5MB) */
|
|
13
|
+
export const FILE_PREVIEW_MODE_SIZE = 5 * 1024 * 1024;
|
|
14
|
+
/** Default preview size in characters */
|
|
15
|
+
export const FILE_PREVIEW_CHARS = 2000;
|
|
16
|
+
/**
|
|
17
|
+
* Calculate available token budget for file reads.
|
|
18
|
+
*
|
|
19
|
+
* @param contextWindow - Total context window for the model
|
|
20
|
+
* @param currentTokens - Tokens already used (conversation + system prompt)
|
|
21
|
+
* @param maxOutputTokens - Reserved output tokens
|
|
22
|
+
* @returns Available tokens for file content
|
|
23
|
+
*/
|
|
24
|
+
export function calculateFileTokenBudget(contextWindow, currentTokens, maxOutputTokens) {
|
|
25
|
+
const remainingTokens = contextWindow - currentTokens - maxOutputTokens;
|
|
26
|
+
if (remainingTokens <= 0) {
|
|
27
|
+
return 0;
|
|
28
|
+
}
|
|
29
|
+
return Math.floor(remainingTokens * FILE_READ_BUDGET_PERCENT);
|
|
30
|
+
}
|
|
31
|
+
/**
|
|
32
|
+
* Determine how a file should be handled based on its size and the budget.
|
|
33
|
+
*/
|
|
34
|
+
export function shouldTruncateFile(fileSize, budget) {
|
|
35
|
+
// Very large files: preview mode
|
|
36
|
+
if (fileSize > FILE_PREVIEW_MODE_SIZE) {
|
|
37
|
+
return {
|
|
38
|
+
shouldTruncate: true,
|
|
39
|
+
maxChars: FILE_PREVIEW_CHARS,
|
|
40
|
+
previewMode: true,
|
|
41
|
+
};
|
|
42
|
+
}
|
|
43
|
+
// Small files: skip validation
|
|
44
|
+
if (fileSize < FILE_FAST_PATH_SIZE) {
|
|
45
|
+
return { shouldTruncate: false };
|
|
46
|
+
}
|
|
47
|
+
// Estimate tokens (4 chars per token, rough)
|
|
48
|
+
const estimatedTokens = Math.ceil(fileSize / 4);
|
|
49
|
+
if (estimatedTokens <= budget) {
|
|
50
|
+
return { shouldTruncate: false };
|
|
51
|
+
}
|
|
52
|
+
// Truncate to fit budget
|
|
53
|
+
const maxChars = budget * 4; // Convert back to chars
|
|
54
|
+
return {
|
|
55
|
+
shouldTruncate: true,
|
|
56
|
+
maxChars: Math.max(FILE_PREVIEW_CHARS, maxChars),
|
|
57
|
+
previewMode: false,
|
|
58
|
+
};
|
|
59
|
+
}
|
|
60
|
+
/**
|
|
61
|
+
* Estimate post-processing token count based on file type.
|
|
62
|
+
*
|
|
63
|
+
* Different file types produce vastly different amounts of text after
|
|
64
|
+
* processing. A 50 MB video file yields ~200-500 tokens of metadata,
|
|
65
|
+
* while a 50 MB text file yields ~12.5 M tokens. Using the raw byte
|
|
66
|
+
* size for all types causes media files to be wrongly excluded by the
|
|
67
|
+
* aggregate budget check.
|
|
68
|
+
*
|
|
69
|
+
* @param sizeBytes Raw file size in bytes
|
|
70
|
+
* @param fileType Detected file type (e.g. "video", "audio", "image")
|
|
71
|
+
* @returns Estimated token count after processing
|
|
72
|
+
*/
|
|
73
|
+
export function estimatePostProcessingTokens(sizeBytes, fileType) {
|
|
74
|
+
switch (fileType) {
|
|
75
|
+
// Media files produce only metadata text (~100-500 tokens)
|
|
76
|
+
case "video":
|
|
77
|
+
return 500;
|
|
78
|
+
case "audio":
|
|
79
|
+
return 300;
|
|
80
|
+
// Images are sent as base64 — provider counts them as ~1500 tokens each
|
|
81
|
+
case "image":
|
|
82
|
+
return 1500;
|
|
83
|
+
// Archives produce a file listing (~500-2000 tokens)
|
|
84
|
+
case "archive":
|
|
85
|
+
return 1000;
|
|
86
|
+
// Unknown binary files produce metadata + extracted strings (~200-1000 tokens)
|
|
87
|
+
case "unknown":
|
|
88
|
+
return 500;
|
|
89
|
+
// PDFs are sent natively on some providers; estimate ~1 token per 100 bytes, capped
|
|
90
|
+
case "pdf":
|
|
91
|
+
return Math.min(Math.ceil(sizeBytes / 100), 50_000);
|
|
92
|
+
// Structured documents (Excel, Word, PPTX) extract text — roughly 15% of raw size
|
|
93
|
+
case "xlsx":
|
|
94
|
+
case "docx":
|
|
95
|
+
case "pptx":
|
|
96
|
+
return Math.ceil((sizeBytes * 0.15) / 4);
|
|
97
|
+
// SVG is sanitized markup — usually small
|
|
98
|
+
case "svg":
|
|
99
|
+
return Math.ceil(sizeBytes / 4);
|
|
100
|
+
// CSV, text, code — raw text roughly 1 token per 4 bytes
|
|
101
|
+
case "csv":
|
|
102
|
+
case "text":
|
|
103
|
+
default:
|
|
104
|
+
// Original formula: base64-inflate then divide by 4
|
|
105
|
+
return Math.ceil((sizeBytes * 1.33) / 4);
|
|
106
|
+
}
|
|
107
|
+
}
|
|
108
|
+
export function enforceAggregateFileBudget(files, availableTokens) {
|
|
109
|
+
const TOKEN_BUDGET_FOR_FILES = Math.floor(availableTokens * FILE_READ_BUDGET_PERCENT);
|
|
110
|
+
let usedTokens = 0;
|
|
111
|
+
const included = [];
|
|
112
|
+
const excluded = [];
|
|
113
|
+
const notices = [];
|
|
114
|
+
const sorted = [...files].sort((a, b) => a.sizeBytes - b.sizeBytes);
|
|
115
|
+
for (const file of sorted) {
|
|
116
|
+
const estimatedTokens = estimatePostProcessingTokens(file.sizeBytes, file.fileType);
|
|
117
|
+
if (usedTokens + estimatedTokens <= TOKEN_BUDGET_FOR_FILES) {
|
|
118
|
+
usedTokens += estimatedTokens;
|
|
119
|
+
included.push(file);
|
|
120
|
+
}
|
|
121
|
+
else {
|
|
122
|
+
excluded.push(file);
|
|
123
|
+
notices.push(`Skipped "${file.name}" (${(file.sizeBytes / 1024).toFixed(0)} KB) — exceeds context budget`);
|
|
124
|
+
}
|
|
125
|
+
}
|
|
126
|
+
return { included, excluded, notices };
|
|
127
|
+
}
|