@juspay/neurolink 9.32.0 → 9.32.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +6 -0
- package/dist/auth/anthropicOAuth.js +1 -1
- package/dist/cli/commands/proxy.js +18 -5
- package/dist/client/aiSdkAdapter.js +1 -1
- package/dist/client/index.js +137 -501
- package/dist/core/factory.js +0 -1
- package/dist/core/redisConversationMemoryManager.js +1 -1
- package/dist/features/ppt/slideGenerator.js +0 -1
- package/dist/features/ppt/utils.js +0 -1
- package/dist/lib/server/routes/claudeProxyRoutes.js +45 -9
- package/dist/mcp/elicitationProtocol.js +1 -1
- package/dist/mcp/servers/agent/directToolsServer.js +0 -1
- package/dist/providers/azureOpenai.js +1 -1
- package/dist/providers/huggingFace.js +0 -1
- package/dist/providers/openaiCompatible.js +0 -1
- package/dist/sdk/toolRegistration.js +0 -1
- package/dist/server/openapi/generator.js +1 -1
- package/dist/server/routes/claudeProxyRoutes.js +45 -9
- package/dist/types/configTypes.js +0 -5
- package/dist/types/modelTypes.js +0 -1
- package/dist/types/tools.js +0 -1
- package/dist/types/typeAliases.js +0 -1
- package/dist/types/utilities.js +1 -1
- package/dist/types/workflowTypes.js +0 -1
- package/dist/utils/providerRetry.js +0 -1
- package/dist/utils/providerUtils.js +0 -1
- package/package.json +2 -2
- package/dist/client/adapters/providerImageAdapter.js +0 -588
- package/dist/client/adapters/tts/googleTTSHandler.js +0 -344
- package/dist/client/adapters/video/directorPipeline.js +0 -516
- package/dist/client/adapters/video/ffmpegAdapter.js +0 -206
- package/dist/client/adapters/video/frameExtractor.js +0 -143
- package/dist/client/adapters/video/vertexVideoHandler.js +0 -763
- package/dist/client/adapters/video/videoAnalyzer.js +0 -238
- package/dist/client/adapters/video/videoMerger.js +0 -171
- package/dist/client/agent/directTools.js +0 -840
- package/dist/client/auth/AuthProviderFactory.js +0 -111
- package/dist/client/auth/AuthProviderRegistry.js +0 -190
- package/dist/client/auth/RequestContext.js +0 -78
- package/dist/client/auth/accountPool.js +0 -178
- package/dist/client/auth/anthropicOAuth.js +0 -974
- package/dist/client/auth/authContext.js +0 -314
- package/dist/client/auth/errors.js +0 -39
- package/dist/client/auth/index.js +0 -61
- package/dist/client/auth/middleware/AuthMiddleware.js +0 -519
- package/dist/client/auth/middleware/rateLimitByUser.js +0 -554
- package/dist/client/auth/providers/BaseAuthProvider.js +0 -723
- package/dist/client/auth/providers/CognitoProvider.js +0 -304
- package/dist/client/auth/providers/KeycloakProvider.js +0 -393
- package/dist/client/auth/providers/auth0.js +0 -274
- package/dist/client/auth/providers/betterAuth.js +0 -182
- package/dist/client/auth/providers/clerk.js +0 -317
- package/dist/client/auth/providers/custom.js +0 -112
- package/dist/client/auth/providers/firebase.js +0 -226
- package/dist/client/auth/providers/jwt.js +0 -212
- package/dist/client/auth/providers/oauth2.js +0 -303
- package/dist/client/auth/providers/supabase.js +0 -259
- package/dist/client/auth/providers/workos.js +0 -284
- package/dist/client/auth/serverBridge.js +0 -25
- package/dist/client/auth/sessionManager.js +0 -437
- package/dist/client/auth/tokenStore.js +0 -799
- package/dist/client/client/aiSdkAdapter.js +0 -487
- package/dist/client/client/auth.js +0 -473
- package/dist/client/client/errors.js +0 -552
- package/dist/client/client/httpClient.js +0 -837
- package/dist/client/client/index.js +0 -172
- package/dist/client/client/interceptors.js +0 -601
- package/dist/client/client/sseClient.js +0 -545
- package/dist/client/client/streamingClient.js +0 -917
- package/dist/client/client/wsClient.js +0 -369
- package/dist/client/config/configManager.js +0 -303
- package/dist/client/config/conversationMemory.js +0 -86
- package/dist/client/config/taskClassificationConfig.js +0 -148
- package/dist/client/constants/contextWindows.js +0 -295
- package/dist/client/constants/enums.js +0 -853
- package/dist/client/constants/index.js +0 -207
- package/dist/client/constants/performance.js +0 -389
- package/dist/client/constants/retry.js +0 -266
- package/dist/client/constants/timeouts.js +0 -182
- package/dist/client/constants/tokens.js +0 -380
- package/dist/client/constants/videoErrors.js +0 -46
- package/dist/client/context/budgetChecker.js +0 -98
- package/dist/client/context/contextCompactor.js +0 -205
- package/dist/client/context/emergencyTruncation.js +0 -88
- package/dist/client/context/errorDetection.js +0 -171
- package/dist/client/context/errors.js +0 -21
- package/dist/client/context/fileTokenBudget.js +0 -127
- package/dist/client/context/prompts/summarizationPrompt.js +0 -117
- package/dist/client/context/stages/fileReadDeduplicator.js +0 -66
- package/dist/client/context/stages/slidingWindowTruncator.js +0 -190
- package/dist/client/context/stages/structuredSummarizer.js +0 -99
- package/dist/client/context/stages/toolOutputPruner.js +0 -52
- package/dist/client/context/summarizationEngine.js +0 -136
- package/dist/client/context/toolOutputLimits.js +0 -78
- package/dist/client/context/toolPairRepair.js +0 -66
- package/dist/client/core/analytics.js +0 -88
- package/dist/client/core/baseProvider.js +0 -1385
- package/dist/client/core/constants.js +0 -140
- package/dist/client/core/conversationMemoryFactory.js +0 -141
- package/dist/client/core/conversationMemoryInitializer.js +0 -128
- package/dist/client/core/conversationMemoryManager.js +0 -344
- package/dist/client/core/dynamicModels.js +0 -358
- package/dist/client/core/evaluation.js +0 -309
- package/dist/client/core/evaluationProviders.js +0 -248
- package/dist/client/core/factory.js +0 -412
- package/dist/client/core/infrastructure/baseError.js +0 -22
- package/dist/client/core/infrastructure/baseFactory.js +0 -54
- package/dist/client/core/infrastructure/baseRegistry.js +0 -53
- package/dist/client/core/infrastructure/index.js +0 -5
- package/dist/client/core/infrastructure/retry.js +0 -20
- package/dist/client/core/infrastructure/typedEventEmitter.js +0 -23
- package/dist/client/core/modelConfiguration.js +0 -851
- package/dist/client/core/modules/GenerationHandler.js +0 -588
- package/dist/client/core/modules/MessageBuilder.js +0 -273
- package/dist/client/core/modules/StreamHandler.js +0 -185
- package/dist/client/core/modules/TelemetryHandler.js +0 -203
- package/dist/client/core/modules/ToolsManager.js +0 -499
- package/dist/client/core/modules/Utilities.js +0 -331
- package/dist/client/core/redisConversationMemoryManager.js +0 -1435
- package/dist/client/core/streamAnalytics.js +0 -131
- package/dist/client/evaluation/contextBuilder.js +0 -134
- package/dist/client/evaluation/index.js +0 -61
- package/dist/client/evaluation/prompts.js +0 -73
- package/dist/client/evaluation/ragasEvaluator.js +0 -110
- package/dist/client/evaluation/retryManager.js +0 -78
- package/dist/client/evaluation/scoring.js +0 -61
- package/dist/client/factories/providerFactory.js +0 -166
- package/dist/client/factories/providerRegistry.js +0 -166
- package/dist/client/features/ppt/constants.js +0 -896
- package/dist/client/features/ppt/contentPlanner.js +0 -529
- package/dist/client/features/ppt/presentationOrchestrator.js +0 -236
- package/dist/client/features/ppt/slideGenerator.js +0 -532
- package/dist/client/features/ppt/slideRenderers.js +0 -2383
- package/dist/client/features/ppt/slideTypeInference.js +0 -405
- package/dist/client/features/ppt/types.js +0 -13
- package/dist/client/features/ppt/utils.js +0 -443
- package/dist/client/files/fileReferenceRegistry.js +0 -1543
- package/dist/client/files/fileTools.js +0 -450
- package/dist/client/files/streamingReader.js +0 -321
- package/dist/client/files/types.js +0 -23
- package/dist/client/hitl/hitlErrors.js +0 -54
- package/dist/client/hitl/hitlManager.js +0 -460
- package/dist/client/mcp/agentExposure.js +0 -356
- package/dist/client/mcp/auth/index.js +0 -11
- package/dist/client/mcp/auth/oauthClientProvider.js +0 -325
- package/dist/client/mcp/auth/tokenStorage.js +0 -134
- package/dist/client/mcp/batching/index.js +0 -10
- package/dist/client/mcp/batching/requestBatcher.js +0 -441
- package/dist/client/mcp/caching/index.js +0 -10
- package/dist/client/mcp/caching/toolCache.js +0 -433
- package/dist/client/mcp/elicitation/elicitationManager.js +0 -376
- package/dist/client/mcp/elicitation/index.js +0 -11
- package/dist/client/mcp/elicitation/types.js +0 -10
- package/dist/client/mcp/elicitationProtocol.js +0 -375
- package/dist/client/mcp/enhancedToolDiscovery.js +0 -481
- package/dist/client/mcp/externalServerManager.js +0 -1478
- package/dist/client/mcp/factory.js +0 -161
- package/dist/client/mcp/flexibleToolValidator.js +0 -161
- package/dist/client/mcp/httpRateLimiter.js +0 -391
- package/dist/client/mcp/httpRetryHandler.js +0 -178
- package/dist/client/mcp/index.js +0 -74
- package/dist/client/mcp/mcpCircuitBreaker.js +0 -427
- package/dist/client/mcp/mcpClientFactory.js +0 -708
- package/dist/client/mcp/mcpRegistryClient.js +0 -488
- package/dist/client/mcp/mcpServerBase.js +0 -373
- package/dist/client/mcp/multiServerManager.js +0 -579
- package/dist/client/mcp/registry.js +0 -158
- package/dist/client/mcp/routing/index.js +0 -10
- package/dist/client/mcp/routing/toolRouter.js +0 -416
- package/dist/client/mcp/serverCapabilities.js +0 -502
- package/dist/client/mcp/servers/agent/directToolsServer.js +0 -150
- package/dist/client/mcp/toolAnnotations.js +0 -239
- package/dist/client/mcp/toolConverter.js +0 -258
- package/dist/client/mcp/toolDiscoveryService.js +0 -798
- package/dist/client/mcp/toolIntegration.js +0 -334
- package/dist/client/mcp/toolRegistry.js +0 -729
- package/dist/client/memory/hippocampusInitializer.js +0 -19
- package/dist/client/memory/memoryRetrievalTools.js +0 -166
- package/dist/client/middleware/builtin/analytics.js +0 -132
- package/dist/client/middleware/builtin/autoEvaluation.js +0 -203
- package/dist/client/middleware/builtin/guardrails.js +0 -109
- package/dist/client/middleware/builtin/lifecycle.js +0 -168
- package/dist/client/middleware/factory.js +0 -327
- package/dist/client/middleware/registry.js +0 -295
- package/dist/client/middleware/utils/guardrailsUtils.js +0 -396
- package/dist/client/models/anthropicModels.js +0 -527
- package/dist/client/neurolink.js +0 -8233
- package/dist/client/observability/exporterRegistry.js +0 -413
- package/dist/client/observability/exporters/arizeExporter.js +0 -138
- package/dist/client/observability/exporters/baseExporter.js +0 -190
- package/dist/client/observability/exporters/braintrustExporter.js +0 -154
- package/dist/client/observability/exporters/datadogExporter.js +0 -196
- package/dist/client/observability/exporters/laminarExporter.js +0 -302
- package/dist/client/observability/exporters/langfuseExporter.js +0 -209
- package/dist/client/observability/exporters/langsmithExporter.js +0 -143
- package/dist/client/observability/exporters/otelExporter.js +0 -164
- package/dist/client/observability/exporters/posthogExporter.js +0 -287
- package/dist/client/observability/exporters/sentryExporter.js +0 -165
- package/dist/client/observability/index.js +0 -31
- package/dist/client/observability/metricsAggregator.js +0 -556
- package/dist/client/observability/otelBridge.js +0 -131
- package/dist/client/observability/retryPolicy.js +0 -383
- package/dist/client/observability/sampling/samplers.js +0 -216
- package/dist/client/observability/spanProcessor.js +0 -303
- package/dist/client/observability/tokenTracker.js +0 -413
- package/dist/client/observability/types/exporterTypes.js +0 -5
- package/dist/client/observability/types/index.js +0 -4
- package/dist/client/observability/types/spanTypes.js +0 -92
- package/dist/client/observability/utils/safeMetadata.js +0 -25
- package/dist/client/observability/utils/spanSerializer.js +0 -292
- package/dist/client/processors/archive/ArchiveProcessor.js +0 -1308
- package/dist/client/processors/base/BaseFileProcessor.js +0 -614
- package/dist/client/processors/base/types.js +0 -82
- package/dist/client/processors/config/fileTypes.js +0 -520
- package/dist/client/processors/config/index.js +0 -92
- package/dist/client/processors/config/languageMap.js +0 -410
- package/dist/client/processors/config/mimeTypes.js +0 -363
- package/dist/client/processors/config/sizeLimits.js +0 -258
- package/dist/client/processors/document/ExcelProcessor.js +0 -590
- package/dist/client/processors/document/OpenDocumentProcessor.js +0 -212
- package/dist/client/processors/document/PptxProcessor.js +0 -157
- package/dist/client/processors/document/RtfProcessor.js +0 -361
- package/dist/client/processors/document/WordProcessor.js +0 -353
- package/dist/client/processors/errors/FileErrorCode.js +0 -255
- package/dist/client/processors/errors/errorHelpers.js +0 -386
- package/dist/client/processors/errors/errorSerializer.js +0 -507
- package/dist/client/processors/errors/index.js +0 -49
- package/dist/client/processors/markup/SvgProcessor.js +0 -240
- package/dist/client/processors/media/AudioProcessor.js +0 -707
- package/dist/client/processors/media/VideoProcessor.js +0 -1045
- package/dist/client/providers/amazonBedrock.js +0 -1512
- package/dist/client/providers/amazonSagemaker.js +0 -162
- package/dist/client/providers/anthropic.js +0 -831
- package/dist/client/providers/azureOpenai.js +0 -143
- package/dist/client/providers/googleAiStudio.js +0 -1200
- package/dist/client/providers/googleNativeGemini3.js +0 -543
- package/dist/client/providers/googleVertex.js +0 -2936
- package/dist/client/providers/huggingFace.js +0 -315
- package/dist/client/providers/litellm.js +0 -488
- package/dist/client/providers/mistral.js +0 -157
- package/dist/client/providers/ollama.js +0 -1579
- package/dist/client/providers/openAI.js +0 -627
- package/dist/client/providers/openRouter.js +0 -543
- package/dist/client/providers/openaiCompatible.js +0 -290
- package/dist/client/providers/providerTypeUtils.js +0 -46
- package/dist/client/providers/sagemaker/adaptive-semaphore.js +0 -215
- package/dist/client/providers/sagemaker/client.js +0 -472
- package/dist/client/providers/sagemaker/config.js +0 -317
- package/dist/client/providers/sagemaker/detection.js +0 -606
- package/dist/client/providers/sagemaker/error-constants.js +0 -227
- package/dist/client/providers/sagemaker/errors.js +0 -299
- package/dist/client/providers/sagemaker/language-model.js +0 -775
- package/dist/client/providers/sagemaker/parsers.js +0 -634
- package/dist/client/providers/sagemaker/streaming.js +0 -331
- package/dist/client/providers/sagemaker/structured-parser.js +0 -625
- package/dist/client/proxy/accountQuota.js +0 -162
- package/dist/client/proxy/claudeFormat.js +0 -595
- package/dist/client/proxy/modelRouter.js +0 -29
- package/dist/client/proxy/oauthFetch.js +0 -367
- package/dist/client/proxy/proxyFetch.js +0 -586
- package/dist/client/proxy/requestLogger.js +0 -207
- package/dist/client/proxy/tokenRefresh.js +0 -124
- package/dist/client/proxy/usageStats.js +0 -74
- package/dist/client/proxy/utils/noProxyUtils.js +0 -149
- package/dist/client/rag/ChunkerFactory.js +0 -320
- package/dist/client/rag/ChunkerRegistry.js +0 -421
- package/dist/client/rag/chunkers/BaseChunker.js +0 -143
- package/dist/client/rag/chunkers/CharacterChunker.js +0 -28
- package/dist/client/rag/chunkers/HTMLChunker.js +0 -38
- package/dist/client/rag/chunkers/JSONChunker.js +0 -68
- package/dist/client/rag/chunkers/LaTeXChunker.js +0 -63
- package/dist/client/rag/chunkers/MarkdownChunker.js +0 -306
- package/dist/client/rag/chunkers/RecursiveChunker.js +0 -139
- package/dist/client/rag/chunkers/SemanticMarkdownChunker.js +0 -138
- package/dist/client/rag/chunkers/SentenceChunker.js +0 -66
- package/dist/client/rag/chunkers/TokenChunker.js +0 -61
- package/dist/client/rag/chunkers/index.js +0 -15
- package/dist/client/rag/chunking/characterChunker.js +0 -142
- package/dist/client/rag/chunking/chunkerRegistry.js +0 -194
- package/dist/client/rag/chunking/htmlChunker.js +0 -247
- package/dist/client/rag/chunking/index.js +0 -17
- package/dist/client/rag/chunking/jsonChunker.js +0 -281
- package/dist/client/rag/chunking/latexChunker.js +0 -251
- package/dist/client/rag/chunking/markdownChunker.js +0 -373
- package/dist/client/rag/chunking/recursiveChunker.js +0 -148
- package/dist/client/rag/chunking/semanticChunker.js +0 -306
- package/dist/client/rag/chunking/sentenceChunker.js +0 -230
- package/dist/client/rag/chunking/tokenChunker.js +0 -183
- package/dist/client/rag/document/MDocument.js +0 -392
- package/dist/client/rag/document/index.js +0 -5
- package/dist/client/rag/document/loaders.js +0 -500
- package/dist/client/rag/errors/RAGError.js +0 -274
- package/dist/client/rag/errors/index.js +0 -6
- package/dist/client/rag/graphRag/graphRAG.js +0 -401
- package/dist/client/rag/graphRag/index.js +0 -4
- package/dist/client/rag/index.js +0 -141
- package/dist/client/rag/metadata/MetadataExtractorFactory.js +0 -418
- package/dist/client/rag/metadata/MetadataExtractorRegistry.js +0 -362
- package/dist/client/rag/metadata/index.js +0 -9
- package/dist/client/rag/metadata/metadataExtractor.js +0 -280
- package/dist/client/rag/pipeline/RAGPipeline.js +0 -436
- package/dist/client/rag/pipeline/contextAssembly.js +0 -341
- package/dist/client/rag/pipeline/index.js +0 -5
- package/dist/client/rag/ragIntegration.js +0 -321
- package/dist/client/rag/reranker/RerankerFactory.js +0 -430
- package/dist/client/rag/reranker/RerankerRegistry.js +0 -402
- package/dist/client/rag/reranker/index.js +0 -9
- package/dist/client/rag/reranker/reranker.js +0 -277
- package/dist/client/rag/resilience/CircuitBreaker.js +0 -431
- package/dist/client/rag/resilience/RetryHandler.js +0 -304
- package/dist/client/rag/resilience/index.js +0 -7
- package/dist/client/rag/retrieval/hybridSearch.js +0 -335
- package/dist/client/rag/retrieval/index.js +0 -5
- package/dist/client/rag/retrieval/vectorQueryTool.js +0 -307
- package/dist/client/rag/types.js +0 -8
- package/dist/client/sdk/toolRegistration.js +0 -377
- package/dist/client/server/abstract/baseServerAdapter.js +0 -575
- package/dist/client/server/adapters/expressAdapter.js +0 -486
- package/dist/client/server/adapters/fastifyAdapter.js +0 -472
- package/dist/client/server/adapters/honoAdapter.js +0 -632
- package/dist/client/server/adapters/koaAdapter.js +0 -510
- package/dist/client/server/errors.js +0 -486
- package/dist/client/server/factory/serverAdapterFactory.js +0 -160
- package/dist/client/server/index.js +0 -108
- package/dist/client/server/middleware/abortSignal.js +0 -111
- package/dist/client/server/middleware/auth.js +0 -388
- package/dist/client/server/middleware/cache.js +0 -359
- package/dist/client/server/middleware/common.js +0 -281
- package/dist/client/server/middleware/deprecation.js +0 -190
- package/dist/client/server/middleware/mcpBodyAttachment.js +0 -63
- package/dist/client/server/middleware/rateLimit.js +0 -227
- package/dist/client/server/middleware/validation.js +0 -388
- package/dist/client/server/openapi/generator.js +0 -398
- package/dist/client/server/openapi/index.js +0 -36
- package/dist/client/server/openapi/schemas.js +0 -695
- package/dist/client/server/openapi/templates.js +0 -374
- package/dist/client/server/routes/agentRoutes.js +0 -189
- package/dist/client/server/routes/claudeProxyRoutes.js +0 -1600
- package/dist/client/server/routes/healthRoutes.js +0 -187
- package/dist/client/server/routes/index.js +0 -57
- package/dist/client/server/routes/mcpRoutes.js +0 -342
- package/dist/client/server/routes/memoryRoutes.js +0 -350
- package/dist/client/server/routes/openApiRoutes.js +0 -126
- package/dist/client/server/routes/toolRoutes.js +0 -199
- package/dist/client/server/streaming/dataStream.js +0 -486
- package/dist/client/server/streaming/index.js +0 -11
- package/dist/client/server/types.js +0 -67
- package/dist/client/server/utils/redaction.js +0 -334
- package/dist/client/server/utils/validation.js +0 -243
- package/dist/client/server/websocket/WebSocketHandler.js +0 -383
- package/dist/client/server/websocket/index.js +0 -4
- package/dist/client/services/server/ai/observability/instrumentation.js +0 -808
- package/dist/client/telemetry/attributes.js +0 -100
- package/dist/client/telemetry/index.js +0 -26
- package/dist/client/telemetry/telemetryService.js +0 -308
- package/dist/client/telemetry/tracers.js +0 -17
- package/dist/client/telemetry/withSpan.js +0 -34
- package/dist/client/types/actionTypes.js +0 -6
- package/dist/client/types/analytics.js +0 -5
- package/dist/client/types/authTypes.js +0 -9
- package/dist/client/types/circuitBreakerErrors.js +0 -34
- package/dist/client/types/cli.js +0 -21
- package/dist/client/types/clientTypes.js +0 -10
- package/dist/client/types/common.js +0 -51
- package/dist/client/types/configTypes.js +0 -49
- package/dist/client/types/content.js +0 -19
- package/dist/client/types/contextTypes.js +0 -400
- package/dist/client/types/conversation.js +0 -47
- package/dist/client/types/conversationMemoryInterface.js +0 -6
- package/dist/client/types/domainTypes.js +0 -5
- package/dist/client/types/errors.js +0 -167
- package/dist/client/types/evaluation.js +0 -5
- package/dist/client/types/evaluationProviders.js +0 -5
- package/dist/client/types/evaluationTypes.js +0 -1
- package/dist/client/types/externalMcp.js +0 -6
- package/dist/client/types/fileReferenceTypes.js +0 -8
- package/dist/client/types/fileTypes.js +0 -4
- package/dist/client/types/generateTypes.js +0 -1
- package/dist/client/types/guardrails.js +0 -1
- package/dist/client/types/hitlTypes.js +0 -8
- package/dist/client/types/index.js +0 -57
- package/dist/client/types/mcpTypes.js +0 -5
- package/dist/client/types/middlewareTypes.js +0 -1
- package/dist/client/types/modelTypes.js +0 -30
- package/dist/client/types/multimodal.js +0 -135
- package/dist/client/types/observability.js +0 -6
- package/dist/client/types/pptTypes.js +0 -82
- package/dist/client/types/providers.js +0 -111
- package/dist/client/types/proxyTypes.js +0 -16
- package/dist/client/types/ragTypes.js +0 -7
- package/dist/client/types/sdkTypes.js +0 -8
- package/dist/client/types/serviceTypes.js +0 -5
- package/dist/client/types/streamTypes.js +0 -1
- package/dist/client/types/subscriptionTypes.js +0 -9
- package/dist/client/types/taskClassificationTypes.js +0 -5
- package/dist/client/types/tools.js +0 -24
- package/dist/client/types/ttsTypes.js +0 -57
- package/dist/client/types/typeAliases.js +0 -48
- package/dist/client/types/utilities.js +0 -4
- package/dist/client/types/workflowTypes.js +0 -30
- package/dist/client/utils/async/withTimeout.js +0 -98
- package/dist/client/utils/asyncMutex.js +0 -60
- package/dist/client/utils/conversationMemory.js +0 -431
- package/dist/client/utils/csvProcessor.js +0 -846
- package/dist/client/utils/errorHandling.js +0 -936
- package/dist/client/utils/evaluationUtils.js +0 -131
- package/dist/client/utils/factoryProcessing.js +0 -589
- package/dist/client/utils/fileDetector.js +0 -2161
- package/dist/client/utils/imageCache.js +0 -376
- package/dist/client/utils/imageProcessor.js +0 -704
- package/dist/client/utils/logger.js +0 -491
- package/dist/client/utils/mcpDefaults.js +0 -134
- package/dist/client/utils/messageBuilder.js +0 -1653
- package/dist/client/utils/modelAliasResolver.js +0 -54
- package/dist/client/utils/modelDetection.js +0 -80
- package/dist/client/utils/modelRouter.js +0 -292
- package/dist/client/utils/multimodalOptionsBuilder.js +0 -65
- package/dist/client/utils/observabilityHelpers.js +0 -47
- package/dist/client/utils/parameterValidation.js +0 -966
- package/dist/client/utils/pdfProcessor.js +0 -410
- package/dist/client/utils/performance.js +0 -222
- package/dist/client/utils/pricing.js +0 -340
- package/dist/client/utils/promptRedaction.js +0 -62
- package/dist/client/utils/providerConfig.js +0 -1009
- package/dist/client/utils/providerHealth.js +0 -1237
- package/dist/client/utils/providerRetry.js +0 -112
- package/dist/client/utils/providerUtils.js +0 -434
- package/dist/client/utils/rateLimiter.js +0 -200
- package/dist/client/utils/redis.js +0 -368
- package/dist/client/utils/retryHandler.js +0 -269
- package/dist/client/utils/retryability.js +0 -22
- package/dist/client/utils/sanitizers/svg.js +0 -481
- package/dist/client/utils/schemaConversion.js +0 -255
- package/dist/client/utils/taskClassificationUtils.js +0 -149
- package/dist/client/utils/taskClassifier.js +0 -94
- package/dist/client/utils/thinkingConfig.js +0 -104
- package/dist/client/utils/timeout.js +0 -359
- package/dist/client/utils/tokenEstimation.js +0 -142
- package/dist/client/utils/tokenLimits.js +0 -125
- package/dist/client/utils/tokenUtils.js +0 -239
- package/dist/client/utils/toolUtils.js +0 -75
- package/dist/client/utils/transformationUtils.js +0 -554
- package/dist/client/utils/ttsProcessor.js +0 -286
- package/dist/client/utils/typeUtils.js +0 -97
- package/dist/client/utils/videoAnalysisProcessor.js +0 -67
- package/dist/client/workflow/config.js +0 -398
- package/dist/client/workflow/core/ensembleExecutor.js +0 -407
- package/dist/client/workflow/core/judgeScorer.js +0 -544
- package/dist/client/workflow/core/responseConditioner.js +0 -225
- package/dist/client/workflow/core/types/conditionerTypes.js +0 -7
- package/dist/client/workflow/core/types/ensembleTypes.js +0 -7
- package/dist/client/workflow/core/types/index.js +0 -7
- package/dist/client/workflow/core/types/judgeTypes.js +0 -7
- package/dist/client/workflow/core/types/layerTypes.js +0 -7
- package/dist/client/workflow/core/types/registryTypes.js +0 -7
- package/dist/client/workflow/core/workflowRegistry.js +0 -304
- package/dist/client/workflow/core/workflowRunner.js +0 -586
- package/dist/client/workflow/index.js +0 -50
- package/dist/client/workflow/types.js +0 -9
- package/dist/client/workflow/utils/types/index.js +0 -7
- package/dist/client/workflow/utils/workflowMetrics.js +0 -311
- package/dist/client/workflow/utils/workflowValidation.js +0 -420
- package/dist/client/workflow/workflows/adaptiveWorkflow.js +0 -366
- package/dist/client/workflow/workflows/consensusWorkflow.js +0 -192
- package/dist/client/workflow/workflows/fallbackWorkflow.js +0 -225
- package/dist/client/workflow/workflows/multiJudgeWorkflow.js +0 -351
- /package/dist/client/{client/reactHooks.js → reactHooks.js} +0 -0
|
@@ -1,1653 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Message Builder Utility
|
|
3
|
-
* Centralized logic for building message arrays from TextGenerationOptions
|
|
4
|
-
* Enhanced with multimodal support for images
|
|
5
|
-
*/
|
|
6
|
-
import { existsSync, readFileSync, statSync } from "fs";
|
|
7
|
-
import { getGlobalDispatcher, interceptors, request } from "undici";
|
|
8
|
-
import { MultimodalLogger, ProviderImageAdapter, } from "../adapters/providerImageAdapter.js";
|
|
9
|
-
import { CONVERSATION_INSTRUCTIONS, STRUCTURED_OUTPUT_INSTRUCTIONS, } from "../config/conversationMemory.js";
|
|
10
|
-
import { getAvailableInputTokens } from "../constants/contextWindows.js";
|
|
11
|
-
import { enforceAggregateFileBudget, FILE_READ_BUDGET_PERCENT, } from "../context/fileTokenBudget.js";
|
|
12
|
-
import { SIZE_TIER_THRESHOLDS } from "../files/types.js";
|
|
13
|
-
import { tracers, ATTR, withSpan } from "../telemetry/index.js";
|
|
14
|
-
import { FileDetector } from "./fileDetector.js";
|
|
15
|
-
import { getImageCache } from "./imageCache.js";
|
|
16
|
-
import { logger } from "./logger.js";
|
|
17
|
-
import { PDFImageConverter, PDFProcessor } from "./pdfProcessor.js";
|
|
18
|
-
import { urlDownloadRateLimiter } from "./rateLimiter.js";
|
|
19
|
-
import { estimateTokens } from "./tokenEstimation.js";
|
|
20
|
-
// ---------------------------------------------------------------------------
|
|
21
|
-
// SDK-7: Lightweight file-type inference helpers for budget estimation
|
|
22
|
-
// These avoid calling the full FileDetector pipeline — they only need to
|
|
23
|
-
// classify files into broad categories (video, audio, image, etc.) so
|
|
24
|
-
// estimatePostProcessingTokens() can use type-aware estimates.
|
|
25
|
-
// ---------------------------------------------------------------------------
|
|
26
|
-
/** Extension → file type mapping for budget estimation */
|
|
27
|
-
const EXTENSION_TYPE_MAP = {
|
|
28
|
-
// Video
|
|
29
|
-
mp4: "video",
|
|
30
|
-
mkv: "video",
|
|
31
|
-
mov: "video",
|
|
32
|
-
avi: "video",
|
|
33
|
-
webm: "video",
|
|
34
|
-
wmv: "video",
|
|
35
|
-
flv: "video",
|
|
36
|
-
m4v: "video",
|
|
37
|
-
// Audio
|
|
38
|
-
mp3: "audio",
|
|
39
|
-
wav: "audio",
|
|
40
|
-
ogg: "audio",
|
|
41
|
-
flac: "audio",
|
|
42
|
-
m4a: "audio",
|
|
43
|
-
aac: "audio",
|
|
44
|
-
wma: "audio",
|
|
45
|
-
opus: "audio",
|
|
46
|
-
// Image
|
|
47
|
-
jpg: "image",
|
|
48
|
-
jpeg: "image",
|
|
49
|
-
png: "image",
|
|
50
|
-
gif: "image",
|
|
51
|
-
webp: "image",
|
|
52
|
-
bmp: "image",
|
|
53
|
-
tiff: "image",
|
|
54
|
-
tif: "image",
|
|
55
|
-
avif: "image",
|
|
56
|
-
// Archive
|
|
57
|
-
zip: "archive",
|
|
58
|
-
tar: "archive",
|
|
59
|
-
gz: "archive",
|
|
60
|
-
tgz: "archive",
|
|
61
|
-
rar: "archive",
|
|
62
|
-
"7z": "archive",
|
|
63
|
-
jar: "archive",
|
|
64
|
-
// Documents
|
|
65
|
-
xlsx: "xlsx",
|
|
66
|
-
xls: "xlsx",
|
|
67
|
-
ods: "xlsx",
|
|
68
|
-
docx: "docx",
|
|
69
|
-
doc: "docx",
|
|
70
|
-
odt: "docx",
|
|
71
|
-
rtf: "docx",
|
|
72
|
-
pptx: "pptx",
|
|
73
|
-
ppt: "pptx",
|
|
74
|
-
odp: "pptx",
|
|
75
|
-
// PDF
|
|
76
|
-
pdf: "pdf",
|
|
77
|
-
// SVG
|
|
78
|
-
svg: "svg",
|
|
79
|
-
// CSV
|
|
80
|
-
csv: "csv",
|
|
81
|
-
tsv: "csv",
|
|
82
|
-
};
|
|
83
|
-
/**
|
|
84
|
-
* Infer file type from extension in a file path or URL.
|
|
85
|
-
* Returns undefined if no extension or unrecognized.
|
|
86
|
-
*/
|
|
87
|
-
function inferFileTypeFromExtension(filePath) {
|
|
88
|
-
// Strip query string / fragment for URLs
|
|
89
|
-
const cleaned = filePath.split("?")[0].split("#")[0];
|
|
90
|
-
const lastDot = cleaned.lastIndexOf(".");
|
|
91
|
-
if (lastDot === -1) {
|
|
92
|
-
return undefined;
|
|
93
|
-
}
|
|
94
|
-
const ext = cleaned.slice(lastDot + 1).toLowerCase();
|
|
95
|
-
return EXTENSION_TYPE_MAP[ext];
|
|
96
|
-
}
|
|
97
|
-
/**
|
|
98
|
-
* Infer file type from the first few magic bytes of a Buffer.
|
|
99
|
-
* Only checks the most common binary types — text types default to undefined.
|
|
100
|
-
*/
|
|
101
|
-
function inferFileTypeFromBuffer(buf) {
|
|
102
|
-
if (buf.length < 4) {
|
|
103
|
-
return undefined;
|
|
104
|
-
}
|
|
105
|
-
// PNG
|
|
106
|
-
if (buf[0] === 0x89 &&
|
|
107
|
-
buf[1] === 0x50 &&
|
|
108
|
-
buf[2] === 0x4e &&
|
|
109
|
-
buf[3] === 0x47) {
|
|
110
|
-
return "image";
|
|
111
|
-
}
|
|
112
|
-
// JPEG
|
|
113
|
-
if (buf[0] === 0xff && buf[1] === 0xd8 && buf[2] === 0xff) {
|
|
114
|
-
return "image";
|
|
115
|
-
}
|
|
116
|
-
// GIF
|
|
117
|
-
if (buf[0] === 0x47 && buf[1] === 0x49 && buf[2] === 0x46) {
|
|
118
|
-
return "image";
|
|
119
|
-
}
|
|
120
|
-
// WebP (RIFF + WEBP)
|
|
121
|
-
if (buf.length >= 12 &&
|
|
122
|
-
buf[0] === 0x52 &&
|
|
123
|
-
buf[1] === 0x49 &&
|
|
124
|
-
buf[2] === 0x46 &&
|
|
125
|
-
buf[3] === 0x46 &&
|
|
126
|
-
buf[8] === 0x57 &&
|
|
127
|
-
buf[9] === 0x45 &&
|
|
128
|
-
buf[10] === 0x42 &&
|
|
129
|
-
buf[11] === 0x50) {
|
|
130
|
-
return "image";
|
|
131
|
-
}
|
|
132
|
-
// PDF
|
|
133
|
-
if (buf[0] === 0x25 &&
|
|
134
|
-
buf[1] === 0x50 &&
|
|
135
|
-
buf[2] === 0x44 &&
|
|
136
|
-
buf[3] === 0x46) {
|
|
137
|
-
return "pdf";
|
|
138
|
-
}
|
|
139
|
-
// MP4/MOV (ftyp at offset 4)
|
|
140
|
-
if (buf.length >= 8 &&
|
|
141
|
-
buf[4] === 0x66 &&
|
|
142
|
-
buf[5] === 0x74 &&
|
|
143
|
-
buf[6] === 0x79 &&
|
|
144
|
-
buf[7] === 0x70) {
|
|
145
|
-
return "video";
|
|
146
|
-
}
|
|
147
|
-
// MKV/WebM (EBML)
|
|
148
|
-
if (buf[0] === 0x1a &&
|
|
149
|
-
buf[1] === 0x45 &&
|
|
150
|
-
buf[2] === 0xdf &&
|
|
151
|
-
buf[3] === 0xa3) {
|
|
152
|
-
return "video";
|
|
153
|
-
}
|
|
154
|
-
// AVI (RIFF + AVI)
|
|
155
|
-
if (buf.length >= 12 &&
|
|
156
|
-
buf[0] === 0x52 &&
|
|
157
|
-
buf[1] === 0x49 &&
|
|
158
|
-
buf[2] === 0x46 &&
|
|
159
|
-
buf[3] === 0x46 &&
|
|
160
|
-
buf[8] === 0x41 &&
|
|
161
|
-
buf[9] === 0x56 &&
|
|
162
|
-
buf[10] === 0x49 &&
|
|
163
|
-
buf[11] === 0x20) {
|
|
164
|
-
return "video";
|
|
165
|
-
}
|
|
166
|
-
// WAV (RIFF + WAVE)
|
|
167
|
-
if (buf.length >= 12 &&
|
|
168
|
-
buf[0] === 0x52 &&
|
|
169
|
-
buf[1] === 0x49 &&
|
|
170
|
-
buf[2] === 0x46 &&
|
|
171
|
-
buf[3] === 0x46 &&
|
|
172
|
-
buf[8] === 0x57 &&
|
|
173
|
-
buf[9] === 0x41 &&
|
|
174
|
-
buf[10] === 0x56 &&
|
|
175
|
-
buf[11] === 0x45) {
|
|
176
|
-
return "audio";
|
|
177
|
-
}
|
|
178
|
-
// MP3 (ID3 tag)
|
|
179
|
-
if (buf[0] === 0x49 && buf[1] === 0x44 && buf[2] === 0x33) {
|
|
180
|
-
return "audio";
|
|
181
|
-
}
|
|
182
|
-
// FLAC
|
|
183
|
-
if (buf[0] === 0x66 &&
|
|
184
|
-
buf[1] === 0x4c &&
|
|
185
|
-
buf[2] === 0x61 &&
|
|
186
|
-
buf[3] === 0x43) {
|
|
187
|
-
return "audio";
|
|
188
|
-
}
|
|
189
|
-
// OGG
|
|
190
|
-
if (buf[0] === 0x4f &&
|
|
191
|
-
buf[1] === 0x67 &&
|
|
192
|
-
buf[2] === 0x67 &&
|
|
193
|
-
buf[3] === 0x53) {
|
|
194
|
-
return "audio";
|
|
195
|
-
}
|
|
196
|
-
// ZIP (also .xlsx, .docx, .pptx — but without extension we default to archive)
|
|
197
|
-
if (buf[0] === 0x50 &&
|
|
198
|
-
buf[1] === 0x4b &&
|
|
199
|
-
buf[2] === 0x03 &&
|
|
200
|
-
buf[3] === 0x04) {
|
|
201
|
-
return "archive";
|
|
202
|
-
}
|
|
203
|
-
// GZIP
|
|
204
|
-
if (buf[0] === 0x1f && buf[1] === 0x8b) {
|
|
205
|
-
return "archive";
|
|
206
|
-
}
|
|
207
|
-
// RAR
|
|
208
|
-
if (buf[0] === 0x52 &&
|
|
209
|
-
buf[1] === 0x61 &&
|
|
210
|
-
buf[2] === 0x72 &&
|
|
211
|
-
buf[3] === 0x21) {
|
|
212
|
-
return "archive";
|
|
213
|
-
}
|
|
214
|
-
return undefined;
|
|
215
|
-
}
|
|
216
|
-
/**
|
|
217
|
-
* Type guard to check if an image input has alt text
|
|
218
|
-
*/
|
|
219
|
-
function isImageWithAltText(image) {
|
|
220
|
-
return (typeof image === "object" && !Buffer.isBuffer(image) && "data" in image);
|
|
221
|
-
}
|
|
222
|
-
/**
|
|
223
|
-
* Extract image data from an image input (handles both simple and alt text formats)
|
|
224
|
-
*/
|
|
225
|
-
function extractImageData(image) {
|
|
226
|
-
if (isImageWithAltText(image)) {
|
|
227
|
-
return image.data;
|
|
228
|
-
}
|
|
229
|
-
return image;
|
|
230
|
-
}
|
|
231
|
-
/**
|
|
232
|
-
* Extract alt text from an image input if available
|
|
233
|
-
*/
|
|
234
|
-
function extractAltText(image) {
|
|
235
|
-
if (isImageWithAltText(image)) {
|
|
236
|
-
return image.altText;
|
|
237
|
-
}
|
|
238
|
-
return undefined;
|
|
239
|
-
}
|
|
240
|
-
/**
|
|
241
|
-
* Type guard for validating message roles
|
|
242
|
-
*/
|
|
243
|
-
function isValidRole(role) {
|
|
244
|
-
return (typeof role === "string" &&
|
|
245
|
-
(role === "user" || role === "assistant" || role === "system"));
|
|
246
|
-
}
|
|
247
|
-
/**
|
|
248
|
-
* Type guard for validating content items
|
|
249
|
-
*/
|
|
250
|
-
function isValidContentItem(item) {
|
|
251
|
-
if (!item || typeof item !== "object") {
|
|
252
|
-
return false;
|
|
253
|
-
}
|
|
254
|
-
const contentItem = item;
|
|
255
|
-
if (contentItem.type === "text") {
|
|
256
|
-
return typeof contentItem.text === "string";
|
|
257
|
-
}
|
|
258
|
-
if (contentItem.type === "image") {
|
|
259
|
-
return (typeof contentItem.image === "string" &&
|
|
260
|
-
(contentItem.mimeType === undefined ||
|
|
261
|
-
typeof contentItem.mimeType === "string"));
|
|
262
|
-
}
|
|
263
|
-
if (contentItem.type === "file") {
|
|
264
|
-
return (Buffer.isBuffer(contentItem.data) &&
|
|
265
|
-
typeof contentItem.mimeType === "string");
|
|
266
|
-
}
|
|
267
|
-
return false;
|
|
268
|
-
}
|
|
269
|
-
/**
|
|
270
|
-
* Safely convert content item to AI SDK content format
|
|
271
|
-
*/
|
|
272
|
-
function convertContentItem(item) {
|
|
273
|
-
if (!isValidContentItem(item)) {
|
|
274
|
-
return null;
|
|
275
|
-
}
|
|
276
|
-
const contentItem = item;
|
|
277
|
-
if (contentItem.type === "text" && typeof contentItem.text === "string") {
|
|
278
|
-
return { type: "text", text: contentItem.text };
|
|
279
|
-
}
|
|
280
|
-
if (contentItem.type === "image" && typeof contentItem.image === "string") {
|
|
281
|
-
return {
|
|
282
|
-
type: "image",
|
|
283
|
-
image: contentItem.image,
|
|
284
|
-
...(contentItem.mimeType && { mediaType: contentItem.mimeType }),
|
|
285
|
-
};
|
|
286
|
-
}
|
|
287
|
-
if (contentItem.type === "file" &&
|
|
288
|
-
Buffer.isBuffer(contentItem.data) &&
|
|
289
|
-
contentItem.mimeType) {
|
|
290
|
-
return {
|
|
291
|
-
type: "file",
|
|
292
|
-
data: contentItem.data,
|
|
293
|
-
mediaType: contentItem.mimeType,
|
|
294
|
-
};
|
|
295
|
-
}
|
|
296
|
-
return null;
|
|
297
|
-
}
|
|
298
|
-
/**
|
|
299
|
-
* Type-safe conversion from MultimodalChatMessage[] to ModelMessage[]
|
|
300
|
-
* Filters out invalid content and ensures strict ModelMessage contract compliance
|
|
301
|
-
*/
|
|
302
|
-
export function convertToModelMessages(messages) {
|
|
303
|
-
return messages
|
|
304
|
-
.map((msg) => {
|
|
305
|
-
// Validate role
|
|
306
|
-
if (!isValidRole(msg.role)) {
|
|
307
|
-
logger.warn("Invalid message role found, skipping", { role: msg.role });
|
|
308
|
-
return null;
|
|
309
|
-
}
|
|
310
|
-
// Handle string content
|
|
311
|
-
if (typeof msg.content === "string") {
|
|
312
|
-
// Create properly typed discriminated union messages
|
|
313
|
-
if (msg.role === "system") {
|
|
314
|
-
return {
|
|
315
|
-
role: "system",
|
|
316
|
-
content: msg.content,
|
|
317
|
-
};
|
|
318
|
-
}
|
|
319
|
-
else if (msg.role === "user") {
|
|
320
|
-
return {
|
|
321
|
-
role: "user",
|
|
322
|
-
content: msg.content,
|
|
323
|
-
};
|
|
324
|
-
}
|
|
325
|
-
else if (msg.role === "assistant") {
|
|
326
|
-
return {
|
|
327
|
-
role: "assistant",
|
|
328
|
-
content: msg.content,
|
|
329
|
-
};
|
|
330
|
-
}
|
|
331
|
-
}
|
|
332
|
-
// Handle array content (multimodal) - only user messages support full multimodal content
|
|
333
|
-
if (Array.isArray(msg.content)) {
|
|
334
|
-
const validContent = msg.content
|
|
335
|
-
.map(convertContentItem)
|
|
336
|
-
.filter((item) => item !== null);
|
|
337
|
-
// If no valid content items, skip the message
|
|
338
|
-
if (validContent.length === 0) {
|
|
339
|
-
logger.warn("No valid content items found in multimodal message, skipping");
|
|
340
|
-
return null;
|
|
341
|
-
}
|
|
342
|
-
if (msg.role === "user") {
|
|
343
|
-
// User messages support both text and image content
|
|
344
|
-
return {
|
|
345
|
-
role: "user",
|
|
346
|
-
content: validContent,
|
|
347
|
-
};
|
|
348
|
-
}
|
|
349
|
-
else if (msg.role === "assistant") {
|
|
350
|
-
// Assistant messages only support text content, filter out images
|
|
351
|
-
const textOnlyContent = validContent.filter((item) => item.type === "text");
|
|
352
|
-
if (textOnlyContent.length === 0) {
|
|
353
|
-
// If no text content, convert to empty string
|
|
354
|
-
return {
|
|
355
|
-
role: "assistant",
|
|
356
|
-
content: "",
|
|
357
|
-
};
|
|
358
|
-
}
|
|
359
|
-
else if (textOnlyContent.length === 1) {
|
|
360
|
-
// Single text item, use string content
|
|
361
|
-
return {
|
|
362
|
-
role: "assistant",
|
|
363
|
-
content: textOnlyContent[0].text,
|
|
364
|
-
};
|
|
365
|
-
}
|
|
366
|
-
else {
|
|
367
|
-
// Multiple text items, concatenate them
|
|
368
|
-
const combinedText = textOnlyContent
|
|
369
|
-
.map((item) => item.text)
|
|
370
|
-
.join(" ");
|
|
371
|
-
return {
|
|
372
|
-
role: "assistant",
|
|
373
|
-
content: combinedText,
|
|
374
|
-
};
|
|
375
|
-
}
|
|
376
|
-
}
|
|
377
|
-
else {
|
|
378
|
-
// System messages cannot have multimodal content, convert to text
|
|
379
|
-
const textContent = validContent.find((item) => item.type === "text")?.text || "";
|
|
380
|
-
return {
|
|
381
|
-
role: "system",
|
|
382
|
-
content: textContent,
|
|
383
|
-
};
|
|
384
|
-
}
|
|
385
|
-
}
|
|
386
|
-
// Invalid content type
|
|
387
|
-
logger.warn("Invalid message content type found, skipping", {
|
|
388
|
-
contentType: typeof msg.content,
|
|
389
|
-
});
|
|
390
|
-
return null;
|
|
391
|
-
})
|
|
392
|
-
.filter((msg) => msg !== null);
|
|
393
|
-
}
|
|
394
|
-
/**
|
|
395
|
-
* Convert ChatMessage to ModelMessage for AI SDK compatibility
|
|
396
|
-
*/
|
|
397
|
-
function toModelMessage(message) {
|
|
398
|
-
// Only include messages with roles supported by AI SDK
|
|
399
|
-
if (message.role === "user" ||
|
|
400
|
-
message.role === "assistant" ||
|
|
401
|
-
message.role === "system") {
|
|
402
|
-
return {
|
|
403
|
-
role: message.role,
|
|
404
|
-
content: message.content,
|
|
405
|
-
};
|
|
406
|
-
}
|
|
407
|
-
return null; // Filter out tool_call and tool_result messages
|
|
408
|
-
}
|
|
409
|
-
/**
|
|
410
|
-
* Format CSV metadata for LLM consumption
|
|
411
|
-
*/
|
|
412
|
-
function formatCSVMetadata(metadata) {
|
|
413
|
-
const parts = [];
|
|
414
|
-
if (metadata.rowCount !== undefined) {
|
|
415
|
-
parts.push(`${metadata.rowCount} data rows`);
|
|
416
|
-
}
|
|
417
|
-
if (metadata.columnCount !== undefined) {
|
|
418
|
-
parts.push(`${metadata.columnCount} columns`);
|
|
419
|
-
}
|
|
420
|
-
if (metadata.columnNames && metadata.columnNames.length > 0) {
|
|
421
|
-
const columns = metadata.columnNames.join(", ");
|
|
422
|
-
parts.push(`Columns: [${columns}]`);
|
|
423
|
-
}
|
|
424
|
-
if (metadata.hasEmptyColumns) {
|
|
425
|
-
parts.push(`⚠️ Contains empty column names`);
|
|
426
|
-
}
|
|
427
|
-
return parts.length > 0 ? `**Metadata**: ${parts.join(" | ")}` : "";
|
|
428
|
-
}
|
|
429
|
-
/**
|
|
430
|
-
* Check if structured output mode should be enabled
|
|
431
|
-
* Structured output is used when a schema is provided with json/structured format
|
|
432
|
-
*/
|
|
433
|
-
function shouldUseStructuredOutput(options) {
|
|
434
|
-
return (!!options.schema &&
|
|
435
|
-
(options.output?.format === "json" ||
|
|
436
|
-
options.output?.format === "structured"));
|
|
437
|
-
}
|
|
438
|
-
/**
|
|
439
|
-
* Log structural metadata about a composed message array without logging content.
|
|
440
|
-
* Only logs a compact summary (role counts, total chars, estimated tokens).
|
|
441
|
-
* Per-message breakdown is intentionally omitted to avoid log noise
|
|
442
|
-
* (~600 lines per retry cascade with many messages).
|
|
443
|
-
*/
|
|
444
|
-
function logMessageComposition(messages, requestId) {
|
|
445
|
-
if (!logger.shouldLog("debug")) {
|
|
446
|
-
return;
|
|
447
|
-
}
|
|
448
|
-
const roles = {};
|
|
449
|
-
let totalChars = 0;
|
|
450
|
-
for (const msg of messages) {
|
|
451
|
-
const chars = typeof msg.content === "string" ? msg.content.length : 0;
|
|
452
|
-
roles[msg.role] = (roles[msg.role] || 0) + 1;
|
|
453
|
-
totalChars += chars;
|
|
454
|
-
}
|
|
455
|
-
logger.debug("[MessageBuilder] Composed", {
|
|
456
|
-
requestId,
|
|
457
|
-
totalMessages: messages.length,
|
|
458
|
-
roles,
|
|
459
|
-
totalChars,
|
|
460
|
-
estimatedTokens: Math.ceil(totalChars / 4),
|
|
461
|
-
});
|
|
462
|
-
}
|
|
463
|
-
/**
|
|
464
|
-
* Build a properly formatted message array for AI providers
|
|
465
|
-
* Combines system prompt, conversation history, and current user prompt
|
|
466
|
-
* Supports both TextGenerationOptions and StreamOptions
|
|
467
|
-
* Enhanced with CSV file processing support
|
|
468
|
-
*/
|
|
469
|
-
export async function buildMessagesArray(options) {
|
|
470
|
-
const messages = [];
|
|
471
|
-
// Check if conversation history exists
|
|
472
|
-
const hasConversationHistory = options.conversationMessages && options.conversationMessages.length > 0;
|
|
473
|
-
// Build enhanced system prompt
|
|
474
|
-
let systemPrompt = options.systemPrompt?.trim() || "";
|
|
475
|
-
// Add conversation-aware instructions when history exists
|
|
476
|
-
if (hasConversationHistory) {
|
|
477
|
-
systemPrompt = `${systemPrompt.trim()}${CONVERSATION_INSTRUCTIONS}`;
|
|
478
|
-
}
|
|
479
|
-
// Add structured output instructions when schema is provided with json/structured format
|
|
480
|
-
if (shouldUseStructuredOutput(options)) {
|
|
481
|
-
systemPrompt = `${systemPrompt.trim()}${STRUCTURED_OUTPUT_INSTRUCTIONS}`;
|
|
482
|
-
}
|
|
483
|
-
// Add system message if we have one
|
|
484
|
-
if (systemPrompt.trim()) {
|
|
485
|
-
messages.push({
|
|
486
|
-
role: "system",
|
|
487
|
-
content: systemPrompt.trim(),
|
|
488
|
-
providerOptions: {
|
|
489
|
-
anthropic: { cacheControl: { type: "ephemeral" } },
|
|
490
|
-
},
|
|
491
|
-
});
|
|
492
|
-
}
|
|
493
|
-
// Add conversation history if available
|
|
494
|
-
// Convert ChatMessages to ModelMessages and filter out tool messages
|
|
495
|
-
if (hasConversationHistory && options.conversationMessages) {
|
|
496
|
-
for (const chatMessage of options.conversationMessages) {
|
|
497
|
-
const coreMessage = toModelMessage(chatMessage);
|
|
498
|
-
if (coreMessage) {
|
|
499
|
-
messages.push(coreMessage);
|
|
500
|
-
}
|
|
501
|
-
}
|
|
502
|
-
}
|
|
503
|
-
// Add current user prompt (required)
|
|
504
|
-
// Handle both TextGenerationOptions (prompt field) and StreamOptions (input.text field)
|
|
505
|
-
let currentPrompt;
|
|
506
|
-
if ("prompt" in options && options.prompt) {
|
|
507
|
-
currentPrompt = options.prompt;
|
|
508
|
-
}
|
|
509
|
-
else if ("input" in options && options.input?.text) {
|
|
510
|
-
currentPrompt = options.input.text;
|
|
511
|
-
}
|
|
512
|
-
// Process CSV files if present and inject into prompt using proper CSV parser
|
|
513
|
-
if ("input" in options && options.input) {
|
|
514
|
-
const input = options.input;
|
|
515
|
-
let csvContent = "";
|
|
516
|
-
const csvOptions = "csvOptions" in options ? options.csvOptions : undefined;
|
|
517
|
-
// Process explicit csvFiles array
|
|
518
|
-
if (input.csvFiles && input.csvFiles.length > 0) {
|
|
519
|
-
for (let i = 0; i < input.csvFiles.length; i++) {
|
|
520
|
-
const csvFile = input.csvFiles[i];
|
|
521
|
-
const filename = extractFilename(csvFile, i);
|
|
522
|
-
const filePath = typeof csvFile === "string" ? csvFile : filename;
|
|
523
|
-
try {
|
|
524
|
-
const result = await FileDetector.detectAndProcess(csvFile, {
|
|
525
|
-
allowedTypes: ["csv"],
|
|
526
|
-
csvOptions: csvOptions,
|
|
527
|
-
});
|
|
528
|
-
let csvSection = `\n\n## CSV Data from "${filename}":\n`;
|
|
529
|
-
// Add metadata from csv-parser library
|
|
530
|
-
if (result.metadata) {
|
|
531
|
-
const metadataText = formatCSVMetadata(result.metadata);
|
|
532
|
-
if (metadataText) {
|
|
533
|
-
csvSection += metadataText + `\n\n`;
|
|
534
|
-
}
|
|
535
|
-
}
|
|
536
|
-
csvSection += buildCSVToolInstructions(filePath);
|
|
537
|
-
csvSection += result.content;
|
|
538
|
-
csvContent += csvSection;
|
|
539
|
-
logger.info(`[CSV] ✅ Processed: ${filename}`, result.metadata);
|
|
540
|
-
}
|
|
541
|
-
catch (error) {
|
|
542
|
-
logger.error(`[CSV] ❌ Failed to process ${filename}:`, error);
|
|
543
|
-
csvContent += `\n\n## CSV Data Error: Failed to process "${filename}"\nReason: ${error instanceof Error ? error.message : "Unknown error"}`;
|
|
544
|
-
}
|
|
545
|
-
}
|
|
546
|
-
}
|
|
547
|
-
// Process unified files array (auto-detect CSV)
|
|
548
|
-
if (input.files && input.files.length > 0) {
|
|
549
|
-
for (const file of input.files) {
|
|
550
|
-
const filename = extractFilename(file);
|
|
551
|
-
try {
|
|
552
|
-
const result = await FileDetector.detectAndProcess(file, {
|
|
553
|
-
maxSize: 50 * 1024 * 1024,
|
|
554
|
-
allowedTypes: ["csv"],
|
|
555
|
-
csvOptions: csvOptions,
|
|
556
|
-
});
|
|
557
|
-
if (result.type === "csv") {
|
|
558
|
-
let csvSection = `\n\n## CSV Data from "${filename}":\n`;
|
|
559
|
-
// Add metadata from csv-parser library
|
|
560
|
-
if (result.metadata) {
|
|
561
|
-
const metadataText = formatCSVMetadata(result.metadata);
|
|
562
|
-
if (metadataText) {
|
|
563
|
-
csvSection += metadataText + `\n\n`;
|
|
564
|
-
}
|
|
565
|
-
}
|
|
566
|
-
csvSection += result.content;
|
|
567
|
-
csvContent += csvSection;
|
|
568
|
-
logger.info(`[FileDetector] ✅ CSV: ${filename}`, result.metadata);
|
|
569
|
-
}
|
|
570
|
-
}
|
|
571
|
-
catch (error) {
|
|
572
|
-
// Silently skip non-CSV files in auto-detect mode
|
|
573
|
-
logger.debug(`[FileDetector] Skipped ${filename}: ${error instanceof Error ? error.message : String(error)}`);
|
|
574
|
-
}
|
|
575
|
-
}
|
|
576
|
-
}
|
|
577
|
-
// Prepend CSV content to current prompt
|
|
578
|
-
if (csvContent) {
|
|
579
|
-
currentPrompt = csvContent + (currentPrompt || "");
|
|
580
|
-
}
|
|
581
|
-
}
|
|
582
|
-
if (currentPrompt?.trim()) {
|
|
583
|
-
messages.push({
|
|
584
|
-
role: "user",
|
|
585
|
-
content: currentPrompt.trim(),
|
|
586
|
-
});
|
|
587
|
-
}
|
|
588
|
-
const reqId = options.context
|
|
589
|
-
?.requestId;
|
|
590
|
-
logMessageComposition(messages, reqId);
|
|
591
|
-
return messages;
|
|
592
|
-
}
|
|
593
|
-
/**
|
|
594
|
-
* Enforce aggregate file budget, excluding files that would exceed the context window.
|
|
595
|
-
* Mutates options.input.files and options.input.text as needed.
|
|
596
|
-
*/
|
|
597
|
-
function enforceFileBudget(options, provider, model) {
|
|
598
|
-
if (!options.input.files || options.input.files.length === 0) {
|
|
599
|
-
return;
|
|
600
|
-
}
|
|
601
|
-
const availableTokens = getAvailableInputTokens(provider, model);
|
|
602
|
-
const budgetFiles = options.input.files.map((file, idx) => {
|
|
603
|
-
let sizeBytes;
|
|
604
|
-
let fileType;
|
|
605
|
-
if (Buffer.isBuffer(file)) {
|
|
606
|
-
sizeBytes = file.length;
|
|
607
|
-
fileType = inferFileTypeFromBuffer(file);
|
|
608
|
-
}
|
|
609
|
-
else if (typeof file === "string") {
|
|
610
|
-
if (existsSync(file)) {
|
|
611
|
-
try {
|
|
612
|
-
sizeBytes = statSync(file).size;
|
|
613
|
-
}
|
|
614
|
-
catch {
|
|
615
|
-
sizeBytes = 0;
|
|
616
|
-
}
|
|
617
|
-
}
|
|
618
|
-
else {
|
|
619
|
-
sizeBytes = file.length;
|
|
620
|
-
}
|
|
621
|
-
fileType = inferFileTypeFromExtension(file);
|
|
622
|
-
}
|
|
623
|
-
else {
|
|
624
|
-
sizeBytes = 0;
|
|
625
|
-
}
|
|
626
|
-
return {
|
|
627
|
-
name: typeof file === "string" ? file : `file-${idx}`,
|
|
628
|
-
sizeBytes,
|
|
629
|
-
fileType,
|
|
630
|
-
originalIndex: idx,
|
|
631
|
-
};
|
|
632
|
-
});
|
|
633
|
-
const budgetResult = enforceAggregateFileBudget(budgetFiles.map((f) => ({
|
|
634
|
-
name: f.name,
|
|
635
|
-
sizeBytes: f.sizeBytes,
|
|
636
|
-
fileType: f.fileType,
|
|
637
|
-
})), availableTokens);
|
|
638
|
-
if (budgetResult.excluded.length > 0) {
|
|
639
|
-
const includedIndices = new Set(budgetResult.included.map((f) => {
|
|
640
|
-
return budgetFiles.findIndex((bf) => bf.name === f.name);
|
|
641
|
-
}));
|
|
642
|
-
options.input.files = options.input.files.filter((_file, idx) => {
|
|
643
|
-
return includedIndices.has(idx);
|
|
644
|
-
});
|
|
645
|
-
options.input.text =
|
|
646
|
-
(options.input.text || "") + "\n\n" + budgetResult.notices.join("\n");
|
|
647
|
-
logger.warn(`[FileDetector] Aggregate file budget enforcement: excluded ${budgetResult.excluded.length} file(s)`);
|
|
648
|
-
}
|
|
649
|
-
}
|
|
650
|
-
/**
|
|
651
|
-
* Append a detected file result to options.input based on its type.
|
|
652
|
-
* Handles CSV, SVG, image, PDF, video, audio, archive, xlsx, docx, pptx, text, and unknown types.
|
|
653
|
-
*/
|
|
654
|
-
function appendDetectedFileResult(result, file, options) {
|
|
655
|
-
const filename = extractFilename(file);
|
|
656
|
-
if (result.type === "csv") {
|
|
657
|
-
const filePath = typeof file === "string" ? file : filename;
|
|
658
|
-
let csvSection = `\n\n## CSV Data from "${filename}":\n`;
|
|
659
|
-
if (result.metadata) {
|
|
660
|
-
const metadataText = formatCSVMetadata(result.metadata);
|
|
661
|
-
if (metadataText) {
|
|
662
|
-
csvSection += metadataText + `\n\n`;
|
|
663
|
-
}
|
|
664
|
-
}
|
|
665
|
-
csvSection += buildCSVToolInstructions(filePath);
|
|
666
|
-
csvSection += result.content;
|
|
667
|
-
options.input.text += csvSection;
|
|
668
|
-
logger.info(`[FileDetector] ✅ CSV: ${filename}`);
|
|
669
|
-
}
|
|
670
|
-
else if (result.type === "svg") {
|
|
671
|
-
const svgSection = `\n\n## SVG Content from "${filename}":\n\`\`\`xml\n${result.content}\n\`\`\`\n`;
|
|
672
|
-
options.input.text += svgSection;
|
|
673
|
-
logger.info(`[FileDetector] ✅ SVG (as text): ${filename}`);
|
|
674
|
-
}
|
|
675
|
-
else if (result.type === "image") {
|
|
676
|
-
options.input.images = [...(options.input.images || []), result.content];
|
|
677
|
-
logger.info(`[FileDetector] ✅ Image: ${result.mimeType}`);
|
|
678
|
-
}
|
|
679
|
-
else if (result.type === "pdf") {
|
|
680
|
-
options.input.pdfFiles = [
|
|
681
|
-
...(options.input.pdfFiles || []),
|
|
682
|
-
result.content,
|
|
683
|
-
];
|
|
684
|
-
logger.info(`[FileDetector] ✅ PDF: ${filename}`);
|
|
685
|
-
}
|
|
686
|
-
else if (result.type === "video") {
|
|
687
|
-
if (result.content) {
|
|
688
|
-
options.input.text += `\n\n## Video File: "${filename}"\n${result.content}\n`;
|
|
689
|
-
}
|
|
690
|
-
if (result.images && result.images.length > 0) {
|
|
691
|
-
options.input.images = [
|
|
692
|
-
...(options.input.images || []),
|
|
693
|
-
...result.images,
|
|
694
|
-
];
|
|
695
|
-
logger.info(`[FileDetector] Added ${result.images.length} video keyframes as images`);
|
|
696
|
-
}
|
|
697
|
-
logger.info(`[FileDetector] ✅ Video: ${filename}`);
|
|
698
|
-
}
|
|
699
|
-
else if (result.type === "audio") {
|
|
700
|
-
if (result.content) {
|
|
701
|
-
options.input.text += `\n\n## Audio File: "${filename}"\n${result.content}\n`;
|
|
702
|
-
}
|
|
703
|
-
if (result.images && result.images.length > 0) {
|
|
704
|
-
options.input.images = [
|
|
705
|
-
...(options.input.images || []),
|
|
706
|
-
...result.images,
|
|
707
|
-
];
|
|
708
|
-
logger.info(`[FileDetector] Added audio cover art as image`);
|
|
709
|
-
}
|
|
710
|
-
logger.info(`[FileDetector] ✅ Audio: ${filename}`);
|
|
711
|
-
}
|
|
712
|
-
else if (result.type === "archive") {
|
|
713
|
-
if (result.content) {
|
|
714
|
-
options.input.text += `\n\n## Archive File: "${filename}"\n${result.content}\n`;
|
|
715
|
-
}
|
|
716
|
-
logger.info(`[FileDetector] ✅ Archive: ${filename}`);
|
|
717
|
-
}
|
|
718
|
-
else if (result.type === "xlsx") {
|
|
719
|
-
if (result.content) {
|
|
720
|
-
options.input.text += `\n\n## Spreadsheet: "${filename}"\n${result.content}\n`;
|
|
721
|
-
}
|
|
722
|
-
logger.info(`[FileDetector] ✅ Spreadsheet: ${filename}`);
|
|
723
|
-
}
|
|
724
|
-
else if (result.type === "docx") {
|
|
725
|
-
if (result.content) {
|
|
726
|
-
options.input.text += `\n\n## Document: "${filename}"\n${result.content}\n`;
|
|
727
|
-
}
|
|
728
|
-
logger.info(`[FileDetector] ✅ Document: ${filename}`);
|
|
729
|
-
}
|
|
730
|
-
else if (result.type === "pptx") {
|
|
731
|
-
if (result.content) {
|
|
732
|
-
options.input.text += `\n\n## Presentation: "${filename}"\n${result.content}\n`;
|
|
733
|
-
}
|
|
734
|
-
logger.info(`[FileDetector] ✅ Presentation: ${filename}`);
|
|
735
|
-
}
|
|
736
|
-
else if (result.type === "text") {
|
|
737
|
-
if (result.content) {
|
|
738
|
-
const langHint = getLanguageHint(result.mimeType, filename);
|
|
739
|
-
const MAX_TEXT_FILE_CHARS = 200_000;
|
|
740
|
-
let fileContent = result.content;
|
|
741
|
-
let truncated = false;
|
|
742
|
-
if (fileContent.length > MAX_TEXT_FILE_CHARS) {
|
|
743
|
-
const headChars = Math.floor(MAX_TEXT_FILE_CHARS * 0.75);
|
|
744
|
-
const tailChars = Math.floor(MAX_TEXT_FILE_CHARS * 0.25);
|
|
745
|
-
const omittedChars = fileContent.length - headChars - tailChars;
|
|
746
|
-
fileContent =
|
|
747
|
-
fileContent.slice(0, headChars) +
|
|
748
|
-
`\n\n... [${omittedChars.toLocaleString()} characters omitted — file truncated to fit context window] ...\n\n` +
|
|
749
|
-
fileContent.slice(-tailChars);
|
|
750
|
-
truncated = true;
|
|
751
|
-
}
|
|
752
|
-
const textSection = langHint
|
|
753
|
-
? `\n\n## File: "${filename}"\n\`\`\`${langHint}\n${fileContent}\n\`\`\`\n`
|
|
754
|
-
: `\n\n## File: "${filename}"\n${fileContent}\n`;
|
|
755
|
-
options.input.text += textSection;
|
|
756
|
-
if (truncated) {
|
|
757
|
-
logger.warn(`[FileDetector] Large text file "${filename}" truncated from ${result.content.length.toLocaleString()} to ${MAX_TEXT_FILE_CHARS.toLocaleString()} chars`);
|
|
758
|
-
}
|
|
759
|
-
}
|
|
760
|
-
logger.info(`[FileDetector] ✅ Text: ${filename}`);
|
|
761
|
-
}
|
|
762
|
-
else if (result.type === "unknown") {
|
|
763
|
-
if (result.content) {
|
|
764
|
-
options.input.text += `\n\n## Attached File: "${filename}"\n${result.content}\n`;
|
|
765
|
-
}
|
|
766
|
-
logger.info(`[FileDetector] ⚠️ Unknown format (metadata extracted): ${filename}`);
|
|
767
|
-
}
|
|
768
|
-
}
|
|
769
|
-
/**
|
|
770
|
-
* Process the unified files array with auto-detection.
|
|
771
|
-
* Handles lazy file registration, full processing, and preview injection.
|
|
772
|
-
*/
|
|
773
|
-
async function processUnifiedFilesArray(options, maxSize, provider) {
|
|
774
|
-
if (!options.input.files || options.input.files.length === 0) {
|
|
775
|
-
return;
|
|
776
|
-
}
|
|
777
|
-
const totalFiles = options.input.files.length;
|
|
778
|
-
return withSpan({
|
|
779
|
-
name: "neurolink.file.process_all",
|
|
780
|
-
tracer: tracers.file,
|
|
781
|
-
attributes: {
|
|
782
|
-
[ATTR.FILE_TOTAL_COUNT]: totalFiles,
|
|
783
|
-
[ATTR.NL_PROVIDER]: provider,
|
|
784
|
-
},
|
|
785
|
-
}, async (span) => {
|
|
786
|
-
logger.info(`[NEUROLINK] Processing ${totalFiles} file(s) with auto-detection`);
|
|
787
|
-
options.input.text = options.input.text || "";
|
|
788
|
-
let includedCount = 0;
|
|
789
|
-
const fileRegistry = options.fileRegistry;
|
|
790
|
-
for (let fileIdx = 0; fileIdx < options.input.files.length; fileIdx++) {
|
|
791
|
-
const file = options.input.files[fileIdx];
|
|
792
|
-
const filename = extractFilename(file, fileIdx);
|
|
793
|
-
try {
|
|
794
|
-
// ─── Lazy file registration path ──────────────────────────────
|
|
795
|
-
const fileSize = fileRegistry ? getFileSize(file) : 0;
|
|
796
|
-
if (fileRegistry && fileSize > SIZE_TIER_THRESHOLDS.TINY_MAX) {
|
|
797
|
-
const registered = await tryRegisterFileReference(file, fileSize, fileRegistry, fileIdx);
|
|
798
|
-
if (registered) {
|
|
799
|
-
logger.info(`[NEUROLINK] File lazily registered: ${filename} (${fileSize} bytes) — deferred processing`);
|
|
800
|
-
includedCount++;
|
|
801
|
-
continue;
|
|
802
|
-
}
|
|
803
|
-
}
|
|
804
|
-
// ─── Full processing path (current behavior) ──────────────────
|
|
805
|
-
const genericFileMaxSize = Math.max(maxSize, 100 * 1024 * 1024);
|
|
806
|
-
const rawFileInput = isFileWithMetadata(file) ? file.buffer : file;
|
|
807
|
-
const result = await FileDetector.detectAndProcess(rawFileInput, {
|
|
808
|
-
maxSize: genericFileMaxSize,
|
|
809
|
-
allowedTypes: [
|
|
810
|
-
"csv",
|
|
811
|
-
"image",
|
|
812
|
-
"pdf",
|
|
813
|
-
"svg",
|
|
814
|
-
"video",
|
|
815
|
-
"audio",
|
|
816
|
-
"archive",
|
|
817
|
-
"xlsx",
|
|
818
|
-
"docx",
|
|
819
|
-
"pptx",
|
|
820
|
-
"text",
|
|
821
|
-
"unknown",
|
|
822
|
-
],
|
|
823
|
-
csvOptions: options.csvOptions,
|
|
824
|
-
provider: provider,
|
|
825
|
-
});
|
|
826
|
-
appendDetectedFileResult(result, file, options);
|
|
827
|
-
includedCount++;
|
|
828
|
-
// Log what content type was added to the message
|
|
829
|
-
const contentType = result.type === "image" ? "image" : "text";
|
|
830
|
-
logger.info(`[NEUROLINK] File added to message: ${filename} as ${contentType} (type: ${result.type})`);
|
|
831
|
-
}
|
|
832
|
-
catch (error) {
|
|
833
|
-
const errMsg = error instanceof Error ? error.message : String(error);
|
|
834
|
-
logger.error(`[NEUROLINK] File skipped/failed: ${filename} — reason: ${errMsg}`);
|
|
835
|
-
}
|
|
836
|
-
}
|
|
837
|
-
span.setAttribute(ATTR.FILE_INCLUDED_COUNT, includedCount);
|
|
838
|
-
// After processing all files, inject previews for any lazily-registered files
|
|
839
|
-
if (fileRegistry && fileRegistry.size > 0) {
|
|
840
|
-
const previewText = await fileRegistry.generatePromptPreview();
|
|
841
|
-
if (previewText) {
|
|
842
|
-
options.input.text = (options.input.text || "") + previewText;
|
|
843
|
-
logger.info(`[FileDetector] Injected previews for ${fileRegistry.size} lazily-registered file(s)`);
|
|
844
|
-
}
|
|
845
|
-
const registeredFiles = fileRegistry.list();
|
|
846
|
-
for (const ref of registeredFiles) {
|
|
847
|
-
if (ref.extractedImages && ref.extractedImages.length > 0) {
|
|
848
|
-
options.input.images = [
|
|
849
|
-
...(options.input.images || []),
|
|
850
|
-
...ref.extractedImages,
|
|
851
|
-
];
|
|
852
|
-
logger.info(`[FileDetector] Injected ${ref.extractedImages.length} extracted images from "${ref.filename}"`);
|
|
853
|
-
}
|
|
854
|
-
}
|
|
855
|
-
}
|
|
856
|
-
logger.info(`[NEUROLINK] File processing complete: ${includedCount}/${totalFiles} files included in message`);
|
|
857
|
-
});
|
|
858
|
-
}
|
|
859
|
-
/**
|
|
860
|
-
* Process explicit CSV files array and append to options.input.text.
|
|
861
|
-
*/
|
|
862
|
-
async function processExplicitCsvFiles(options) {
|
|
863
|
-
if (!options.input.csvFiles || options.input.csvFiles.length === 0) {
|
|
864
|
-
return;
|
|
865
|
-
}
|
|
866
|
-
logger.info(`[CSV] Processing ${options.input.csvFiles.length} explicit CSV file(s)`);
|
|
867
|
-
options.input.text = options.input.text || "";
|
|
868
|
-
for (let i = 0; i < options.input.csvFiles.length; i++) {
|
|
869
|
-
const csvFile = options.input.csvFiles[i];
|
|
870
|
-
try {
|
|
871
|
-
const result = await FileDetector.detectAndProcess(csvFile, {
|
|
872
|
-
allowedTypes: ["csv"],
|
|
873
|
-
csvOptions: options.csvOptions,
|
|
874
|
-
});
|
|
875
|
-
const filename = extractFilename(csvFile, i);
|
|
876
|
-
const filePath = typeof csvFile === "string" ? csvFile : filename;
|
|
877
|
-
let csvSection = `\n\n## CSV Data from "${filename}":\n`;
|
|
878
|
-
if (result.metadata) {
|
|
879
|
-
const metadataText = formatCSVMetadata(result.metadata);
|
|
880
|
-
if (metadataText) {
|
|
881
|
-
csvSection += metadataText + `\n\n`;
|
|
882
|
-
}
|
|
883
|
-
}
|
|
884
|
-
csvSection += buildCSVToolInstructions(filePath);
|
|
885
|
-
csvSection += result.content;
|
|
886
|
-
options.input.text += csvSection;
|
|
887
|
-
logger.info(`[CSV] ✅ Processed: ${filename}`);
|
|
888
|
-
}
|
|
889
|
-
catch (error) {
|
|
890
|
-
logger.error(`[CSV] ❌ Failed:`, error);
|
|
891
|
-
const filename = extractFilename(csvFile, i);
|
|
892
|
-
options.input.text += `\n\n## CSV Data Error: Failed to process "${filename}"`;
|
|
893
|
-
options.input.text += `\nReason: ${error instanceof Error ? error.message : "Unknown error"}`;
|
|
894
|
-
}
|
|
895
|
-
}
|
|
896
|
-
}
|
|
897
|
-
/**
|
|
898
|
-
* Enforce post-processing budget on accumulated text content and log token usage.
|
|
899
|
-
*/
|
|
900
|
-
function enforcePostProcessingBudget(options, provider, model) {
|
|
901
|
-
if (!options.input.text) {
|
|
902
|
-
return;
|
|
903
|
-
}
|
|
904
|
-
const availableTokens = getAvailableInputTokens(provider, model);
|
|
905
|
-
const textTokenBudget = Math.floor(availableTokens * FILE_READ_BUDGET_PERCENT);
|
|
906
|
-
const actualTextTokens = estimateTokens(options.input.text, provider);
|
|
907
|
-
if (actualTextTokens > textTokenBudget && textTokenBudget > 0) {
|
|
908
|
-
const maxChars = textTokenBudget * 4;
|
|
909
|
-
if (options.input.text.length > maxChars) {
|
|
910
|
-
const headChars = Math.floor(maxChars * 0.75);
|
|
911
|
-
const tailChars = Math.floor(maxChars * 0.25);
|
|
912
|
-
const head = options.input.text.slice(0, headChars);
|
|
913
|
-
const tail = options.input.text.slice(-tailChars);
|
|
914
|
-
const truncatedTokens = actualTextTokens - textTokenBudget;
|
|
915
|
-
options.input.text =
|
|
916
|
-
head +
|
|
917
|
-
`\n\n[... ${truncatedTokens.toLocaleString()} tokens of file content truncated to fit context window ...]\n\n` +
|
|
918
|
-
tail;
|
|
919
|
-
logger.warn(`[FileDetector] Post-processing budget enforcement: truncated ~${truncatedTokens.toLocaleString()} tokens of file content to fit ${textTokenBudget.toLocaleString()} token budget`);
|
|
920
|
-
}
|
|
921
|
-
}
|
|
922
|
-
// Token usage breakdown logging
|
|
923
|
-
const textTokens = estimateTokens(options.input.text, provider);
|
|
924
|
-
const imageCount = (options.input.images?.length ?? 0) +
|
|
925
|
-
(options.input.content?.filter((c) => c.type === "image").length ?? 0);
|
|
926
|
-
const imageTokens = imageCount * 1500;
|
|
927
|
-
const totalContentTokens = textTokens + imageTokens;
|
|
928
|
-
const contextWindow = getAvailableInputTokens(provider, model);
|
|
929
|
-
logger.info(`[TokenUsage] Content breakdown: text=${textTokens.toLocaleString()} tokens, ` +
|
|
930
|
-
`images=${imageCount} (~${imageTokens.toLocaleString()} tokens), ` +
|
|
931
|
-
`total=${totalContentTokens.toLocaleString()} tokens, ` +
|
|
932
|
-
`budget=${contextWindow.toLocaleString()} tokens, ` +
|
|
933
|
-
`utilization=${contextWindow > 0 ? ((totalContentTokens / contextWindow) * 100).toFixed(1) : "N/A"}%`);
|
|
934
|
-
}
|
|
935
|
-
/**
|
|
936
|
-
* Process explicit PDF files and return structured PDF entries for multimodal processing.
|
|
937
|
-
*/
|
|
938
|
-
async function processExplicitPdfFiles(options, maxSize, provider) {
|
|
939
|
-
const pdfFiles = [];
|
|
940
|
-
if (!options.input.pdfFiles || options.input.pdfFiles.length === 0) {
|
|
941
|
-
return pdfFiles;
|
|
942
|
-
}
|
|
943
|
-
logger.info(`[PDF] Processing ${options.input.pdfFiles.length} explicit PDF file(s) for ${provider}`);
|
|
944
|
-
for (let i = 0; i < options.input.pdfFiles.length; i++) {
|
|
945
|
-
const pdfFile = options.input.pdfFiles[i];
|
|
946
|
-
const filename = extractFilename(pdfFile, i);
|
|
947
|
-
try {
|
|
948
|
-
const result = await FileDetector.detectAndProcess(pdfFile, {
|
|
949
|
-
maxSize,
|
|
950
|
-
allowedTypes: ["pdf"],
|
|
951
|
-
provider: provider,
|
|
952
|
-
});
|
|
953
|
-
if (Buffer.isBuffer(result.content)) {
|
|
954
|
-
pdfFiles.push({
|
|
955
|
-
buffer: result.content,
|
|
956
|
-
filename,
|
|
957
|
-
pageCount: result.metadata?.estimatedPages ?? null,
|
|
958
|
-
});
|
|
959
|
-
logger.info(`[PDF] ✅ Queued for multimodal: ${filename} (${result.metadata?.estimatedPages ?? "unknown"} pages)`);
|
|
960
|
-
}
|
|
961
|
-
}
|
|
962
|
-
catch (error) {
|
|
963
|
-
logger.error(`[PDF] ❌ Failed to process ${filename}:`, error);
|
|
964
|
-
throw error;
|
|
965
|
-
}
|
|
966
|
-
}
|
|
967
|
-
return pdfFiles;
|
|
968
|
-
}
|
|
969
|
-
/**
|
|
970
|
-
* Build the enhanced system prompt for multimodal messages, including
|
|
971
|
-
* conversation instructions, structured output instructions, and file handling guidance.
|
|
972
|
-
*/
|
|
973
|
-
function buildMultimodalSystemPrompt(options, hasPDFFiles) {
|
|
974
|
-
let systemPrompt = options.systemPrompt?.trim() || "";
|
|
975
|
-
const hasConversationHistory = options.conversationHistory && options.conversationHistory.length > 0;
|
|
976
|
-
if (hasConversationHistory) {
|
|
977
|
-
systemPrompt = `${systemPrompt.trim()}${CONVERSATION_INSTRUCTIONS}`;
|
|
978
|
-
}
|
|
979
|
-
if (shouldUseStructuredOutput(options)) {
|
|
980
|
-
systemPrompt = `${systemPrompt.trim()}${STRUCTURED_OUTPUT_INSTRUCTIONS}`;
|
|
981
|
-
}
|
|
982
|
-
const hasCSVFiles = (options.input.csvFiles && options.input.csvFiles.length > 0) ||
|
|
983
|
-
(options.input.files &&
|
|
984
|
-
options.input.files.some((f) => typeof f === "string" ? f.toLowerCase().endsWith(".csv") : false));
|
|
985
|
-
if (hasCSVFiles || hasPDFFiles) {
|
|
986
|
-
const fileTypes = [];
|
|
987
|
-
if (hasPDFFiles) {
|
|
988
|
-
fileTypes.push("PDFs");
|
|
989
|
-
}
|
|
990
|
-
if (hasCSVFiles) {
|
|
991
|
-
fileTypes.push("CSVs");
|
|
992
|
-
}
|
|
993
|
-
systemPrompt += `\n\nIMPORTANT FILE HANDLING INSTRUCTIONS:
|
|
994
|
-
- File content (${fileTypes.join(", ")}, images) is already processed and included in this message
|
|
995
|
-
- DO NOT use GitHub tools (get_file_contents, search_code, etc.) for local files - they only work for remote repository files
|
|
996
|
-
- Analyze the provided file content directly without attempting to fetch or read files using tools
|
|
997
|
-
- GitHub MCP tools are ONLY for remote repository operations, not local filesystem access
|
|
998
|
-
- Use the file content shown in this message for your analysis`;
|
|
999
|
-
}
|
|
1000
|
-
return systemPrompt;
|
|
1001
|
-
}
|
|
1002
|
-
/**
|
|
1003
|
-
* Build multimodal message array with image support
|
|
1004
|
-
* Detects when images are present and routes through provider adapter
|
|
1005
|
-
*/
|
|
1006
|
-
export async function buildMultimodalMessagesArray(options, provider, model) {
|
|
1007
|
-
// Compute provider-specific max PDF size once for consistent validation
|
|
1008
|
-
const pdfConfig = PDFProcessor.getProviderConfig(provider);
|
|
1009
|
-
const maxSize = pdfConfig
|
|
1010
|
-
? pdfConfig.maxSizeMB * 1024 * 1024
|
|
1011
|
-
: 10 * 1024 * 1024;
|
|
1012
|
-
// Aggregate file budget enforcement
|
|
1013
|
-
enforceFileBudget(options, provider, model);
|
|
1014
|
-
// Process unified files array (auto-detect)
|
|
1015
|
-
await processUnifiedFilesArray(options, maxSize, provider);
|
|
1016
|
-
// Process explicit CSV files array
|
|
1017
|
-
await processExplicitCsvFiles(options);
|
|
1018
|
-
// Post-processing budget enforcement and token usage logging
|
|
1019
|
-
enforcePostProcessingBudget(options, provider, model);
|
|
1020
|
-
// Process explicit PDF files
|
|
1021
|
-
const pdfFiles = await processExplicitPdfFiles(options, maxSize, provider);
|
|
1022
|
-
// Check if this is a multimodal request
|
|
1023
|
-
const hasImages = (options.input.images && options.input.images.length > 0) ||
|
|
1024
|
-
(options.input.content &&
|
|
1025
|
-
options.input.content.some((c) => c.type === "image"));
|
|
1026
|
-
const hasPDFs = pdfFiles.length > 0;
|
|
1027
|
-
// If no images or PDFs, use standard message building and convert to MultimodalChatMessage[]
|
|
1028
|
-
if (!hasImages && !hasPDFs) {
|
|
1029
|
-
if (options.input.csvFiles) {
|
|
1030
|
-
options.input.csvFiles = [];
|
|
1031
|
-
}
|
|
1032
|
-
if (options.input.pdfFiles) {
|
|
1033
|
-
options.input.pdfFiles = [];
|
|
1034
|
-
}
|
|
1035
|
-
if (options.input.files) {
|
|
1036
|
-
options.input.files = [];
|
|
1037
|
-
}
|
|
1038
|
-
const standardMessages = await buildMessagesArray(options);
|
|
1039
|
-
return standardMessages.map((msg) => {
|
|
1040
|
-
const msgProviderOptions = msg
|
|
1041
|
-
.providerOptions;
|
|
1042
|
-
return {
|
|
1043
|
-
role: msg.role,
|
|
1044
|
-
content: msg.content,
|
|
1045
|
-
...(msgProviderOptions && { providerOptions: msgProviderOptions }),
|
|
1046
|
-
};
|
|
1047
|
-
});
|
|
1048
|
-
}
|
|
1049
|
-
// Validate provider supports vision
|
|
1050
|
-
if (!ProviderImageAdapter.supportsVision(provider, model)) {
|
|
1051
|
-
throw new Error(`Provider ${provider} with model ${model} does not support vision processing. ` +
|
|
1052
|
-
`Supported providers: ${ProviderImageAdapter.getVisionProviders().join(", ")}`);
|
|
1053
|
-
}
|
|
1054
|
-
const messages = [];
|
|
1055
|
-
// Build enhanced system prompt
|
|
1056
|
-
const systemPrompt = buildMultimodalSystemPrompt(options, pdfFiles.length > 0);
|
|
1057
|
-
if (systemPrompt.trim()) {
|
|
1058
|
-
messages.push({
|
|
1059
|
-
role: "system",
|
|
1060
|
-
content: systemPrompt.trim(),
|
|
1061
|
-
providerOptions: {
|
|
1062
|
-
anthropic: { cacheControl: { type: "ephemeral" } },
|
|
1063
|
-
},
|
|
1064
|
-
});
|
|
1065
|
-
}
|
|
1066
|
-
// Add conversation history if available
|
|
1067
|
-
const hasConversationHistory = options.conversationHistory && options.conversationHistory.length > 0;
|
|
1068
|
-
if (hasConversationHistory && options.conversationHistory) {
|
|
1069
|
-
for (const msg of options.conversationHistory) {
|
|
1070
|
-
// Filter out tool_call and tool_result roles — only user/assistant/system are valid for AI providers
|
|
1071
|
-
if (msg.role === "user" ||
|
|
1072
|
-
msg.role === "assistant" ||
|
|
1073
|
-
msg.role === "system") {
|
|
1074
|
-
const providerOptions = msg.providerOptions;
|
|
1075
|
-
messages.push({
|
|
1076
|
-
role: msg.role,
|
|
1077
|
-
content: msg.content,
|
|
1078
|
-
...(providerOptions && { providerOptions }),
|
|
1079
|
-
});
|
|
1080
|
-
}
|
|
1081
|
-
}
|
|
1082
|
-
}
|
|
1083
|
-
// Handle multimodal content
|
|
1084
|
-
try {
|
|
1085
|
-
let userContent;
|
|
1086
|
-
if (options.input.content && options.input.content.length > 0) {
|
|
1087
|
-
userContent = await convertContentToProviderFormat(options.input.content, provider, model);
|
|
1088
|
-
}
|
|
1089
|
-
else if ((options.input.images && options.input.images.length > 0) ||
|
|
1090
|
-
pdfFiles.length > 0) {
|
|
1091
|
-
userContent = await convertMultimodalToProviderFormat(options.input.text, options.input.images || [], pdfFiles, provider, model);
|
|
1092
|
-
}
|
|
1093
|
-
else {
|
|
1094
|
-
userContent = options.input.text;
|
|
1095
|
-
}
|
|
1096
|
-
if (typeof userContent === "string") {
|
|
1097
|
-
messages.push({
|
|
1098
|
-
role: "user",
|
|
1099
|
-
content: userContent,
|
|
1100
|
-
});
|
|
1101
|
-
}
|
|
1102
|
-
else {
|
|
1103
|
-
messages.push({
|
|
1104
|
-
role: "user",
|
|
1105
|
-
content: userContent,
|
|
1106
|
-
});
|
|
1107
|
-
}
|
|
1108
|
-
const reqId = options.context
|
|
1109
|
-
?.requestId;
|
|
1110
|
-
logMessageComposition(messages, reqId);
|
|
1111
|
-
return messages;
|
|
1112
|
-
}
|
|
1113
|
-
catch (error) {
|
|
1114
|
-
MultimodalLogger.logError("MULTIMODAL_BUILD", error, {
|
|
1115
|
-
provider,
|
|
1116
|
-
model,
|
|
1117
|
-
hasImages,
|
|
1118
|
-
imageCount: options.input.images?.length || 0,
|
|
1119
|
-
});
|
|
1120
|
-
throw error;
|
|
1121
|
-
}
|
|
1122
|
-
}
|
|
1123
|
-
/**
|
|
1124
|
-
* Convert advanced content format to provider-specific format
|
|
1125
|
-
*/
|
|
1126
|
-
async function convertContentToProviderFormat(content, provider, _model) {
|
|
1127
|
-
const textContent = content.find((c) => c.type === "text");
|
|
1128
|
-
const imageContent = content.filter((c) => c.type === "image");
|
|
1129
|
-
if (!textContent) {
|
|
1130
|
-
throw new Error("Multimodal content must include at least one text element");
|
|
1131
|
-
}
|
|
1132
|
-
if (imageContent.length === 0) {
|
|
1133
|
-
return textContent.text;
|
|
1134
|
-
}
|
|
1135
|
-
// Extract images as Buffer | string array
|
|
1136
|
-
const images = imageContent.map((img) => img.data);
|
|
1137
|
-
return await convertSimpleImagesToProviderFormat(textContent.text, images, provider, _model);
|
|
1138
|
-
}
|
|
1139
|
-
/**
|
|
1140
|
-
* Check if a string is an internet URL
|
|
1141
|
-
*/
|
|
1142
|
-
function isInternetUrl(input) {
|
|
1143
|
-
return input.startsWith("http://") || input.startsWith("https://");
|
|
1144
|
-
}
|
|
1145
|
-
/**
|
|
1146
|
-
* Download image from URL and convert to base64 data URI
|
|
1147
|
-
* Rate-limited to 10 downloads per second to prevent DoS
|
|
1148
|
-
* Uses LRU cache to avoid redundant downloads of the same URL
|
|
1149
|
-
*/
|
|
1150
|
-
async function downloadImageFromUrl(url) {
|
|
1151
|
-
// Check cache first (before rate limiting)
|
|
1152
|
-
const cache = getImageCache();
|
|
1153
|
-
const cached = cache.get(url);
|
|
1154
|
-
if (cached) {
|
|
1155
|
-
logger.debug("Using cached image for URL", { url: url.substring(0, 50) });
|
|
1156
|
-
return cached.dataUri;
|
|
1157
|
-
}
|
|
1158
|
-
// Apply rate limiting only if cache missed
|
|
1159
|
-
await urlDownloadRateLimiter.acquire();
|
|
1160
|
-
try {
|
|
1161
|
-
const response = await request(url, {
|
|
1162
|
-
dispatcher: getGlobalDispatcher().compose(interceptors.redirect({ maxRedirections: 5 })),
|
|
1163
|
-
method: "GET",
|
|
1164
|
-
headersTimeout: 10000, // 10 second timeout for headers
|
|
1165
|
-
bodyTimeout: 30000, // 30 second timeout for body,
|
|
1166
|
-
});
|
|
1167
|
-
if (response.statusCode !== 200) {
|
|
1168
|
-
throw new Error(`HTTP ${response.statusCode}: Failed to download image from ${url}`);
|
|
1169
|
-
}
|
|
1170
|
-
// Get content type from headers
|
|
1171
|
-
const contentType = response.headers["content-type"] || "image/jpeg";
|
|
1172
|
-
// Validate it's an image
|
|
1173
|
-
if (!contentType.startsWith("image/")) {
|
|
1174
|
-
throw new Error(`URL does not point to an image. Content-Type: ${contentType}`);
|
|
1175
|
-
}
|
|
1176
|
-
// Read the response body
|
|
1177
|
-
const chunks = [];
|
|
1178
|
-
for await (const chunk of response.body) {
|
|
1179
|
-
chunks.push(chunk);
|
|
1180
|
-
}
|
|
1181
|
-
const buffer = Buffer.concat(chunks);
|
|
1182
|
-
// Check file size (limit to 10MB)
|
|
1183
|
-
const maxSize = 10 * 1024 * 1024; // 10MB
|
|
1184
|
-
if (buffer.length > maxSize) {
|
|
1185
|
-
throw new Error(`Image too large: ${buffer.length} bytes (max: ${maxSize} bytes)`);
|
|
1186
|
-
}
|
|
1187
|
-
// Convert to base64 data URI
|
|
1188
|
-
const base64 = buffer.toString("base64");
|
|
1189
|
-
const dataUri = `data:${contentType};base64,${base64}`;
|
|
1190
|
-
// Store in cache for future use
|
|
1191
|
-
cache.set(url, dataUri, contentType, buffer);
|
|
1192
|
-
return dataUri;
|
|
1193
|
-
}
|
|
1194
|
-
catch (error) {
|
|
1195
|
-
MultimodalLogger.logError("URL_DOWNLOAD_FAILED", error, { url });
|
|
1196
|
-
throw new Error(`Failed to download image from ${url}: ${error instanceof Error ? error.message : String(error)}`, { cause: error });
|
|
1197
|
-
}
|
|
1198
|
-
}
|
|
1199
|
-
/**
|
|
1200
|
-
* Convert simple images format to Vercel AI SDK format with smart auto-detection
|
|
1201
|
-
* - URLs: Downloaded and converted to base64 for Vercel AI SDK compatibility
|
|
1202
|
-
* - Local files: Converted to base64 for Vercel AI SDK compatibility
|
|
1203
|
-
* - Buffers/Data URIs: Processed normally
|
|
1204
|
-
* - Supports alt text for accessibility (included as context in text parts)
|
|
1205
|
-
*/
|
|
1206
|
-
async function convertSimpleImagesToProviderFormat(text, images, provider, _model) {
|
|
1207
|
-
// Validate image count against provider-specific limits before processing
|
|
1208
|
-
ProviderImageAdapter.validateImageCount(images.length, provider, _model);
|
|
1209
|
-
// For Vercel AI SDK, we need to return the content in the standard format
|
|
1210
|
-
// The Vercel AI SDK will handle provider-specific formatting internally
|
|
1211
|
-
// IMPORTANT: Generate alt text descriptions BEFORE URL downloading to maintain correct image numbering
|
|
1212
|
-
// This ensures image numbers match the original order provided by users, even if some URLs fail to download
|
|
1213
|
-
const altTextDescriptions = images
|
|
1214
|
-
.map((image, idx) => {
|
|
1215
|
-
const altText = extractAltText(image);
|
|
1216
|
-
return altText ? `[Image ${idx + 1}: ${altText}]` : null;
|
|
1217
|
-
})
|
|
1218
|
-
.filter(Boolean);
|
|
1219
|
-
// Build enhanced text with alt text context for accessibility
|
|
1220
|
-
// NOTE: Alt text is appended to the user's prompt as contextual information because most AI providers
|
|
1221
|
-
// don't have native alt text fields in their APIs. This approach ensures accessibility metadata
|
|
1222
|
-
// is preserved and helps AI models better understand image content.
|
|
1223
|
-
const enhancedText = altTextDescriptions.length > 0
|
|
1224
|
-
? `${text}\n\nImage descriptions for context: ${altTextDescriptions.join(" ")}`
|
|
1225
|
-
: text;
|
|
1226
|
-
// Smart auto-detection: separate URLs from actual image data
|
|
1227
|
-
// Also track alt text for each image
|
|
1228
|
-
const urlImages = [];
|
|
1229
|
-
const actualImages = [];
|
|
1230
|
-
images.forEach((image, _index) => {
|
|
1231
|
-
const imageData = extractImageData(image);
|
|
1232
|
-
const altText = extractAltText(image);
|
|
1233
|
-
if (typeof imageData === "string" && isInternetUrl(imageData)) {
|
|
1234
|
-
// Internet URL - will be downloaded and converted to base64
|
|
1235
|
-
urlImages.push({ url: imageData, altText });
|
|
1236
|
-
}
|
|
1237
|
-
else {
|
|
1238
|
-
// Actual image data (file path, Buffer, data URI) - process for Vercel AI SDK
|
|
1239
|
-
actualImages.push({ data: imageData, altText });
|
|
1240
|
-
}
|
|
1241
|
-
});
|
|
1242
|
-
// Download URL images and add to actual images
|
|
1243
|
-
for (const { url, altText } of urlImages) {
|
|
1244
|
-
try {
|
|
1245
|
-
const downloadedDataUri = await downloadImageFromUrl(url);
|
|
1246
|
-
actualImages.push({ data: downloadedDataUri, altText });
|
|
1247
|
-
}
|
|
1248
|
-
catch (error) {
|
|
1249
|
-
MultimodalLogger.logError("URL_DOWNLOAD_FAILED_SKIPPING", error, { url });
|
|
1250
|
-
// Continue processing other images even if one URL fails
|
|
1251
|
-
logger.warn(`Failed to download image from ${url}, skipping: ${error instanceof Error ? error.message : String(error)}`);
|
|
1252
|
-
}
|
|
1253
|
-
}
|
|
1254
|
-
const content = [
|
|
1255
|
-
{ type: "text", text: enhancedText },
|
|
1256
|
-
];
|
|
1257
|
-
// Process all images (including downloaded URLs) for Vercel AI SDK
|
|
1258
|
-
actualImages.forEach(({ data: image }, index) => {
|
|
1259
|
-
try {
|
|
1260
|
-
// Vercel AI SDK v6 expects { type: 'image', image: Buffer | string, mimeType?: string }
|
|
1261
|
-
// IMPORTANT: The `image` field must be raw base64 or a Buffer — NOT a data: URI string.
|
|
1262
|
-
// The AI SDK v6's download pipeline calls `new URL(image)` on string values. A data: URI
|
|
1263
|
-
// is a valid URL, so the SDK tries to "download" it, which hits SSRF validation
|
|
1264
|
-
// (validateDownloadUrl) and throws "URL scheme must be http or https, got data:".
|
|
1265
|
-
// Passing raw base64 avoids this because `new URL(base64string)` throws and the SDK
|
|
1266
|
-
// treats the string as inline base64 data instead.
|
|
1267
|
-
let imageData;
|
|
1268
|
-
let mimeType = "image/jpeg"; // Default mime type
|
|
1269
|
-
if (typeof image === "string") {
|
|
1270
|
-
if (image.startsWith("data:")) {
|
|
1271
|
-
// Data URI (including downloaded URLs) - extract mime type and raw base64
|
|
1272
|
-
const match = image.match(/^data:([^;]+);base64,(.+)$/);
|
|
1273
|
-
if (match) {
|
|
1274
|
-
mimeType = match[1];
|
|
1275
|
-
imageData = match[2]; // Raw base64 only — NOT the full data: URI
|
|
1276
|
-
}
|
|
1277
|
-
else {
|
|
1278
|
-
imageData = image;
|
|
1279
|
-
}
|
|
1280
|
-
}
|
|
1281
|
-
else if (isInternetUrl(image)) {
|
|
1282
|
-
// This should not happen as URLs are processed separately above
|
|
1283
|
-
// But handle it gracefully just in case
|
|
1284
|
-
throw new Error(`Unprocessed URL found in actualImages: ${image}`);
|
|
1285
|
-
}
|
|
1286
|
-
else {
|
|
1287
|
-
// File path string - convert to base64
|
|
1288
|
-
try {
|
|
1289
|
-
if (existsSync(image)) {
|
|
1290
|
-
const buffer = readFileSync(image);
|
|
1291
|
-
const base64 = buffer.toString("base64");
|
|
1292
|
-
// Detect mime type from file extension
|
|
1293
|
-
const ext = image.toLowerCase().split(".").pop();
|
|
1294
|
-
switch (ext) {
|
|
1295
|
-
case "png":
|
|
1296
|
-
mimeType = "image/png";
|
|
1297
|
-
break;
|
|
1298
|
-
case "gif":
|
|
1299
|
-
mimeType = "image/gif";
|
|
1300
|
-
break;
|
|
1301
|
-
case "webp":
|
|
1302
|
-
mimeType = "image/webp";
|
|
1303
|
-
break;
|
|
1304
|
-
case "bmp":
|
|
1305
|
-
mimeType = "image/bmp";
|
|
1306
|
-
break;
|
|
1307
|
-
case "tiff":
|
|
1308
|
-
case "tif":
|
|
1309
|
-
mimeType = "image/tiff";
|
|
1310
|
-
break;
|
|
1311
|
-
default:
|
|
1312
|
-
mimeType = "image/jpeg";
|
|
1313
|
-
break;
|
|
1314
|
-
}
|
|
1315
|
-
imageData = base64; // Raw base64 only
|
|
1316
|
-
}
|
|
1317
|
-
else {
|
|
1318
|
-
throw new Error(`Image file not found: ${image}`);
|
|
1319
|
-
}
|
|
1320
|
-
}
|
|
1321
|
-
catch (error) {
|
|
1322
|
-
MultimodalLogger.logError("FILE_PATH_CONVERSION", error, {
|
|
1323
|
-
index,
|
|
1324
|
-
filePath: image,
|
|
1325
|
-
});
|
|
1326
|
-
throw new Error(`Failed to convert file path to base64: ${image}. ${error}`, { cause: error });
|
|
1327
|
-
}
|
|
1328
|
-
}
|
|
1329
|
-
}
|
|
1330
|
-
else {
|
|
1331
|
-
// Buffer - convert to raw base64
|
|
1332
|
-
imageData = image.toString("base64");
|
|
1333
|
-
}
|
|
1334
|
-
content.push({
|
|
1335
|
-
type: "image",
|
|
1336
|
-
image: imageData,
|
|
1337
|
-
mimeType: mimeType,
|
|
1338
|
-
});
|
|
1339
|
-
}
|
|
1340
|
-
catch (error) {
|
|
1341
|
-
MultimodalLogger.logError("ADD_IMAGE_TO_CONTENT", error, {
|
|
1342
|
-
index,
|
|
1343
|
-
provider,
|
|
1344
|
-
});
|
|
1345
|
-
throw error;
|
|
1346
|
-
}
|
|
1347
|
-
});
|
|
1348
|
-
return content;
|
|
1349
|
-
}
|
|
1350
|
-
/**
|
|
1351
|
-
* Convert multimodal content (images + PDFs) to provider format
|
|
1352
|
-
*/
|
|
1353
|
-
async function convertMultimodalToProviderFormat(text, images, pdfFiles, provider, model) {
|
|
1354
|
-
const content = [
|
|
1355
|
-
{ type: "text", text },
|
|
1356
|
-
];
|
|
1357
|
-
// Add images if present
|
|
1358
|
-
if (images.length > 0) {
|
|
1359
|
-
const imageContent = await convertSimpleImagesToProviderFormat("", images, provider, model);
|
|
1360
|
-
if (Array.isArray(imageContent)) {
|
|
1361
|
-
imageContent.forEach((item) => {
|
|
1362
|
-
if (item.type !== "text") {
|
|
1363
|
-
content.push(item);
|
|
1364
|
-
}
|
|
1365
|
-
});
|
|
1366
|
-
}
|
|
1367
|
-
}
|
|
1368
|
-
// Check if provider supports native PDF processing
|
|
1369
|
-
const supportsNativePDF = PDFProcessor.supportsNativePDF(provider);
|
|
1370
|
-
if (supportsNativePDF) {
|
|
1371
|
-
// Add PDFs using Vercel AI SDK standard format (works for providers with native PDF support)
|
|
1372
|
-
content.push(...pdfFiles.map((pdf) => {
|
|
1373
|
-
logger.info(`[PDF] ✅ Added to content (native PDF format): ${pdf.filename}`);
|
|
1374
|
-
return {
|
|
1375
|
-
type: "file",
|
|
1376
|
-
data: pdf.buffer,
|
|
1377
|
-
mediaType: "application/pdf",
|
|
1378
|
-
};
|
|
1379
|
-
}));
|
|
1380
|
-
}
|
|
1381
|
-
else {
|
|
1382
|
-
// Provider doesn't support native PDF - convert PDF pages to images
|
|
1383
|
-
// This enables PDF processing for providers like Mistral, Ollama that support images but not PDFs
|
|
1384
|
-
logger.info(`[PDF→Image] Provider ${provider} doesn't support native PDF. Converting ${pdfFiles.length} PDF(s) to images...`);
|
|
1385
|
-
for (const pdf of pdfFiles) {
|
|
1386
|
-
try {
|
|
1387
|
-
const conversionResult = await PDFImageConverter.convertToImages(pdf.buffer, {
|
|
1388
|
-
scale: 2.0, // High quality for OCR/analysis
|
|
1389
|
-
maxPages: 20, // Limit pages to prevent token overflow
|
|
1390
|
-
});
|
|
1391
|
-
logger.info(`[PDF→Image] ✅ Converted ${pdf.filename}: ${conversionResult.pageCount} page(s) → images`);
|
|
1392
|
-
// Add each page as an ImagePart (raw base64, not data: URI — see SSRF note above)
|
|
1393
|
-
conversionResult.images.forEach((base64Image, pageIndex) => {
|
|
1394
|
-
content.push({
|
|
1395
|
-
type: "image",
|
|
1396
|
-
image: base64Image,
|
|
1397
|
-
mimeType: "image/png",
|
|
1398
|
-
});
|
|
1399
|
-
logger.debug(`[PDF→Image] Added page ${pageIndex + 1}/${conversionResult.pageCount} of ${pdf.filename}`);
|
|
1400
|
-
});
|
|
1401
|
-
// Log any warnings from conversion
|
|
1402
|
-
if (conversionResult.warnings) {
|
|
1403
|
-
conversionResult.warnings.forEach((warning) => {
|
|
1404
|
-
logger.warn(`[PDF→Image] ${warning}`);
|
|
1405
|
-
});
|
|
1406
|
-
}
|
|
1407
|
-
}
|
|
1408
|
-
catch (error) {
|
|
1409
|
-
const errorMessage = error instanceof Error ? error.message : String(error);
|
|
1410
|
-
logger.error(`[PDF→Image] ❌ Failed to convert ${pdf.filename}: ${errorMessage}`);
|
|
1411
|
-
// Re-throw so the user knows PDF processing failed
|
|
1412
|
-
throw new Error(`PDF to image conversion failed for ${pdf.filename}: ${errorMessage}. ` +
|
|
1413
|
-
`Provider ${provider} doesn't support native PDFs and image conversion failed.`, { cause: error });
|
|
1414
|
-
}
|
|
1415
|
-
}
|
|
1416
|
-
}
|
|
1417
|
-
return content;
|
|
1418
|
-
}
|
|
1419
|
-
/**
|
|
1420
|
-
* Type guard for FileWithMetadata objects.
|
|
1421
|
-
*/
|
|
1422
|
-
function isFileWithMetadata(file) {
|
|
1423
|
-
return (typeof file === "object" &&
|
|
1424
|
-
!Buffer.isBuffer(file) &&
|
|
1425
|
-
"buffer" in file &&
|
|
1426
|
-
"filename" in file);
|
|
1427
|
-
}
|
|
1428
|
-
/**
|
|
1429
|
-
* Extract filename from file input.
|
|
1430
|
-
* Supports Buffers (generic name), strings (path/URL), and FileWithMetadata objects.
|
|
1431
|
-
*/
|
|
1432
|
-
function extractFilename(file, index = 0) {
|
|
1433
|
-
if (isFileWithMetadata(file)) {
|
|
1434
|
-
return file.filename;
|
|
1435
|
-
}
|
|
1436
|
-
if (typeof file === "string") {
|
|
1437
|
-
if (file.startsWith("http")) {
|
|
1438
|
-
try {
|
|
1439
|
-
const url = new URL(file);
|
|
1440
|
-
return url.pathname.split("/").pop() || `file-${index + 1}`;
|
|
1441
|
-
}
|
|
1442
|
-
catch {
|
|
1443
|
-
return `file-${index + 1}`;
|
|
1444
|
-
}
|
|
1445
|
-
}
|
|
1446
|
-
return (file.split("/").pop() || file.split("\\").pop() || `file-${index + 1}`);
|
|
1447
|
-
}
|
|
1448
|
-
return `file-${index + 1}`;
|
|
1449
|
-
}
|
|
1450
|
-
/**
|
|
1451
|
-
* Get the byte size of a file input.
|
|
1452
|
-
* For FileWithMetadata: returns buffer.length.
|
|
1453
|
-
* For Buffers: returns buffer.length.
|
|
1454
|
-
* For strings that are file paths: returns the stat size.
|
|
1455
|
-
* For URLs/data URIs: returns a rough estimate from string length.
|
|
1456
|
-
*/
|
|
1457
|
-
function getFileSize(file) {
|
|
1458
|
-
if (isFileWithMetadata(file)) {
|
|
1459
|
-
return file.buffer.length;
|
|
1460
|
-
}
|
|
1461
|
-
if (Buffer.isBuffer(file)) {
|
|
1462
|
-
return file.length;
|
|
1463
|
-
}
|
|
1464
|
-
if (typeof file === "string" && existsSync(file)) {
|
|
1465
|
-
try {
|
|
1466
|
-
return statSync(file).size;
|
|
1467
|
-
}
|
|
1468
|
-
catch {
|
|
1469
|
-
return 0;
|
|
1470
|
-
}
|
|
1471
|
-
}
|
|
1472
|
-
// For URLs and data URIs, use string length as rough estimate
|
|
1473
|
-
return typeof file === "string" ? file.length : 0;
|
|
1474
|
-
}
|
|
1475
|
-
/**
|
|
1476
|
-
* Get a Buffer from a file input.
|
|
1477
|
-
* For FileWithMetadata: returns the buffer property.
|
|
1478
|
-
* For Buffers: returns as-is.
|
|
1479
|
-
* For file paths: reads the file.
|
|
1480
|
-
* For URLs/data URIs: returns null (not supported for lazy registration).
|
|
1481
|
-
*/
|
|
1482
|
-
async function getFileBuffer(file) {
|
|
1483
|
-
if (isFileWithMetadata(file)) {
|
|
1484
|
-
return file.buffer;
|
|
1485
|
-
}
|
|
1486
|
-
if (Buffer.isBuffer(file)) {
|
|
1487
|
-
return file;
|
|
1488
|
-
}
|
|
1489
|
-
if (typeof file === "string" && existsSync(file)) {
|
|
1490
|
-
try {
|
|
1491
|
-
return readFileSync(file);
|
|
1492
|
-
}
|
|
1493
|
-
catch {
|
|
1494
|
-
return null;
|
|
1495
|
-
}
|
|
1496
|
-
}
|
|
1497
|
-
// URLs and data URIs can't be lazily registered (need download first)
|
|
1498
|
-
return null;
|
|
1499
|
-
}
|
|
1500
|
-
/**
|
|
1501
|
-
* Determine the source type of a file input.
|
|
1502
|
-
*/
|
|
1503
|
-
function getFileSource(file) {
|
|
1504
|
-
if (isFileWithMetadata(file)) {
|
|
1505
|
-
return "buffer";
|
|
1506
|
-
}
|
|
1507
|
-
if (Buffer.isBuffer(file)) {
|
|
1508
|
-
return "buffer";
|
|
1509
|
-
}
|
|
1510
|
-
if (typeof file === "string") {
|
|
1511
|
-
if (file.startsWith("data:")) {
|
|
1512
|
-
return "datauri";
|
|
1513
|
-
}
|
|
1514
|
-
if (file.startsWith("http://") || file.startsWith("https://")) {
|
|
1515
|
-
return "url";
|
|
1516
|
-
}
|
|
1517
|
-
if (existsSync(file)) {
|
|
1518
|
-
return "path";
|
|
1519
|
-
}
|
|
1520
|
-
}
|
|
1521
|
-
return "buffer";
|
|
1522
|
-
}
|
|
1523
|
-
/**
|
|
1524
|
-
* Try to register a file with the FileReferenceRegistry for lazy processing.
|
|
1525
|
-
* Returns true if registration succeeded, false if it failed (caller should
|
|
1526
|
-
* fall through to full processing).
|
|
1527
|
-
*/
|
|
1528
|
-
async function tryRegisterFileReference(file, fileSize, registry, index = 0) {
|
|
1529
|
-
try {
|
|
1530
|
-
const buffer = await getFileBuffer(file);
|
|
1531
|
-
if (!buffer) {
|
|
1532
|
-
return false;
|
|
1533
|
-
}
|
|
1534
|
-
const filename = extractFilename(file, index);
|
|
1535
|
-
await registry.register(buffer, getFileSource(file), { filename });
|
|
1536
|
-
logger.info(`[FileDetector] Registered "${filename}" (${(fileSize / 1024).toFixed(0)} KB) ` +
|
|
1537
|
-
`as lazy reference — skipping upfront processing`);
|
|
1538
|
-
return true;
|
|
1539
|
-
}
|
|
1540
|
-
catch (regError) {
|
|
1541
|
-
logger.warn(`[FileDetector] Failed to register file as reference, falling back to full processing: ${regError instanceof Error ? regError.message : String(regError)}`);
|
|
1542
|
-
return false;
|
|
1543
|
-
}
|
|
1544
|
-
}
|
|
1545
|
-
/**
|
|
1546
|
-
* Get a language hint for code fencing based on MIME type or filename extension.
|
|
1547
|
-
* Returns the language identifier for markdown code blocks, or null for generic text.
|
|
1548
|
-
*/
|
|
1549
|
-
function getLanguageHint(mimeType, filename) {
|
|
1550
|
-
// Try MIME type first
|
|
1551
|
-
const mimeMap = {
|
|
1552
|
-
"text/javascript": "javascript",
|
|
1553
|
-
"text/typescript": "typescript",
|
|
1554
|
-
"text/x-python": "python",
|
|
1555
|
-
"text/x-java-source": "java",
|
|
1556
|
-
"text/x-go": "go",
|
|
1557
|
-
"text/x-rustsrc": "rust",
|
|
1558
|
-
"text/x-ruby": "ruby",
|
|
1559
|
-
"text/x-php": "php",
|
|
1560
|
-
"text/x-c": "c",
|
|
1561
|
-
"text/x-c++": "cpp",
|
|
1562
|
-
"text/x-csharp": "csharp",
|
|
1563
|
-
"text/x-swift": "swift",
|
|
1564
|
-
"text/x-kotlin": "kotlin",
|
|
1565
|
-
"text/x-scala": "scala",
|
|
1566
|
-
"text/x-shellscript": "bash",
|
|
1567
|
-
"text/x-powershell": "powershell",
|
|
1568
|
-
"text/x-sql": "sql",
|
|
1569
|
-
"text/x-r": "r",
|
|
1570
|
-
"text/x-lua": "lua",
|
|
1571
|
-
"text/x-perl": "perl",
|
|
1572
|
-
"text/x-dart": "dart",
|
|
1573
|
-
"text/x-elixir": "elixir",
|
|
1574
|
-
"text/x-erlang": "erlang",
|
|
1575
|
-
"text/x-haskell": "haskell",
|
|
1576
|
-
"text/x-clojure": "clojure",
|
|
1577
|
-
"text/x-lisp": "lisp",
|
|
1578
|
-
"text/html": "html",
|
|
1579
|
-
"text/css": "css",
|
|
1580
|
-
"text/markdown": "markdown",
|
|
1581
|
-
"application/json": "json",
|
|
1582
|
-
"application/xml": "xml",
|
|
1583
|
-
"text/xml": "xml",
|
|
1584
|
-
"application/yaml": "yaml",
|
|
1585
|
-
"application/x-yaml": "yaml",
|
|
1586
|
-
};
|
|
1587
|
-
const lower = mimeType.toLowerCase().split(";")[0].trim();
|
|
1588
|
-
if (mimeMap[lower]) {
|
|
1589
|
-
return mimeMap[lower];
|
|
1590
|
-
}
|
|
1591
|
-
// Fallback: try extension from filename
|
|
1592
|
-
const ext = filename.split(".").pop()?.toLowerCase();
|
|
1593
|
-
if (!ext) {
|
|
1594
|
-
return null;
|
|
1595
|
-
}
|
|
1596
|
-
const extMap = {
|
|
1597
|
-
js: "javascript",
|
|
1598
|
-
mjs: "javascript",
|
|
1599
|
-
cjs: "javascript",
|
|
1600
|
-
jsx: "javascript",
|
|
1601
|
-
ts: "typescript",
|
|
1602
|
-
tsx: "typescript",
|
|
1603
|
-
py: "python",
|
|
1604
|
-
java: "java",
|
|
1605
|
-
go: "go",
|
|
1606
|
-
rs: "rust",
|
|
1607
|
-
rb: "ruby",
|
|
1608
|
-
php: "php",
|
|
1609
|
-
c: "c",
|
|
1610
|
-
cpp: "cpp",
|
|
1611
|
-
cc: "cpp",
|
|
1612
|
-
h: "c",
|
|
1613
|
-
hpp: "cpp",
|
|
1614
|
-
cs: "csharp",
|
|
1615
|
-
swift: "swift",
|
|
1616
|
-
kt: "kotlin",
|
|
1617
|
-
kts: "kotlin",
|
|
1618
|
-
scala: "scala",
|
|
1619
|
-
sh: "bash",
|
|
1620
|
-
bash: "bash",
|
|
1621
|
-
zsh: "bash",
|
|
1622
|
-
ps1: "powershell",
|
|
1623
|
-
sql: "sql",
|
|
1624
|
-
r: "r",
|
|
1625
|
-
lua: "lua",
|
|
1626
|
-
pl: "perl",
|
|
1627
|
-
perl: "perl",
|
|
1628
|
-
dart: "dart",
|
|
1629
|
-
ex: "elixir",
|
|
1630
|
-
exs: "elixir",
|
|
1631
|
-
erl: "erlang",
|
|
1632
|
-
hs: "haskell",
|
|
1633
|
-
clj: "clojure",
|
|
1634
|
-
lisp: "lisp",
|
|
1635
|
-
vim: "vim",
|
|
1636
|
-
html: "html",
|
|
1637
|
-
htm: "html",
|
|
1638
|
-
css: "css",
|
|
1639
|
-
md: "markdown",
|
|
1640
|
-
markdown: "markdown",
|
|
1641
|
-
json: "json",
|
|
1642
|
-
xml: "xml",
|
|
1643
|
-
yaml: "yaml",
|
|
1644
|
-
yml: "yaml",
|
|
1645
|
-
toml: "toml",
|
|
1646
|
-
ini: "ini",
|
|
1647
|
-
cfg: "ini",
|
|
1648
|
-
};
|
|
1649
|
-
return extMap[ext] || null;
|
|
1650
|
-
}
|
|
1651
|
-
function buildCSVToolInstructions(filePath) {
|
|
1652
|
-
return `\n**NOTE**: You can perform calculations directly on the CSV data shown above. For advanced operations on the full file (counting by column, grouping, etc.), you may optionally use the analyzeCSV tool with filePath="${filePath}".\n\nExample: analyzeCSV(filePath="${filePath}", operation="count_by_column", column="merchant_id")\n\n`;
|
|
1653
|
-
}
|