@juspay/neurolink 9.32.0 → 9.33.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (475) hide show
  1. package/CHANGELOG.md +12 -0
  2. package/dist/auth/anthropicOAuth.js +1 -1
  3. package/dist/cli/commands/proxy.js +18 -5
  4. package/dist/client/aiSdkAdapter.js +1 -1
  5. package/dist/client/index.js +137 -501
  6. package/dist/core/factory.js +0 -1
  7. package/dist/core/redisConversationMemoryManager.js +1 -1
  8. package/dist/features/ppt/slideGenerator.js +0 -1
  9. package/dist/features/ppt/utils.js +0 -1
  10. package/dist/lib/neurolink.d.ts +10 -0
  11. package/dist/lib/neurolink.js +41 -7
  12. package/dist/lib/server/routes/claudeProxyRoutes.js +45 -9
  13. package/dist/lib/types/generateTypes.d.ts +16 -0
  14. package/dist/lib/types/streamTypes.d.ts +15 -0
  15. package/dist/mcp/elicitationProtocol.js +1 -1
  16. package/dist/mcp/servers/agent/directToolsServer.js +0 -1
  17. package/dist/neurolink.d.ts +10 -0
  18. package/dist/neurolink.js +41 -7
  19. package/dist/providers/azureOpenai.js +1 -1
  20. package/dist/providers/huggingFace.js +0 -1
  21. package/dist/providers/openaiCompatible.js +0 -1
  22. package/dist/sdk/toolRegistration.js +0 -1
  23. package/dist/server/openapi/generator.js +1 -1
  24. package/dist/server/routes/claudeProxyRoutes.js +45 -9
  25. package/dist/types/configTypes.js +0 -5
  26. package/dist/types/generateTypes.d.ts +16 -0
  27. package/dist/types/modelTypes.js +0 -1
  28. package/dist/types/streamTypes.d.ts +15 -0
  29. package/dist/types/tools.js +0 -1
  30. package/dist/types/typeAliases.js +0 -1
  31. package/dist/types/utilities.js +1 -1
  32. package/dist/types/workflowTypes.js +0 -1
  33. package/dist/utils/providerRetry.js +0 -1
  34. package/dist/utils/providerUtils.js +0 -1
  35. package/package.json +2 -2
  36. package/dist/client/adapters/providerImageAdapter.js +0 -588
  37. package/dist/client/adapters/tts/googleTTSHandler.js +0 -344
  38. package/dist/client/adapters/video/directorPipeline.js +0 -516
  39. package/dist/client/adapters/video/ffmpegAdapter.js +0 -206
  40. package/dist/client/adapters/video/frameExtractor.js +0 -143
  41. package/dist/client/adapters/video/vertexVideoHandler.js +0 -763
  42. package/dist/client/adapters/video/videoAnalyzer.js +0 -238
  43. package/dist/client/adapters/video/videoMerger.js +0 -171
  44. package/dist/client/agent/directTools.js +0 -840
  45. package/dist/client/auth/AuthProviderFactory.js +0 -111
  46. package/dist/client/auth/AuthProviderRegistry.js +0 -190
  47. package/dist/client/auth/RequestContext.js +0 -78
  48. package/dist/client/auth/accountPool.js +0 -178
  49. package/dist/client/auth/anthropicOAuth.js +0 -974
  50. package/dist/client/auth/authContext.js +0 -314
  51. package/dist/client/auth/errors.js +0 -39
  52. package/dist/client/auth/index.js +0 -61
  53. package/dist/client/auth/middleware/AuthMiddleware.js +0 -519
  54. package/dist/client/auth/middleware/rateLimitByUser.js +0 -554
  55. package/dist/client/auth/providers/BaseAuthProvider.js +0 -723
  56. package/dist/client/auth/providers/CognitoProvider.js +0 -304
  57. package/dist/client/auth/providers/KeycloakProvider.js +0 -393
  58. package/dist/client/auth/providers/auth0.js +0 -274
  59. package/dist/client/auth/providers/betterAuth.js +0 -182
  60. package/dist/client/auth/providers/clerk.js +0 -317
  61. package/dist/client/auth/providers/custom.js +0 -112
  62. package/dist/client/auth/providers/firebase.js +0 -226
  63. package/dist/client/auth/providers/jwt.js +0 -212
  64. package/dist/client/auth/providers/oauth2.js +0 -303
  65. package/dist/client/auth/providers/supabase.js +0 -259
  66. package/dist/client/auth/providers/workos.js +0 -284
  67. package/dist/client/auth/serverBridge.js +0 -25
  68. package/dist/client/auth/sessionManager.js +0 -437
  69. package/dist/client/auth/tokenStore.js +0 -799
  70. package/dist/client/client/aiSdkAdapter.js +0 -487
  71. package/dist/client/client/auth.js +0 -473
  72. package/dist/client/client/errors.js +0 -552
  73. package/dist/client/client/httpClient.js +0 -837
  74. package/dist/client/client/index.js +0 -172
  75. package/dist/client/client/interceptors.js +0 -601
  76. package/dist/client/client/sseClient.js +0 -545
  77. package/dist/client/client/streamingClient.js +0 -917
  78. package/dist/client/client/wsClient.js +0 -369
  79. package/dist/client/config/configManager.js +0 -303
  80. package/dist/client/config/conversationMemory.js +0 -86
  81. package/dist/client/config/taskClassificationConfig.js +0 -148
  82. package/dist/client/constants/contextWindows.js +0 -295
  83. package/dist/client/constants/enums.js +0 -853
  84. package/dist/client/constants/index.js +0 -207
  85. package/dist/client/constants/performance.js +0 -389
  86. package/dist/client/constants/retry.js +0 -266
  87. package/dist/client/constants/timeouts.js +0 -182
  88. package/dist/client/constants/tokens.js +0 -380
  89. package/dist/client/constants/videoErrors.js +0 -46
  90. package/dist/client/context/budgetChecker.js +0 -98
  91. package/dist/client/context/contextCompactor.js +0 -205
  92. package/dist/client/context/emergencyTruncation.js +0 -88
  93. package/dist/client/context/errorDetection.js +0 -171
  94. package/dist/client/context/errors.js +0 -21
  95. package/dist/client/context/fileTokenBudget.js +0 -127
  96. package/dist/client/context/prompts/summarizationPrompt.js +0 -117
  97. package/dist/client/context/stages/fileReadDeduplicator.js +0 -66
  98. package/dist/client/context/stages/slidingWindowTruncator.js +0 -190
  99. package/dist/client/context/stages/structuredSummarizer.js +0 -99
  100. package/dist/client/context/stages/toolOutputPruner.js +0 -52
  101. package/dist/client/context/summarizationEngine.js +0 -136
  102. package/dist/client/context/toolOutputLimits.js +0 -78
  103. package/dist/client/context/toolPairRepair.js +0 -66
  104. package/dist/client/core/analytics.js +0 -88
  105. package/dist/client/core/baseProvider.js +0 -1385
  106. package/dist/client/core/constants.js +0 -140
  107. package/dist/client/core/conversationMemoryFactory.js +0 -141
  108. package/dist/client/core/conversationMemoryInitializer.js +0 -128
  109. package/dist/client/core/conversationMemoryManager.js +0 -344
  110. package/dist/client/core/dynamicModels.js +0 -358
  111. package/dist/client/core/evaluation.js +0 -309
  112. package/dist/client/core/evaluationProviders.js +0 -248
  113. package/dist/client/core/factory.js +0 -412
  114. package/dist/client/core/infrastructure/baseError.js +0 -22
  115. package/dist/client/core/infrastructure/baseFactory.js +0 -54
  116. package/dist/client/core/infrastructure/baseRegistry.js +0 -53
  117. package/dist/client/core/infrastructure/index.js +0 -5
  118. package/dist/client/core/infrastructure/retry.js +0 -20
  119. package/dist/client/core/infrastructure/typedEventEmitter.js +0 -23
  120. package/dist/client/core/modelConfiguration.js +0 -851
  121. package/dist/client/core/modules/GenerationHandler.js +0 -588
  122. package/dist/client/core/modules/MessageBuilder.js +0 -273
  123. package/dist/client/core/modules/StreamHandler.js +0 -185
  124. package/dist/client/core/modules/TelemetryHandler.js +0 -203
  125. package/dist/client/core/modules/ToolsManager.js +0 -499
  126. package/dist/client/core/modules/Utilities.js +0 -331
  127. package/dist/client/core/redisConversationMemoryManager.js +0 -1435
  128. package/dist/client/core/streamAnalytics.js +0 -131
  129. package/dist/client/evaluation/contextBuilder.js +0 -134
  130. package/dist/client/evaluation/index.js +0 -61
  131. package/dist/client/evaluation/prompts.js +0 -73
  132. package/dist/client/evaluation/ragasEvaluator.js +0 -110
  133. package/dist/client/evaluation/retryManager.js +0 -78
  134. package/dist/client/evaluation/scoring.js +0 -61
  135. package/dist/client/factories/providerFactory.js +0 -166
  136. package/dist/client/factories/providerRegistry.js +0 -166
  137. package/dist/client/features/ppt/constants.js +0 -896
  138. package/dist/client/features/ppt/contentPlanner.js +0 -529
  139. package/dist/client/features/ppt/presentationOrchestrator.js +0 -236
  140. package/dist/client/features/ppt/slideGenerator.js +0 -532
  141. package/dist/client/features/ppt/slideRenderers.js +0 -2383
  142. package/dist/client/features/ppt/slideTypeInference.js +0 -405
  143. package/dist/client/features/ppt/types.js +0 -13
  144. package/dist/client/features/ppt/utils.js +0 -443
  145. package/dist/client/files/fileReferenceRegistry.js +0 -1543
  146. package/dist/client/files/fileTools.js +0 -450
  147. package/dist/client/files/streamingReader.js +0 -321
  148. package/dist/client/files/types.js +0 -23
  149. package/dist/client/hitl/hitlErrors.js +0 -54
  150. package/dist/client/hitl/hitlManager.js +0 -460
  151. package/dist/client/mcp/agentExposure.js +0 -356
  152. package/dist/client/mcp/auth/index.js +0 -11
  153. package/dist/client/mcp/auth/oauthClientProvider.js +0 -325
  154. package/dist/client/mcp/auth/tokenStorage.js +0 -134
  155. package/dist/client/mcp/batching/index.js +0 -10
  156. package/dist/client/mcp/batching/requestBatcher.js +0 -441
  157. package/dist/client/mcp/caching/index.js +0 -10
  158. package/dist/client/mcp/caching/toolCache.js +0 -433
  159. package/dist/client/mcp/elicitation/elicitationManager.js +0 -376
  160. package/dist/client/mcp/elicitation/index.js +0 -11
  161. package/dist/client/mcp/elicitation/types.js +0 -10
  162. package/dist/client/mcp/elicitationProtocol.js +0 -375
  163. package/dist/client/mcp/enhancedToolDiscovery.js +0 -481
  164. package/dist/client/mcp/externalServerManager.js +0 -1478
  165. package/dist/client/mcp/factory.js +0 -161
  166. package/dist/client/mcp/flexibleToolValidator.js +0 -161
  167. package/dist/client/mcp/httpRateLimiter.js +0 -391
  168. package/dist/client/mcp/httpRetryHandler.js +0 -178
  169. package/dist/client/mcp/index.js +0 -74
  170. package/dist/client/mcp/mcpCircuitBreaker.js +0 -427
  171. package/dist/client/mcp/mcpClientFactory.js +0 -708
  172. package/dist/client/mcp/mcpRegistryClient.js +0 -488
  173. package/dist/client/mcp/mcpServerBase.js +0 -373
  174. package/dist/client/mcp/multiServerManager.js +0 -579
  175. package/dist/client/mcp/registry.js +0 -158
  176. package/dist/client/mcp/routing/index.js +0 -10
  177. package/dist/client/mcp/routing/toolRouter.js +0 -416
  178. package/dist/client/mcp/serverCapabilities.js +0 -502
  179. package/dist/client/mcp/servers/agent/directToolsServer.js +0 -150
  180. package/dist/client/mcp/toolAnnotations.js +0 -239
  181. package/dist/client/mcp/toolConverter.js +0 -258
  182. package/dist/client/mcp/toolDiscoveryService.js +0 -798
  183. package/dist/client/mcp/toolIntegration.js +0 -334
  184. package/dist/client/mcp/toolRegistry.js +0 -729
  185. package/dist/client/memory/hippocampusInitializer.js +0 -19
  186. package/dist/client/memory/memoryRetrievalTools.js +0 -166
  187. package/dist/client/middleware/builtin/analytics.js +0 -132
  188. package/dist/client/middleware/builtin/autoEvaluation.js +0 -203
  189. package/dist/client/middleware/builtin/guardrails.js +0 -109
  190. package/dist/client/middleware/builtin/lifecycle.js +0 -168
  191. package/dist/client/middleware/factory.js +0 -327
  192. package/dist/client/middleware/registry.js +0 -295
  193. package/dist/client/middleware/utils/guardrailsUtils.js +0 -396
  194. package/dist/client/models/anthropicModels.js +0 -527
  195. package/dist/client/neurolink.js +0 -8233
  196. package/dist/client/observability/exporterRegistry.js +0 -413
  197. package/dist/client/observability/exporters/arizeExporter.js +0 -138
  198. package/dist/client/observability/exporters/baseExporter.js +0 -190
  199. package/dist/client/observability/exporters/braintrustExporter.js +0 -154
  200. package/dist/client/observability/exporters/datadogExporter.js +0 -196
  201. package/dist/client/observability/exporters/laminarExporter.js +0 -302
  202. package/dist/client/observability/exporters/langfuseExporter.js +0 -209
  203. package/dist/client/observability/exporters/langsmithExporter.js +0 -143
  204. package/dist/client/observability/exporters/otelExporter.js +0 -164
  205. package/dist/client/observability/exporters/posthogExporter.js +0 -287
  206. package/dist/client/observability/exporters/sentryExporter.js +0 -165
  207. package/dist/client/observability/index.js +0 -31
  208. package/dist/client/observability/metricsAggregator.js +0 -556
  209. package/dist/client/observability/otelBridge.js +0 -131
  210. package/dist/client/observability/retryPolicy.js +0 -383
  211. package/dist/client/observability/sampling/samplers.js +0 -216
  212. package/dist/client/observability/spanProcessor.js +0 -303
  213. package/dist/client/observability/tokenTracker.js +0 -413
  214. package/dist/client/observability/types/exporterTypes.js +0 -5
  215. package/dist/client/observability/types/index.js +0 -4
  216. package/dist/client/observability/types/spanTypes.js +0 -92
  217. package/dist/client/observability/utils/safeMetadata.js +0 -25
  218. package/dist/client/observability/utils/spanSerializer.js +0 -292
  219. package/dist/client/processors/archive/ArchiveProcessor.js +0 -1308
  220. package/dist/client/processors/base/BaseFileProcessor.js +0 -614
  221. package/dist/client/processors/base/types.js +0 -82
  222. package/dist/client/processors/config/fileTypes.js +0 -520
  223. package/dist/client/processors/config/index.js +0 -92
  224. package/dist/client/processors/config/languageMap.js +0 -410
  225. package/dist/client/processors/config/mimeTypes.js +0 -363
  226. package/dist/client/processors/config/sizeLimits.js +0 -258
  227. package/dist/client/processors/document/ExcelProcessor.js +0 -590
  228. package/dist/client/processors/document/OpenDocumentProcessor.js +0 -212
  229. package/dist/client/processors/document/PptxProcessor.js +0 -157
  230. package/dist/client/processors/document/RtfProcessor.js +0 -361
  231. package/dist/client/processors/document/WordProcessor.js +0 -353
  232. package/dist/client/processors/errors/FileErrorCode.js +0 -255
  233. package/dist/client/processors/errors/errorHelpers.js +0 -386
  234. package/dist/client/processors/errors/errorSerializer.js +0 -507
  235. package/dist/client/processors/errors/index.js +0 -49
  236. package/dist/client/processors/markup/SvgProcessor.js +0 -240
  237. package/dist/client/processors/media/AudioProcessor.js +0 -707
  238. package/dist/client/processors/media/VideoProcessor.js +0 -1045
  239. package/dist/client/providers/amazonBedrock.js +0 -1512
  240. package/dist/client/providers/amazonSagemaker.js +0 -162
  241. package/dist/client/providers/anthropic.js +0 -831
  242. package/dist/client/providers/azureOpenai.js +0 -143
  243. package/dist/client/providers/googleAiStudio.js +0 -1200
  244. package/dist/client/providers/googleNativeGemini3.js +0 -543
  245. package/dist/client/providers/googleVertex.js +0 -2936
  246. package/dist/client/providers/huggingFace.js +0 -315
  247. package/dist/client/providers/litellm.js +0 -488
  248. package/dist/client/providers/mistral.js +0 -157
  249. package/dist/client/providers/ollama.js +0 -1579
  250. package/dist/client/providers/openAI.js +0 -627
  251. package/dist/client/providers/openRouter.js +0 -543
  252. package/dist/client/providers/openaiCompatible.js +0 -290
  253. package/dist/client/providers/providerTypeUtils.js +0 -46
  254. package/dist/client/providers/sagemaker/adaptive-semaphore.js +0 -215
  255. package/dist/client/providers/sagemaker/client.js +0 -472
  256. package/dist/client/providers/sagemaker/config.js +0 -317
  257. package/dist/client/providers/sagemaker/detection.js +0 -606
  258. package/dist/client/providers/sagemaker/error-constants.js +0 -227
  259. package/dist/client/providers/sagemaker/errors.js +0 -299
  260. package/dist/client/providers/sagemaker/language-model.js +0 -775
  261. package/dist/client/providers/sagemaker/parsers.js +0 -634
  262. package/dist/client/providers/sagemaker/streaming.js +0 -331
  263. package/dist/client/providers/sagemaker/structured-parser.js +0 -625
  264. package/dist/client/proxy/accountQuota.js +0 -162
  265. package/dist/client/proxy/claudeFormat.js +0 -595
  266. package/dist/client/proxy/modelRouter.js +0 -29
  267. package/dist/client/proxy/oauthFetch.js +0 -367
  268. package/dist/client/proxy/proxyFetch.js +0 -586
  269. package/dist/client/proxy/requestLogger.js +0 -207
  270. package/dist/client/proxy/tokenRefresh.js +0 -124
  271. package/dist/client/proxy/usageStats.js +0 -74
  272. package/dist/client/proxy/utils/noProxyUtils.js +0 -149
  273. package/dist/client/rag/ChunkerFactory.js +0 -320
  274. package/dist/client/rag/ChunkerRegistry.js +0 -421
  275. package/dist/client/rag/chunkers/BaseChunker.js +0 -143
  276. package/dist/client/rag/chunkers/CharacterChunker.js +0 -28
  277. package/dist/client/rag/chunkers/HTMLChunker.js +0 -38
  278. package/dist/client/rag/chunkers/JSONChunker.js +0 -68
  279. package/dist/client/rag/chunkers/LaTeXChunker.js +0 -63
  280. package/dist/client/rag/chunkers/MarkdownChunker.js +0 -306
  281. package/dist/client/rag/chunkers/RecursiveChunker.js +0 -139
  282. package/dist/client/rag/chunkers/SemanticMarkdownChunker.js +0 -138
  283. package/dist/client/rag/chunkers/SentenceChunker.js +0 -66
  284. package/dist/client/rag/chunkers/TokenChunker.js +0 -61
  285. package/dist/client/rag/chunkers/index.js +0 -15
  286. package/dist/client/rag/chunking/characterChunker.js +0 -142
  287. package/dist/client/rag/chunking/chunkerRegistry.js +0 -194
  288. package/dist/client/rag/chunking/htmlChunker.js +0 -247
  289. package/dist/client/rag/chunking/index.js +0 -17
  290. package/dist/client/rag/chunking/jsonChunker.js +0 -281
  291. package/dist/client/rag/chunking/latexChunker.js +0 -251
  292. package/dist/client/rag/chunking/markdownChunker.js +0 -373
  293. package/dist/client/rag/chunking/recursiveChunker.js +0 -148
  294. package/dist/client/rag/chunking/semanticChunker.js +0 -306
  295. package/dist/client/rag/chunking/sentenceChunker.js +0 -230
  296. package/dist/client/rag/chunking/tokenChunker.js +0 -183
  297. package/dist/client/rag/document/MDocument.js +0 -392
  298. package/dist/client/rag/document/index.js +0 -5
  299. package/dist/client/rag/document/loaders.js +0 -500
  300. package/dist/client/rag/errors/RAGError.js +0 -274
  301. package/dist/client/rag/errors/index.js +0 -6
  302. package/dist/client/rag/graphRag/graphRAG.js +0 -401
  303. package/dist/client/rag/graphRag/index.js +0 -4
  304. package/dist/client/rag/index.js +0 -141
  305. package/dist/client/rag/metadata/MetadataExtractorFactory.js +0 -418
  306. package/dist/client/rag/metadata/MetadataExtractorRegistry.js +0 -362
  307. package/dist/client/rag/metadata/index.js +0 -9
  308. package/dist/client/rag/metadata/metadataExtractor.js +0 -280
  309. package/dist/client/rag/pipeline/RAGPipeline.js +0 -436
  310. package/dist/client/rag/pipeline/contextAssembly.js +0 -341
  311. package/dist/client/rag/pipeline/index.js +0 -5
  312. package/dist/client/rag/ragIntegration.js +0 -321
  313. package/dist/client/rag/reranker/RerankerFactory.js +0 -430
  314. package/dist/client/rag/reranker/RerankerRegistry.js +0 -402
  315. package/dist/client/rag/reranker/index.js +0 -9
  316. package/dist/client/rag/reranker/reranker.js +0 -277
  317. package/dist/client/rag/resilience/CircuitBreaker.js +0 -431
  318. package/dist/client/rag/resilience/RetryHandler.js +0 -304
  319. package/dist/client/rag/resilience/index.js +0 -7
  320. package/dist/client/rag/retrieval/hybridSearch.js +0 -335
  321. package/dist/client/rag/retrieval/index.js +0 -5
  322. package/dist/client/rag/retrieval/vectorQueryTool.js +0 -307
  323. package/dist/client/rag/types.js +0 -8
  324. package/dist/client/sdk/toolRegistration.js +0 -377
  325. package/dist/client/server/abstract/baseServerAdapter.js +0 -575
  326. package/dist/client/server/adapters/expressAdapter.js +0 -486
  327. package/dist/client/server/adapters/fastifyAdapter.js +0 -472
  328. package/dist/client/server/adapters/honoAdapter.js +0 -632
  329. package/dist/client/server/adapters/koaAdapter.js +0 -510
  330. package/dist/client/server/errors.js +0 -486
  331. package/dist/client/server/factory/serverAdapterFactory.js +0 -160
  332. package/dist/client/server/index.js +0 -108
  333. package/dist/client/server/middleware/abortSignal.js +0 -111
  334. package/dist/client/server/middleware/auth.js +0 -388
  335. package/dist/client/server/middleware/cache.js +0 -359
  336. package/dist/client/server/middleware/common.js +0 -281
  337. package/dist/client/server/middleware/deprecation.js +0 -190
  338. package/dist/client/server/middleware/mcpBodyAttachment.js +0 -63
  339. package/dist/client/server/middleware/rateLimit.js +0 -227
  340. package/dist/client/server/middleware/validation.js +0 -388
  341. package/dist/client/server/openapi/generator.js +0 -398
  342. package/dist/client/server/openapi/index.js +0 -36
  343. package/dist/client/server/openapi/schemas.js +0 -695
  344. package/dist/client/server/openapi/templates.js +0 -374
  345. package/dist/client/server/routes/agentRoutes.js +0 -189
  346. package/dist/client/server/routes/claudeProxyRoutes.js +0 -1600
  347. package/dist/client/server/routes/healthRoutes.js +0 -187
  348. package/dist/client/server/routes/index.js +0 -57
  349. package/dist/client/server/routes/mcpRoutes.js +0 -342
  350. package/dist/client/server/routes/memoryRoutes.js +0 -350
  351. package/dist/client/server/routes/openApiRoutes.js +0 -126
  352. package/dist/client/server/routes/toolRoutes.js +0 -199
  353. package/dist/client/server/streaming/dataStream.js +0 -486
  354. package/dist/client/server/streaming/index.js +0 -11
  355. package/dist/client/server/types.js +0 -67
  356. package/dist/client/server/utils/redaction.js +0 -334
  357. package/dist/client/server/utils/validation.js +0 -243
  358. package/dist/client/server/websocket/WebSocketHandler.js +0 -383
  359. package/dist/client/server/websocket/index.js +0 -4
  360. package/dist/client/services/server/ai/observability/instrumentation.js +0 -808
  361. package/dist/client/telemetry/attributes.js +0 -100
  362. package/dist/client/telemetry/index.js +0 -26
  363. package/dist/client/telemetry/telemetryService.js +0 -308
  364. package/dist/client/telemetry/tracers.js +0 -17
  365. package/dist/client/telemetry/withSpan.js +0 -34
  366. package/dist/client/types/actionTypes.js +0 -6
  367. package/dist/client/types/analytics.js +0 -5
  368. package/dist/client/types/authTypes.js +0 -9
  369. package/dist/client/types/circuitBreakerErrors.js +0 -34
  370. package/dist/client/types/cli.js +0 -21
  371. package/dist/client/types/clientTypes.js +0 -10
  372. package/dist/client/types/common.js +0 -51
  373. package/dist/client/types/configTypes.js +0 -49
  374. package/dist/client/types/content.js +0 -19
  375. package/dist/client/types/contextTypes.js +0 -400
  376. package/dist/client/types/conversation.js +0 -47
  377. package/dist/client/types/conversationMemoryInterface.js +0 -6
  378. package/dist/client/types/domainTypes.js +0 -5
  379. package/dist/client/types/errors.js +0 -167
  380. package/dist/client/types/evaluation.js +0 -5
  381. package/dist/client/types/evaluationProviders.js +0 -5
  382. package/dist/client/types/evaluationTypes.js +0 -1
  383. package/dist/client/types/externalMcp.js +0 -6
  384. package/dist/client/types/fileReferenceTypes.js +0 -8
  385. package/dist/client/types/fileTypes.js +0 -4
  386. package/dist/client/types/generateTypes.js +0 -1
  387. package/dist/client/types/guardrails.js +0 -1
  388. package/dist/client/types/hitlTypes.js +0 -8
  389. package/dist/client/types/index.js +0 -57
  390. package/dist/client/types/mcpTypes.js +0 -5
  391. package/dist/client/types/middlewareTypes.js +0 -1
  392. package/dist/client/types/modelTypes.js +0 -30
  393. package/dist/client/types/multimodal.js +0 -135
  394. package/dist/client/types/observability.js +0 -6
  395. package/dist/client/types/pptTypes.js +0 -82
  396. package/dist/client/types/providers.js +0 -111
  397. package/dist/client/types/proxyTypes.js +0 -16
  398. package/dist/client/types/ragTypes.js +0 -7
  399. package/dist/client/types/sdkTypes.js +0 -8
  400. package/dist/client/types/serviceTypes.js +0 -5
  401. package/dist/client/types/streamTypes.js +0 -1
  402. package/dist/client/types/subscriptionTypes.js +0 -9
  403. package/dist/client/types/taskClassificationTypes.js +0 -5
  404. package/dist/client/types/tools.js +0 -24
  405. package/dist/client/types/ttsTypes.js +0 -57
  406. package/dist/client/types/typeAliases.js +0 -48
  407. package/dist/client/types/utilities.js +0 -4
  408. package/dist/client/types/workflowTypes.js +0 -30
  409. package/dist/client/utils/async/withTimeout.js +0 -98
  410. package/dist/client/utils/asyncMutex.js +0 -60
  411. package/dist/client/utils/conversationMemory.js +0 -431
  412. package/dist/client/utils/csvProcessor.js +0 -846
  413. package/dist/client/utils/errorHandling.js +0 -936
  414. package/dist/client/utils/evaluationUtils.js +0 -131
  415. package/dist/client/utils/factoryProcessing.js +0 -589
  416. package/dist/client/utils/fileDetector.js +0 -2161
  417. package/dist/client/utils/imageCache.js +0 -376
  418. package/dist/client/utils/imageProcessor.js +0 -704
  419. package/dist/client/utils/logger.js +0 -491
  420. package/dist/client/utils/mcpDefaults.js +0 -134
  421. package/dist/client/utils/messageBuilder.js +0 -1653
  422. package/dist/client/utils/modelAliasResolver.js +0 -54
  423. package/dist/client/utils/modelDetection.js +0 -80
  424. package/dist/client/utils/modelRouter.js +0 -292
  425. package/dist/client/utils/multimodalOptionsBuilder.js +0 -65
  426. package/dist/client/utils/observabilityHelpers.js +0 -47
  427. package/dist/client/utils/parameterValidation.js +0 -966
  428. package/dist/client/utils/pdfProcessor.js +0 -410
  429. package/dist/client/utils/performance.js +0 -222
  430. package/dist/client/utils/pricing.js +0 -340
  431. package/dist/client/utils/promptRedaction.js +0 -62
  432. package/dist/client/utils/providerConfig.js +0 -1009
  433. package/dist/client/utils/providerHealth.js +0 -1237
  434. package/dist/client/utils/providerRetry.js +0 -112
  435. package/dist/client/utils/providerUtils.js +0 -434
  436. package/dist/client/utils/rateLimiter.js +0 -200
  437. package/dist/client/utils/redis.js +0 -368
  438. package/dist/client/utils/retryHandler.js +0 -269
  439. package/dist/client/utils/retryability.js +0 -22
  440. package/dist/client/utils/sanitizers/svg.js +0 -481
  441. package/dist/client/utils/schemaConversion.js +0 -255
  442. package/dist/client/utils/taskClassificationUtils.js +0 -149
  443. package/dist/client/utils/taskClassifier.js +0 -94
  444. package/dist/client/utils/thinkingConfig.js +0 -104
  445. package/dist/client/utils/timeout.js +0 -359
  446. package/dist/client/utils/tokenEstimation.js +0 -142
  447. package/dist/client/utils/tokenLimits.js +0 -125
  448. package/dist/client/utils/tokenUtils.js +0 -239
  449. package/dist/client/utils/toolUtils.js +0 -75
  450. package/dist/client/utils/transformationUtils.js +0 -554
  451. package/dist/client/utils/ttsProcessor.js +0 -286
  452. package/dist/client/utils/typeUtils.js +0 -97
  453. package/dist/client/utils/videoAnalysisProcessor.js +0 -67
  454. package/dist/client/workflow/config.js +0 -398
  455. package/dist/client/workflow/core/ensembleExecutor.js +0 -407
  456. package/dist/client/workflow/core/judgeScorer.js +0 -544
  457. package/dist/client/workflow/core/responseConditioner.js +0 -225
  458. package/dist/client/workflow/core/types/conditionerTypes.js +0 -7
  459. package/dist/client/workflow/core/types/ensembleTypes.js +0 -7
  460. package/dist/client/workflow/core/types/index.js +0 -7
  461. package/dist/client/workflow/core/types/judgeTypes.js +0 -7
  462. package/dist/client/workflow/core/types/layerTypes.js +0 -7
  463. package/dist/client/workflow/core/types/registryTypes.js +0 -7
  464. package/dist/client/workflow/core/workflowRegistry.js +0 -304
  465. package/dist/client/workflow/core/workflowRunner.js +0 -586
  466. package/dist/client/workflow/index.js +0 -50
  467. package/dist/client/workflow/types.js +0 -9
  468. package/dist/client/workflow/utils/types/index.js +0 -7
  469. package/dist/client/workflow/utils/workflowMetrics.js +0 -311
  470. package/dist/client/workflow/utils/workflowValidation.js +0 -420
  471. package/dist/client/workflow/workflows/adaptiveWorkflow.js +0 -366
  472. package/dist/client/workflow/workflows/consensusWorkflow.js +0 -192
  473. package/dist/client/workflow/workflows/fallbackWorkflow.js +0 -225
  474. package/dist/client/workflow/workflows/multiJudgeWorkflow.js +0 -351
  475. /package/dist/client/{client/reactHooks.js → reactHooks.js} +0 -0
@@ -1,1653 +0,0 @@
1
- /**
2
- * Message Builder Utility
3
- * Centralized logic for building message arrays from TextGenerationOptions
4
- * Enhanced with multimodal support for images
5
- */
6
- import { existsSync, readFileSync, statSync } from "fs";
7
- import { getGlobalDispatcher, interceptors, request } from "undici";
8
- import { MultimodalLogger, ProviderImageAdapter, } from "../adapters/providerImageAdapter.js";
9
- import { CONVERSATION_INSTRUCTIONS, STRUCTURED_OUTPUT_INSTRUCTIONS, } from "../config/conversationMemory.js";
10
- import { getAvailableInputTokens } from "../constants/contextWindows.js";
11
- import { enforceAggregateFileBudget, FILE_READ_BUDGET_PERCENT, } from "../context/fileTokenBudget.js";
12
- import { SIZE_TIER_THRESHOLDS } from "../files/types.js";
13
- import { tracers, ATTR, withSpan } from "../telemetry/index.js";
14
- import { FileDetector } from "./fileDetector.js";
15
- import { getImageCache } from "./imageCache.js";
16
- import { logger } from "./logger.js";
17
- import { PDFImageConverter, PDFProcessor } from "./pdfProcessor.js";
18
- import { urlDownloadRateLimiter } from "./rateLimiter.js";
19
- import { estimateTokens } from "./tokenEstimation.js";
20
- // ---------------------------------------------------------------------------
21
- // SDK-7: Lightweight file-type inference helpers for budget estimation
22
- // These avoid calling the full FileDetector pipeline — they only need to
23
- // classify files into broad categories (video, audio, image, etc.) so
24
- // estimatePostProcessingTokens() can use type-aware estimates.
25
- // ---------------------------------------------------------------------------
26
- /** Extension → file type mapping for budget estimation */
27
- const EXTENSION_TYPE_MAP = {
28
- // Video
29
- mp4: "video",
30
- mkv: "video",
31
- mov: "video",
32
- avi: "video",
33
- webm: "video",
34
- wmv: "video",
35
- flv: "video",
36
- m4v: "video",
37
- // Audio
38
- mp3: "audio",
39
- wav: "audio",
40
- ogg: "audio",
41
- flac: "audio",
42
- m4a: "audio",
43
- aac: "audio",
44
- wma: "audio",
45
- opus: "audio",
46
- // Image
47
- jpg: "image",
48
- jpeg: "image",
49
- png: "image",
50
- gif: "image",
51
- webp: "image",
52
- bmp: "image",
53
- tiff: "image",
54
- tif: "image",
55
- avif: "image",
56
- // Archive
57
- zip: "archive",
58
- tar: "archive",
59
- gz: "archive",
60
- tgz: "archive",
61
- rar: "archive",
62
- "7z": "archive",
63
- jar: "archive",
64
- // Documents
65
- xlsx: "xlsx",
66
- xls: "xlsx",
67
- ods: "xlsx",
68
- docx: "docx",
69
- doc: "docx",
70
- odt: "docx",
71
- rtf: "docx",
72
- pptx: "pptx",
73
- ppt: "pptx",
74
- odp: "pptx",
75
- // PDF
76
- pdf: "pdf",
77
- // SVG
78
- svg: "svg",
79
- // CSV
80
- csv: "csv",
81
- tsv: "csv",
82
- };
83
- /**
84
- * Infer file type from extension in a file path or URL.
85
- * Returns undefined if no extension or unrecognized.
86
- */
87
- function inferFileTypeFromExtension(filePath) {
88
- // Strip query string / fragment for URLs
89
- const cleaned = filePath.split("?")[0].split("#")[0];
90
- const lastDot = cleaned.lastIndexOf(".");
91
- if (lastDot === -1) {
92
- return undefined;
93
- }
94
- const ext = cleaned.slice(lastDot + 1).toLowerCase();
95
- return EXTENSION_TYPE_MAP[ext];
96
- }
97
- /**
98
- * Infer file type from the first few magic bytes of a Buffer.
99
- * Only checks the most common binary types — text types default to undefined.
100
- */
101
- function inferFileTypeFromBuffer(buf) {
102
- if (buf.length < 4) {
103
- return undefined;
104
- }
105
- // PNG
106
- if (buf[0] === 0x89 &&
107
- buf[1] === 0x50 &&
108
- buf[2] === 0x4e &&
109
- buf[3] === 0x47) {
110
- return "image";
111
- }
112
- // JPEG
113
- if (buf[0] === 0xff && buf[1] === 0xd8 && buf[2] === 0xff) {
114
- return "image";
115
- }
116
- // GIF
117
- if (buf[0] === 0x47 && buf[1] === 0x49 && buf[2] === 0x46) {
118
- return "image";
119
- }
120
- // WebP (RIFF + WEBP)
121
- if (buf.length >= 12 &&
122
- buf[0] === 0x52 &&
123
- buf[1] === 0x49 &&
124
- buf[2] === 0x46 &&
125
- buf[3] === 0x46 &&
126
- buf[8] === 0x57 &&
127
- buf[9] === 0x45 &&
128
- buf[10] === 0x42 &&
129
- buf[11] === 0x50) {
130
- return "image";
131
- }
132
- // PDF
133
- if (buf[0] === 0x25 &&
134
- buf[1] === 0x50 &&
135
- buf[2] === 0x44 &&
136
- buf[3] === 0x46) {
137
- return "pdf";
138
- }
139
- // MP4/MOV (ftyp at offset 4)
140
- if (buf.length >= 8 &&
141
- buf[4] === 0x66 &&
142
- buf[5] === 0x74 &&
143
- buf[6] === 0x79 &&
144
- buf[7] === 0x70) {
145
- return "video";
146
- }
147
- // MKV/WebM (EBML)
148
- if (buf[0] === 0x1a &&
149
- buf[1] === 0x45 &&
150
- buf[2] === 0xdf &&
151
- buf[3] === 0xa3) {
152
- return "video";
153
- }
154
- // AVI (RIFF + AVI)
155
- if (buf.length >= 12 &&
156
- buf[0] === 0x52 &&
157
- buf[1] === 0x49 &&
158
- buf[2] === 0x46 &&
159
- buf[3] === 0x46 &&
160
- buf[8] === 0x41 &&
161
- buf[9] === 0x56 &&
162
- buf[10] === 0x49 &&
163
- buf[11] === 0x20) {
164
- return "video";
165
- }
166
- // WAV (RIFF + WAVE)
167
- if (buf.length >= 12 &&
168
- buf[0] === 0x52 &&
169
- buf[1] === 0x49 &&
170
- buf[2] === 0x46 &&
171
- buf[3] === 0x46 &&
172
- buf[8] === 0x57 &&
173
- buf[9] === 0x41 &&
174
- buf[10] === 0x56 &&
175
- buf[11] === 0x45) {
176
- return "audio";
177
- }
178
- // MP3 (ID3 tag)
179
- if (buf[0] === 0x49 && buf[1] === 0x44 && buf[2] === 0x33) {
180
- return "audio";
181
- }
182
- // FLAC
183
- if (buf[0] === 0x66 &&
184
- buf[1] === 0x4c &&
185
- buf[2] === 0x61 &&
186
- buf[3] === 0x43) {
187
- return "audio";
188
- }
189
- // OGG
190
- if (buf[0] === 0x4f &&
191
- buf[1] === 0x67 &&
192
- buf[2] === 0x67 &&
193
- buf[3] === 0x53) {
194
- return "audio";
195
- }
196
- // ZIP (also .xlsx, .docx, .pptx — but without extension we default to archive)
197
- if (buf[0] === 0x50 &&
198
- buf[1] === 0x4b &&
199
- buf[2] === 0x03 &&
200
- buf[3] === 0x04) {
201
- return "archive";
202
- }
203
- // GZIP
204
- if (buf[0] === 0x1f && buf[1] === 0x8b) {
205
- return "archive";
206
- }
207
- // RAR
208
- if (buf[0] === 0x52 &&
209
- buf[1] === 0x61 &&
210
- buf[2] === 0x72 &&
211
- buf[3] === 0x21) {
212
- return "archive";
213
- }
214
- return undefined;
215
- }
216
- /**
217
- * Type guard to check if an image input has alt text
218
- */
219
- function isImageWithAltText(image) {
220
- return (typeof image === "object" && !Buffer.isBuffer(image) && "data" in image);
221
- }
222
- /**
223
- * Extract image data from an image input (handles both simple and alt text formats)
224
- */
225
- function extractImageData(image) {
226
- if (isImageWithAltText(image)) {
227
- return image.data;
228
- }
229
- return image;
230
- }
231
- /**
232
- * Extract alt text from an image input if available
233
- */
234
- function extractAltText(image) {
235
- if (isImageWithAltText(image)) {
236
- return image.altText;
237
- }
238
- return undefined;
239
- }
240
- /**
241
- * Type guard for validating message roles
242
- */
243
- function isValidRole(role) {
244
- return (typeof role === "string" &&
245
- (role === "user" || role === "assistant" || role === "system"));
246
- }
247
- /**
248
- * Type guard for validating content items
249
- */
250
- function isValidContentItem(item) {
251
- if (!item || typeof item !== "object") {
252
- return false;
253
- }
254
- const contentItem = item;
255
- if (contentItem.type === "text") {
256
- return typeof contentItem.text === "string";
257
- }
258
- if (contentItem.type === "image") {
259
- return (typeof contentItem.image === "string" &&
260
- (contentItem.mimeType === undefined ||
261
- typeof contentItem.mimeType === "string"));
262
- }
263
- if (contentItem.type === "file") {
264
- return (Buffer.isBuffer(contentItem.data) &&
265
- typeof contentItem.mimeType === "string");
266
- }
267
- return false;
268
- }
269
- /**
270
- * Safely convert content item to AI SDK content format
271
- */
272
- function convertContentItem(item) {
273
- if (!isValidContentItem(item)) {
274
- return null;
275
- }
276
- const contentItem = item;
277
- if (contentItem.type === "text" && typeof contentItem.text === "string") {
278
- return { type: "text", text: contentItem.text };
279
- }
280
- if (contentItem.type === "image" && typeof contentItem.image === "string") {
281
- return {
282
- type: "image",
283
- image: contentItem.image,
284
- ...(contentItem.mimeType && { mediaType: contentItem.mimeType }),
285
- };
286
- }
287
- if (contentItem.type === "file" &&
288
- Buffer.isBuffer(contentItem.data) &&
289
- contentItem.mimeType) {
290
- return {
291
- type: "file",
292
- data: contentItem.data,
293
- mediaType: contentItem.mimeType,
294
- };
295
- }
296
- return null;
297
- }
298
- /**
299
- * Type-safe conversion from MultimodalChatMessage[] to ModelMessage[]
300
- * Filters out invalid content and ensures strict ModelMessage contract compliance
301
- */
302
- export function convertToModelMessages(messages) {
303
- return messages
304
- .map((msg) => {
305
- // Validate role
306
- if (!isValidRole(msg.role)) {
307
- logger.warn("Invalid message role found, skipping", { role: msg.role });
308
- return null;
309
- }
310
- // Handle string content
311
- if (typeof msg.content === "string") {
312
- // Create properly typed discriminated union messages
313
- if (msg.role === "system") {
314
- return {
315
- role: "system",
316
- content: msg.content,
317
- };
318
- }
319
- else if (msg.role === "user") {
320
- return {
321
- role: "user",
322
- content: msg.content,
323
- };
324
- }
325
- else if (msg.role === "assistant") {
326
- return {
327
- role: "assistant",
328
- content: msg.content,
329
- };
330
- }
331
- }
332
- // Handle array content (multimodal) - only user messages support full multimodal content
333
- if (Array.isArray(msg.content)) {
334
- const validContent = msg.content
335
- .map(convertContentItem)
336
- .filter((item) => item !== null);
337
- // If no valid content items, skip the message
338
- if (validContent.length === 0) {
339
- logger.warn("No valid content items found in multimodal message, skipping");
340
- return null;
341
- }
342
- if (msg.role === "user") {
343
- // User messages support both text and image content
344
- return {
345
- role: "user",
346
- content: validContent,
347
- };
348
- }
349
- else if (msg.role === "assistant") {
350
- // Assistant messages only support text content, filter out images
351
- const textOnlyContent = validContent.filter((item) => item.type === "text");
352
- if (textOnlyContent.length === 0) {
353
- // If no text content, convert to empty string
354
- return {
355
- role: "assistant",
356
- content: "",
357
- };
358
- }
359
- else if (textOnlyContent.length === 1) {
360
- // Single text item, use string content
361
- return {
362
- role: "assistant",
363
- content: textOnlyContent[0].text,
364
- };
365
- }
366
- else {
367
- // Multiple text items, concatenate them
368
- const combinedText = textOnlyContent
369
- .map((item) => item.text)
370
- .join(" ");
371
- return {
372
- role: "assistant",
373
- content: combinedText,
374
- };
375
- }
376
- }
377
- else {
378
- // System messages cannot have multimodal content, convert to text
379
- const textContent = validContent.find((item) => item.type === "text")?.text || "";
380
- return {
381
- role: "system",
382
- content: textContent,
383
- };
384
- }
385
- }
386
- // Invalid content type
387
- logger.warn("Invalid message content type found, skipping", {
388
- contentType: typeof msg.content,
389
- });
390
- return null;
391
- })
392
- .filter((msg) => msg !== null);
393
- }
394
- /**
395
- * Convert ChatMessage to ModelMessage for AI SDK compatibility
396
- */
397
- function toModelMessage(message) {
398
- // Only include messages with roles supported by AI SDK
399
- if (message.role === "user" ||
400
- message.role === "assistant" ||
401
- message.role === "system") {
402
- return {
403
- role: message.role,
404
- content: message.content,
405
- };
406
- }
407
- return null; // Filter out tool_call and tool_result messages
408
- }
409
- /**
410
- * Format CSV metadata for LLM consumption
411
- */
412
- function formatCSVMetadata(metadata) {
413
- const parts = [];
414
- if (metadata.rowCount !== undefined) {
415
- parts.push(`${metadata.rowCount} data rows`);
416
- }
417
- if (metadata.columnCount !== undefined) {
418
- parts.push(`${metadata.columnCount} columns`);
419
- }
420
- if (metadata.columnNames && metadata.columnNames.length > 0) {
421
- const columns = metadata.columnNames.join(", ");
422
- parts.push(`Columns: [${columns}]`);
423
- }
424
- if (metadata.hasEmptyColumns) {
425
- parts.push(`⚠️ Contains empty column names`);
426
- }
427
- return parts.length > 0 ? `**Metadata**: ${parts.join(" | ")}` : "";
428
- }
429
- /**
430
- * Check if structured output mode should be enabled
431
- * Structured output is used when a schema is provided with json/structured format
432
- */
433
- function shouldUseStructuredOutput(options) {
434
- return (!!options.schema &&
435
- (options.output?.format === "json" ||
436
- options.output?.format === "structured"));
437
- }
438
- /**
439
- * Log structural metadata about a composed message array without logging content.
440
- * Only logs a compact summary (role counts, total chars, estimated tokens).
441
- * Per-message breakdown is intentionally omitted to avoid log noise
442
- * (~600 lines per retry cascade with many messages).
443
- */
444
- function logMessageComposition(messages, requestId) {
445
- if (!logger.shouldLog("debug")) {
446
- return;
447
- }
448
- const roles = {};
449
- let totalChars = 0;
450
- for (const msg of messages) {
451
- const chars = typeof msg.content === "string" ? msg.content.length : 0;
452
- roles[msg.role] = (roles[msg.role] || 0) + 1;
453
- totalChars += chars;
454
- }
455
- logger.debug("[MessageBuilder] Composed", {
456
- requestId,
457
- totalMessages: messages.length,
458
- roles,
459
- totalChars,
460
- estimatedTokens: Math.ceil(totalChars / 4),
461
- });
462
- }
463
- /**
464
- * Build a properly formatted message array for AI providers
465
- * Combines system prompt, conversation history, and current user prompt
466
- * Supports both TextGenerationOptions and StreamOptions
467
- * Enhanced with CSV file processing support
468
- */
469
- export async function buildMessagesArray(options) {
470
- const messages = [];
471
- // Check if conversation history exists
472
- const hasConversationHistory = options.conversationMessages && options.conversationMessages.length > 0;
473
- // Build enhanced system prompt
474
- let systemPrompt = options.systemPrompt?.trim() || "";
475
- // Add conversation-aware instructions when history exists
476
- if (hasConversationHistory) {
477
- systemPrompt = `${systemPrompt.trim()}${CONVERSATION_INSTRUCTIONS}`;
478
- }
479
- // Add structured output instructions when schema is provided with json/structured format
480
- if (shouldUseStructuredOutput(options)) {
481
- systemPrompt = `${systemPrompt.trim()}${STRUCTURED_OUTPUT_INSTRUCTIONS}`;
482
- }
483
- // Add system message if we have one
484
- if (systemPrompt.trim()) {
485
- messages.push({
486
- role: "system",
487
- content: systemPrompt.trim(),
488
- providerOptions: {
489
- anthropic: { cacheControl: { type: "ephemeral" } },
490
- },
491
- });
492
- }
493
- // Add conversation history if available
494
- // Convert ChatMessages to ModelMessages and filter out tool messages
495
- if (hasConversationHistory && options.conversationMessages) {
496
- for (const chatMessage of options.conversationMessages) {
497
- const coreMessage = toModelMessage(chatMessage);
498
- if (coreMessage) {
499
- messages.push(coreMessage);
500
- }
501
- }
502
- }
503
- // Add current user prompt (required)
504
- // Handle both TextGenerationOptions (prompt field) and StreamOptions (input.text field)
505
- let currentPrompt;
506
- if ("prompt" in options && options.prompt) {
507
- currentPrompt = options.prompt;
508
- }
509
- else if ("input" in options && options.input?.text) {
510
- currentPrompt = options.input.text;
511
- }
512
- // Process CSV files if present and inject into prompt using proper CSV parser
513
- if ("input" in options && options.input) {
514
- const input = options.input;
515
- let csvContent = "";
516
- const csvOptions = "csvOptions" in options ? options.csvOptions : undefined;
517
- // Process explicit csvFiles array
518
- if (input.csvFiles && input.csvFiles.length > 0) {
519
- for (let i = 0; i < input.csvFiles.length; i++) {
520
- const csvFile = input.csvFiles[i];
521
- const filename = extractFilename(csvFile, i);
522
- const filePath = typeof csvFile === "string" ? csvFile : filename;
523
- try {
524
- const result = await FileDetector.detectAndProcess(csvFile, {
525
- allowedTypes: ["csv"],
526
- csvOptions: csvOptions,
527
- });
528
- let csvSection = `\n\n## CSV Data from "${filename}":\n`;
529
- // Add metadata from csv-parser library
530
- if (result.metadata) {
531
- const metadataText = formatCSVMetadata(result.metadata);
532
- if (metadataText) {
533
- csvSection += metadataText + `\n\n`;
534
- }
535
- }
536
- csvSection += buildCSVToolInstructions(filePath);
537
- csvSection += result.content;
538
- csvContent += csvSection;
539
- logger.info(`[CSV] ✅ Processed: ${filename}`, result.metadata);
540
- }
541
- catch (error) {
542
- logger.error(`[CSV] ❌ Failed to process ${filename}:`, error);
543
- csvContent += `\n\n## CSV Data Error: Failed to process "${filename}"\nReason: ${error instanceof Error ? error.message : "Unknown error"}`;
544
- }
545
- }
546
- }
547
- // Process unified files array (auto-detect CSV)
548
- if (input.files && input.files.length > 0) {
549
- for (const file of input.files) {
550
- const filename = extractFilename(file);
551
- try {
552
- const result = await FileDetector.detectAndProcess(file, {
553
- maxSize: 50 * 1024 * 1024,
554
- allowedTypes: ["csv"],
555
- csvOptions: csvOptions,
556
- });
557
- if (result.type === "csv") {
558
- let csvSection = `\n\n## CSV Data from "${filename}":\n`;
559
- // Add metadata from csv-parser library
560
- if (result.metadata) {
561
- const metadataText = formatCSVMetadata(result.metadata);
562
- if (metadataText) {
563
- csvSection += metadataText + `\n\n`;
564
- }
565
- }
566
- csvSection += result.content;
567
- csvContent += csvSection;
568
- logger.info(`[FileDetector] ✅ CSV: ${filename}`, result.metadata);
569
- }
570
- }
571
- catch (error) {
572
- // Silently skip non-CSV files in auto-detect mode
573
- logger.debug(`[FileDetector] Skipped ${filename}: ${error instanceof Error ? error.message : String(error)}`);
574
- }
575
- }
576
- }
577
- // Prepend CSV content to current prompt
578
- if (csvContent) {
579
- currentPrompt = csvContent + (currentPrompt || "");
580
- }
581
- }
582
- if (currentPrompt?.trim()) {
583
- messages.push({
584
- role: "user",
585
- content: currentPrompt.trim(),
586
- });
587
- }
588
- const reqId = options.context
589
- ?.requestId;
590
- logMessageComposition(messages, reqId);
591
- return messages;
592
- }
593
- /**
594
- * Enforce aggregate file budget, excluding files that would exceed the context window.
595
- * Mutates options.input.files and options.input.text as needed.
596
- */
597
- function enforceFileBudget(options, provider, model) {
598
- if (!options.input.files || options.input.files.length === 0) {
599
- return;
600
- }
601
- const availableTokens = getAvailableInputTokens(provider, model);
602
- const budgetFiles = options.input.files.map((file, idx) => {
603
- let sizeBytes;
604
- let fileType;
605
- if (Buffer.isBuffer(file)) {
606
- sizeBytes = file.length;
607
- fileType = inferFileTypeFromBuffer(file);
608
- }
609
- else if (typeof file === "string") {
610
- if (existsSync(file)) {
611
- try {
612
- sizeBytes = statSync(file).size;
613
- }
614
- catch {
615
- sizeBytes = 0;
616
- }
617
- }
618
- else {
619
- sizeBytes = file.length;
620
- }
621
- fileType = inferFileTypeFromExtension(file);
622
- }
623
- else {
624
- sizeBytes = 0;
625
- }
626
- return {
627
- name: typeof file === "string" ? file : `file-${idx}`,
628
- sizeBytes,
629
- fileType,
630
- originalIndex: idx,
631
- };
632
- });
633
- const budgetResult = enforceAggregateFileBudget(budgetFiles.map((f) => ({
634
- name: f.name,
635
- sizeBytes: f.sizeBytes,
636
- fileType: f.fileType,
637
- })), availableTokens);
638
- if (budgetResult.excluded.length > 0) {
639
- const includedIndices = new Set(budgetResult.included.map((f) => {
640
- return budgetFiles.findIndex((bf) => bf.name === f.name);
641
- }));
642
- options.input.files = options.input.files.filter((_file, idx) => {
643
- return includedIndices.has(idx);
644
- });
645
- options.input.text =
646
- (options.input.text || "") + "\n\n" + budgetResult.notices.join("\n");
647
- logger.warn(`[FileDetector] Aggregate file budget enforcement: excluded ${budgetResult.excluded.length} file(s)`);
648
- }
649
- }
650
- /**
651
- * Append a detected file result to options.input based on its type.
652
- * Handles CSV, SVG, image, PDF, video, audio, archive, xlsx, docx, pptx, text, and unknown types.
653
- */
654
- function appendDetectedFileResult(result, file, options) {
655
- const filename = extractFilename(file);
656
- if (result.type === "csv") {
657
- const filePath = typeof file === "string" ? file : filename;
658
- let csvSection = `\n\n## CSV Data from "${filename}":\n`;
659
- if (result.metadata) {
660
- const metadataText = formatCSVMetadata(result.metadata);
661
- if (metadataText) {
662
- csvSection += metadataText + `\n\n`;
663
- }
664
- }
665
- csvSection += buildCSVToolInstructions(filePath);
666
- csvSection += result.content;
667
- options.input.text += csvSection;
668
- logger.info(`[FileDetector] ✅ CSV: ${filename}`);
669
- }
670
- else if (result.type === "svg") {
671
- const svgSection = `\n\n## SVG Content from "${filename}":\n\`\`\`xml\n${result.content}\n\`\`\`\n`;
672
- options.input.text += svgSection;
673
- logger.info(`[FileDetector] ✅ SVG (as text): ${filename}`);
674
- }
675
- else if (result.type === "image") {
676
- options.input.images = [...(options.input.images || []), result.content];
677
- logger.info(`[FileDetector] ✅ Image: ${result.mimeType}`);
678
- }
679
- else if (result.type === "pdf") {
680
- options.input.pdfFiles = [
681
- ...(options.input.pdfFiles || []),
682
- result.content,
683
- ];
684
- logger.info(`[FileDetector] ✅ PDF: ${filename}`);
685
- }
686
- else if (result.type === "video") {
687
- if (result.content) {
688
- options.input.text += `\n\n## Video File: "${filename}"\n${result.content}\n`;
689
- }
690
- if (result.images && result.images.length > 0) {
691
- options.input.images = [
692
- ...(options.input.images || []),
693
- ...result.images,
694
- ];
695
- logger.info(`[FileDetector] Added ${result.images.length} video keyframes as images`);
696
- }
697
- logger.info(`[FileDetector] ✅ Video: ${filename}`);
698
- }
699
- else if (result.type === "audio") {
700
- if (result.content) {
701
- options.input.text += `\n\n## Audio File: "${filename}"\n${result.content}\n`;
702
- }
703
- if (result.images && result.images.length > 0) {
704
- options.input.images = [
705
- ...(options.input.images || []),
706
- ...result.images,
707
- ];
708
- logger.info(`[FileDetector] Added audio cover art as image`);
709
- }
710
- logger.info(`[FileDetector] ✅ Audio: ${filename}`);
711
- }
712
- else if (result.type === "archive") {
713
- if (result.content) {
714
- options.input.text += `\n\n## Archive File: "${filename}"\n${result.content}\n`;
715
- }
716
- logger.info(`[FileDetector] ✅ Archive: ${filename}`);
717
- }
718
- else if (result.type === "xlsx") {
719
- if (result.content) {
720
- options.input.text += `\n\n## Spreadsheet: "${filename}"\n${result.content}\n`;
721
- }
722
- logger.info(`[FileDetector] ✅ Spreadsheet: ${filename}`);
723
- }
724
- else if (result.type === "docx") {
725
- if (result.content) {
726
- options.input.text += `\n\n## Document: "${filename}"\n${result.content}\n`;
727
- }
728
- logger.info(`[FileDetector] ✅ Document: ${filename}`);
729
- }
730
- else if (result.type === "pptx") {
731
- if (result.content) {
732
- options.input.text += `\n\n## Presentation: "${filename}"\n${result.content}\n`;
733
- }
734
- logger.info(`[FileDetector] ✅ Presentation: ${filename}`);
735
- }
736
- else if (result.type === "text") {
737
- if (result.content) {
738
- const langHint = getLanguageHint(result.mimeType, filename);
739
- const MAX_TEXT_FILE_CHARS = 200_000;
740
- let fileContent = result.content;
741
- let truncated = false;
742
- if (fileContent.length > MAX_TEXT_FILE_CHARS) {
743
- const headChars = Math.floor(MAX_TEXT_FILE_CHARS * 0.75);
744
- const tailChars = Math.floor(MAX_TEXT_FILE_CHARS * 0.25);
745
- const omittedChars = fileContent.length - headChars - tailChars;
746
- fileContent =
747
- fileContent.slice(0, headChars) +
748
- `\n\n... [${omittedChars.toLocaleString()} characters omitted — file truncated to fit context window] ...\n\n` +
749
- fileContent.slice(-tailChars);
750
- truncated = true;
751
- }
752
- const textSection = langHint
753
- ? `\n\n## File: "${filename}"\n\`\`\`${langHint}\n${fileContent}\n\`\`\`\n`
754
- : `\n\n## File: "${filename}"\n${fileContent}\n`;
755
- options.input.text += textSection;
756
- if (truncated) {
757
- logger.warn(`[FileDetector] Large text file "${filename}" truncated from ${result.content.length.toLocaleString()} to ${MAX_TEXT_FILE_CHARS.toLocaleString()} chars`);
758
- }
759
- }
760
- logger.info(`[FileDetector] ✅ Text: ${filename}`);
761
- }
762
- else if (result.type === "unknown") {
763
- if (result.content) {
764
- options.input.text += `\n\n## Attached File: "${filename}"\n${result.content}\n`;
765
- }
766
- logger.info(`[FileDetector] ⚠️ Unknown format (metadata extracted): ${filename}`);
767
- }
768
- }
769
- /**
770
- * Process the unified files array with auto-detection.
771
- * Handles lazy file registration, full processing, and preview injection.
772
- */
773
- async function processUnifiedFilesArray(options, maxSize, provider) {
774
- if (!options.input.files || options.input.files.length === 0) {
775
- return;
776
- }
777
- const totalFiles = options.input.files.length;
778
- return withSpan({
779
- name: "neurolink.file.process_all",
780
- tracer: tracers.file,
781
- attributes: {
782
- [ATTR.FILE_TOTAL_COUNT]: totalFiles,
783
- [ATTR.NL_PROVIDER]: provider,
784
- },
785
- }, async (span) => {
786
- logger.info(`[NEUROLINK] Processing ${totalFiles} file(s) with auto-detection`);
787
- options.input.text = options.input.text || "";
788
- let includedCount = 0;
789
- const fileRegistry = options.fileRegistry;
790
- for (let fileIdx = 0; fileIdx < options.input.files.length; fileIdx++) {
791
- const file = options.input.files[fileIdx];
792
- const filename = extractFilename(file, fileIdx);
793
- try {
794
- // ─── Lazy file registration path ──────────────────────────────
795
- const fileSize = fileRegistry ? getFileSize(file) : 0;
796
- if (fileRegistry && fileSize > SIZE_TIER_THRESHOLDS.TINY_MAX) {
797
- const registered = await tryRegisterFileReference(file, fileSize, fileRegistry, fileIdx);
798
- if (registered) {
799
- logger.info(`[NEUROLINK] File lazily registered: ${filename} (${fileSize} bytes) — deferred processing`);
800
- includedCount++;
801
- continue;
802
- }
803
- }
804
- // ─── Full processing path (current behavior) ──────────────────
805
- const genericFileMaxSize = Math.max(maxSize, 100 * 1024 * 1024);
806
- const rawFileInput = isFileWithMetadata(file) ? file.buffer : file;
807
- const result = await FileDetector.detectAndProcess(rawFileInput, {
808
- maxSize: genericFileMaxSize,
809
- allowedTypes: [
810
- "csv",
811
- "image",
812
- "pdf",
813
- "svg",
814
- "video",
815
- "audio",
816
- "archive",
817
- "xlsx",
818
- "docx",
819
- "pptx",
820
- "text",
821
- "unknown",
822
- ],
823
- csvOptions: options.csvOptions,
824
- provider: provider,
825
- });
826
- appendDetectedFileResult(result, file, options);
827
- includedCount++;
828
- // Log what content type was added to the message
829
- const contentType = result.type === "image" ? "image" : "text";
830
- logger.info(`[NEUROLINK] File added to message: ${filename} as ${contentType} (type: ${result.type})`);
831
- }
832
- catch (error) {
833
- const errMsg = error instanceof Error ? error.message : String(error);
834
- logger.error(`[NEUROLINK] File skipped/failed: ${filename} — reason: ${errMsg}`);
835
- }
836
- }
837
- span.setAttribute(ATTR.FILE_INCLUDED_COUNT, includedCount);
838
- // After processing all files, inject previews for any lazily-registered files
839
- if (fileRegistry && fileRegistry.size > 0) {
840
- const previewText = await fileRegistry.generatePromptPreview();
841
- if (previewText) {
842
- options.input.text = (options.input.text || "") + previewText;
843
- logger.info(`[FileDetector] Injected previews for ${fileRegistry.size} lazily-registered file(s)`);
844
- }
845
- const registeredFiles = fileRegistry.list();
846
- for (const ref of registeredFiles) {
847
- if (ref.extractedImages && ref.extractedImages.length > 0) {
848
- options.input.images = [
849
- ...(options.input.images || []),
850
- ...ref.extractedImages,
851
- ];
852
- logger.info(`[FileDetector] Injected ${ref.extractedImages.length} extracted images from "${ref.filename}"`);
853
- }
854
- }
855
- }
856
- logger.info(`[NEUROLINK] File processing complete: ${includedCount}/${totalFiles} files included in message`);
857
- });
858
- }
859
- /**
860
- * Process explicit CSV files array and append to options.input.text.
861
- */
862
- async function processExplicitCsvFiles(options) {
863
- if (!options.input.csvFiles || options.input.csvFiles.length === 0) {
864
- return;
865
- }
866
- logger.info(`[CSV] Processing ${options.input.csvFiles.length} explicit CSV file(s)`);
867
- options.input.text = options.input.text || "";
868
- for (let i = 0; i < options.input.csvFiles.length; i++) {
869
- const csvFile = options.input.csvFiles[i];
870
- try {
871
- const result = await FileDetector.detectAndProcess(csvFile, {
872
- allowedTypes: ["csv"],
873
- csvOptions: options.csvOptions,
874
- });
875
- const filename = extractFilename(csvFile, i);
876
- const filePath = typeof csvFile === "string" ? csvFile : filename;
877
- let csvSection = `\n\n## CSV Data from "${filename}":\n`;
878
- if (result.metadata) {
879
- const metadataText = formatCSVMetadata(result.metadata);
880
- if (metadataText) {
881
- csvSection += metadataText + `\n\n`;
882
- }
883
- }
884
- csvSection += buildCSVToolInstructions(filePath);
885
- csvSection += result.content;
886
- options.input.text += csvSection;
887
- logger.info(`[CSV] ✅ Processed: ${filename}`);
888
- }
889
- catch (error) {
890
- logger.error(`[CSV] ❌ Failed:`, error);
891
- const filename = extractFilename(csvFile, i);
892
- options.input.text += `\n\n## CSV Data Error: Failed to process "${filename}"`;
893
- options.input.text += `\nReason: ${error instanceof Error ? error.message : "Unknown error"}`;
894
- }
895
- }
896
- }
897
- /**
898
- * Enforce post-processing budget on accumulated text content and log token usage.
899
- */
900
- function enforcePostProcessingBudget(options, provider, model) {
901
- if (!options.input.text) {
902
- return;
903
- }
904
- const availableTokens = getAvailableInputTokens(provider, model);
905
- const textTokenBudget = Math.floor(availableTokens * FILE_READ_BUDGET_PERCENT);
906
- const actualTextTokens = estimateTokens(options.input.text, provider);
907
- if (actualTextTokens > textTokenBudget && textTokenBudget > 0) {
908
- const maxChars = textTokenBudget * 4;
909
- if (options.input.text.length > maxChars) {
910
- const headChars = Math.floor(maxChars * 0.75);
911
- const tailChars = Math.floor(maxChars * 0.25);
912
- const head = options.input.text.slice(0, headChars);
913
- const tail = options.input.text.slice(-tailChars);
914
- const truncatedTokens = actualTextTokens - textTokenBudget;
915
- options.input.text =
916
- head +
917
- `\n\n[... ${truncatedTokens.toLocaleString()} tokens of file content truncated to fit context window ...]\n\n` +
918
- tail;
919
- logger.warn(`[FileDetector] Post-processing budget enforcement: truncated ~${truncatedTokens.toLocaleString()} tokens of file content to fit ${textTokenBudget.toLocaleString()} token budget`);
920
- }
921
- }
922
- // Token usage breakdown logging
923
- const textTokens = estimateTokens(options.input.text, provider);
924
- const imageCount = (options.input.images?.length ?? 0) +
925
- (options.input.content?.filter((c) => c.type === "image").length ?? 0);
926
- const imageTokens = imageCount * 1500;
927
- const totalContentTokens = textTokens + imageTokens;
928
- const contextWindow = getAvailableInputTokens(provider, model);
929
- logger.info(`[TokenUsage] Content breakdown: text=${textTokens.toLocaleString()} tokens, ` +
930
- `images=${imageCount} (~${imageTokens.toLocaleString()} tokens), ` +
931
- `total=${totalContentTokens.toLocaleString()} tokens, ` +
932
- `budget=${contextWindow.toLocaleString()} tokens, ` +
933
- `utilization=${contextWindow > 0 ? ((totalContentTokens / contextWindow) * 100).toFixed(1) : "N/A"}%`);
934
- }
935
- /**
936
- * Process explicit PDF files and return structured PDF entries for multimodal processing.
937
- */
938
- async function processExplicitPdfFiles(options, maxSize, provider) {
939
- const pdfFiles = [];
940
- if (!options.input.pdfFiles || options.input.pdfFiles.length === 0) {
941
- return pdfFiles;
942
- }
943
- logger.info(`[PDF] Processing ${options.input.pdfFiles.length} explicit PDF file(s) for ${provider}`);
944
- for (let i = 0; i < options.input.pdfFiles.length; i++) {
945
- const pdfFile = options.input.pdfFiles[i];
946
- const filename = extractFilename(pdfFile, i);
947
- try {
948
- const result = await FileDetector.detectAndProcess(pdfFile, {
949
- maxSize,
950
- allowedTypes: ["pdf"],
951
- provider: provider,
952
- });
953
- if (Buffer.isBuffer(result.content)) {
954
- pdfFiles.push({
955
- buffer: result.content,
956
- filename,
957
- pageCount: result.metadata?.estimatedPages ?? null,
958
- });
959
- logger.info(`[PDF] ✅ Queued for multimodal: ${filename} (${result.metadata?.estimatedPages ?? "unknown"} pages)`);
960
- }
961
- }
962
- catch (error) {
963
- logger.error(`[PDF] ❌ Failed to process ${filename}:`, error);
964
- throw error;
965
- }
966
- }
967
- return pdfFiles;
968
- }
969
- /**
970
- * Build the enhanced system prompt for multimodal messages, including
971
- * conversation instructions, structured output instructions, and file handling guidance.
972
- */
973
- function buildMultimodalSystemPrompt(options, hasPDFFiles) {
974
- let systemPrompt = options.systemPrompt?.trim() || "";
975
- const hasConversationHistory = options.conversationHistory && options.conversationHistory.length > 0;
976
- if (hasConversationHistory) {
977
- systemPrompt = `${systemPrompt.trim()}${CONVERSATION_INSTRUCTIONS}`;
978
- }
979
- if (shouldUseStructuredOutput(options)) {
980
- systemPrompt = `${systemPrompt.trim()}${STRUCTURED_OUTPUT_INSTRUCTIONS}`;
981
- }
982
- const hasCSVFiles = (options.input.csvFiles && options.input.csvFiles.length > 0) ||
983
- (options.input.files &&
984
- options.input.files.some((f) => typeof f === "string" ? f.toLowerCase().endsWith(".csv") : false));
985
- if (hasCSVFiles || hasPDFFiles) {
986
- const fileTypes = [];
987
- if (hasPDFFiles) {
988
- fileTypes.push("PDFs");
989
- }
990
- if (hasCSVFiles) {
991
- fileTypes.push("CSVs");
992
- }
993
- systemPrompt += `\n\nIMPORTANT FILE HANDLING INSTRUCTIONS:
994
- - File content (${fileTypes.join(", ")}, images) is already processed and included in this message
995
- - DO NOT use GitHub tools (get_file_contents, search_code, etc.) for local files - they only work for remote repository files
996
- - Analyze the provided file content directly without attempting to fetch or read files using tools
997
- - GitHub MCP tools are ONLY for remote repository operations, not local filesystem access
998
- - Use the file content shown in this message for your analysis`;
999
- }
1000
- return systemPrompt;
1001
- }
1002
- /**
1003
- * Build multimodal message array with image support
1004
- * Detects when images are present and routes through provider adapter
1005
- */
1006
- export async function buildMultimodalMessagesArray(options, provider, model) {
1007
- // Compute provider-specific max PDF size once for consistent validation
1008
- const pdfConfig = PDFProcessor.getProviderConfig(provider);
1009
- const maxSize = pdfConfig
1010
- ? pdfConfig.maxSizeMB * 1024 * 1024
1011
- : 10 * 1024 * 1024;
1012
- // Aggregate file budget enforcement
1013
- enforceFileBudget(options, provider, model);
1014
- // Process unified files array (auto-detect)
1015
- await processUnifiedFilesArray(options, maxSize, provider);
1016
- // Process explicit CSV files array
1017
- await processExplicitCsvFiles(options);
1018
- // Post-processing budget enforcement and token usage logging
1019
- enforcePostProcessingBudget(options, provider, model);
1020
- // Process explicit PDF files
1021
- const pdfFiles = await processExplicitPdfFiles(options, maxSize, provider);
1022
- // Check if this is a multimodal request
1023
- const hasImages = (options.input.images && options.input.images.length > 0) ||
1024
- (options.input.content &&
1025
- options.input.content.some((c) => c.type === "image"));
1026
- const hasPDFs = pdfFiles.length > 0;
1027
- // If no images or PDFs, use standard message building and convert to MultimodalChatMessage[]
1028
- if (!hasImages && !hasPDFs) {
1029
- if (options.input.csvFiles) {
1030
- options.input.csvFiles = [];
1031
- }
1032
- if (options.input.pdfFiles) {
1033
- options.input.pdfFiles = [];
1034
- }
1035
- if (options.input.files) {
1036
- options.input.files = [];
1037
- }
1038
- const standardMessages = await buildMessagesArray(options);
1039
- return standardMessages.map((msg) => {
1040
- const msgProviderOptions = msg
1041
- .providerOptions;
1042
- return {
1043
- role: msg.role,
1044
- content: msg.content,
1045
- ...(msgProviderOptions && { providerOptions: msgProviderOptions }),
1046
- };
1047
- });
1048
- }
1049
- // Validate provider supports vision
1050
- if (!ProviderImageAdapter.supportsVision(provider, model)) {
1051
- throw new Error(`Provider ${provider} with model ${model} does not support vision processing. ` +
1052
- `Supported providers: ${ProviderImageAdapter.getVisionProviders().join(", ")}`);
1053
- }
1054
- const messages = [];
1055
- // Build enhanced system prompt
1056
- const systemPrompt = buildMultimodalSystemPrompt(options, pdfFiles.length > 0);
1057
- if (systemPrompt.trim()) {
1058
- messages.push({
1059
- role: "system",
1060
- content: systemPrompt.trim(),
1061
- providerOptions: {
1062
- anthropic: { cacheControl: { type: "ephemeral" } },
1063
- },
1064
- });
1065
- }
1066
- // Add conversation history if available
1067
- const hasConversationHistory = options.conversationHistory && options.conversationHistory.length > 0;
1068
- if (hasConversationHistory && options.conversationHistory) {
1069
- for (const msg of options.conversationHistory) {
1070
- // Filter out tool_call and tool_result roles — only user/assistant/system are valid for AI providers
1071
- if (msg.role === "user" ||
1072
- msg.role === "assistant" ||
1073
- msg.role === "system") {
1074
- const providerOptions = msg.providerOptions;
1075
- messages.push({
1076
- role: msg.role,
1077
- content: msg.content,
1078
- ...(providerOptions && { providerOptions }),
1079
- });
1080
- }
1081
- }
1082
- }
1083
- // Handle multimodal content
1084
- try {
1085
- let userContent;
1086
- if (options.input.content && options.input.content.length > 0) {
1087
- userContent = await convertContentToProviderFormat(options.input.content, provider, model);
1088
- }
1089
- else if ((options.input.images && options.input.images.length > 0) ||
1090
- pdfFiles.length > 0) {
1091
- userContent = await convertMultimodalToProviderFormat(options.input.text, options.input.images || [], pdfFiles, provider, model);
1092
- }
1093
- else {
1094
- userContent = options.input.text;
1095
- }
1096
- if (typeof userContent === "string") {
1097
- messages.push({
1098
- role: "user",
1099
- content: userContent,
1100
- });
1101
- }
1102
- else {
1103
- messages.push({
1104
- role: "user",
1105
- content: userContent,
1106
- });
1107
- }
1108
- const reqId = options.context
1109
- ?.requestId;
1110
- logMessageComposition(messages, reqId);
1111
- return messages;
1112
- }
1113
- catch (error) {
1114
- MultimodalLogger.logError("MULTIMODAL_BUILD", error, {
1115
- provider,
1116
- model,
1117
- hasImages,
1118
- imageCount: options.input.images?.length || 0,
1119
- });
1120
- throw error;
1121
- }
1122
- }
1123
- /**
1124
- * Convert advanced content format to provider-specific format
1125
- */
1126
- async function convertContentToProviderFormat(content, provider, _model) {
1127
- const textContent = content.find((c) => c.type === "text");
1128
- const imageContent = content.filter((c) => c.type === "image");
1129
- if (!textContent) {
1130
- throw new Error("Multimodal content must include at least one text element");
1131
- }
1132
- if (imageContent.length === 0) {
1133
- return textContent.text;
1134
- }
1135
- // Extract images as Buffer | string array
1136
- const images = imageContent.map((img) => img.data);
1137
- return await convertSimpleImagesToProviderFormat(textContent.text, images, provider, _model);
1138
- }
1139
- /**
1140
- * Check if a string is an internet URL
1141
- */
1142
- function isInternetUrl(input) {
1143
- return input.startsWith("http://") || input.startsWith("https://");
1144
- }
1145
- /**
1146
- * Download image from URL and convert to base64 data URI
1147
- * Rate-limited to 10 downloads per second to prevent DoS
1148
- * Uses LRU cache to avoid redundant downloads of the same URL
1149
- */
1150
- async function downloadImageFromUrl(url) {
1151
- // Check cache first (before rate limiting)
1152
- const cache = getImageCache();
1153
- const cached = cache.get(url);
1154
- if (cached) {
1155
- logger.debug("Using cached image for URL", { url: url.substring(0, 50) });
1156
- return cached.dataUri;
1157
- }
1158
- // Apply rate limiting only if cache missed
1159
- await urlDownloadRateLimiter.acquire();
1160
- try {
1161
- const response = await request(url, {
1162
- dispatcher: getGlobalDispatcher().compose(interceptors.redirect({ maxRedirections: 5 })),
1163
- method: "GET",
1164
- headersTimeout: 10000, // 10 second timeout for headers
1165
- bodyTimeout: 30000, // 30 second timeout for body,
1166
- });
1167
- if (response.statusCode !== 200) {
1168
- throw new Error(`HTTP ${response.statusCode}: Failed to download image from ${url}`);
1169
- }
1170
- // Get content type from headers
1171
- const contentType = response.headers["content-type"] || "image/jpeg";
1172
- // Validate it's an image
1173
- if (!contentType.startsWith("image/")) {
1174
- throw new Error(`URL does not point to an image. Content-Type: ${contentType}`);
1175
- }
1176
- // Read the response body
1177
- const chunks = [];
1178
- for await (const chunk of response.body) {
1179
- chunks.push(chunk);
1180
- }
1181
- const buffer = Buffer.concat(chunks);
1182
- // Check file size (limit to 10MB)
1183
- const maxSize = 10 * 1024 * 1024; // 10MB
1184
- if (buffer.length > maxSize) {
1185
- throw new Error(`Image too large: ${buffer.length} bytes (max: ${maxSize} bytes)`);
1186
- }
1187
- // Convert to base64 data URI
1188
- const base64 = buffer.toString("base64");
1189
- const dataUri = `data:${contentType};base64,${base64}`;
1190
- // Store in cache for future use
1191
- cache.set(url, dataUri, contentType, buffer);
1192
- return dataUri;
1193
- }
1194
- catch (error) {
1195
- MultimodalLogger.logError("URL_DOWNLOAD_FAILED", error, { url });
1196
- throw new Error(`Failed to download image from ${url}: ${error instanceof Error ? error.message : String(error)}`, { cause: error });
1197
- }
1198
- }
1199
- /**
1200
- * Convert simple images format to Vercel AI SDK format with smart auto-detection
1201
- * - URLs: Downloaded and converted to base64 for Vercel AI SDK compatibility
1202
- * - Local files: Converted to base64 for Vercel AI SDK compatibility
1203
- * - Buffers/Data URIs: Processed normally
1204
- * - Supports alt text for accessibility (included as context in text parts)
1205
- */
1206
- async function convertSimpleImagesToProviderFormat(text, images, provider, _model) {
1207
- // Validate image count against provider-specific limits before processing
1208
- ProviderImageAdapter.validateImageCount(images.length, provider, _model);
1209
- // For Vercel AI SDK, we need to return the content in the standard format
1210
- // The Vercel AI SDK will handle provider-specific formatting internally
1211
- // IMPORTANT: Generate alt text descriptions BEFORE URL downloading to maintain correct image numbering
1212
- // This ensures image numbers match the original order provided by users, even if some URLs fail to download
1213
- const altTextDescriptions = images
1214
- .map((image, idx) => {
1215
- const altText = extractAltText(image);
1216
- return altText ? `[Image ${idx + 1}: ${altText}]` : null;
1217
- })
1218
- .filter(Boolean);
1219
- // Build enhanced text with alt text context for accessibility
1220
- // NOTE: Alt text is appended to the user's prompt as contextual information because most AI providers
1221
- // don't have native alt text fields in their APIs. This approach ensures accessibility metadata
1222
- // is preserved and helps AI models better understand image content.
1223
- const enhancedText = altTextDescriptions.length > 0
1224
- ? `${text}\n\nImage descriptions for context: ${altTextDescriptions.join(" ")}`
1225
- : text;
1226
- // Smart auto-detection: separate URLs from actual image data
1227
- // Also track alt text for each image
1228
- const urlImages = [];
1229
- const actualImages = [];
1230
- images.forEach((image, _index) => {
1231
- const imageData = extractImageData(image);
1232
- const altText = extractAltText(image);
1233
- if (typeof imageData === "string" && isInternetUrl(imageData)) {
1234
- // Internet URL - will be downloaded and converted to base64
1235
- urlImages.push({ url: imageData, altText });
1236
- }
1237
- else {
1238
- // Actual image data (file path, Buffer, data URI) - process for Vercel AI SDK
1239
- actualImages.push({ data: imageData, altText });
1240
- }
1241
- });
1242
- // Download URL images and add to actual images
1243
- for (const { url, altText } of urlImages) {
1244
- try {
1245
- const downloadedDataUri = await downloadImageFromUrl(url);
1246
- actualImages.push({ data: downloadedDataUri, altText });
1247
- }
1248
- catch (error) {
1249
- MultimodalLogger.logError("URL_DOWNLOAD_FAILED_SKIPPING", error, { url });
1250
- // Continue processing other images even if one URL fails
1251
- logger.warn(`Failed to download image from ${url}, skipping: ${error instanceof Error ? error.message : String(error)}`);
1252
- }
1253
- }
1254
- const content = [
1255
- { type: "text", text: enhancedText },
1256
- ];
1257
- // Process all images (including downloaded URLs) for Vercel AI SDK
1258
- actualImages.forEach(({ data: image }, index) => {
1259
- try {
1260
- // Vercel AI SDK v6 expects { type: 'image', image: Buffer | string, mimeType?: string }
1261
- // IMPORTANT: The `image` field must be raw base64 or a Buffer — NOT a data: URI string.
1262
- // The AI SDK v6's download pipeline calls `new URL(image)` on string values. A data: URI
1263
- // is a valid URL, so the SDK tries to "download" it, which hits SSRF validation
1264
- // (validateDownloadUrl) and throws "URL scheme must be http or https, got data:".
1265
- // Passing raw base64 avoids this because `new URL(base64string)` throws and the SDK
1266
- // treats the string as inline base64 data instead.
1267
- let imageData;
1268
- let mimeType = "image/jpeg"; // Default mime type
1269
- if (typeof image === "string") {
1270
- if (image.startsWith("data:")) {
1271
- // Data URI (including downloaded URLs) - extract mime type and raw base64
1272
- const match = image.match(/^data:([^;]+);base64,(.+)$/);
1273
- if (match) {
1274
- mimeType = match[1];
1275
- imageData = match[2]; // Raw base64 only — NOT the full data: URI
1276
- }
1277
- else {
1278
- imageData = image;
1279
- }
1280
- }
1281
- else if (isInternetUrl(image)) {
1282
- // This should not happen as URLs are processed separately above
1283
- // But handle it gracefully just in case
1284
- throw new Error(`Unprocessed URL found in actualImages: ${image}`);
1285
- }
1286
- else {
1287
- // File path string - convert to base64
1288
- try {
1289
- if (existsSync(image)) {
1290
- const buffer = readFileSync(image);
1291
- const base64 = buffer.toString("base64");
1292
- // Detect mime type from file extension
1293
- const ext = image.toLowerCase().split(".").pop();
1294
- switch (ext) {
1295
- case "png":
1296
- mimeType = "image/png";
1297
- break;
1298
- case "gif":
1299
- mimeType = "image/gif";
1300
- break;
1301
- case "webp":
1302
- mimeType = "image/webp";
1303
- break;
1304
- case "bmp":
1305
- mimeType = "image/bmp";
1306
- break;
1307
- case "tiff":
1308
- case "tif":
1309
- mimeType = "image/tiff";
1310
- break;
1311
- default:
1312
- mimeType = "image/jpeg";
1313
- break;
1314
- }
1315
- imageData = base64; // Raw base64 only
1316
- }
1317
- else {
1318
- throw new Error(`Image file not found: ${image}`);
1319
- }
1320
- }
1321
- catch (error) {
1322
- MultimodalLogger.logError("FILE_PATH_CONVERSION", error, {
1323
- index,
1324
- filePath: image,
1325
- });
1326
- throw new Error(`Failed to convert file path to base64: ${image}. ${error}`, { cause: error });
1327
- }
1328
- }
1329
- }
1330
- else {
1331
- // Buffer - convert to raw base64
1332
- imageData = image.toString("base64");
1333
- }
1334
- content.push({
1335
- type: "image",
1336
- image: imageData,
1337
- mimeType: mimeType,
1338
- });
1339
- }
1340
- catch (error) {
1341
- MultimodalLogger.logError("ADD_IMAGE_TO_CONTENT", error, {
1342
- index,
1343
- provider,
1344
- });
1345
- throw error;
1346
- }
1347
- });
1348
- return content;
1349
- }
1350
- /**
1351
- * Convert multimodal content (images + PDFs) to provider format
1352
- */
1353
- async function convertMultimodalToProviderFormat(text, images, pdfFiles, provider, model) {
1354
- const content = [
1355
- { type: "text", text },
1356
- ];
1357
- // Add images if present
1358
- if (images.length > 0) {
1359
- const imageContent = await convertSimpleImagesToProviderFormat("", images, provider, model);
1360
- if (Array.isArray(imageContent)) {
1361
- imageContent.forEach((item) => {
1362
- if (item.type !== "text") {
1363
- content.push(item);
1364
- }
1365
- });
1366
- }
1367
- }
1368
- // Check if provider supports native PDF processing
1369
- const supportsNativePDF = PDFProcessor.supportsNativePDF(provider);
1370
- if (supportsNativePDF) {
1371
- // Add PDFs using Vercel AI SDK standard format (works for providers with native PDF support)
1372
- content.push(...pdfFiles.map((pdf) => {
1373
- logger.info(`[PDF] ✅ Added to content (native PDF format): ${pdf.filename}`);
1374
- return {
1375
- type: "file",
1376
- data: pdf.buffer,
1377
- mediaType: "application/pdf",
1378
- };
1379
- }));
1380
- }
1381
- else {
1382
- // Provider doesn't support native PDF - convert PDF pages to images
1383
- // This enables PDF processing for providers like Mistral, Ollama that support images but not PDFs
1384
- logger.info(`[PDF→Image] Provider ${provider} doesn't support native PDF. Converting ${pdfFiles.length} PDF(s) to images...`);
1385
- for (const pdf of pdfFiles) {
1386
- try {
1387
- const conversionResult = await PDFImageConverter.convertToImages(pdf.buffer, {
1388
- scale: 2.0, // High quality for OCR/analysis
1389
- maxPages: 20, // Limit pages to prevent token overflow
1390
- });
1391
- logger.info(`[PDF→Image] ✅ Converted ${pdf.filename}: ${conversionResult.pageCount} page(s) → images`);
1392
- // Add each page as an ImagePart (raw base64, not data: URI — see SSRF note above)
1393
- conversionResult.images.forEach((base64Image, pageIndex) => {
1394
- content.push({
1395
- type: "image",
1396
- image: base64Image,
1397
- mimeType: "image/png",
1398
- });
1399
- logger.debug(`[PDF→Image] Added page ${pageIndex + 1}/${conversionResult.pageCount} of ${pdf.filename}`);
1400
- });
1401
- // Log any warnings from conversion
1402
- if (conversionResult.warnings) {
1403
- conversionResult.warnings.forEach((warning) => {
1404
- logger.warn(`[PDF→Image] ${warning}`);
1405
- });
1406
- }
1407
- }
1408
- catch (error) {
1409
- const errorMessage = error instanceof Error ? error.message : String(error);
1410
- logger.error(`[PDF→Image] ❌ Failed to convert ${pdf.filename}: ${errorMessage}`);
1411
- // Re-throw so the user knows PDF processing failed
1412
- throw new Error(`PDF to image conversion failed for ${pdf.filename}: ${errorMessage}. ` +
1413
- `Provider ${provider} doesn't support native PDFs and image conversion failed.`, { cause: error });
1414
- }
1415
- }
1416
- }
1417
- return content;
1418
- }
1419
- /**
1420
- * Type guard for FileWithMetadata objects.
1421
- */
1422
- function isFileWithMetadata(file) {
1423
- return (typeof file === "object" &&
1424
- !Buffer.isBuffer(file) &&
1425
- "buffer" in file &&
1426
- "filename" in file);
1427
- }
1428
- /**
1429
- * Extract filename from file input.
1430
- * Supports Buffers (generic name), strings (path/URL), and FileWithMetadata objects.
1431
- */
1432
- function extractFilename(file, index = 0) {
1433
- if (isFileWithMetadata(file)) {
1434
- return file.filename;
1435
- }
1436
- if (typeof file === "string") {
1437
- if (file.startsWith("http")) {
1438
- try {
1439
- const url = new URL(file);
1440
- return url.pathname.split("/").pop() || `file-${index + 1}`;
1441
- }
1442
- catch {
1443
- return `file-${index + 1}`;
1444
- }
1445
- }
1446
- return (file.split("/").pop() || file.split("\\").pop() || `file-${index + 1}`);
1447
- }
1448
- return `file-${index + 1}`;
1449
- }
1450
- /**
1451
- * Get the byte size of a file input.
1452
- * For FileWithMetadata: returns buffer.length.
1453
- * For Buffers: returns buffer.length.
1454
- * For strings that are file paths: returns the stat size.
1455
- * For URLs/data URIs: returns a rough estimate from string length.
1456
- */
1457
- function getFileSize(file) {
1458
- if (isFileWithMetadata(file)) {
1459
- return file.buffer.length;
1460
- }
1461
- if (Buffer.isBuffer(file)) {
1462
- return file.length;
1463
- }
1464
- if (typeof file === "string" && existsSync(file)) {
1465
- try {
1466
- return statSync(file).size;
1467
- }
1468
- catch {
1469
- return 0;
1470
- }
1471
- }
1472
- // For URLs and data URIs, use string length as rough estimate
1473
- return typeof file === "string" ? file.length : 0;
1474
- }
1475
- /**
1476
- * Get a Buffer from a file input.
1477
- * For FileWithMetadata: returns the buffer property.
1478
- * For Buffers: returns as-is.
1479
- * For file paths: reads the file.
1480
- * For URLs/data URIs: returns null (not supported for lazy registration).
1481
- */
1482
- async function getFileBuffer(file) {
1483
- if (isFileWithMetadata(file)) {
1484
- return file.buffer;
1485
- }
1486
- if (Buffer.isBuffer(file)) {
1487
- return file;
1488
- }
1489
- if (typeof file === "string" && existsSync(file)) {
1490
- try {
1491
- return readFileSync(file);
1492
- }
1493
- catch {
1494
- return null;
1495
- }
1496
- }
1497
- // URLs and data URIs can't be lazily registered (need download first)
1498
- return null;
1499
- }
1500
- /**
1501
- * Determine the source type of a file input.
1502
- */
1503
- function getFileSource(file) {
1504
- if (isFileWithMetadata(file)) {
1505
- return "buffer";
1506
- }
1507
- if (Buffer.isBuffer(file)) {
1508
- return "buffer";
1509
- }
1510
- if (typeof file === "string") {
1511
- if (file.startsWith("data:")) {
1512
- return "datauri";
1513
- }
1514
- if (file.startsWith("http://") || file.startsWith("https://")) {
1515
- return "url";
1516
- }
1517
- if (existsSync(file)) {
1518
- return "path";
1519
- }
1520
- }
1521
- return "buffer";
1522
- }
1523
- /**
1524
- * Try to register a file with the FileReferenceRegistry for lazy processing.
1525
- * Returns true if registration succeeded, false if it failed (caller should
1526
- * fall through to full processing).
1527
- */
1528
- async function tryRegisterFileReference(file, fileSize, registry, index = 0) {
1529
- try {
1530
- const buffer = await getFileBuffer(file);
1531
- if (!buffer) {
1532
- return false;
1533
- }
1534
- const filename = extractFilename(file, index);
1535
- await registry.register(buffer, getFileSource(file), { filename });
1536
- logger.info(`[FileDetector] Registered "${filename}" (${(fileSize / 1024).toFixed(0)} KB) ` +
1537
- `as lazy reference — skipping upfront processing`);
1538
- return true;
1539
- }
1540
- catch (regError) {
1541
- logger.warn(`[FileDetector] Failed to register file as reference, falling back to full processing: ${regError instanceof Error ? regError.message : String(regError)}`);
1542
- return false;
1543
- }
1544
- }
1545
- /**
1546
- * Get a language hint for code fencing based on MIME type or filename extension.
1547
- * Returns the language identifier for markdown code blocks, or null for generic text.
1548
- */
1549
- function getLanguageHint(mimeType, filename) {
1550
- // Try MIME type first
1551
- const mimeMap = {
1552
- "text/javascript": "javascript",
1553
- "text/typescript": "typescript",
1554
- "text/x-python": "python",
1555
- "text/x-java-source": "java",
1556
- "text/x-go": "go",
1557
- "text/x-rustsrc": "rust",
1558
- "text/x-ruby": "ruby",
1559
- "text/x-php": "php",
1560
- "text/x-c": "c",
1561
- "text/x-c++": "cpp",
1562
- "text/x-csharp": "csharp",
1563
- "text/x-swift": "swift",
1564
- "text/x-kotlin": "kotlin",
1565
- "text/x-scala": "scala",
1566
- "text/x-shellscript": "bash",
1567
- "text/x-powershell": "powershell",
1568
- "text/x-sql": "sql",
1569
- "text/x-r": "r",
1570
- "text/x-lua": "lua",
1571
- "text/x-perl": "perl",
1572
- "text/x-dart": "dart",
1573
- "text/x-elixir": "elixir",
1574
- "text/x-erlang": "erlang",
1575
- "text/x-haskell": "haskell",
1576
- "text/x-clojure": "clojure",
1577
- "text/x-lisp": "lisp",
1578
- "text/html": "html",
1579
- "text/css": "css",
1580
- "text/markdown": "markdown",
1581
- "application/json": "json",
1582
- "application/xml": "xml",
1583
- "text/xml": "xml",
1584
- "application/yaml": "yaml",
1585
- "application/x-yaml": "yaml",
1586
- };
1587
- const lower = mimeType.toLowerCase().split(";")[0].trim();
1588
- if (mimeMap[lower]) {
1589
- return mimeMap[lower];
1590
- }
1591
- // Fallback: try extension from filename
1592
- const ext = filename.split(".").pop()?.toLowerCase();
1593
- if (!ext) {
1594
- return null;
1595
- }
1596
- const extMap = {
1597
- js: "javascript",
1598
- mjs: "javascript",
1599
- cjs: "javascript",
1600
- jsx: "javascript",
1601
- ts: "typescript",
1602
- tsx: "typescript",
1603
- py: "python",
1604
- java: "java",
1605
- go: "go",
1606
- rs: "rust",
1607
- rb: "ruby",
1608
- php: "php",
1609
- c: "c",
1610
- cpp: "cpp",
1611
- cc: "cpp",
1612
- h: "c",
1613
- hpp: "cpp",
1614
- cs: "csharp",
1615
- swift: "swift",
1616
- kt: "kotlin",
1617
- kts: "kotlin",
1618
- scala: "scala",
1619
- sh: "bash",
1620
- bash: "bash",
1621
- zsh: "bash",
1622
- ps1: "powershell",
1623
- sql: "sql",
1624
- r: "r",
1625
- lua: "lua",
1626
- pl: "perl",
1627
- perl: "perl",
1628
- dart: "dart",
1629
- ex: "elixir",
1630
- exs: "elixir",
1631
- erl: "erlang",
1632
- hs: "haskell",
1633
- clj: "clojure",
1634
- lisp: "lisp",
1635
- vim: "vim",
1636
- html: "html",
1637
- htm: "html",
1638
- css: "css",
1639
- md: "markdown",
1640
- markdown: "markdown",
1641
- json: "json",
1642
- xml: "xml",
1643
- yaml: "yaml",
1644
- yml: "yaml",
1645
- toml: "toml",
1646
- ini: "ini",
1647
- cfg: "ini",
1648
- };
1649
- return extMap[ext] || null;
1650
- }
1651
- function buildCSVToolInstructions(filePath) {
1652
- return `\n**NOTE**: You can perform calculations directly on the CSV data shown above. For advanced operations on the full file (counting by column, grouping, etc.), you may optionally use the analyzeCSV tool with filePath="${filePath}".\n\nExample: analyzeCSV(filePath="${filePath}", operation="count_by_column", column="merchant_id")\n\n`;
1653
- }