@juspay/neurolink 9.32.0 → 9.33.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (475) hide show
  1. package/CHANGELOG.md +12 -0
  2. package/dist/auth/anthropicOAuth.js +1 -1
  3. package/dist/cli/commands/proxy.js +18 -5
  4. package/dist/client/aiSdkAdapter.js +1 -1
  5. package/dist/client/index.js +137 -501
  6. package/dist/core/factory.js +0 -1
  7. package/dist/core/redisConversationMemoryManager.js +1 -1
  8. package/dist/features/ppt/slideGenerator.js +0 -1
  9. package/dist/features/ppt/utils.js +0 -1
  10. package/dist/lib/neurolink.d.ts +10 -0
  11. package/dist/lib/neurolink.js +41 -7
  12. package/dist/lib/server/routes/claudeProxyRoutes.js +45 -9
  13. package/dist/lib/types/generateTypes.d.ts +16 -0
  14. package/dist/lib/types/streamTypes.d.ts +15 -0
  15. package/dist/mcp/elicitationProtocol.js +1 -1
  16. package/dist/mcp/servers/agent/directToolsServer.js +0 -1
  17. package/dist/neurolink.d.ts +10 -0
  18. package/dist/neurolink.js +41 -7
  19. package/dist/providers/azureOpenai.js +1 -1
  20. package/dist/providers/huggingFace.js +0 -1
  21. package/dist/providers/openaiCompatible.js +0 -1
  22. package/dist/sdk/toolRegistration.js +0 -1
  23. package/dist/server/openapi/generator.js +1 -1
  24. package/dist/server/routes/claudeProxyRoutes.js +45 -9
  25. package/dist/types/configTypes.js +0 -5
  26. package/dist/types/generateTypes.d.ts +16 -0
  27. package/dist/types/modelTypes.js +0 -1
  28. package/dist/types/streamTypes.d.ts +15 -0
  29. package/dist/types/tools.js +0 -1
  30. package/dist/types/typeAliases.js +0 -1
  31. package/dist/types/utilities.js +1 -1
  32. package/dist/types/workflowTypes.js +0 -1
  33. package/dist/utils/providerRetry.js +0 -1
  34. package/dist/utils/providerUtils.js +0 -1
  35. package/package.json +2 -2
  36. package/dist/client/adapters/providerImageAdapter.js +0 -588
  37. package/dist/client/adapters/tts/googleTTSHandler.js +0 -344
  38. package/dist/client/adapters/video/directorPipeline.js +0 -516
  39. package/dist/client/adapters/video/ffmpegAdapter.js +0 -206
  40. package/dist/client/adapters/video/frameExtractor.js +0 -143
  41. package/dist/client/adapters/video/vertexVideoHandler.js +0 -763
  42. package/dist/client/adapters/video/videoAnalyzer.js +0 -238
  43. package/dist/client/adapters/video/videoMerger.js +0 -171
  44. package/dist/client/agent/directTools.js +0 -840
  45. package/dist/client/auth/AuthProviderFactory.js +0 -111
  46. package/dist/client/auth/AuthProviderRegistry.js +0 -190
  47. package/dist/client/auth/RequestContext.js +0 -78
  48. package/dist/client/auth/accountPool.js +0 -178
  49. package/dist/client/auth/anthropicOAuth.js +0 -974
  50. package/dist/client/auth/authContext.js +0 -314
  51. package/dist/client/auth/errors.js +0 -39
  52. package/dist/client/auth/index.js +0 -61
  53. package/dist/client/auth/middleware/AuthMiddleware.js +0 -519
  54. package/dist/client/auth/middleware/rateLimitByUser.js +0 -554
  55. package/dist/client/auth/providers/BaseAuthProvider.js +0 -723
  56. package/dist/client/auth/providers/CognitoProvider.js +0 -304
  57. package/dist/client/auth/providers/KeycloakProvider.js +0 -393
  58. package/dist/client/auth/providers/auth0.js +0 -274
  59. package/dist/client/auth/providers/betterAuth.js +0 -182
  60. package/dist/client/auth/providers/clerk.js +0 -317
  61. package/dist/client/auth/providers/custom.js +0 -112
  62. package/dist/client/auth/providers/firebase.js +0 -226
  63. package/dist/client/auth/providers/jwt.js +0 -212
  64. package/dist/client/auth/providers/oauth2.js +0 -303
  65. package/dist/client/auth/providers/supabase.js +0 -259
  66. package/dist/client/auth/providers/workos.js +0 -284
  67. package/dist/client/auth/serverBridge.js +0 -25
  68. package/dist/client/auth/sessionManager.js +0 -437
  69. package/dist/client/auth/tokenStore.js +0 -799
  70. package/dist/client/client/aiSdkAdapter.js +0 -487
  71. package/dist/client/client/auth.js +0 -473
  72. package/dist/client/client/errors.js +0 -552
  73. package/dist/client/client/httpClient.js +0 -837
  74. package/dist/client/client/index.js +0 -172
  75. package/dist/client/client/interceptors.js +0 -601
  76. package/dist/client/client/sseClient.js +0 -545
  77. package/dist/client/client/streamingClient.js +0 -917
  78. package/dist/client/client/wsClient.js +0 -369
  79. package/dist/client/config/configManager.js +0 -303
  80. package/dist/client/config/conversationMemory.js +0 -86
  81. package/dist/client/config/taskClassificationConfig.js +0 -148
  82. package/dist/client/constants/contextWindows.js +0 -295
  83. package/dist/client/constants/enums.js +0 -853
  84. package/dist/client/constants/index.js +0 -207
  85. package/dist/client/constants/performance.js +0 -389
  86. package/dist/client/constants/retry.js +0 -266
  87. package/dist/client/constants/timeouts.js +0 -182
  88. package/dist/client/constants/tokens.js +0 -380
  89. package/dist/client/constants/videoErrors.js +0 -46
  90. package/dist/client/context/budgetChecker.js +0 -98
  91. package/dist/client/context/contextCompactor.js +0 -205
  92. package/dist/client/context/emergencyTruncation.js +0 -88
  93. package/dist/client/context/errorDetection.js +0 -171
  94. package/dist/client/context/errors.js +0 -21
  95. package/dist/client/context/fileTokenBudget.js +0 -127
  96. package/dist/client/context/prompts/summarizationPrompt.js +0 -117
  97. package/dist/client/context/stages/fileReadDeduplicator.js +0 -66
  98. package/dist/client/context/stages/slidingWindowTruncator.js +0 -190
  99. package/dist/client/context/stages/structuredSummarizer.js +0 -99
  100. package/dist/client/context/stages/toolOutputPruner.js +0 -52
  101. package/dist/client/context/summarizationEngine.js +0 -136
  102. package/dist/client/context/toolOutputLimits.js +0 -78
  103. package/dist/client/context/toolPairRepair.js +0 -66
  104. package/dist/client/core/analytics.js +0 -88
  105. package/dist/client/core/baseProvider.js +0 -1385
  106. package/dist/client/core/constants.js +0 -140
  107. package/dist/client/core/conversationMemoryFactory.js +0 -141
  108. package/dist/client/core/conversationMemoryInitializer.js +0 -128
  109. package/dist/client/core/conversationMemoryManager.js +0 -344
  110. package/dist/client/core/dynamicModels.js +0 -358
  111. package/dist/client/core/evaluation.js +0 -309
  112. package/dist/client/core/evaluationProviders.js +0 -248
  113. package/dist/client/core/factory.js +0 -412
  114. package/dist/client/core/infrastructure/baseError.js +0 -22
  115. package/dist/client/core/infrastructure/baseFactory.js +0 -54
  116. package/dist/client/core/infrastructure/baseRegistry.js +0 -53
  117. package/dist/client/core/infrastructure/index.js +0 -5
  118. package/dist/client/core/infrastructure/retry.js +0 -20
  119. package/dist/client/core/infrastructure/typedEventEmitter.js +0 -23
  120. package/dist/client/core/modelConfiguration.js +0 -851
  121. package/dist/client/core/modules/GenerationHandler.js +0 -588
  122. package/dist/client/core/modules/MessageBuilder.js +0 -273
  123. package/dist/client/core/modules/StreamHandler.js +0 -185
  124. package/dist/client/core/modules/TelemetryHandler.js +0 -203
  125. package/dist/client/core/modules/ToolsManager.js +0 -499
  126. package/dist/client/core/modules/Utilities.js +0 -331
  127. package/dist/client/core/redisConversationMemoryManager.js +0 -1435
  128. package/dist/client/core/streamAnalytics.js +0 -131
  129. package/dist/client/evaluation/contextBuilder.js +0 -134
  130. package/dist/client/evaluation/index.js +0 -61
  131. package/dist/client/evaluation/prompts.js +0 -73
  132. package/dist/client/evaluation/ragasEvaluator.js +0 -110
  133. package/dist/client/evaluation/retryManager.js +0 -78
  134. package/dist/client/evaluation/scoring.js +0 -61
  135. package/dist/client/factories/providerFactory.js +0 -166
  136. package/dist/client/factories/providerRegistry.js +0 -166
  137. package/dist/client/features/ppt/constants.js +0 -896
  138. package/dist/client/features/ppt/contentPlanner.js +0 -529
  139. package/dist/client/features/ppt/presentationOrchestrator.js +0 -236
  140. package/dist/client/features/ppt/slideGenerator.js +0 -532
  141. package/dist/client/features/ppt/slideRenderers.js +0 -2383
  142. package/dist/client/features/ppt/slideTypeInference.js +0 -405
  143. package/dist/client/features/ppt/types.js +0 -13
  144. package/dist/client/features/ppt/utils.js +0 -443
  145. package/dist/client/files/fileReferenceRegistry.js +0 -1543
  146. package/dist/client/files/fileTools.js +0 -450
  147. package/dist/client/files/streamingReader.js +0 -321
  148. package/dist/client/files/types.js +0 -23
  149. package/dist/client/hitl/hitlErrors.js +0 -54
  150. package/dist/client/hitl/hitlManager.js +0 -460
  151. package/dist/client/mcp/agentExposure.js +0 -356
  152. package/dist/client/mcp/auth/index.js +0 -11
  153. package/dist/client/mcp/auth/oauthClientProvider.js +0 -325
  154. package/dist/client/mcp/auth/tokenStorage.js +0 -134
  155. package/dist/client/mcp/batching/index.js +0 -10
  156. package/dist/client/mcp/batching/requestBatcher.js +0 -441
  157. package/dist/client/mcp/caching/index.js +0 -10
  158. package/dist/client/mcp/caching/toolCache.js +0 -433
  159. package/dist/client/mcp/elicitation/elicitationManager.js +0 -376
  160. package/dist/client/mcp/elicitation/index.js +0 -11
  161. package/dist/client/mcp/elicitation/types.js +0 -10
  162. package/dist/client/mcp/elicitationProtocol.js +0 -375
  163. package/dist/client/mcp/enhancedToolDiscovery.js +0 -481
  164. package/dist/client/mcp/externalServerManager.js +0 -1478
  165. package/dist/client/mcp/factory.js +0 -161
  166. package/dist/client/mcp/flexibleToolValidator.js +0 -161
  167. package/dist/client/mcp/httpRateLimiter.js +0 -391
  168. package/dist/client/mcp/httpRetryHandler.js +0 -178
  169. package/dist/client/mcp/index.js +0 -74
  170. package/dist/client/mcp/mcpCircuitBreaker.js +0 -427
  171. package/dist/client/mcp/mcpClientFactory.js +0 -708
  172. package/dist/client/mcp/mcpRegistryClient.js +0 -488
  173. package/dist/client/mcp/mcpServerBase.js +0 -373
  174. package/dist/client/mcp/multiServerManager.js +0 -579
  175. package/dist/client/mcp/registry.js +0 -158
  176. package/dist/client/mcp/routing/index.js +0 -10
  177. package/dist/client/mcp/routing/toolRouter.js +0 -416
  178. package/dist/client/mcp/serverCapabilities.js +0 -502
  179. package/dist/client/mcp/servers/agent/directToolsServer.js +0 -150
  180. package/dist/client/mcp/toolAnnotations.js +0 -239
  181. package/dist/client/mcp/toolConverter.js +0 -258
  182. package/dist/client/mcp/toolDiscoveryService.js +0 -798
  183. package/dist/client/mcp/toolIntegration.js +0 -334
  184. package/dist/client/mcp/toolRegistry.js +0 -729
  185. package/dist/client/memory/hippocampusInitializer.js +0 -19
  186. package/dist/client/memory/memoryRetrievalTools.js +0 -166
  187. package/dist/client/middleware/builtin/analytics.js +0 -132
  188. package/dist/client/middleware/builtin/autoEvaluation.js +0 -203
  189. package/dist/client/middleware/builtin/guardrails.js +0 -109
  190. package/dist/client/middleware/builtin/lifecycle.js +0 -168
  191. package/dist/client/middleware/factory.js +0 -327
  192. package/dist/client/middleware/registry.js +0 -295
  193. package/dist/client/middleware/utils/guardrailsUtils.js +0 -396
  194. package/dist/client/models/anthropicModels.js +0 -527
  195. package/dist/client/neurolink.js +0 -8233
  196. package/dist/client/observability/exporterRegistry.js +0 -413
  197. package/dist/client/observability/exporters/arizeExporter.js +0 -138
  198. package/dist/client/observability/exporters/baseExporter.js +0 -190
  199. package/dist/client/observability/exporters/braintrustExporter.js +0 -154
  200. package/dist/client/observability/exporters/datadogExporter.js +0 -196
  201. package/dist/client/observability/exporters/laminarExporter.js +0 -302
  202. package/dist/client/observability/exporters/langfuseExporter.js +0 -209
  203. package/dist/client/observability/exporters/langsmithExporter.js +0 -143
  204. package/dist/client/observability/exporters/otelExporter.js +0 -164
  205. package/dist/client/observability/exporters/posthogExporter.js +0 -287
  206. package/dist/client/observability/exporters/sentryExporter.js +0 -165
  207. package/dist/client/observability/index.js +0 -31
  208. package/dist/client/observability/metricsAggregator.js +0 -556
  209. package/dist/client/observability/otelBridge.js +0 -131
  210. package/dist/client/observability/retryPolicy.js +0 -383
  211. package/dist/client/observability/sampling/samplers.js +0 -216
  212. package/dist/client/observability/spanProcessor.js +0 -303
  213. package/dist/client/observability/tokenTracker.js +0 -413
  214. package/dist/client/observability/types/exporterTypes.js +0 -5
  215. package/dist/client/observability/types/index.js +0 -4
  216. package/dist/client/observability/types/spanTypes.js +0 -92
  217. package/dist/client/observability/utils/safeMetadata.js +0 -25
  218. package/dist/client/observability/utils/spanSerializer.js +0 -292
  219. package/dist/client/processors/archive/ArchiveProcessor.js +0 -1308
  220. package/dist/client/processors/base/BaseFileProcessor.js +0 -614
  221. package/dist/client/processors/base/types.js +0 -82
  222. package/dist/client/processors/config/fileTypes.js +0 -520
  223. package/dist/client/processors/config/index.js +0 -92
  224. package/dist/client/processors/config/languageMap.js +0 -410
  225. package/dist/client/processors/config/mimeTypes.js +0 -363
  226. package/dist/client/processors/config/sizeLimits.js +0 -258
  227. package/dist/client/processors/document/ExcelProcessor.js +0 -590
  228. package/dist/client/processors/document/OpenDocumentProcessor.js +0 -212
  229. package/dist/client/processors/document/PptxProcessor.js +0 -157
  230. package/dist/client/processors/document/RtfProcessor.js +0 -361
  231. package/dist/client/processors/document/WordProcessor.js +0 -353
  232. package/dist/client/processors/errors/FileErrorCode.js +0 -255
  233. package/dist/client/processors/errors/errorHelpers.js +0 -386
  234. package/dist/client/processors/errors/errorSerializer.js +0 -507
  235. package/dist/client/processors/errors/index.js +0 -49
  236. package/dist/client/processors/markup/SvgProcessor.js +0 -240
  237. package/dist/client/processors/media/AudioProcessor.js +0 -707
  238. package/dist/client/processors/media/VideoProcessor.js +0 -1045
  239. package/dist/client/providers/amazonBedrock.js +0 -1512
  240. package/dist/client/providers/amazonSagemaker.js +0 -162
  241. package/dist/client/providers/anthropic.js +0 -831
  242. package/dist/client/providers/azureOpenai.js +0 -143
  243. package/dist/client/providers/googleAiStudio.js +0 -1200
  244. package/dist/client/providers/googleNativeGemini3.js +0 -543
  245. package/dist/client/providers/googleVertex.js +0 -2936
  246. package/dist/client/providers/huggingFace.js +0 -315
  247. package/dist/client/providers/litellm.js +0 -488
  248. package/dist/client/providers/mistral.js +0 -157
  249. package/dist/client/providers/ollama.js +0 -1579
  250. package/dist/client/providers/openAI.js +0 -627
  251. package/dist/client/providers/openRouter.js +0 -543
  252. package/dist/client/providers/openaiCompatible.js +0 -290
  253. package/dist/client/providers/providerTypeUtils.js +0 -46
  254. package/dist/client/providers/sagemaker/adaptive-semaphore.js +0 -215
  255. package/dist/client/providers/sagemaker/client.js +0 -472
  256. package/dist/client/providers/sagemaker/config.js +0 -317
  257. package/dist/client/providers/sagemaker/detection.js +0 -606
  258. package/dist/client/providers/sagemaker/error-constants.js +0 -227
  259. package/dist/client/providers/sagemaker/errors.js +0 -299
  260. package/dist/client/providers/sagemaker/language-model.js +0 -775
  261. package/dist/client/providers/sagemaker/parsers.js +0 -634
  262. package/dist/client/providers/sagemaker/streaming.js +0 -331
  263. package/dist/client/providers/sagemaker/structured-parser.js +0 -625
  264. package/dist/client/proxy/accountQuota.js +0 -162
  265. package/dist/client/proxy/claudeFormat.js +0 -595
  266. package/dist/client/proxy/modelRouter.js +0 -29
  267. package/dist/client/proxy/oauthFetch.js +0 -367
  268. package/dist/client/proxy/proxyFetch.js +0 -586
  269. package/dist/client/proxy/requestLogger.js +0 -207
  270. package/dist/client/proxy/tokenRefresh.js +0 -124
  271. package/dist/client/proxy/usageStats.js +0 -74
  272. package/dist/client/proxy/utils/noProxyUtils.js +0 -149
  273. package/dist/client/rag/ChunkerFactory.js +0 -320
  274. package/dist/client/rag/ChunkerRegistry.js +0 -421
  275. package/dist/client/rag/chunkers/BaseChunker.js +0 -143
  276. package/dist/client/rag/chunkers/CharacterChunker.js +0 -28
  277. package/dist/client/rag/chunkers/HTMLChunker.js +0 -38
  278. package/dist/client/rag/chunkers/JSONChunker.js +0 -68
  279. package/dist/client/rag/chunkers/LaTeXChunker.js +0 -63
  280. package/dist/client/rag/chunkers/MarkdownChunker.js +0 -306
  281. package/dist/client/rag/chunkers/RecursiveChunker.js +0 -139
  282. package/dist/client/rag/chunkers/SemanticMarkdownChunker.js +0 -138
  283. package/dist/client/rag/chunkers/SentenceChunker.js +0 -66
  284. package/dist/client/rag/chunkers/TokenChunker.js +0 -61
  285. package/dist/client/rag/chunkers/index.js +0 -15
  286. package/dist/client/rag/chunking/characterChunker.js +0 -142
  287. package/dist/client/rag/chunking/chunkerRegistry.js +0 -194
  288. package/dist/client/rag/chunking/htmlChunker.js +0 -247
  289. package/dist/client/rag/chunking/index.js +0 -17
  290. package/dist/client/rag/chunking/jsonChunker.js +0 -281
  291. package/dist/client/rag/chunking/latexChunker.js +0 -251
  292. package/dist/client/rag/chunking/markdownChunker.js +0 -373
  293. package/dist/client/rag/chunking/recursiveChunker.js +0 -148
  294. package/dist/client/rag/chunking/semanticChunker.js +0 -306
  295. package/dist/client/rag/chunking/sentenceChunker.js +0 -230
  296. package/dist/client/rag/chunking/tokenChunker.js +0 -183
  297. package/dist/client/rag/document/MDocument.js +0 -392
  298. package/dist/client/rag/document/index.js +0 -5
  299. package/dist/client/rag/document/loaders.js +0 -500
  300. package/dist/client/rag/errors/RAGError.js +0 -274
  301. package/dist/client/rag/errors/index.js +0 -6
  302. package/dist/client/rag/graphRag/graphRAG.js +0 -401
  303. package/dist/client/rag/graphRag/index.js +0 -4
  304. package/dist/client/rag/index.js +0 -141
  305. package/dist/client/rag/metadata/MetadataExtractorFactory.js +0 -418
  306. package/dist/client/rag/metadata/MetadataExtractorRegistry.js +0 -362
  307. package/dist/client/rag/metadata/index.js +0 -9
  308. package/dist/client/rag/metadata/metadataExtractor.js +0 -280
  309. package/dist/client/rag/pipeline/RAGPipeline.js +0 -436
  310. package/dist/client/rag/pipeline/contextAssembly.js +0 -341
  311. package/dist/client/rag/pipeline/index.js +0 -5
  312. package/dist/client/rag/ragIntegration.js +0 -321
  313. package/dist/client/rag/reranker/RerankerFactory.js +0 -430
  314. package/dist/client/rag/reranker/RerankerRegistry.js +0 -402
  315. package/dist/client/rag/reranker/index.js +0 -9
  316. package/dist/client/rag/reranker/reranker.js +0 -277
  317. package/dist/client/rag/resilience/CircuitBreaker.js +0 -431
  318. package/dist/client/rag/resilience/RetryHandler.js +0 -304
  319. package/dist/client/rag/resilience/index.js +0 -7
  320. package/dist/client/rag/retrieval/hybridSearch.js +0 -335
  321. package/dist/client/rag/retrieval/index.js +0 -5
  322. package/dist/client/rag/retrieval/vectorQueryTool.js +0 -307
  323. package/dist/client/rag/types.js +0 -8
  324. package/dist/client/sdk/toolRegistration.js +0 -377
  325. package/dist/client/server/abstract/baseServerAdapter.js +0 -575
  326. package/dist/client/server/adapters/expressAdapter.js +0 -486
  327. package/dist/client/server/adapters/fastifyAdapter.js +0 -472
  328. package/dist/client/server/adapters/honoAdapter.js +0 -632
  329. package/dist/client/server/adapters/koaAdapter.js +0 -510
  330. package/dist/client/server/errors.js +0 -486
  331. package/dist/client/server/factory/serverAdapterFactory.js +0 -160
  332. package/dist/client/server/index.js +0 -108
  333. package/dist/client/server/middleware/abortSignal.js +0 -111
  334. package/dist/client/server/middleware/auth.js +0 -388
  335. package/dist/client/server/middleware/cache.js +0 -359
  336. package/dist/client/server/middleware/common.js +0 -281
  337. package/dist/client/server/middleware/deprecation.js +0 -190
  338. package/dist/client/server/middleware/mcpBodyAttachment.js +0 -63
  339. package/dist/client/server/middleware/rateLimit.js +0 -227
  340. package/dist/client/server/middleware/validation.js +0 -388
  341. package/dist/client/server/openapi/generator.js +0 -398
  342. package/dist/client/server/openapi/index.js +0 -36
  343. package/dist/client/server/openapi/schemas.js +0 -695
  344. package/dist/client/server/openapi/templates.js +0 -374
  345. package/dist/client/server/routes/agentRoutes.js +0 -189
  346. package/dist/client/server/routes/claudeProxyRoutes.js +0 -1600
  347. package/dist/client/server/routes/healthRoutes.js +0 -187
  348. package/dist/client/server/routes/index.js +0 -57
  349. package/dist/client/server/routes/mcpRoutes.js +0 -342
  350. package/dist/client/server/routes/memoryRoutes.js +0 -350
  351. package/dist/client/server/routes/openApiRoutes.js +0 -126
  352. package/dist/client/server/routes/toolRoutes.js +0 -199
  353. package/dist/client/server/streaming/dataStream.js +0 -486
  354. package/dist/client/server/streaming/index.js +0 -11
  355. package/dist/client/server/types.js +0 -67
  356. package/dist/client/server/utils/redaction.js +0 -334
  357. package/dist/client/server/utils/validation.js +0 -243
  358. package/dist/client/server/websocket/WebSocketHandler.js +0 -383
  359. package/dist/client/server/websocket/index.js +0 -4
  360. package/dist/client/services/server/ai/observability/instrumentation.js +0 -808
  361. package/dist/client/telemetry/attributes.js +0 -100
  362. package/dist/client/telemetry/index.js +0 -26
  363. package/dist/client/telemetry/telemetryService.js +0 -308
  364. package/dist/client/telemetry/tracers.js +0 -17
  365. package/dist/client/telemetry/withSpan.js +0 -34
  366. package/dist/client/types/actionTypes.js +0 -6
  367. package/dist/client/types/analytics.js +0 -5
  368. package/dist/client/types/authTypes.js +0 -9
  369. package/dist/client/types/circuitBreakerErrors.js +0 -34
  370. package/dist/client/types/cli.js +0 -21
  371. package/dist/client/types/clientTypes.js +0 -10
  372. package/dist/client/types/common.js +0 -51
  373. package/dist/client/types/configTypes.js +0 -49
  374. package/dist/client/types/content.js +0 -19
  375. package/dist/client/types/contextTypes.js +0 -400
  376. package/dist/client/types/conversation.js +0 -47
  377. package/dist/client/types/conversationMemoryInterface.js +0 -6
  378. package/dist/client/types/domainTypes.js +0 -5
  379. package/dist/client/types/errors.js +0 -167
  380. package/dist/client/types/evaluation.js +0 -5
  381. package/dist/client/types/evaluationProviders.js +0 -5
  382. package/dist/client/types/evaluationTypes.js +0 -1
  383. package/dist/client/types/externalMcp.js +0 -6
  384. package/dist/client/types/fileReferenceTypes.js +0 -8
  385. package/dist/client/types/fileTypes.js +0 -4
  386. package/dist/client/types/generateTypes.js +0 -1
  387. package/dist/client/types/guardrails.js +0 -1
  388. package/dist/client/types/hitlTypes.js +0 -8
  389. package/dist/client/types/index.js +0 -57
  390. package/dist/client/types/mcpTypes.js +0 -5
  391. package/dist/client/types/middlewareTypes.js +0 -1
  392. package/dist/client/types/modelTypes.js +0 -30
  393. package/dist/client/types/multimodal.js +0 -135
  394. package/dist/client/types/observability.js +0 -6
  395. package/dist/client/types/pptTypes.js +0 -82
  396. package/dist/client/types/providers.js +0 -111
  397. package/dist/client/types/proxyTypes.js +0 -16
  398. package/dist/client/types/ragTypes.js +0 -7
  399. package/dist/client/types/sdkTypes.js +0 -8
  400. package/dist/client/types/serviceTypes.js +0 -5
  401. package/dist/client/types/streamTypes.js +0 -1
  402. package/dist/client/types/subscriptionTypes.js +0 -9
  403. package/dist/client/types/taskClassificationTypes.js +0 -5
  404. package/dist/client/types/tools.js +0 -24
  405. package/dist/client/types/ttsTypes.js +0 -57
  406. package/dist/client/types/typeAliases.js +0 -48
  407. package/dist/client/types/utilities.js +0 -4
  408. package/dist/client/types/workflowTypes.js +0 -30
  409. package/dist/client/utils/async/withTimeout.js +0 -98
  410. package/dist/client/utils/asyncMutex.js +0 -60
  411. package/dist/client/utils/conversationMemory.js +0 -431
  412. package/dist/client/utils/csvProcessor.js +0 -846
  413. package/dist/client/utils/errorHandling.js +0 -936
  414. package/dist/client/utils/evaluationUtils.js +0 -131
  415. package/dist/client/utils/factoryProcessing.js +0 -589
  416. package/dist/client/utils/fileDetector.js +0 -2161
  417. package/dist/client/utils/imageCache.js +0 -376
  418. package/dist/client/utils/imageProcessor.js +0 -704
  419. package/dist/client/utils/logger.js +0 -491
  420. package/dist/client/utils/mcpDefaults.js +0 -134
  421. package/dist/client/utils/messageBuilder.js +0 -1653
  422. package/dist/client/utils/modelAliasResolver.js +0 -54
  423. package/dist/client/utils/modelDetection.js +0 -80
  424. package/dist/client/utils/modelRouter.js +0 -292
  425. package/dist/client/utils/multimodalOptionsBuilder.js +0 -65
  426. package/dist/client/utils/observabilityHelpers.js +0 -47
  427. package/dist/client/utils/parameterValidation.js +0 -966
  428. package/dist/client/utils/pdfProcessor.js +0 -410
  429. package/dist/client/utils/performance.js +0 -222
  430. package/dist/client/utils/pricing.js +0 -340
  431. package/dist/client/utils/promptRedaction.js +0 -62
  432. package/dist/client/utils/providerConfig.js +0 -1009
  433. package/dist/client/utils/providerHealth.js +0 -1237
  434. package/dist/client/utils/providerRetry.js +0 -112
  435. package/dist/client/utils/providerUtils.js +0 -434
  436. package/dist/client/utils/rateLimiter.js +0 -200
  437. package/dist/client/utils/redis.js +0 -368
  438. package/dist/client/utils/retryHandler.js +0 -269
  439. package/dist/client/utils/retryability.js +0 -22
  440. package/dist/client/utils/sanitizers/svg.js +0 -481
  441. package/dist/client/utils/schemaConversion.js +0 -255
  442. package/dist/client/utils/taskClassificationUtils.js +0 -149
  443. package/dist/client/utils/taskClassifier.js +0 -94
  444. package/dist/client/utils/thinkingConfig.js +0 -104
  445. package/dist/client/utils/timeout.js +0 -359
  446. package/dist/client/utils/tokenEstimation.js +0 -142
  447. package/dist/client/utils/tokenLimits.js +0 -125
  448. package/dist/client/utils/tokenUtils.js +0 -239
  449. package/dist/client/utils/toolUtils.js +0 -75
  450. package/dist/client/utils/transformationUtils.js +0 -554
  451. package/dist/client/utils/ttsProcessor.js +0 -286
  452. package/dist/client/utils/typeUtils.js +0 -97
  453. package/dist/client/utils/videoAnalysisProcessor.js +0 -67
  454. package/dist/client/workflow/config.js +0 -398
  455. package/dist/client/workflow/core/ensembleExecutor.js +0 -407
  456. package/dist/client/workflow/core/judgeScorer.js +0 -544
  457. package/dist/client/workflow/core/responseConditioner.js +0 -225
  458. package/dist/client/workflow/core/types/conditionerTypes.js +0 -7
  459. package/dist/client/workflow/core/types/ensembleTypes.js +0 -7
  460. package/dist/client/workflow/core/types/index.js +0 -7
  461. package/dist/client/workflow/core/types/judgeTypes.js +0 -7
  462. package/dist/client/workflow/core/types/layerTypes.js +0 -7
  463. package/dist/client/workflow/core/types/registryTypes.js +0 -7
  464. package/dist/client/workflow/core/workflowRegistry.js +0 -304
  465. package/dist/client/workflow/core/workflowRunner.js +0 -586
  466. package/dist/client/workflow/index.js +0 -50
  467. package/dist/client/workflow/types.js +0 -9
  468. package/dist/client/workflow/utils/types/index.js +0 -7
  469. package/dist/client/workflow/utils/workflowMetrics.js +0 -311
  470. package/dist/client/workflow/utils/workflowValidation.js +0 -420
  471. package/dist/client/workflow/workflows/adaptiveWorkflow.js +0 -366
  472. package/dist/client/workflow/workflows/consensusWorkflow.js +0 -192
  473. package/dist/client/workflow/workflows/fallbackWorkflow.js +0 -225
  474. package/dist/client/workflow/workflows/multiJudgeWorkflow.js +0 -351
  475. /package/dist/client/{client/reactHooks.js → reactHooks.js} +0 -0
@@ -1,775 +0,0 @@
1
- /**
2
- * SageMaker Language Model Implementation
3
- *
4
- * This module implements the LanguageModel interface for Amazon SageMaker
5
- * integration with the Vercel AI SDK.
6
- */
7
- import { randomUUID } from "crypto";
8
- import { SageMakerRuntimeClient } from "./client.js";
9
- import { handleSageMakerError } from "./errors.js";
10
- import { estimateTokenUsage, createSageMakerStream } from "./streaming.js";
11
- import { createAdaptiveSemaphore } from "./adaptive-semaphore.js";
12
- import { logger } from "../../utils/logger.js";
13
- /**
14
- * Base synthetic streaming delay in milliseconds for simulating real-time response
15
- * Can be configured via SAGEMAKER_BASE_STREAMING_DELAY_MS environment variable
16
- */
17
- const BASE_SYNTHETIC_STREAMING_DELAY_MS = process.env
18
- .SAGEMAKER_BASE_STREAMING_DELAY_MS
19
- ? parseInt(process.env.SAGEMAKER_BASE_STREAMING_DELAY_MS, 10)
20
- : 50;
21
- /**
22
- * Maximum synthetic streaming delay in milliseconds to prevent excessively slow streaming
23
- * Can be configured via SAGEMAKER_MAX_STREAMING_DELAY_MS environment variable
24
- */
25
- const MAX_SYNTHETIC_STREAMING_DELAY_MS = process.env
26
- .SAGEMAKER_MAX_STREAMING_DELAY_MS
27
- ? parseInt(process.env.SAGEMAKER_MAX_STREAMING_DELAY_MS, 10)
28
- : 200;
29
- /**
30
- * Calculate adaptive delay based on text size to avoid slow streaming for large texts
31
- * Smaller texts get longer delays for realistic feel, larger texts get shorter delays for performance
32
- */
33
- function calculateAdaptiveDelay(textLength, chunkCount) {
34
- // Base calculation: smaller delay for larger texts
35
- const adaptiveDelay = Math.max(10, // Minimum 10ms delay
36
- Math.min(MAX_SYNTHETIC_STREAMING_DELAY_MS, BASE_SYNTHETIC_STREAMING_DELAY_MS * (1000 / Math.max(textLength, 100))));
37
- // Further reduce delay if there are many chunks to process
38
- if (chunkCount > 20) {
39
- return Math.max(10, adaptiveDelay * 0.5); // Half delay for many chunks
40
- }
41
- else if (chunkCount > 10) {
42
- return Math.max(15, adaptiveDelay * 0.7); // Reduced delay for moderate chunks
43
- }
44
- return adaptiveDelay;
45
- }
46
- /**
47
- * Create an async iterator for text chunks with adaptive delay between chunks
48
- * Used for synthetic streaming simulation with performance optimization for large texts
49
- */
50
- async function* createTextChunkIterator(text) {
51
- if (!text) {
52
- return; // No text to emit
53
- }
54
- const words = text.split(/\s+/);
55
- const chunkSize = Math.max(1, Math.floor(words.length / 10));
56
- const totalChunks = Math.ceil(words.length / chunkSize);
57
- // Calculate adaptive delay based on text size and chunk count
58
- const adaptiveDelay = calculateAdaptiveDelay(text.length, totalChunks);
59
- for (let i = 0; i < words.length; i += chunkSize) {
60
- const chunk = words.slice(i, i + chunkSize).join(" ");
61
- const deltaText = i === 0 ? chunk : " " + chunk;
62
- // Add adaptive delay between chunks for realistic streaming simulation
63
- // Delay is shorter for larger texts to improve performance
64
- if (i > 0) {
65
- await new Promise((resolve) => setTimeout(resolve, adaptiveDelay));
66
- }
67
- yield deltaText;
68
- }
69
- }
70
- /**
71
- * Batch processing concurrency constants
72
- */
73
- const DEFAULT_INITIAL_CONCURRENCY = 5;
74
- const DEFAULT_MAX_CONCURRENCY = 10;
75
- const DEFAULT_MIN_CONCURRENCY = 1;
76
- /**
77
- * SageMaker Language Model implementing LanguageModel interface
78
- *
79
- * Token Limit Behavior:
80
- * - When maxTokens is undefined, SageMaker uses the model's default token limits
81
- * - When maxTokens is specified, it sets max_new_tokens parameter explicitly
82
- * - This aligns with the unlimited-by-default token policy across all providers
83
- */
84
- export class SageMakerLanguageModel {
85
- /**
86
- * Specification version for the AI SDK LanguageModel interface.
87
- * Uses "v2" for structural compatibility with AI SDK v6's `LanguageModelV2`.
88
- * The AI SDK checks this field to determine which interface version to use.
89
- */
90
- specificationVersion = "v2";
91
- provider = "sagemaker";
92
- modelId;
93
- supportsStreaming = true;
94
- defaultObjectGenerationMode = "json";
95
- /**
96
- * Supported URL patterns by media type.
97
- * SageMaker endpoints do not natively download URLs, so this is empty.
98
- * Required by the LanguageModelV2 interface.
99
- */
100
- supportedUrls = {};
101
- client;
102
- config;
103
- modelConfig;
104
- constructor(modelId, config, modelConfig) {
105
- this.modelId = modelId;
106
- this.config = config;
107
- this.modelConfig = modelConfig;
108
- this.client = new SageMakerRuntimeClient(config);
109
- logger.debug("SageMaker Language Model initialized", {
110
- modelId: this.modelId,
111
- endpointName: this.modelConfig.endpointName,
112
- provider: this.provider,
113
- specificationVersion: this.specificationVersion,
114
- });
115
- }
116
- /**
117
- * Generate text synchronously using SageMaker endpoint
118
- */
119
- async doGenerate(options) {
120
- const startTime = Date.now();
121
- try {
122
- const promptText = this.extractPromptText(options);
123
- logger.debug("SageMaker doGenerate called", {
124
- endpointName: this.modelConfig.endpointName,
125
- promptLength: promptText.length,
126
- maxTokens: options.maxTokens,
127
- temperature: options.temperature,
128
- });
129
- // Convert AI SDK options to SageMaker request format
130
- const sagemakerRequest = this.convertToSageMakerRequest(options);
131
- // Invoke SageMaker endpoint
132
- const response = await this.client.invokeEndpoint({
133
- EndpointName: this.modelConfig.endpointName,
134
- Body: JSON.stringify(sagemakerRequest),
135
- ContentType: "application/json",
136
- Accept: "application/json",
137
- });
138
- // Parse SageMaker response
139
- const responseBody = JSON.parse(new TextDecoder().decode(response.Body));
140
- const generatedText = this.extractTextFromResponse(responseBody);
141
- // Extract tool calls if present (Phase 4 enhancement)
142
- const toolCalls = this.extractToolCallsFromResponse(responseBody);
143
- // Calculate token usage
144
- const usage = estimateTokenUsage(promptText, generatedText);
145
- // Determine finish reason based on response content
146
- let finishReason = "stop";
147
- if (toolCalls && toolCalls.length > 0) {
148
- finishReason = "tool-calls";
149
- }
150
- else if (responseBody.finish_reason) {
151
- finishReason = this.mapSageMakerFinishReason(responseBody.finish_reason);
152
- }
153
- const duration = Date.now() - startTime;
154
- logger.debug("SageMaker doGenerate completed", {
155
- duration,
156
- outputLength: generatedText.length,
157
- usage,
158
- toolCallsCount: toolCalls?.length || 0,
159
- finishReason,
160
- });
161
- const result = {
162
- text: generatedText,
163
- usage: {
164
- inputTokens: usage.promptTokens,
165
- outputTokens: usage.completionTokens,
166
- totalTokens: usage.total,
167
- },
168
- finishReason,
169
- rawCall: {
170
- rawPrompt: options.prompt,
171
- rawSettings: {
172
- maxTokens: options.maxTokens,
173
- temperature: options.temperature,
174
- topP: options.topP,
175
- endpointName: this.modelConfig.endpointName,
176
- },
177
- },
178
- rawResponse: {
179
- headers: {
180
- "content-type": response.ContentType || "application/json",
181
- "invoked-variant": response.InvokedProductionVariant || "",
182
- },
183
- },
184
- request: {
185
- body: JSON.stringify(sagemakerRequest),
186
- },
187
- };
188
- // Add tool calls to result if present
189
- if (toolCalls && toolCalls.length > 0) {
190
- result.toolCalls = toolCalls;
191
- }
192
- // Add structured data if response format was specified (Phase 4)
193
- const responseFormat = sagemakerRequest
194
- .response_format;
195
- if (responseFormat &&
196
- (responseFormat.type === "json_object" ||
197
- responseFormat.type === "json_schema")) {
198
- try {
199
- const parsedData = JSON.parse(generatedText);
200
- result.object = parsedData;
201
- logger.debug("Extracted structured data from response", {
202
- responseFormat: responseFormat.type,
203
- hasObject: !!result.object,
204
- });
205
- }
206
- catch (parseError) {
207
- logger.warn("Failed to parse structured response as JSON", {
208
- error: parseError instanceof Error
209
- ? parseError.message
210
- : String(parseError),
211
- responseText: generatedText.substring(0, 200),
212
- });
213
- // Keep the text response as fallback
214
- }
215
- }
216
- return result;
217
- }
218
- catch (error) {
219
- const duration = Date.now() - startTime;
220
- logger.error("SageMaker doGenerate failed", {
221
- duration,
222
- error: error instanceof Error ? error.message : String(error),
223
- });
224
- throw handleSageMakerError(error, this.modelConfig.endpointName);
225
- }
226
- }
227
- /**
228
- * Generate text with streaming using SageMaker endpoint
229
- */
230
- async doStream(options) {
231
- try {
232
- const promptText = this.extractPromptText(options);
233
- logger.debug("SageMaker doStream called", {
234
- endpointName: this.modelConfig.endpointName,
235
- promptLength: promptText.length,
236
- });
237
- // Phase 2: Full streaming implementation with automatic detection
238
- const sagemakerRequest = this.convertToSageMakerRequest(options);
239
- // Add streaming parameter if model supports it
240
- const requestWithStreaming = {
241
- ...sagemakerRequest,
242
- parameters: {
243
- ...(typeof sagemakerRequest.parameters === "object" &&
244
- sagemakerRequest.parameters !== null
245
- ? sagemakerRequest.parameters
246
- : {}),
247
- stream: true, // Will be validated by detection system
248
- },
249
- };
250
- logger.debug("Attempting streaming generation", {
251
- endpointName: this.modelConfig.endpointName,
252
- hasStreamingFlag: true,
253
- });
254
- try {
255
- // First, try to invoke with streaming
256
- const response = await this.client.invokeEndpointWithStreaming({
257
- EndpointName: this.modelConfig.endpointName,
258
- Body: JSON.stringify(requestWithStreaming),
259
- ContentType: this.modelConfig.contentType || "application/json",
260
- Accept: this.modelConfig.accept || "application/json",
261
- });
262
- // Create intelligent streaming response
263
- const stream = await createSageMakerStream(response.Body, this.modelConfig.endpointName, this.config, {
264
- prompt: promptText,
265
- onChunk: (chunk) => {
266
- logger.debug("Streaming chunk received", {
267
- contentLength: chunk.content?.length || 0,
268
- done: chunk.done,
269
- });
270
- },
271
- onComplete: (usage) => {
272
- logger.debug("Streaming completed", {
273
- usage,
274
- endpointName: this.modelConfig.endpointName,
275
- });
276
- },
277
- onError: (error) => {
278
- logger.error("Streaming error", {
279
- error: error.message,
280
- endpointName: this.modelConfig.endpointName,
281
- });
282
- },
283
- });
284
- return {
285
- stream: stream,
286
- rawCall: {
287
- rawPrompt: sagemakerRequest,
288
- rawSettings: this.modelConfig,
289
- },
290
- rawResponse: {
291
- headers: {
292
- "Content-Type": response.ContentType || "application/json",
293
- "X-Invoked-Production-Variant": response.InvokedProductionVariant || "unknown",
294
- },
295
- },
296
- };
297
- }
298
- catch (streamingError) {
299
- logger.warn("Streaming failed, falling back to non-streaming", {
300
- endpointName: this.modelConfig.endpointName,
301
- error: streamingError instanceof Error
302
- ? streamingError.message
303
- : String(streamingError),
304
- });
305
- // Fallback: Generate normally and create synthetic stream
306
- const result = await this.doGenerate(options);
307
- // Create synthetic stream from complete result using async iterator pattern
308
- const syntheticStream = new ReadableStream({
309
- async start(controller) {
310
- try {
311
- // Create async iterator for text chunks
312
- const textChunks = createTextChunkIterator(result.text);
313
- // Process chunks with async iterator pattern
314
- for await (const deltaText of textChunks) {
315
- controller.enqueue({
316
- type: "text-delta",
317
- textDelta: deltaText,
318
- });
319
- }
320
- // Emit completion
321
- controller.enqueue({
322
- type: "finish",
323
- finishReason: result.finishReason,
324
- usage: result.usage,
325
- });
326
- controller.close();
327
- }
328
- catch (error) {
329
- controller.error(error);
330
- }
331
- },
332
- });
333
- return {
334
- stream: syntheticStream,
335
- rawCall: result.rawCall,
336
- rawResponse: result.rawResponse,
337
- request: result.request,
338
- warnings: [
339
- ...(result.warnings || []),
340
- {
341
- type: "other",
342
- message: "Streaming not supported, using synthetic stream",
343
- },
344
- ],
345
- };
346
- }
347
- }
348
- catch (error) {
349
- logger.error("SageMaker doStream failed", {
350
- error: error instanceof Error ? error.message : String(error),
351
- });
352
- throw handleSageMakerError(error, this.modelConfig.endpointName);
353
- }
354
- }
355
- /**
356
- * Convert AI SDK options to SageMaker request format
357
- */
358
- convertToSageMakerRequest(options) {
359
- const promptText = this.extractPromptText(options);
360
- // Enhanced SageMaker request format with tool support (Phase 4)
361
- const request = {
362
- inputs: promptText,
363
- parameters: {
364
- // Only include max_new_tokens if explicitly specified; let SageMaker use model defaults otherwise
365
- ...(options.maxTokens !== undefined
366
- ? { max_new_tokens: options.maxTokens }
367
- : {}),
368
- temperature: options.temperature || 0.7,
369
- top_p: options.topP || 0.9,
370
- stop: options.stopSequences || [],
371
- },
372
- };
373
- // Add tool support if tools are present
374
- const tools = options.tools;
375
- if (tools && Array.isArray(tools) && tools.length > 0) {
376
- request.tools = this.convertToolsToSageMakerFormat(tools);
377
- // Add tool choice if specified
378
- const toolChoice = options.toolChoice;
379
- if (toolChoice) {
380
- request.tool_choice =
381
- this.convertToolChoiceToSageMakerFormat(toolChoice);
382
- }
383
- logger.debug("Added tool support to SageMaker request", {
384
- toolCount: tools.length,
385
- toolChoice: toolChoice,
386
- });
387
- }
388
- // Add structured output support (Phase 4)
389
- const responseFormat = options
390
- .responseFormat;
391
- if (responseFormat) {
392
- request.response_format =
393
- this.convertResponseFormatToSageMakerFormat(responseFormat);
394
- logger.debug("Added structured output support to SageMaker request", {
395
- responseFormat: responseFormat.type,
396
- });
397
- }
398
- logger.debug("Converted to SageMaker request format", {
399
- inputLength: promptText.length,
400
- parameters: request.parameters,
401
- hasTools: !!request.tools,
402
- });
403
- return request;
404
- }
405
- /**
406
- * Convert Vercel AI SDK tools to SageMaker format
407
- */
408
- convertToolsToSageMakerFormat(tools) {
409
- return tools.map((tool) => {
410
- if (tool.type === "function") {
411
- return {
412
- type: "function",
413
- function: {
414
- name: tool.function.name,
415
- description: tool.function.description || "",
416
- parameters: tool.function.parameters || {},
417
- },
418
- };
419
- }
420
- return tool; // Pass through other tool types
421
- });
422
- }
423
- /**
424
- * Convert Vercel AI SDK tool choice to SageMaker format
425
- */
426
- convertToolChoiceToSageMakerFormat(toolChoice) {
427
- if (typeof toolChoice === "string") {
428
- return toolChoice; // 'auto', 'none', etc.
429
- }
430
- if (toolChoice?.type === "function") {
431
- return {
432
- type: "function",
433
- function: {
434
- name: toolChoice.function.name,
435
- },
436
- };
437
- }
438
- return toolChoice;
439
- }
440
- /**
441
- * Convert Vercel AI SDK response format to SageMaker format (Phase 4)
442
- */
443
- convertResponseFormatToSageMakerFormat(responseFormat) {
444
- if (responseFormat.type === "json_object") {
445
- return {
446
- type: "json_object",
447
- schema: responseFormat.schema || undefined,
448
- };
449
- }
450
- if (responseFormat.type === "json_schema") {
451
- return {
452
- type: "json_schema",
453
- json_schema: {
454
- name: responseFormat.json_schema?.name || "response",
455
- description: responseFormat.json_schema?.description ||
456
- "Generated response",
457
- schema: responseFormat.json_schema?.schema || {},
458
- },
459
- };
460
- }
461
- // Default to text
462
- return {
463
- type: "text",
464
- };
465
- }
466
- /**
467
- * Extract text content from AI SDK prompt format
468
- */
469
- extractPromptText(options) {
470
- // Check for messages first (like Ollama)
471
- const messages = options.messages;
472
- if (messages && Array.isArray(messages)) {
473
- return messages
474
- .filter((msg) => msg.role && msg.content)
475
- .map((msg) => {
476
- if (typeof msg.content === "string") {
477
- return `${msg.role}: ${msg.content}`;
478
- }
479
- return `${msg.role}: ${JSON.stringify(msg.content)}`;
480
- })
481
- .join("\n");
482
- }
483
- // Fallback to prompt property
484
- const prompt = options.prompt;
485
- if (typeof prompt === "string") {
486
- return prompt;
487
- }
488
- if (Array.isArray(prompt)) {
489
- return prompt
490
- .filter((msg) => msg.role && msg.content)
491
- .map((msg) => {
492
- if (typeof msg.content === "string") {
493
- return `${msg.role}: ${msg.content}`;
494
- }
495
- return `${msg.role}: ${JSON.stringify(msg.content)}`;
496
- })
497
- .join("\n");
498
- }
499
- return String(prompt);
500
- }
501
- /**
502
- * Extract generated text from SageMaker response
503
- */
504
- extractTextFromResponse(responseBody) {
505
- // Handle common SageMaker response formats
506
- if (typeof responseBody === "string") {
507
- return responseBody;
508
- }
509
- if (responseBody.generated_text) {
510
- return responseBody.generated_text;
511
- }
512
- if (responseBody.outputs) {
513
- return responseBody.outputs;
514
- }
515
- if (responseBody.text) {
516
- return responseBody.text;
517
- }
518
- if (Array.isArray(responseBody) && responseBody[0]?.generated_text) {
519
- return responseBody[0].generated_text;
520
- }
521
- // Handle response with tool calls
522
- if (responseBody.choices && Array.isArray(responseBody.choices)) {
523
- const choice = responseBody.choices[0];
524
- if (choice?.message?.content) {
525
- return choice.message.content;
526
- }
527
- }
528
- // Fallback: stringify the entire response
529
- return JSON.stringify(responseBody);
530
- }
531
- /**
532
- * Extract tool calls from SageMaker response (Phase 4)
533
- */
534
- extractToolCallsFromResponse(responseBody) {
535
- // Handle OpenAI-compatible format (common for many SageMaker models)
536
- if (responseBody.choices && Array.isArray(responseBody.choices)) {
537
- const choice = responseBody.choices[0];
538
- if (choice?.message?.tool_calls) {
539
- return choice.message.tool_calls.map((toolCall) => ({
540
- type: "function",
541
- id: String(toolCall.id || `call_${randomUUID()}`),
542
- function: {
543
- name: String(toolCall.function.name),
544
- arguments: String(toolCall.function.arguments),
545
- },
546
- }));
547
- }
548
- }
549
- // Handle custom SageMaker tool call format
550
- if (responseBody.tool_calls && Array.isArray(responseBody.tool_calls)) {
551
- return responseBody.tool_calls;
552
- }
553
- // Handle Anthropic-style tool use
554
- if (responseBody.content && Array.isArray(responseBody.content)) {
555
- const toolUses = responseBody.content.filter((item) => item.type === "tool_use");
556
- if (toolUses.length > 0) {
557
- return toolUses.map((toolUse) => ({
558
- type: "function",
559
- id: String(toolUse.id || `call_${randomUUID()}`),
560
- function: {
561
- name: String(toolUse.name),
562
- arguments: JSON.stringify(toolUse.input || {}),
563
- },
564
- }));
565
- }
566
- }
567
- return undefined;
568
- }
569
- /**
570
- * Map SageMaker finish reason to standardized format
571
- */
572
- mapSageMakerFinishReason(sagemakerReason) {
573
- switch (sagemakerReason?.toLowerCase()) {
574
- case "stop":
575
- case "end_turn":
576
- case "stop_sequence":
577
- return "stop";
578
- case "length":
579
- case "max_tokens":
580
- case "max_length":
581
- return "length";
582
- case "content_filter":
583
- case "content_filtered":
584
- return "content-filter";
585
- case "tool_calls":
586
- case "function_call":
587
- return "tool-calls";
588
- case "error":
589
- return "error";
590
- default:
591
- return "unknown";
592
- }
593
- }
594
- /**
595
- * Get model configuration summary for debugging
596
- */
597
- getModelInfo() {
598
- return {
599
- modelId: this.modelId,
600
- provider: this.provider,
601
- specificationVersion: this.specificationVersion,
602
- endpointName: this.modelConfig.endpointName,
603
- modelType: this.modelConfig.modelType,
604
- region: this.config.region,
605
- };
606
- }
607
- /**
608
- * Test basic connectivity to the SageMaker endpoint
609
- */
610
- async testConnectivity() {
611
- try {
612
- // Use the same pattern as Ollama - pass messages directly
613
- const result = await this.doGenerate({
614
- inputFormat: "messages",
615
- mode: { type: "regular" },
616
- prompt: [
617
- { role: "user", content: [{ type: "text", text: "Hello" }] },
618
- ],
619
- maxTokens: 10,
620
- });
621
- return {
622
- success: !!result.text,
623
- };
624
- }
625
- catch (error) {
626
- return {
627
- success: false,
628
- error: error instanceof Error ? error.message : String(error),
629
- };
630
- }
631
- }
632
- /**
633
- * Batch inference support (Phase 4)
634
- * Process multiple prompts in a single request for efficiency
635
- */
636
- async doBatchGenerate(prompts, options) {
637
- try {
638
- logger.debug("SageMaker batch generate called", {
639
- batchSize: prompts.length,
640
- endpointName: this.modelConfig.endpointName,
641
- });
642
- // Advanced parallel processing with dynamic concurrency and error handling
643
- const results = await this.processPromptsInParallel(prompts, options);
644
- logger.debug("SageMaker batch generate completed", {
645
- batchSize: prompts.length,
646
- successCount: results.length,
647
- });
648
- return results;
649
- }
650
- catch (error) {
651
- logger.error("SageMaker batch generate failed", {
652
- error: error instanceof Error ? error.message : String(error),
653
- batchSize: prompts.length,
654
- });
655
- throw handleSageMakerError(error, this.modelConfig.endpointName);
656
- }
657
- }
658
- /**
659
- * Process prompts in parallel with advanced concurrency control and error handling
660
- */
661
- async processPromptsInParallel(prompts, options) {
662
- // Dynamic concurrency based on batch size and endpoint capacity
663
- const INITIAL_CONCURRENCY = Math.min(this.modelConfig.initialConcurrency ?? DEFAULT_INITIAL_CONCURRENCY, prompts.length);
664
- const MAX_CONCURRENCY = this.modelConfig.maxConcurrency ?? DEFAULT_MAX_CONCURRENCY;
665
- const MIN_CONCURRENCY = this.modelConfig.minConcurrency ?? DEFAULT_MIN_CONCURRENCY;
666
- const results = new Array(prompts.length);
667
- const errors = [];
668
- // Use adaptive semaphore utility for concurrency control
669
- const semaphore = createAdaptiveSemaphore(INITIAL_CONCURRENCY, MAX_CONCURRENCY, MIN_CONCURRENCY);
670
- // Process each prompt with adaptive concurrency
671
- const processPrompt = async (prompt, index) => {
672
- await semaphore.acquire();
673
- const startTime = Date.now();
674
- try {
675
- const result = await this.doGenerate({
676
- inputFormat: "messages",
677
- mode: { type: "regular" },
678
- prompt: [
679
- {
680
- role: "user",
681
- content: [{ type: "text", text: prompt }],
682
- },
683
- ],
684
- maxTokens: options?.maxTokens,
685
- temperature: options?.temperature,
686
- topP: options?.topP,
687
- });
688
- const duration = Date.now() - startTime;
689
- results[index] = {
690
- text: result.text || "",
691
- usage: {
692
- promptTokens: result.usage.inputTokens ?? 0,
693
- completionTokens: result.usage.outputTokens ?? 0,
694
- total: result.usage.totalTokens ??
695
- (result.usage.inputTokens ?? 0) +
696
- (result.usage.outputTokens ?? 0),
697
- },
698
- finishReason: result.finishReason,
699
- index,
700
- };
701
- // Record successful completion for adaptive concurrency adjustment
702
- semaphore.recordSuccess(duration);
703
- }
704
- catch (error) {
705
- errors.push({
706
- index,
707
- error: error instanceof Error ? error : new Error(String(error)),
708
- });
709
- // Record error for adaptive concurrency adjustment
710
- const duration = Date.now() - startTime;
711
- semaphore.recordError(duration);
712
- // Create error result
713
- results[index] = {
714
- text: "",
715
- usage: { promptTokens: 0, completionTokens: 0, total: 0 },
716
- finishReason: "error",
717
- index,
718
- };
719
- }
720
- finally {
721
- semaphore.release();
722
- }
723
- };
724
- // Start all requests with concurrency control
725
- const allPromises = prompts.map((prompt, index) => processPrompt(prompt, index));
726
- // Wait for all requests to complete
727
- await Promise.all(allPromises);
728
- // Log final statistics using semaphore metrics
729
- const metrics = semaphore.getMetrics();
730
- logger.debug("Parallel batch processing completed", {
731
- totalPrompts: prompts.length,
732
- successCount: metrics.completedCount,
733
- errorCount: metrics.errorCount,
734
- finalConcurrency: metrics.currentConcurrency,
735
- errorRate: metrics.errorCount / prompts.length,
736
- averageResponseTime: metrics.averageResponseTime,
737
- });
738
- // If we have too many errors, log them for debugging
739
- if (errors.length > 0) {
740
- logger.warn("Batch processing encountered errors", {
741
- errorCount: errors.length,
742
- sampleErrors: errors.slice(0, 3).map((e) => ({
743
- index: e.index,
744
- message: e.error.message,
745
- })),
746
- });
747
- }
748
- // Return results in original order (already sorted by index)
749
- return results.map(({ text, usage, finishReason }) => ({
750
- text,
751
- usage,
752
- finishReason,
753
- }));
754
- }
755
- /**
756
- * Enhanced model information with batch capabilities
757
- */
758
- getModelCapabilities() {
759
- return {
760
- ...this.getModelInfo(),
761
- capabilities: {
762
- streaming: true,
763
- toolCalling: true,
764
- structuredOutput: true,
765
- batchInference: true,
766
- supportedResponseFormats: ["text", "json_object", "json_schema"],
767
- supportedToolTypes: ["function"],
768
- maxBatchSize: 100, // Increased limit with parallel processing
769
- adaptiveConcurrency: true,
770
- errorRecovery: true,
771
- },
772
- };
773
- }
774
- }
775
- export default SageMakerLanguageModel;