modelfusion 0.0.44

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (405) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +429 -0
  3. package/composed-function/index.cjs +22 -0
  4. package/composed-function/index.d.ts +6 -0
  5. package/composed-function/index.js +6 -0
  6. package/composed-function/summarize/SummarizationFunction.cjs +2 -0
  7. package/composed-function/summarize/SummarizationFunction.d.ts +4 -0
  8. package/composed-function/summarize/SummarizationFunction.js +1 -0
  9. package/composed-function/summarize/summarizeRecursively.cjs +19 -0
  10. package/composed-function/summarize/summarizeRecursively.d.ts +11 -0
  11. package/composed-function/summarize/summarizeRecursively.js +15 -0
  12. package/composed-function/summarize/summarizeRecursivelyWithTextGenerationAndTokenSplitting.cjs +29 -0
  13. package/composed-function/summarize/summarizeRecursivelyWithTextGenerationAndTokenSplitting.d.ts +24 -0
  14. package/composed-function/summarize/summarizeRecursivelyWithTextGenerationAndTokenSplitting.js +25 -0
  15. package/composed-function/use-tool/NoSuchToolError.cjs +17 -0
  16. package/composed-function/use-tool/NoSuchToolError.d.ts +4 -0
  17. package/composed-function/use-tool/NoSuchToolError.js +13 -0
  18. package/composed-function/use-tool/Tool.cjs +43 -0
  19. package/composed-function/use-tool/Tool.d.ts +15 -0
  20. package/composed-function/use-tool/Tool.js +39 -0
  21. package/composed-function/use-tool/useTool.cjs +59 -0
  22. package/composed-function/use-tool/useTool.d.ts +36 -0
  23. package/composed-function/use-tool/useTool.js +54 -0
  24. package/cost/Cost.cjs +38 -0
  25. package/cost/Cost.d.ts +16 -0
  26. package/cost/Cost.js +34 -0
  27. package/cost/CostCalculator.cjs +2 -0
  28. package/cost/CostCalculator.d.ts +8 -0
  29. package/cost/CostCalculator.js +1 -0
  30. package/cost/calculateCost.cjs +28 -0
  31. package/cost/calculateCost.d.ts +7 -0
  32. package/cost/calculateCost.js +24 -0
  33. package/cost/index.cjs +19 -0
  34. package/cost/index.d.ts +3 -0
  35. package/cost/index.js +3 -0
  36. package/index.cjs +25 -0
  37. package/index.d.ts +9 -0
  38. package/index.js +9 -0
  39. package/model-function/AbstractModel.cjs +22 -0
  40. package/model-function/AbstractModel.d.ts +12 -0
  41. package/model-function/AbstractModel.js +18 -0
  42. package/model-function/FunctionOptions.cjs +2 -0
  43. package/model-function/FunctionOptions.d.ts +6 -0
  44. package/model-function/FunctionOptions.js +1 -0
  45. package/model-function/Model.cjs +2 -0
  46. package/model-function/Model.d.ts +23 -0
  47. package/model-function/Model.js +1 -0
  48. package/model-function/ModelCallEvent.cjs +2 -0
  49. package/model-function/ModelCallEvent.d.ts +18 -0
  50. package/model-function/ModelCallEvent.js +1 -0
  51. package/model-function/ModelCallEventSource.cjs +42 -0
  52. package/model-function/ModelCallEventSource.d.ts +13 -0
  53. package/model-function/ModelCallEventSource.js +38 -0
  54. package/model-function/ModelCallObserver.cjs +2 -0
  55. package/model-function/ModelCallObserver.d.ts +5 -0
  56. package/model-function/ModelCallObserver.js +1 -0
  57. package/model-function/ModelInformation.cjs +2 -0
  58. package/model-function/ModelInformation.d.ts +4 -0
  59. package/model-function/ModelInformation.js +1 -0
  60. package/model-function/SuccessfulModelCall.cjs +22 -0
  61. package/model-function/SuccessfulModelCall.d.ts +9 -0
  62. package/model-function/SuccessfulModelCall.js +18 -0
  63. package/model-function/embed-text/TextEmbeddingEvent.cjs +2 -0
  64. package/model-function/embed-text/TextEmbeddingEvent.d.ts +23 -0
  65. package/model-function/embed-text/TextEmbeddingEvent.js +1 -0
  66. package/model-function/embed-text/TextEmbeddingModel.cjs +2 -0
  67. package/model-function/embed-text/TextEmbeddingModel.d.ts +18 -0
  68. package/model-function/embed-text/TextEmbeddingModel.js +1 -0
  69. package/model-function/embed-text/embedText.cjs +90 -0
  70. package/model-function/embed-text/embedText.d.ts +33 -0
  71. package/model-function/embed-text/embedText.js +85 -0
  72. package/model-function/executeCall.cjs +60 -0
  73. package/model-function/executeCall.d.ts +27 -0
  74. package/model-function/executeCall.js +56 -0
  75. package/model-function/generate-image/ImageGenerationEvent.cjs +2 -0
  76. package/model-function/generate-image/ImageGenerationEvent.d.ts +22 -0
  77. package/model-function/generate-image/ImageGenerationEvent.js +1 -0
  78. package/model-function/generate-image/ImageGenerationModel.cjs +2 -0
  79. package/model-function/generate-image/ImageGenerationModel.d.ts +8 -0
  80. package/model-function/generate-image/ImageGenerationModel.js +1 -0
  81. package/model-function/generate-image/generateImage.cjs +63 -0
  82. package/model-function/generate-image/generateImage.d.ts +23 -0
  83. package/model-function/generate-image/generateImage.js +59 -0
  84. package/model-function/generate-json/GenerateJsonModel.cjs +2 -0
  85. package/model-function/generate-json/GenerateJsonModel.d.ts +10 -0
  86. package/model-function/generate-json/GenerateJsonModel.js +1 -0
  87. package/model-function/generate-json/GenerateJsonOrTextModel.cjs +2 -0
  88. package/model-function/generate-json/GenerateJsonOrTextModel.d.ts +18 -0
  89. package/model-function/generate-json/GenerateJsonOrTextModel.js +1 -0
  90. package/model-function/generate-json/JsonGenerationEvent.cjs +2 -0
  91. package/model-function/generate-json/JsonGenerationEvent.d.ts +22 -0
  92. package/model-function/generate-json/JsonGenerationEvent.js +1 -0
  93. package/model-function/generate-json/NoSuchSchemaError.cjs +17 -0
  94. package/model-function/generate-json/NoSuchSchemaError.d.ts +4 -0
  95. package/model-function/generate-json/NoSuchSchemaError.js +13 -0
  96. package/model-function/generate-json/SchemaDefinition.cjs +2 -0
  97. package/model-function/generate-json/SchemaDefinition.d.ts +6 -0
  98. package/model-function/generate-json/SchemaDefinition.js +1 -0
  99. package/model-function/generate-json/SchemaValidationError.cjs +36 -0
  100. package/model-function/generate-json/SchemaValidationError.d.ts +11 -0
  101. package/model-function/generate-json/SchemaValidationError.js +32 -0
  102. package/model-function/generate-json/generateJson.cjs +61 -0
  103. package/model-function/generate-json/generateJson.d.ts +9 -0
  104. package/model-function/generate-json/generateJson.js +57 -0
  105. package/model-function/generate-json/generateJsonOrText.cjs +74 -0
  106. package/model-function/generate-json/generateJsonOrText.d.ts +25 -0
  107. package/model-function/generate-json/generateJsonOrText.js +70 -0
  108. package/model-function/generate-text/AsyncQueue.cjs +66 -0
  109. package/model-function/generate-text/AsyncQueue.d.ts +17 -0
  110. package/model-function/generate-text/AsyncQueue.js +62 -0
  111. package/model-function/generate-text/DeltaEvent.cjs +2 -0
  112. package/model-function/generate-text/DeltaEvent.d.ts +7 -0
  113. package/model-function/generate-text/DeltaEvent.js +1 -0
  114. package/model-function/generate-text/TextDeltaEventSource.cjs +54 -0
  115. package/model-function/generate-text/TextDeltaEventSource.d.ts +5 -0
  116. package/model-function/generate-text/TextDeltaEventSource.js +46 -0
  117. package/model-function/generate-text/TextGenerationEvent.cjs +2 -0
  118. package/model-function/generate-text/TextGenerationEvent.d.ts +22 -0
  119. package/model-function/generate-text/TextGenerationEvent.js +1 -0
  120. package/model-function/generate-text/TextGenerationModel.cjs +2 -0
  121. package/model-function/generate-text/TextGenerationModel.d.ts +42 -0
  122. package/model-function/generate-text/TextGenerationModel.js +1 -0
  123. package/model-function/generate-text/TextStreamingEvent.cjs +2 -0
  124. package/model-function/generate-text/TextStreamingEvent.d.ts +22 -0
  125. package/model-function/generate-text/TextStreamingEvent.js +1 -0
  126. package/model-function/generate-text/extractTextDeltas.cjs +23 -0
  127. package/model-function/generate-text/extractTextDeltas.d.ts +7 -0
  128. package/model-function/generate-text/extractTextDeltas.js +19 -0
  129. package/model-function/generate-text/generateText.cjs +67 -0
  130. package/model-function/generate-text/generateText.d.ts +20 -0
  131. package/model-function/generate-text/generateText.js +63 -0
  132. package/model-function/generate-text/parseEventSourceReadableStream.cjs +30 -0
  133. package/model-function/generate-text/parseEventSourceReadableStream.d.ts +8 -0
  134. package/model-function/generate-text/parseEventSourceReadableStream.js +26 -0
  135. package/model-function/generate-text/streamText.cjs +115 -0
  136. package/model-function/generate-text/streamText.d.ts +11 -0
  137. package/model-function/generate-text/streamText.js +111 -0
  138. package/model-function/index.cjs +47 -0
  139. package/model-function/index.d.ts +31 -0
  140. package/model-function/index.js +31 -0
  141. package/model-function/tokenize-text/Tokenizer.cjs +2 -0
  142. package/model-function/tokenize-text/Tokenizer.d.ts +19 -0
  143. package/model-function/tokenize-text/Tokenizer.js +1 -0
  144. package/model-function/tokenize-text/countTokens.cjs +10 -0
  145. package/model-function/tokenize-text/countTokens.d.ts +5 -0
  146. package/model-function/tokenize-text/countTokens.js +6 -0
  147. package/model-function/transcribe-audio/TranscriptionEvent.cjs +2 -0
  148. package/model-function/transcribe-audio/TranscriptionEvent.d.ts +22 -0
  149. package/model-function/transcribe-audio/TranscriptionEvent.js +1 -0
  150. package/model-function/transcribe-audio/TranscriptionModel.cjs +2 -0
  151. package/model-function/transcribe-audio/TranscriptionModel.d.ts +8 -0
  152. package/model-function/transcribe-audio/TranscriptionModel.js +1 -0
  153. package/model-function/transcribe-audio/transcribe.cjs +62 -0
  154. package/model-function/transcribe-audio/transcribe.d.ts +22 -0
  155. package/model-function/transcribe-audio/transcribe.js +58 -0
  156. package/model-provider/automatic1111/Automatic1111Error.cjs +39 -0
  157. package/model-provider/automatic1111/Automatic1111Error.d.ts +31 -0
  158. package/model-provider/automatic1111/Automatic1111Error.js +31 -0
  159. package/model-provider/automatic1111/Automatic1111ImageGenerationModel.cjs +76 -0
  160. package/model-provider/automatic1111/Automatic1111ImageGenerationModel.d.ts +54 -0
  161. package/model-provider/automatic1111/Automatic1111ImageGenerationModel.js +72 -0
  162. package/model-provider/automatic1111/index.cjs +20 -0
  163. package/model-provider/automatic1111/index.d.ts +2 -0
  164. package/model-provider/automatic1111/index.js +2 -0
  165. package/model-provider/cohere/CohereError.cjs +36 -0
  166. package/model-provider/cohere/CohereError.d.ts +22 -0
  167. package/model-provider/cohere/CohereError.js +28 -0
  168. package/model-provider/cohere/CohereTextEmbeddingModel.cjs +172 -0
  169. package/model-provider/cohere/CohereTextEmbeddingModel.d.ts +119 -0
  170. package/model-provider/cohere/CohereTextEmbeddingModel.js +165 -0
  171. package/model-provider/cohere/CohereTextGenerationModel.cjs +283 -0
  172. package/model-provider/cohere/CohereTextGenerationModel.d.ts +203 -0
  173. package/model-provider/cohere/CohereTextGenerationModel.js +276 -0
  174. package/model-provider/cohere/CohereTokenizer.cjs +136 -0
  175. package/model-provider/cohere/CohereTokenizer.d.ts +118 -0
  176. package/model-provider/cohere/CohereTokenizer.js +129 -0
  177. package/model-provider/cohere/index.cjs +22 -0
  178. package/model-provider/cohere/index.d.ts +4 -0
  179. package/model-provider/cohere/index.js +4 -0
  180. package/model-provider/huggingface/HuggingFaceError.cjs +52 -0
  181. package/model-provider/huggingface/HuggingFaceError.d.ts +22 -0
  182. package/model-provider/huggingface/HuggingFaceError.js +44 -0
  183. package/model-provider/huggingface/HuggingFaceTextGenerationModel.cjs +174 -0
  184. package/model-provider/huggingface/HuggingFaceTextGenerationModel.d.ts +75 -0
  185. package/model-provider/huggingface/HuggingFaceTextGenerationModel.js +167 -0
  186. package/model-provider/huggingface/index.cjs +20 -0
  187. package/model-provider/huggingface/index.d.ts +2 -0
  188. package/model-provider/huggingface/index.js +2 -0
  189. package/model-provider/index.cjs +22 -0
  190. package/model-provider/index.d.ts +6 -0
  191. package/model-provider/index.js +6 -0
  192. package/model-provider/llamacpp/LlamaCppError.cjs +52 -0
  193. package/model-provider/llamacpp/LlamaCppError.d.ts +22 -0
  194. package/model-provider/llamacpp/LlamaCppError.js +44 -0
  195. package/model-provider/llamacpp/LlamaCppTextEmbeddingModel.cjs +96 -0
  196. package/model-provider/llamacpp/LlamaCppTextEmbeddingModel.d.ts +40 -0
  197. package/model-provider/llamacpp/LlamaCppTextEmbeddingModel.js +89 -0
  198. package/model-provider/llamacpp/LlamaCppTextGenerationModel.cjs +245 -0
  199. package/model-provider/llamacpp/LlamaCppTextGenerationModel.d.ts +399 -0
  200. package/model-provider/llamacpp/LlamaCppTextGenerationModel.js +238 -0
  201. package/model-provider/llamacpp/LlamaCppTokenizer.cjs +64 -0
  202. package/model-provider/llamacpp/LlamaCppTokenizer.d.ts +38 -0
  203. package/model-provider/llamacpp/LlamaCppTokenizer.js +57 -0
  204. package/model-provider/llamacpp/index.cjs +22 -0
  205. package/model-provider/llamacpp/index.d.ts +4 -0
  206. package/model-provider/llamacpp/index.js +4 -0
  207. package/model-provider/openai/OpenAICostCalculator.cjs +71 -0
  208. package/model-provider/openai/OpenAICostCalculator.d.ts +6 -0
  209. package/model-provider/openai/OpenAICostCalculator.js +67 -0
  210. package/model-provider/openai/OpenAIError.cjs +50 -0
  211. package/model-provider/openai/OpenAIError.d.ts +47 -0
  212. package/model-provider/openai/OpenAIError.js +42 -0
  213. package/model-provider/openai/OpenAIImageGenerationModel.cjs +124 -0
  214. package/model-provider/openai/OpenAIImageGenerationModel.d.ts +113 -0
  215. package/model-provider/openai/OpenAIImageGenerationModel.js +119 -0
  216. package/model-provider/openai/OpenAIModelSettings.cjs +2 -0
  217. package/model-provider/openai/OpenAIModelSettings.d.ts +8 -0
  218. package/model-provider/openai/OpenAIModelSettings.js +1 -0
  219. package/model-provider/openai/OpenAITextEmbeddingModel.cjs +171 -0
  220. package/model-provider/openai/OpenAITextEmbeddingModel.d.ts +122 -0
  221. package/model-provider/openai/OpenAITextEmbeddingModel.js +162 -0
  222. package/model-provider/openai/OpenAITextGenerationModel.cjs +326 -0
  223. package/model-provider/openai/OpenAITextGenerationModel.d.ts +254 -0
  224. package/model-provider/openai/OpenAITextGenerationModel.js +317 -0
  225. package/model-provider/openai/OpenAITranscriptionModel.cjs +195 -0
  226. package/model-provider/openai/OpenAITranscriptionModel.d.ts +196 -0
  227. package/model-provider/openai/OpenAITranscriptionModel.js +187 -0
  228. package/model-provider/openai/TikTokenTokenizer.cjs +86 -0
  229. package/model-provider/openai/TikTokenTokenizer.d.ts +35 -0
  230. package/model-provider/openai/TikTokenTokenizer.js +82 -0
  231. package/model-provider/openai/chat/OpenAIChatMessage.cjs +24 -0
  232. package/model-provider/openai/chat/OpenAIChatMessage.d.ts +26 -0
  233. package/model-provider/openai/chat/OpenAIChatMessage.js +21 -0
  234. package/model-provider/openai/chat/OpenAIChatModel.cjs +288 -0
  235. package/model-provider/openai/chat/OpenAIChatModel.d.ts +344 -0
  236. package/model-provider/openai/chat/OpenAIChatModel.js +279 -0
  237. package/model-provider/openai/chat/OpenAIChatPrompt.cjs +143 -0
  238. package/model-provider/openai/chat/OpenAIChatPrompt.d.ts +108 -0
  239. package/model-provider/openai/chat/OpenAIChatPrompt.js +135 -0
  240. package/model-provider/openai/chat/OpenAIChatStreamIterable.cjs +112 -0
  241. package/model-provider/openai/chat/OpenAIChatStreamIterable.d.ts +19 -0
  242. package/model-provider/openai/chat/OpenAIChatStreamIterable.js +105 -0
  243. package/model-provider/openai/chat/countOpenAIChatMessageTokens.cjs +28 -0
  244. package/model-provider/openai/chat/countOpenAIChatMessageTokens.d.ts +20 -0
  245. package/model-provider/openai/chat/countOpenAIChatMessageTokens.js +23 -0
  246. package/model-provider/openai/index.cjs +31 -0
  247. package/model-provider/openai/index.d.ts +13 -0
  248. package/model-provider/openai/index.js +12 -0
  249. package/model-provider/stability/StabilityError.cjs +36 -0
  250. package/model-provider/stability/StabilityError.d.ts +22 -0
  251. package/model-provider/stability/StabilityError.js +28 -0
  252. package/model-provider/stability/StabilityImageGenerationModel.cjs +133 -0
  253. package/model-provider/stability/StabilityImageGenerationModel.d.ts +95 -0
  254. package/model-provider/stability/StabilityImageGenerationModel.js +129 -0
  255. package/model-provider/stability/index.cjs +20 -0
  256. package/model-provider/stability/index.d.ts +2 -0
  257. package/model-provider/stability/index.js +2 -0
  258. package/package.json +87 -0
  259. package/prompt/InstructionPrompt.cjs +2 -0
  260. package/prompt/InstructionPrompt.d.ts +7 -0
  261. package/prompt/InstructionPrompt.js +1 -0
  262. package/prompt/Llama2PromptMapping.cjs +56 -0
  263. package/prompt/Llama2PromptMapping.d.ts +10 -0
  264. package/prompt/Llama2PromptMapping.js +51 -0
  265. package/prompt/OpenAIChatPromptMapping.cjs +62 -0
  266. package/prompt/OpenAIChatPromptMapping.d.ts +6 -0
  267. package/prompt/OpenAIChatPromptMapping.js +57 -0
  268. package/prompt/PromptMapping.cjs +2 -0
  269. package/prompt/PromptMapping.d.ts +7 -0
  270. package/prompt/PromptMapping.js +1 -0
  271. package/prompt/PromptMappingTextGenerationModel.cjs +88 -0
  272. package/prompt/PromptMappingTextGenerationModel.d.ts +26 -0
  273. package/prompt/PromptMappingTextGenerationModel.js +84 -0
  274. package/prompt/TextPromptMapping.cjs +50 -0
  275. package/prompt/TextPromptMapping.d.ts +14 -0
  276. package/prompt/TextPromptMapping.js +45 -0
  277. package/prompt/chat/ChatPrompt.cjs +2 -0
  278. package/prompt/chat/ChatPrompt.d.ts +33 -0
  279. package/prompt/chat/ChatPrompt.js +1 -0
  280. package/prompt/chat/trimChatPrompt.cjs +50 -0
  281. package/prompt/chat/trimChatPrompt.d.ts +19 -0
  282. package/prompt/chat/trimChatPrompt.js +46 -0
  283. package/prompt/chat/validateChatPrompt.cjs +36 -0
  284. package/prompt/chat/validateChatPrompt.d.ts +8 -0
  285. package/prompt/chat/validateChatPrompt.js +31 -0
  286. package/prompt/index.cjs +25 -0
  287. package/prompt/index.d.ts +9 -0
  288. package/prompt/index.js +9 -0
  289. package/run/ConsoleLogger.cjs +12 -0
  290. package/run/ConsoleLogger.d.ts +6 -0
  291. package/run/ConsoleLogger.js +8 -0
  292. package/run/DefaultRun.cjs +78 -0
  293. package/run/DefaultRun.d.ts +24 -0
  294. package/run/DefaultRun.js +74 -0
  295. package/run/IdMetadata.cjs +2 -0
  296. package/run/IdMetadata.d.ts +7 -0
  297. package/run/IdMetadata.js +1 -0
  298. package/run/Run.cjs +2 -0
  299. package/run/Run.d.ts +27 -0
  300. package/run/Run.js +1 -0
  301. package/run/RunFunction.cjs +2 -0
  302. package/run/RunFunction.d.ts +13 -0
  303. package/run/RunFunction.js +1 -0
  304. package/run/Vector.cjs +2 -0
  305. package/run/Vector.d.ts +5 -0
  306. package/run/Vector.js +1 -0
  307. package/run/index.cjs +22 -0
  308. package/run/index.d.ts +6 -0
  309. package/run/index.js +6 -0
  310. package/text-chunk/TextChunk.cjs +2 -0
  311. package/text-chunk/TextChunk.d.ts +3 -0
  312. package/text-chunk/TextChunk.js +1 -0
  313. package/text-chunk/index.cjs +22 -0
  314. package/text-chunk/index.d.ts +6 -0
  315. package/text-chunk/index.js +6 -0
  316. package/text-chunk/retrieve-text-chunks/TextChunkRetriever.cjs +2 -0
  317. package/text-chunk/retrieve-text-chunks/TextChunkRetriever.d.ts +8 -0
  318. package/text-chunk/retrieve-text-chunks/TextChunkRetriever.js +1 -0
  319. package/text-chunk/retrieve-text-chunks/retrieveTextChunks.cjs +10 -0
  320. package/text-chunk/retrieve-text-chunks/retrieveTextChunks.d.ts +6 -0
  321. package/text-chunk/retrieve-text-chunks/retrieveTextChunks.js +6 -0
  322. package/text-chunk/split/SplitFunction.cjs +2 -0
  323. package/text-chunk/split/SplitFunction.d.ts +4 -0
  324. package/text-chunk/split/SplitFunction.js +1 -0
  325. package/text-chunk/split/splitOnSeparator.cjs +12 -0
  326. package/text-chunk/split/splitOnSeparator.d.ts +8 -0
  327. package/text-chunk/split/splitOnSeparator.js +7 -0
  328. package/text-chunk/split/splitRecursively.cjs +41 -0
  329. package/text-chunk/split/splitRecursively.d.ts +22 -0
  330. package/text-chunk/split/splitRecursively.js +33 -0
  331. package/util/DurationMeasurement.cjs +42 -0
  332. package/util/DurationMeasurement.d.ts +5 -0
  333. package/util/DurationMeasurement.js +38 -0
  334. package/util/ErrorHandler.cjs +2 -0
  335. package/util/ErrorHandler.d.ts +1 -0
  336. package/util/ErrorHandler.js +1 -0
  337. package/util/SafeResult.cjs +2 -0
  338. package/util/SafeResult.d.ts +8 -0
  339. package/util/SafeResult.js +1 -0
  340. package/util/api/AbortError.cjs +9 -0
  341. package/util/api/AbortError.d.ts +3 -0
  342. package/util/api/AbortError.js +5 -0
  343. package/util/api/ApiCallError.cjs +45 -0
  344. package/util/api/ApiCallError.d.ts +15 -0
  345. package/util/api/ApiCallError.js +41 -0
  346. package/util/api/RetryError.cjs +24 -0
  347. package/util/api/RetryError.d.ts +10 -0
  348. package/util/api/RetryError.js +20 -0
  349. package/util/api/RetryFunction.cjs +2 -0
  350. package/util/api/RetryFunction.d.ts +1 -0
  351. package/util/api/RetryFunction.js +1 -0
  352. package/util/api/ThrottleFunction.cjs +2 -0
  353. package/util/api/ThrottleFunction.d.ts +1 -0
  354. package/util/api/ThrottleFunction.js +1 -0
  355. package/util/api/callWithRetryAndThrottle.cjs +7 -0
  356. package/util/api/callWithRetryAndThrottle.d.ts +7 -0
  357. package/util/api/callWithRetryAndThrottle.js +3 -0
  358. package/util/api/postToApi.cjs +103 -0
  359. package/util/api/postToApi.d.ts +29 -0
  360. package/util/api/postToApi.js +96 -0
  361. package/util/api/retryNever.cjs +8 -0
  362. package/util/api/retryNever.d.ts +4 -0
  363. package/util/api/retryNever.js +4 -0
  364. package/util/api/retryWithExponentialBackoff.cjs +48 -0
  365. package/util/api/retryWithExponentialBackoff.d.ts +10 -0
  366. package/util/api/retryWithExponentialBackoff.js +44 -0
  367. package/util/api/throttleMaxConcurrency.cjs +65 -0
  368. package/util/api/throttleMaxConcurrency.d.ts +7 -0
  369. package/util/api/throttleMaxConcurrency.js +61 -0
  370. package/util/api/throttleUnlimitedConcurrency.cjs +8 -0
  371. package/util/api/throttleUnlimitedConcurrency.d.ts +5 -0
  372. package/util/api/throttleUnlimitedConcurrency.js +4 -0
  373. package/util/cosineSimilarity.cjs +26 -0
  374. package/util/cosineSimilarity.d.ts +11 -0
  375. package/util/cosineSimilarity.js +22 -0
  376. package/util/index.cjs +26 -0
  377. package/util/index.d.ts +10 -0
  378. package/util/index.js +10 -0
  379. package/util/never.cjs +6 -0
  380. package/util/never.d.ts +1 -0
  381. package/util/never.js +2 -0
  382. package/util/runSafe.cjs +15 -0
  383. package/util/runSafe.d.ts +2 -0
  384. package/util/runSafe.js +11 -0
  385. package/vector-index/VectorIndex.cjs +2 -0
  386. package/vector-index/VectorIndex.d.ts +18 -0
  387. package/vector-index/VectorIndex.js +1 -0
  388. package/vector-index/VectorIndexSimilarTextChunkRetriever.cjs +57 -0
  389. package/vector-index/VectorIndexSimilarTextChunkRetriever.d.ts +20 -0
  390. package/vector-index/VectorIndexSimilarTextChunkRetriever.js +53 -0
  391. package/vector-index/VectorIndexTextChunkStore.cjs +77 -0
  392. package/vector-index/VectorIndexTextChunkStore.d.ts +35 -0
  393. package/vector-index/VectorIndexTextChunkStore.js +73 -0
  394. package/vector-index/index.cjs +22 -0
  395. package/vector-index/index.d.ts +6 -0
  396. package/vector-index/index.js +6 -0
  397. package/vector-index/memory/MemoryVectorIndex.cjs +63 -0
  398. package/vector-index/memory/MemoryVectorIndex.d.ts +31 -0
  399. package/vector-index/memory/MemoryVectorIndex.js +56 -0
  400. package/vector-index/pinecone/PineconeVectorIndex.cjs +66 -0
  401. package/vector-index/pinecone/PineconeVectorIndex.d.ts +29 -0
  402. package/vector-index/pinecone/PineconeVectorIndex.js +62 -0
  403. package/vector-index/upsertTextChunks.cjs +15 -0
  404. package/vector-index/upsertTextChunks.d.ts +11 -0
  405. package/vector-index/upsertTextChunks.js +11 -0
@@ -0,0 +1,44 @@
1
+ import SecureJSON from "secure-json-parse";
2
+ import { z } from "zod";
3
+ import { ApiCallError } from "../../util/api/ApiCallError.js";
4
+ export const llamaCppErrorDataSchema = z.object({
5
+ error: z.string(),
6
+ });
7
+ export class LlamaCppError extends ApiCallError {
8
+ constructor({ data, statusCode, url, requestBodyValues, message = data.error, }) {
9
+ super({ message, statusCode, requestBodyValues, url });
10
+ Object.defineProperty(this, "data", {
11
+ enumerable: true,
12
+ configurable: true,
13
+ writable: true,
14
+ value: void 0
15
+ });
16
+ this.data = data;
17
+ }
18
+ }
19
+ export const failedLlamaCppCallResponseHandler = async ({ response, url, requestBodyValues }) => {
20
+ const responseBody = await response.text();
21
+ try {
22
+ const parsedError = llamaCppErrorDataSchema.parse(SecureJSON.parse(responseBody));
23
+ return new LlamaCppError({
24
+ url,
25
+ requestBodyValues,
26
+ statusCode: response.status,
27
+ data: parsedError,
28
+ });
29
+ }
30
+ catch (error) {
31
+ if (error instanceof Error) {
32
+ if (error.name === "AbortError" || error instanceof ApiCallError) {
33
+ throw error;
34
+ }
35
+ }
36
+ throw new ApiCallError({
37
+ message: responseBody,
38
+ cause: error,
39
+ statusCode: response.status,
40
+ url,
41
+ requestBodyValues,
42
+ });
43
+ }
44
+ };
@@ -0,0 +1,96 @@
1
+ "use strict";
2
+ var __importDefault = (this && this.__importDefault) || function (mod) {
3
+ return (mod && mod.__esModule) ? mod : { "default": mod };
4
+ };
5
+ Object.defineProperty(exports, "__esModule", { value: true });
6
+ exports.LlamaCppTextEmbeddingModel = void 0;
7
+ const zod_1 = __importDefault(require("zod"));
8
+ const AbstractModel_js_1 = require("../../model-function/AbstractModel.cjs");
9
+ const callWithRetryAndThrottle_js_1 = require("../../util/api/callWithRetryAndThrottle.cjs");
10
+ const postToApi_js_1 = require("../../util/api/postToApi.cjs");
11
+ const LlamaCppError_js_1 = require("./LlamaCppError.cjs");
12
+ const LlamaCppTokenizer_js_1 = require("./LlamaCppTokenizer.cjs");
13
+ class LlamaCppTextEmbeddingModel extends AbstractModel_js_1.AbstractModel {
14
+ constructor(settings = {}) {
15
+ super({ settings });
16
+ Object.defineProperty(this, "provider", {
17
+ enumerable: true,
18
+ configurable: true,
19
+ writable: true,
20
+ value: "llamacpp"
21
+ });
22
+ Object.defineProperty(this, "maxTextsPerCall", {
23
+ enumerable: true,
24
+ configurable: true,
25
+ writable: true,
26
+ value: 1
27
+ });
28
+ Object.defineProperty(this, "contextWindowSize", {
29
+ enumerable: true,
30
+ configurable: true,
31
+ writable: true,
32
+ value: undefined
33
+ });
34
+ Object.defineProperty(this, "embeddingDimensions", {
35
+ enumerable: true,
36
+ configurable: true,
37
+ writable: true,
38
+ value: undefined
39
+ });
40
+ Object.defineProperty(this, "tokenizer", {
41
+ enumerable: true,
42
+ configurable: true,
43
+ writable: true,
44
+ value: void 0
45
+ });
46
+ this.tokenizer = new LlamaCppTokenizer_js_1.LlamaCppTokenizer({
47
+ baseUrl: this.settings.baseUrl,
48
+ retry: this.settings.tokenizerSettings?.retry,
49
+ throttle: this.settings.tokenizerSettings?.throttle,
50
+ });
51
+ }
52
+ get modelName() {
53
+ return null;
54
+ }
55
+ async tokenize(text) {
56
+ return this.tokenizer.tokenize(text);
57
+ }
58
+ async callAPI(texts, options) {
59
+ if (texts.length > this.maxTextsPerCall) {
60
+ throw new Error(`The Llama.cpp embedding API only supports ${this.maxTextsPerCall} texts per API call.`);
61
+ }
62
+ const run = options?.run;
63
+ const settings = options?.settings;
64
+ const callSettings = Object.assign({}, this.settings, settings, {
65
+ abortSignal: run?.abortSignal,
66
+ content: texts[0],
67
+ });
68
+ return (0, callWithRetryAndThrottle_js_1.callWithRetryAndThrottle)({
69
+ retry: this.settings.retry,
70
+ throttle: this.settings.throttle,
71
+ call: async () => callLlamaCppEmbeddingAPI(callSettings),
72
+ });
73
+ }
74
+ generateEmbeddingResponse(texts, options) {
75
+ return this.callAPI(texts, options);
76
+ }
77
+ extractEmbeddings(response) {
78
+ return [response.embedding];
79
+ }
80
+ withSettings(additionalSettings) {
81
+ return new LlamaCppTextEmbeddingModel(Object.assign({}, this.settings, additionalSettings));
82
+ }
83
+ }
84
+ exports.LlamaCppTextEmbeddingModel = LlamaCppTextEmbeddingModel;
85
+ const llamaCppTextEmbeddingResponseSchema = zod_1.default.object({
86
+ embedding: zod_1.default.array(zod_1.default.number()),
87
+ });
88
+ async function callLlamaCppEmbeddingAPI({ baseUrl = "http://127.0.0.1:8080", abortSignal, content, }) {
89
+ return (0, postToApi_js_1.postJsonToApi)({
90
+ url: `${baseUrl}/embedding`,
91
+ body: { content },
92
+ failedResponseHandler: LlamaCppError_js_1.failedLlamaCppCallResponseHandler,
93
+ successfulResponseHandler: (0, postToApi_js_1.createJsonResponseHandler)(llamaCppTextEmbeddingResponseSchema),
94
+ abortSignal,
95
+ });
96
+ }
@@ -0,0 +1,40 @@
1
+ import z from "zod";
2
+ import { AbstractModel } from "../../model-function/AbstractModel.js";
3
+ import { FunctionOptions } from "../../model-function/FunctionOptions.js";
4
+ import { TextEmbeddingModel, TextEmbeddingModelSettings } from "../../model-function/embed-text/TextEmbeddingModel.js";
5
+ import { RetryFunction } from "../../util/api/RetryFunction.js";
6
+ import { ThrottleFunction } from "../../util/api/ThrottleFunction.js";
7
+ export interface LlamaCppEmbeddingModelSettings extends TextEmbeddingModelSettings {
8
+ baseUrl?: string;
9
+ retry?: RetryFunction;
10
+ throttle?: ThrottleFunction;
11
+ tokenizerSettings?: {
12
+ retry?: RetryFunction;
13
+ throttle?: ThrottleFunction;
14
+ };
15
+ }
16
+ export declare class LlamaCppTextEmbeddingModel extends AbstractModel<LlamaCppEmbeddingModelSettings> implements TextEmbeddingModel<LlamaCppTextEmbeddingResponse, LlamaCppEmbeddingModelSettings> {
17
+ constructor(settings?: LlamaCppEmbeddingModelSettings);
18
+ readonly provider: "llamacpp";
19
+ get modelName(): null;
20
+ readonly maxTextsPerCall = 1;
21
+ readonly contextWindowSize: undefined;
22
+ readonly embeddingDimensions: undefined;
23
+ private readonly tokenizer;
24
+ tokenize(text: string): Promise<number[]>;
25
+ callAPI(texts: Array<string>, options?: FunctionOptions<LlamaCppEmbeddingModelSettings>): Promise<LlamaCppTextEmbeddingResponse>;
26
+ generateEmbeddingResponse(texts: string[], options?: FunctionOptions<LlamaCppEmbeddingModelSettings>): Promise<{
27
+ embedding: number[];
28
+ }>;
29
+ extractEmbeddings(response: LlamaCppTextEmbeddingResponse): number[][];
30
+ withSettings(additionalSettings: Partial<LlamaCppEmbeddingModelSettings>): this;
31
+ }
32
+ declare const llamaCppTextEmbeddingResponseSchema: z.ZodObject<{
33
+ embedding: z.ZodArray<z.ZodNumber, "many">;
34
+ }, "strip", z.ZodTypeAny, {
35
+ embedding: number[];
36
+ }, {
37
+ embedding: number[];
38
+ }>;
39
+ export type LlamaCppTextEmbeddingResponse = z.infer<typeof llamaCppTextEmbeddingResponseSchema>;
40
+ export {};
@@ -0,0 +1,89 @@
1
+ import z from "zod";
2
+ import { AbstractModel } from "../../model-function/AbstractModel.js";
3
+ import { callWithRetryAndThrottle } from "../../util/api/callWithRetryAndThrottle.js";
4
+ import { createJsonResponseHandler, postJsonToApi, } from "../../util/api/postToApi.js";
5
+ import { failedLlamaCppCallResponseHandler } from "./LlamaCppError.js";
6
+ import { LlamaCppTokenizer } from "./LlamaCppTokenizer.js";
7
+ export class LlamaCppTextEmbeddingModel extends AbstractModel {
8
+ constructor(settings = {}) {
9
+ super({ settings });
10
+ Object.defineProperty(this, "provider", {
11
+ enumerable: true,
12
+ configurable: true,
13
+ writable: true,
14
+ value: "llamacpp"
15
+ });
16
+ Object.defineProperty(this, "maxTextsPerCall", {
17
+ enumerable: true,
18
+ configurable: true,
19
+ writable: true,
20
+ value: 1
21
+ });
22
+ Object.defineProperty(this, "contextWindowSize", {
23
+ enumerable: true,
24
+ configurable: true,
25
+ writable: true,
26
+ value: undefined
27
+ });
28
+ Object.defineProperty(this, "embeddingDimensions", {
29
+ enumerable: true,
30
+ configurable: true,
31
+ writable: true,
32
+ value: undefined
33
+ });
34
+ Object.defineProperty(this, "tokenizer", {
35
+ enumerable: true,
36
+ configurable: true,
37
+ writable: true,
38
+ value: void 0
39
+ });
40
+ this.tokenizer = new LlamaCppTokenizer({
41
+ baseUrl: this.settings.baseUrl,
42
+ retry: this.settings.tokenizerSettings?.retry,
43
+ throttle: this.settings.tokenizerSettings?.throttle,
44
+ });
45
+ }
46
+ get modelName() {
47
+ return null;
48
+ }
49
+ async tokenize(text) {
50
+ return this.tokenizer.tokenize(text);
51
+ }
52
+ async callAPI(texts, options) {
53
+ if (texts.length > this.maxTextsPerCall) {
54
+ throw new Error(`The Llama.cpp embedding API only supports ${this.maxTextsPerCall} texts per API call.`);
55
+ }
56
+ const run = options?.run;
57
+ const settings = options?.settings;
58
+ const callSettings = Object.assign({}, this.settings, settings, {
59
+ abortSignal: run?.abortSignal,
60
+ content: texts[0],
61
+ });
62
+ return callWithRetryAndThrottle({
63
+ retry: this.settings.retry,
64
+ throttle: this.settings.throttle,
65
+ call: async () => callLlamaCppEmbeddingAPI(callSettings),
66
+ });
67
+ }
68
+ generateEmbeddingResponse(texts, options) {
69
+ return this.callAPI(texts, options);
70
+ }
71
+ extractEmbeddings(response) {
72
+ return [response.embedding];
73
+ }
74
+ withSettings(additionalSettings) {
75
+ return new LlamaCppTextEmbeddingModel(Object.assign({}, this.settings, additionalSettings));
76
+ }
77
+ }
78
+ const llamaCppTextEmbeddingResponseSchema = z.object({
79
+ embedding: z.array(z.number()),
80
+ });
81
+ async function callLlamaCppEmbeddingAPI({ baseUrl = "http://127.0.0.1:8080", abortSignal, content, }) {
82
+ return postJsonToApi({
83
+ url: `${baseUrl}/embedding`,
84
+ body: { content },
85
+ failedResponseHandler: failedLlamaCppCallResponseHandler,
86
+ successfulResponseHandler: createJsonResponseHandler(llamaCppTextEmbeddingResponseSchema),
87
+ abortSignal,
88
+ });
89
+ }
@@ -0,0 +1,245 @@
1
+ "use strict";
2
+ var __importDefault = (this && this.__importDefault) || function (mod) {
3
+ return (mod && mod.__esModule) ? mod : { "default": mod };
4
+ };
5
+ Object.defineProperty(exports, "__esModule", { value: true });
6
+ exports.LlamaCppTextGenerationResponseFormat = exports.LlamaCppTextGenerationModel = void 0;
7
+ const secure_json_parse_1 = __importDefault(require("secure-json-parse"));
8
+ const zod_1 = __importDefault(require("zod"));
9
+ const AbstractModel_js_1 = require("../../model-function/AbstractModel.cjs");
10
+ const AsyncQueue_js_1 = require("../../model-function/generate-text/AsyncQueue.cjs");
11
+ const parseEventSourceReadableStream_js_1 = require("../../model-function/generate-text/parseEventSourceReadableStream.cjs");
12
+ const PromptMappingTextGenerationModel_js_1 = require("../../prompt/PromptMappingTextGenerationModel.cjs");
13
+ const callWithRetryAndThrottle_js_1 = require("../../util/api/callWithRetryAndThrottle.cjs");
14
+ const postToApi_js_1 = require("../../util/api/postToApi.cjs");
15
+ const LlamaCppError_js_1 = require("./LlamaCppError.cjs");
16
+ const LlamaCppTokenizer_js_1 = require("./LlamaCppTokenizer.cjs");
17
+ class LlamaCppTextGenerationModel extends AbstractModel_js_1.AbstractModel {
18
+ constructor(settings = {}) {
19
+ super({ settings });
20
+ Object.defineProperty(this, "provider", {
21
+ enumerable: true,
22
+ configurable: true,
23
+ writable: true,
24
+ value: "llamacpp"
25
+ });
26
+ Object.defineProperty(this, "tokenizer", {
27
+ enumerable: true,
28
+ configurable: true,
29
+ writable: true,
30
+ value: void 0
31
+ });
32
+ this.tokenizer = new LlamaCppTokenizer_js_1.LlamaCppTokenizer({
33
+ baseUrl: this.settings.baseUrl,
34
+ retry: this.settings.tokenizerSettings?.retry,
35
+ throttle: this.settings.tokenizerSettings?.throttle,
36
+ });
37
+ }
38
+ get modelName() {
39
+ return null;
40
+ }
41
+ get contextWindowSize() {
42
+ return this.settings.contextWindowSize;
43
+ }
44
+ async callAPI(prompt, options) {
45
+ const { run, settings, responseFormat } = options;
46
+ const callSettings = Object.assign(this.settings, settings, {
47
+ abortSignal: run?.abortSignal,
48
+ prompt,
49
+ responseFormat,
50
+ });
51
+ return (0, callWithRetryAndThrottle_js_1.callWithRetryAndThrottle)({
52
+ retry: this.settings.retry,
53
+ throttle: this.settings.throttle,
54
+ call: async () => callLlamaCppTextGenerationAPI(callSettings),
55
+ });
56
+ }
57
+ async countPromptTokens(prompt) {
58
+ const tokens = await this.tokenizer.tokenize(prompt);
59
+ return tokens.length;
60
+ }
61
+ generateTextResponse(prompt, options) {
62
+ return this.callAPI(prompt, {
63
+ ...options,
64
+ responseFormat: exports.LlamaCppTextGenerationResponseFormat.json,
65
+ });
66
+ }
67
+ extractText(response) {
68
+ return response.content;
69
+ }
70
+ generateDeltaStreamResponse(prompt, options) {
71
+ return this.callAPI(prompt, {
72
+ ...options,
73
+ responseFormat: exports.LlamaCppTextGenerationResponseFormat.deltaIterable,
74
+ });
75
+ }
76
+ extractTextDelta(fullDelta) {
77
+ return fullDelta.delta;
78
+ }
79
+ mapPrompt(promptMapping) {
80
+ return new PromptMappingTextGenerationModel_js_1.PromptMappingTextGenerationModel({
81
+ model: this.withStopTokens(promptMapping.stopTokens),
82
+ promptMapping,
83
+ });
84
+ }
85
+ withSettings(additionalSettings) {
86
+ return new LlamaCppTextGenerationModel(Object.assign({}, this.settings, additionalSettings));
87
+ }
88
+ get maxCompletionTokens() {
89
+ return this.settings.nPredict;
90
+ }
91
+ withMaxCompletionTokens(maxCompletionTokens) {
92
+ return this.withSettings({ nPredict: maxCompletionTokens });
93
+ }
94
+ withStopTokens(stopTokens) {
95
+ return this.withSettings({ stop: stopTokens });
96
+ }
97
+ }
98
+ exports.LlamaCppTextGenerationModel = LlamaCppTextGenerationModel;
99
+ const llamaCppTextGenerationResponseSchema = zod_1.default.object({
100
+ content: zod_1.default.string(),
101
+ stop: zod_1.default.literal(true),
102
+ generation_settings: zod_1.default.object({
103
+ frequency_penalty: zod_1.default.number(),
104
+ ignore_eos: zod_1.default.boolean(),
105
+ logit_bias: zod_1.default.array(zod_1.default.number()),
106
+ mirostat: zod_1.default.number(),
107
+ mirostat_eta: zod_1.default.number(),
108
+ mirostat_tau: zod_1.default.number(),
109
+ model: zod_1.default.string(),
110
+ n_ctx: zod_1.default.number(),
111
+ n_keep: zod_1.default.number(),
112
+ n_predict: zod_1.default.number(),
113
+ n_probs: zod_1.default.number(),
114
+ penalize_nl: zod_1.default.boolean(),
115
+ presence_penalty: zod_1.default.number(),
116
+ repeat_last_n: zod_1.default.number(),
117
+ repeat_penalty: zod_1.default.number(),
118
+ seed: zod_1.default.number(),
119
+ stop: zod_1.default.array(zod_1.default.string()),
120
+ stream: zod_1.default.boolean(),
121
+ temp: zod_1.default.number(),
122
+ tfs_z: zod_1.default.number(),
123
+ top_k: zod_1.default.number(),
124
+ top_p: zod_1.default.number(),
125
+ typical_p: zod_1.default.number(),
126
+ }),
127
+ model: zod_1.default.string(),
128
+ prompt: zod_1.default.string(),
129
+ stopped_eos: zod_1.default.boolean(),
130
+ stopped_limit: zod_1.default.boolean(),
131
+ stopped_word: zod_1.default.boolean(),
132
+ stopping_word: zod_1.default.string(),
133
+ timings: zod_1.default.object({
134
+ predicted_ms: zod_1.default.number(),
135
+ predicted_n: zod_1.default.number(),
136
+ predicted_per_second: zod_1.default.number().nullable(),
137
+ predicted_per_token_ms: zod_1.default.number().nullable(),
138
+ prompt_ms: zod_1.default.number().nullable(),
139
+ prompt_n: zod_1.default.number(),
140
+ prompt_per_second: zod_1.default.number().nullable(),
141
+ prompt_per_token_ms: zod_1.default.number().nullable(),
142
+ }),
143
+ tokens_cached: zod_1.default.number(),
144
+ tokens_evaluated: zod_1.default.number(),
145
+ tokens_predicted: zod_1.default.number(),
146
+ truncated: zod_1.default.boolean(),
147
+ });
148
+ const llamaCppTextStreamingResponseSchema = zod_1.default.discriminatedUnion("stop", [
149
+ zod_1.default.object({
150
+ content: zod_1.default.string(),
151
+ stop: zod_1.default.literal(false),
152
+ }),
153
+ llamaCppTextGenerationResponseSchema,
154
+ ]);
155
+ async function callLlamaCppTextGenerationAPI({ baseUrl = "http://127.0.0.1:8080", abortSignal, responseFormat, prompt, temperature, topK, topP, nPredict, nKeep, stop, tfsZ, typicalP, repeatPenalty, repeatLastN, penalizeNl, mirostat, mirostatTau, mirostatEta, seed, ignoreEos, logitBias, }) {
156
+ return (0, postToApi_js_1.postJsonToApi)({
157
+ url: `${baseUrl}/completion`,
158
+ body: {
159
+ stream: responseFormat.stream,
160
+ prompt,
161
+ temperature,
162
+ top_k: topK,
163
+ top_p: topP,
164
+ n_predict: nPredict,
165
+ n_keep: nKeep,
166
+ stop,
167
+ tfs_z: tfsZ,
168
+ typical_p: typicalP,
169
+ repeat_penalty: repeatPenalty,
170
+ repeat_last_n: repeatLastN,
171
+ penalize_nl: penalizeNl,
172
+ mirostat,
173
+ mirostat_tau: mirostatTau,
174
+ mirostat_eta: mirostatEta,
175
+ seed,
176
+ ignore_eos: ignoreEos,
177
+ logit_bias: logitBias,
178
+ },
179
+ failedResponseHandler: LlamaCppError_js_1.failedLlamaCppCallResponseHandler,
180
+ successfulResponseHandler: responseFormat.handler,
181
+ abortSignal,
182
+ });
183
+ }
184
+ async function createLlamaCppFullDeltaIterableQueue(stream) {
185
+ const queue = new AsyncQueue_js_1.AsyncQueue();
186
+ let content = "";
187
+ // process the stream asynchonously (no 'await' on purpose):
188
+ (0, parseEventSourceReadableStream_js_1.parseEventSourceReadableStream)({
189
+ stream,
190
+ callback: (event) => {
191
+ if (event.type !== "event") {
192
+ return;
193
+ }
194
+ const data = event.data;
195
+ try {
196
+ const json = secure_json_parse_1.default.parse(data);
197
+ const parseResult = llamaCppTextStreamingResponseSchema.safeParse(json);
198
+ if (!parseResult.success) {
199
+ queue.push({
200
+ type: "error",
201
+ error: parseResult.error,
202
+ });
203
+ queue.close();
204
+ return;
205
+ }
206
+ const event = parseResult.data;
207
+ content += event.content;
208
+ queue.push({
209
+ type: "delta",
210
+ fullDelta: {
211
+ content,
212
+ isComplete: event.stop,
213
+ delta: event.content,
214
+ },
215
+ });
216
+ if (event.stop) {
217
+ queue.close();
218
+ }
219
+ }
220
+ catch (error) {
221
+ queue.push({ type: "error", error });
222
+ queue.close();
223
+ return;
224
+ }
225
+ },
226
+ });
227
+ return queue;
228
+ }
229
+ exports.LlamaCppTextGenerationResponseFormat = {
230
+ /**
231
+ * Returns the response as a JSON object.
232
+ */
233
+ json: {
234
+ stream: false,
235
+ handler: (0, postToApi_js_1.createJsonResponseHandler)(llamaCppTextGenerationResponseSchema),
236
+ },
237
+ /**
238
+ * Returns an async iterable over the full deltas (all choices, including full current state at time of event)
239
+ * of the response stream.
240
+ */
241
+ deltaIterable: {
242
+ stream: true,
243
+ handler: async ({ response }) => createLlamaCppFullDeltaIterableQueue(response.body),
244
+ },
245
+ };