node-llama-cpp 3.0.0-beta.14 → 3.0.0-beta.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (312) hide show
  1. package/README.md +1 -1
  2. package/dist/ChatWrapper.js +4 -0
  3. package/dist/ChatWrapper.js.map +1 -1
  4. package/dist/bindings/AddonTypes.d.ts +21 -0
  5. package/dist/bindings/Llama.d.ts +4 -0
  6. package/dist/bindings/Llama.js +45 -4
  7. package/dist/bindings/Llama.js.map +1 -1
  8. package/dist/bindings/getLlama.d.ts +19 -1
  9. package/dist/bindings/getLlama.js +15 -5
  10. package/dist/bindings/getLlama.js.map +1 -1
  11. package/dist/bindings/types.d.ts +15 -0
  12. package/dist/bindings/types.js +27 -2
  13. package/dist/bindings/types.js.map +1 -1
  14. package/dist/bindings/utils/MemoryOrchestrator.d.ts +21 -0
  15. package/dist/bindings/utils/MemoryOrchestrator.js +49 -0
  16. package/dist/bindings/utils/MemoryOrchestrator.js.map +1 -0
  17. package/dist/bindings/utils/cloneLlamaCppRepo.d.ts +1 -1
  18. package/dist/bindings/utils/cloneLlamaCppRepo.js +3 -2
  19. package/dist/bindings/utils/cloneLlamaCppRepo.js.map +1 -1
  20. package/dist/bindings/utils/compileLLamaCpp.js +2 -2
  21. package/dist/bindings/utils/compileLLamaCpp.js.map +1 -1
  22. package/dist/bindings/utils/getLlamaWithoutBackend.d.ts +5 -0
  23. package/dist/bindings/utils/getLlamaWithoutBackend.js +27 -0
  24. package/dist/bindings/utils/getLlamaWithoutBackend.js.map +1 -0
  25. package/dist/bindings/utils/resolveCustomCmakeOptions.js +2 -2
  26. package/dist/bindings/utils/resolveCustomCmakeOptions.js.map +1 -1
  27. package/dist/chatWrappers/AlpacaChatWrapper.d.ts +2 -1
  28. package/dist/chatWrappers/AlpacaChatWrapper.js +9 -2
  29. package/dist/chatWrappers/AlpacaChatWrapper.js.map +1 -1
  30. package/dist/chatWrappers/ChatMLChatWrapper.js +12 -10
  31. package/dist/chatWrappers/ChatMLChatWrapper.js.map +1 -1
  32. package/dist/chatWrappers/FalconChatWrapper.d.ts +2 -1
  33. package/dist/chatWrappers/FalconChatWrapper.js +28 -11
  34. package/dist/chatWrappers/FalconChatWrapper.js.map +1 -1
  35. package/dist/chatWrappers/FunctionaryChatWrapper.js +59 -45
  36. package/dist/chatWrappers/FunctionaryChatWrapper.js.map +1 -1
  37. package/dist/chatWrappers/GemmaChatWrapper.js +9 -7
  38. package/dist/chatWrappers/GemmaChatWrapper.js.map +1 -1
  39. package/dist/chatWrappers/GeneralChatWrapper.d.ts +2 -1
  40. package/dist/chatWrappers/GeneralChatWrapper.js +35 -12
  41. package/dist/chatWrappers/GeneralChatWrapper.js.map +1 -1
  42. package/dist/chatWrappers/LlamaChatWrapper.d.ts +7 -0
  43. package/dist/chatWrappers/LlamaChatWrapper.js +26 -8
  44. package/dist/chatWrappers/LlamaChatWrapper.js.map +1 -1
  45. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.d.ts +73 -0
  46. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +355 -0
  47. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -0
  48. package/dist/{TemplateChatWrapper.d.ts → chatWrappers/generic/TemplateChatWrapper.d.ts} +6 -9
  49. package/dist/{TemplateChatWrapper.js → chatWrappers/generic/TemplateChatWrapper.js} +31 -69
  50. package/dist/chatWrappers/generic/TemplateChatWrapper.js.map +1 -0
  51. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.d.ts +33 -0
  52. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js +45 -0
  53. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js.map +1 -0
  54. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.d.ts +4 -0
  55. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js +206 -0
  56. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js.map +1 -0
  57. package/dist/chatWrappers/utils/resolveChatWrapper.d.ts +67 -0
  58. package/dist/chatWrappers/utils/resolveChatWrapper.js +206 -0
  59. package/dist/chatWrappers/utils/resolveChatWrapper.js.map +1 -0
  60. package/dist/cli/cli.js +1 -1
  61. package/dist/cli/cli.js.map +1 -1
  62. package/dist/cli/commands/ChatCommand.d.ts +7 -4
  63. package/dist/cli/commands/ChatCommand.js +150 -60
  64. package/dist/cli/commands/ChatCommand.js.map +1 -1
  65. package/dist/cli/commands/ClearCommand.d.ts +1 -1
  66. package/dist/cli/commands/ClearCommand.js +5 -5
  67. package/dist/cli/commands/ClearCommand.js.map +1 -1
  68. package/dist/cli/commands/CompleteCommand.d.ts +3 -2
  69. package/dist/cli/commands/CompleteCommand.js +88 -41
  70. package/dist/cli/commands/CompleteCommand.js.map +1 -1
  71. package/dist/cli/commands/InfillCommand.d.ts +3 -2
  72. package/dist/cli/commands/InfillCommand.js +88 -41
  73. package/dist/cli/commands/InfillCommand.js.map +1 -1
  74. package/dist/cli/commands/{InspectCommand.d.ts → inspect/InspectCommand.d.ts} +1 -4
  75. package/dist/cli/commands/inspect/InspectCommand.js +17 -0
  76. package/dist/cli/commands/inspect/InspectCommand.js.map +1 -0
  77. package/dist/cli/commands/inspect/commands/InspectGgufCommand.d.ts +10 -0
  78. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +108 -0
  79. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -0
  80. package/dist/cli/commands/inspect/commands/InspectGpuCommand.d.ts +4 -0
  81. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +98 -0
  82. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -0
  83. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.d.ts +14 -0
  84. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +577 -0
  85. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -0
  86. package/dist/cli/utils/ConsoleTable.d.ts +23 -0
  87. package/dist/cli/utils/ConsoleTable.js +86 -0
  88. package/dist/cli/utils/ConsoleTable.js.map +1 -0
  89. package/dist/cli/utils/printCommonInfoLines.d.ts +9 -0
  90. package/dist/cli/utils/printCommonInfoLines.js +70 -0
  91. package/dist/cli/utils/printCommonInfoLines.js.map +1 -0
  92. package/dist/cli/utils/printInfoLine.d.ts +10 -0
  93. package/dist/cli/utils/printInfoLine.js +45 -0
  94. package/dist/cli/utils/printInfoLine.js.map +1 -0
  95. package/dist/cli/utils/resolveCommandGgufPath.d.ts +1 -0
  96. package/dist/cli/utils/resolveCommandGgufPath.js +6 -0
  97. package/dist/cli/utils/resolveCommandGgufPath.js.map +1 -0
  98. package/dist/config.d.ts +2 -0
  99. package/dist/config.js +6 -0
  100. package/dist/config.js.map +1 -1
  101. package/dist/evaluator/LlamaChat/LlamaChat.js +13 -5
  102. package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -1
  103. package/dist/evaluator/LlamaCompletion.js +5 -3
  104. package/dist/evaluator/LlamaCompletion.js.map +1 -1
  105. package/dist/evaluator/LlamaContext/LlamaContext.d.ts +40 -3
  106. package/dist/evaluator/LlamaContext/LlamaContext.js +245 -100
  107. package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -1
  108. package/dist/evaluator/LlamaContext/types.d.ts +57 -6
  109. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/firstInFirstOutStrategy.js.map +1 -0
  110. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/maximumParallelismStrategy.js.map +1 -0
  111. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.d.ts +2 -0
  112. package/dist/evaluator/LlamaContext/utils/{resolveBatchItemsPrioritizingStrategy.js → resolveBatchItemsPrioritizationStrategy.js} +4 -4
  113. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js.map +1 -0
  114. package/dist/evaluator/LlamaEmbeddingContext.d.ts +23 -2
  115. package/dist/evaluator/LlamaEmbeddingContext.js +4 -5
  116. package/dist/evaluator/LlamaEmbeddingContext.js.map +1 -1
  117. package/dist/evaluator/LlamaModel.d.ts +64 -6
  118. package/dist/evaluator/LlamaModel.js +297 -8
  119. package/dist/evaluator/LlamaModel.js.map +1 -1
  120. package/dist/evaluator/TokenMeter.d.ts +54 -0
  121. package/dist/evaluator/TokenMeter.js +86 -0
  122. package/dist/evaluator/TokenMeter.js.map +1 -0
  123. package/dist/gguf/GgufInsights.d.ts +40 -0
  124. package/dist/gguf/GgufInsights.js +350 -0
  125. package/dist/gguf/GgufInsights.js.map +1 -0
  126. package/dist/gguf/consts.d.ts +3 -0
  127. package/dist/gguf/consts.js +8 -0
  128. package/dist/gguf/consts.js.map +1 -0
  129. package/dist/gguf/errors/InvalidGgufMagicError.d.ts +3 -0
  130. package/dist/gguf/errors/InvalidGgufMagicError.js +6 -0
  131. package/dist/gguf/errors/InvalidGgufMagicError.js.map +1 -0
  132. package/dist/gguf/errors/UnsupportedGgufValueTypeError.d.ts +4 -0
  133. package/dist/gguf/errors/UnsupportedGgufValueTypeError.js +9 -0
  134. package/dist/gguf/errors/UnsupportedGgufValueTypeError.js.map +1 -0
  135. package/dist/gguf/fileReaders/GgufFileReader.d.ts +33 -0
  136. package/dist/gguf/fileReaders/GgufFileReader.js +76 -0
  137. package/dist/gguf/fileReaders/GgufFileReader.js.map +1 -0
  138. package/dist/gguf/fileReaders/GgufFsFileReader.d.ts +17 -0
  139. package/dist/gguf/fileReaders/GgufFsFileReader.js +45 -0
  140. package/dist/gguf/fileReaders/GgufFsFileReader.js.map +1 -0
  141. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.d.ts +22 -0
  142. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js +63 -0
  143. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js.map +1 -0
  144. package/dist/gguf/parser/GgufV2Parser.d.ts +19 -0
  145. package/dist/gguf/parser/GgufV2Parser.js +115 -0
  146. package/dist/gguf/parser/GgufV2Parser.js.map +1 -0
  147. package/dist/gguf/parser/GgufV3Parser.d.ts +3 -0
  148. package/dist/gguf/parser/GgufV3Parser.js +4 -0
  149. package/dist/gguf/parser/GgufV3Parser.js.map +1 -0
  150. package/dist/gguf/parser/parseGguf.d.ts +8 -0
  151. package/dist/gguf/parser/parseGguf.js +58 -0
  152. package/dist/gguf/parser/parseGguf.js.map +1 -0
  153. package/dist/gguf/readGgufFileInfo.d.ts +30 -0
  154. package/dist/gguf/readGgufFileInfo.js +37 -0
  155. package/dist/gguf/readGgufFileInfo.js.map +1 -0
  156. package/dist/gguf/types/GgufFileInfoTypes.d.ts +52 -0
  157. package/dist/gguf/types/GgufFileInfoTypes.js +18 -0
  158. package/dist/gguf/types/GgufFileInfoTypes.js.map +1 -0
  159. package/dist/gguf/types/GgufMetadataTypes.d.ts +330 -0
  160. package/dist/gguf/types/GgufMetadataTypes.js +86 -0
  161. package/dist/gguf/types/GgufMetadataTypes.js.map +1 -0
  162. package/dist/gguf/types/GgufTensorInfoTypes.d.ts +37 -0
  163. package/dist/gguf/types/GgufTensorInfoTypes.js +33 -0
  164. package/dist/gguf/types/GgufTensorInfoTypes.js.map +1 -0
  165. package/dist/gguf/utils/GgufReadOffset.d.ts +6 -0
  166. package/dist/gguf/utils/GgufReadOffset.js +18 -0
  167. package/dist/gguf/utils/GgufReadOffset.js.map +1 -0
  168. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.d.ts +5 -0
  169. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js +38 -0
  170. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js.map +1 -0
  171. package/dist/gguf/utils/getGgufFileTypeName.d.ts +4 -0
  172. package/dist/gguf/utils/getGgufFileTypeName.js +13 -0
  173. package/dist/gguf/utils/getGgufFileTypeName.js.map +1 -0
  174. package/dist/gguf/utils/getGgufMetadataArchitectureData.d.ts +3 -0
  175. package/dist/gguf/utils/getGgufMetadataArchitectureData.js +4 -0
  176. package/dist/gguf/utils/getGgufMetadataArchitectureData.js.map +1 -0
  177. package/dist/gguf/utils/normalizeGgufDownloadUrl.d.ts +1 -0
  178. package/dist/gguf/utils/normalizeGgufDownloadUrl.js +16 -0
  179. package/dist/gguf/utils/normalizeGgufDownloadUrl.js.map +1 -0
  180. package/dist/index.d.ts +13 -7
  181. package/dist/index.js +11 -6
  182. package/dist/index.js.map +1 -1
  183. package/dist/types.d.ts +1 -1
  184. package/dist/utils/InsufficientMemoryError.d.ts +3 -0
  185. package/dist/utils/InsufficientMemoryError.js +6 -0
  186. package/dist/utils/InsufficientMemoryError.js.map +1 -0
  187. package/dist/utils/LlamaText.d.ts +25 -10
  188. package/dist/utils/LlamaText.js +205 -23
  189. package/dist/utils/LlamaText.js.map +1 -1
  190. package/dist/utils/StopGenerationDetector.js +3 -1
  191. package/dist/utils/StopGenerationDetector.js.map +1 -1
  192. package/dist/utils/findBestOption.d.ts +4 -0
  193. package/dist/utils/findBestOption.js +15 -0
  194. package/dist/utils/findBestOption.js.map +1 -0
  195. package/dist/utils/getQueuedTokensBeforeStopTrigger.js +3 -3
  196. package/dist/utils/getQueuedTokensBeforeStopTrigger.js.map +1 -1
  197. package/dist/utils/gitReleaseBundles.js +68 -1
  198. package/dist/utils/gitReleaseBundles.js.map +1 -1
  199. package/dist/utils/mergeUnionTypes.d.ts +4 -0
  200. package/dist/utils/parseModelFileName.d.ts +1 -0
  201. package/dist/utils/parseModelFileName.js +6 -1
  202. package/dist/utils/parseModelFileName.js.map +1 -1
  203. package/dist/utils/prettyPrintObject.d.ts +10 -1
  204. package/dist/utils/prettyPrintObject.js +57 -13
  205. package/dist/utils/prettyPrintObject.js.map +1 -1
  206. package/dist/utils/spawnCommand.js.map +1 -1
  207. package/dist/utils/tokenizeInput.d.ts +1 -1
  208. package/dist/utils/tokenizeInput.js +3 -3
  209. package/dist/utils/tokenizeInput.js.map +1 -1
  210. package/dist/utils/withOra.d.ts +1 -0
  211. package/dist/utils/withOra.js +2 -2
  212. package/dist/utils/withOra.js.map +1 -1
  213. package/llama/CMakeLists.txt +5 -5
  214. package/llama/addon.cpp +117 -5
  215. package/llama/binariesGithubRelease.json +1 -1
  216. package/llama/gitRelease.bundle +0 -0
  217. package/llama/gpuInfo/cuda-gpu-info.cu +21 -0
  218. package/llama/gpuInfo/cuda-gpu-info.h +3 -0
  219. package/llama/gpuInfo/metal-gpu-info.h +4 -1
  220. package/llama/gpuInfo/metal-gpu-info.mm +14 -1
  221. package/llama/gpuInfo/vulkan-gpu-info.cpp +20 -2
  222. package/llama/gpuInfo/vulkan-gpu-info.h +2 -0
  223. package/llama/llama.cpp.info.json +1 -1
  224. package/llama/toolchains/win32.host-x64.target-arm64.cmake +41 -0
  225. package/llamaBins/linux-arm64/_nlcBuildMetadata.json +1 -1
  226. package/llamaBins/linux-arm64/llama-addon.node +0 -0
  227. package/llamaBins/linux-armv7l/_nlcBuildMetadata.json +1 -1
  228. package/llamaBins/linux-armv7l/llama-addon.node +0 -0
  229. package/llamaBins/linux-x64/_nlcBuildMetadata.json +1 -1
  230. package/llamaBins/linux-x64/llama-addon.node +0 -0
  231. package/llamaBins/linux-x64-cuda/_nlcBuildMetadata.json +1 -1
  232. package/llamaBins/linux-x64-cuda/llama-addon.node +0 -0
  233. package/llamaBins/linux-x64-vulkan/_nlcBuildMetadata.json +1 -1
  234. package/llamaBins/linux-x64-vulkan/llama-addon.node +0 -0
  235. package/llamaBins/mac-arm64-metal/_nlcBuildMetadata.json +1 -1
  236. package/llamaBins/mac-arm64-metal/default.metallib +0 -0
  237. package/llamaBins/mac-arm64-metal/llama-addon.node +0 -0
  238. package/llamaBins/mac-x64/_nlcBuildMetadata.json +1 -1
  239. package/llamaBins/mac-x64/llama-addon.node +0 -0
  240. package/llamaBins/win-arm64/_nlcBuildMetadata.json +1 -0
  241. package/llamaBins/win-arm64/llama-addon.exp +0 -0
  242. package/llamaBins/win-arm64/llama-addon.lib +0 -0
  243. package/llamaBins/win-arm64/llama-addon.node +0 -0
  244. package/llamaBins/win-x64/_nlcBuildMetadata.json +1 -1
  245. package/llamaBins/win-x64/llama-addon.node +0 -0
  246. package/llamaBins/win-x64-cuda/_nlcBuildMetadata.json +1 -1
  247. package/llamaBins/win-x64-cuda/llama-addon.node +0 -0
  248. package/llamaBins/win-x64-vulkan/_nlcBuildMetadata.json +1 -1
  249. package/llamaBins/win-x64-vulkan/llama-addon.node +0 -0
  250. package/package.json +8 -6
  251. package/dist/TemplateChatWrapper.js.map +0 -1
  252. package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.d.ts +0 -33
  253. package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.js +0 -49
  254. package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.js.map +0 -1
  255. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.d.ts +0 -13
  256. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js +0 -63
  257. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js.map +0 -1
  258. package/dist/cli/commands/InspectCommand.js +0 -113
  259. package/dist/cli/commands/InspectCommand.js.map +0 -1
  260. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js.map +0 -1
  261. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js.map +0 -1
  262. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.d.ts +0 -2
  263. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js.map +0 -1
  264. package/dist/gguf/GGUFInsights.d.ts +0 -28
  265. package/dist/gguf/GGUFInsights.js +0 -58
  266. package/dist/gguf/GGUFInsights.js.map +0 -1
  267. package/dist/gguf/GGUFMetadata.d.ts +0 -19
  268. package/dist/gguf/GGUFMetadata.js +0 -38
  269. package/dist/gguf/GGUFMetadata.js.map +0 -1
  270. package/dist/gguf/errors/InvalidGGUFMagicError.d.ts +0 -3
  271. package/dist/gguf/errors/InvalidGGUFMagicError.js +0 -6
  272. package/dist/gguf/errors/InvalidGGUFMagicError.js.map +0 -1
  273. package/dist/gguf/errors/MetadataNotParsedYetError.d.ts +0 -3
  274. package/dist/gguf/errors/MetadataNotParsedYetError.js +0 -6
  275. package/dist/gguf/errors/MetadataNotParsedYetError.js.map +0 -1
  276. package/dist/gguf/errors/MissingNodeLlamaError.d.ts +0 -3
  277. package/dist/gguf/errors/MissingNodeLlamaError.js +0 -6
  278. package/dist/gguf/errors/MissingNodeLlamaError.js.map +0 -1
  279. package/dist/gguf/errors/ModelScore/NotEnoughVRamError.d.ts +0 -5
  280. package/dist/gguf/errors/ModelScore/NotEnoughVRamError.js +0 -11
  281. package/dist/gguf/errors/ModelScore/NotEnoughVRamError.js.map +0 -1
  282. package/dist/gguf/errors/UnsupportedMetadataTypeError.d.ts +0 -4
  283. package/dist/gguf/errors/UnsupportedMetadataTypeError.js +0 -8
  284. package/dist/gguf/errors/UnsupportedMetadataTypeError.js.map +0 -1
  285. package/dist/gguf/ggufParser/GGUFParser.d.ts +0 -18
  286. package/dist/gguf/ggufParser/GGUFParser.js +0 -123
  287. package/dist/gguf/ggufParser/GGUFParser.js.map +0 -1
  288. package/dist/gguf/ggufParser/GGUFTypes.d.ts +0 -257
  289. package/dist/gguf/ggufParser/GGUFTypes.js +0 -2
  290. package/dist/gguf/ggufParser/GGUFTypes.js.map +0 -1
  291. package/dist/gguf/ggufParser/checkArchitecture.d.ts +0 -14
  292. package/dist/gguf/ggufParser/checkArchitecture.js +0 -74
  293. package/dist/gguf/ggufParser/checkArchitecture.js.map +0 -1
  294. package/dist/gguf/ggufParser/stream/GGUFBaseStream.d.ts +0 -38
  295. package/dist/gguf/ggufParser/stream/GGUFBaseStream.js +0 -83
  296. package/dist/gguf/ggufParser/stream/GGUFBaseStream.js.map +0 -1
  297. package/dist/gguf/ggufParser/stream/GGUFFetchStream.d.ts +0 -14
  298. package/dist/gguf/ggufParser/stream/GGUFFetchStream.js +0 -35
  299. package/dist/gguf/ggufParser/stream/GGUFFetchStream.js.map +0 -1
  300. package/dist/gguf/ggufParser/stream/GGUFReadStream.d.ts +0 -15
  301. package/dist/gguf/ggufParser/stream/GGUFReadStream.js +0 -40
  302. package/dist/gguf/ggufParser/stream/GGUFReadStream.js.map +0 -1
  303. package/dist/utils/parseModelTypeDescription.d.ts +0 -6
  304. package/dist/utils/parseModelTypeDescription.js +0 -9
  305. package/dist/utils/parseModelTypeDescription.js.map +0 -1
  306. package/dist/utils/resolveChatWrapper.d.ts +0 -4
  307. package/dist/utils/resolveChatWrapper.js +0 -16
  308. package/dist/utils/resolveChatWrapper.js.map +0 -1
  309. /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.d.ts +0 -0
  310. /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.js +0 -0
  311. /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/maximumParallelismStrategy.d.ts +0 -0
  312. /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/maximumParallelismStrategy.js +0 -0
package/llama/addon.cpp CHANGED
@@ -9,7 +9,7 @@
9
9
  #include "llama.h"
10
10
  #include "napi.h"
11
11
 
12
- #ifdef GPU_INFO_USE_CUBLAS
12
+ #ifdef GPU_INFO_USE_CUDA
13
13
  # include "gpuInfo/cuda-gpu-info.h"
14
14
  #endif
15
15
  #ifdef GPU_INFO_USE_VULKAN
@@ -121,7 +121,7 @@ std::string addon_model_token_to_piece(const struct llama_model* model, llama_to
121
121
  return std::string(result.data(), result.size());
122
122
  }
123
123
 
124
- #ifdef GPU_INFO_USE_CUBLAS
124
+ #ifdef GPU_INFO_USE_CUDA
125
125
  void logCudaError(const char* message) {
126
126
  addonLlamaCppLogCallback(GGML_LOG_LEVEL_ERROR, (std::string("CUDA error: ") + std::string(message)).c_str(), nullptr);
127
127
  }
@@ -136,7 +136,7 @@ Napi::Value getGpuVramInfo(const Napi::CallbackInfo& info) {
136
136
  uint64_t total = 0;
137
137
  uint64_t used = 0;
138
138
 
139
- #ifdef GPU_INFO_USE_CUBLAS
139
+ #ifdef GPU_INFO_USE_CUDA
140
140
  size_t cudaDeviceTotal = 0;
141
141
  size_t cudaDeviceUsed = 0;
142
142
  bool cudeGetInfoSuccess = gpuInfoGetTotalCudaDevicesInfo(&cudaDeviceTotal, &cudaDeviceUsed, logCudaError);
@@ -161,7 +161,7 @@ Napi::Value getGpuVramInfo(const Napi::CallbackInfo& info) {
161
161
  #ifdef GPU_INFO_USE_METAL
162
162
  uint64_t metalDeviceTotal = 0;
163
163
  uint64_t metalDeviceUsed = 0;
164
- get_metal_gpu_info(&metalDeviceTotal, &metalDeviceUsed);
164
+ getMetalGpuInfo(&metalDeviceTotal, &metalDeviceUsed);
165
165
 
166
166
  total += metalDeviceTotal;
167
167
  used += metalDeviceUsed;
@@ -174,8 +174,34 @@ Napi::Value getGpuVramInfo(const Napi::CallbackInfo& info) {
174
174
  return result;
175
175
  }
176
176
 
177
+ Napi::Value getGpuDeviceInfo(const Napi::CallbackInfo& info) {
178
+ std::vector<std::string> deviceNames;
179
+
180
+ #ifdef GPU_INFO_USE_CUDA
181
+ gpuInfoGetCudaDeviceNames(&deviceNames, logCudaError);
182
+ #endif
183
+
184
+ #ifdef GPU_INFO_USE_VULKAN
185
+ gpuInfoGetVulkanDeviceNames(&deviceNames, logVulkanWarning);
186
+ #endif
187
+
188
+ #ifdef GPU_INFO_USE_METAL
189
+ getMetalGpuDeviceNames(&deviceNames);
190
+ #endif
191
+
192
+ Napi::Object result = Napi::Object::New(info.Env());
193
+
194
+ Napi::Array deviceNamesNapiArray = Napi::Array::New(info.Env(), deviceNames.size());
195
+ for (size_t i = 0; i < deviceNames.size(); ++i) {
196
+ deviceNamesNapiArray[i] = Napi::String::New(info.Env(), deviceNames[i]);
197
+ }
198
+ result.Set("deviceNames", deviceNamesNapiArray);
199
+
200
+ return result;
201
+ }
202
+
177
203
  Napi::Value getGpuType(const Napi::CallbackInfo& info) {
178
- #ifdef GPU_INFO_USE_CUBLAS
204
+ #ifdef GPU_INFO_USE_CUDA
179
205
  return Napi::String::New(info.Env(), "cuda");
180
206
  #endif
181
207
 
@@ -507,6 +533,16 @@ class AddonModel : public Napi::ObjectWrap<AddonModel> {
507
533
 
508
534
  return Napi::Number::From(info.Env(), int32_t(tokenType));
509
535
  }
536
+ Napi::Value GetVocabularyType(const Napi::CallbackInfo& info) {
537
+ if (disposed) {
538
+ Napi::Error::New(info.Env(), "Model is disposed").ThrowAsJavaScriptException();
539
+ return info.Env().Undefined();
540
+ }
541
+
542
+ auto vocabularyType = llama_vocab_type(model);
543
+
544
+ return Napi::Number::From(info.Env(), int32_t(vocabularyType));
545
+ }
510
546
  Napi::Value ShouldPrependBosToken(const Napi::CallbackInfo& info) {
511
547
  const int addBos = llama_add_bos_token(model);
512
548
 
@@ -515,6 +551,10 @@ class AddonModel : public Napi::ObjectWrap<AddonModel> {
515
551
  return Napi::Boolean::New(info.Env(), shouldPrependBos);
516
552
  }
517
553
 
554
+ Napi::Value GetModelSize(const Napi::CallbackInfo& info) {
555
+ return Napi::Number::From(info.Env(), llama_model_size(model));
556
+ }
557
+
518
558
  static void init(Napi::Object exports) {
519
559
  exports.Set(
520
560
  "AddonModel",
@@ -540,7 +580,9 @@ class AddonModel : public Napi::ObjectWrap<AddonModel> {
540
580
  InstanceMethod("eotToken", &AddonModel::EotToken),
541
581
  InstanceMethod("getTokenString", &AddonModel::GetTokenString),
542
582
  InstanceMethod("getTokenType", &AddonModel::GetTokenType),
583
+ InstanceMethod("getVocabularyType", &AddonModel::GetVocabularyType),
543
584
  InstanceMethod("shouldPrependBosToken", &AddonModel::ShouldPrependBosToken),
585
+ InstanceMethod("getModelSize", &AddonModel::GetModelSize),
544
586
  InstanceMethod("dispose", &AddonModel::Dispose),
545
587
  }
546
588
  )
@@ -822,6 +864,10 @@ class AddonContext : public Napi::ObjectWrap<AddonContext> {
822
864
  context_params.n_ubatch = context_params.n_batch; // the batch queue is managed in the JS side, so there's no need for managing it on the C++ side
823
865
  }
824
866
 
867
+ if (options.Has("sequences")) {
868
+ context_params.n_seq_max = options.Get("sequences").As<Napi::Number>().Uint32Value();
869
+ }
870
+
825
871
  if (options.Has("embeddings")) {
826
872
  context_params.embeddings = options.Get("embeddings").As<Napi::Boolean>().Value();
827
873
  }
@@ -1039,6 +1085,15 @@ class AddonContext : public Napi::ObjectWrap<AddonContext> {
1039
1085
  return result;
1040
1086
  }
1041
1087
 
1088
+ Napi::Value GetStateSize(const Napi::CallbackInfo& info) {
1089
+ if (disposed) {
1090
+ Napi::Error::New(info.Env(), "Context is disposed").ThrowAsJavaScriptException();
1091
+ return info.Env().Undefined();
1092
+ }
1093
+
1094
+ return Napi::Number::From(info.Env(), llama_get_state_size(ctx));
1095
+ }
1096
+
1042
1097
  Napi::Value PrintTimings(const Napi::CallbackInfo& info) {
1043
1098
  llama_print_timings(ctx);
1044
1099
  llama_reset_timings(ctx);
@@ -1063,6 +1118,7 @@ class AddonContext : public Napi::ObjectWrap<AddonContext> {
1063
1118
  InstanceMethod("sampleToken", &AddonContext::SampleToken),
1064
1119
  InstanceMethod("acceptGrammarEvaluationStateToken", &AddonContext::AcceptGrammarEvaluationStateToken),
1065
1120
  InstanceMethod("getEmbedding", &AddonContext::GetEmbedding),
1121
+ InstanceMethod("getStateSize", &AddonContext::GetStateSize),
1066
1122
  InstanceMethod("printTimings", &AddonContext::PrintTimings),
1067
1123
  InstanceMethod("dispose", &AddonContext::Dispose),
1068
1124
  }
@@ -1444,6 +1500,55 @@ Napi::Value systemInfo(const Napi::CallbackInfo& info) {
1444
1500
  return Napi::String::From(info.Env(), llama_print_system_info());
1445
1501
  }
1446
1502
 
1503
+ Napi::Value addonGetSupportsGpuOffloading(const Napi::CallbackInfo& info) {
1504
+ return Napi::Boolean::New(info.Env(), llama_supports_gpu_offload());
1505
+ }
1506
+
1507
+ Napi::Value addonGetSupportsMmap(const Napi::CallbackInfo& info) {
1508
+ return Napi::Boolean::New(info.Env(), llama_supports_mmap());
1509
+ }
1510
+
1511
+ Napi::Value addonGetSupportsMlock(const Napi::CallbackInfo& info) {
1512
+ return Napi::Boolean::New(info.Env(), llama_supports_mlock());
1513
+ }
1514
+
1515
+ Napi::Value addonGetBlockSizeForGgmlType(const Napi::CallbackInfo& info) {
1516
+ const int ggmlType = info[0].As<Napi::Number>().Int32Value();
1517
+
1518
+ if (ggmlType < 0 || ggmlType > GGML_TYPE_COUNT) {
1519
+ return info.Env().Undefined();
1520
+ }
1521
+
1522
+ const auto blockSize = ggml_blck_size(static_cast<ggml_type>(ggmlType));
1523
+
1524
+ return Napi::Number::New(info.Env(), blockSize);
1525
+ }
1526
+
1527
+ Napi::Value addonGetTypeSizeForGgmlType(const Napi::CallbackInfo& info) {
1528
+ const int ggmlType = info[0].As<Napi::Number>().Int32Value();
1529
+
1530
+ if (ggmlType < 0 || ggmlType > GGML_TYPE_COUNT) {
1531
+ return info.Env().Undefined();
1532
+ }
1533
+
1534
+ const auto typeSize = ggml_type_size(static_cast<ggml_type>(ggmlType));
1535
+
1536
+ return Napi::Number::New(info.Env(), typeSize);
1537
+ }
1538
+
1539
+ Napi::Value addonGetConsts(const Napi::CallbackInfo& info) {
1540
+ Napi::Object consts = Napi::Object::New(info.Env());
1541
+ consts.Set("ggmlMaxDims", Napi::Number::New(info.Env(), GGML_MAX_DIMS));
1542
+ consts.Set("ggmlTypeF16Size", Napi::Number::New(info.Env(), ggml_type_size(GGML_TYPE_F16)));
1543
+ consts.Set("ggmlTypeF32Size", Napi::Number::New(info.Env(), ggml_type_size(GGML_TYPE_F32)));
1544
+ consts.Set("ggmlTensorOverhead", Napi::Number::New(info.Env(), ggml_tensor_overhead()));
1545
+ consts.Set("llamaMaxRngState", Napi::Number::New(info.Env(), LLAMA_MAX_RNG_STATE));
1546
+ consts.Set("llamaPosSize", Napi::Number::New(info.Env(), sizeof(llama_pos)));
1547
+ consts.Set("llamaSeqIdSize", Napi::Number::New(info.Env(), sizeof(llama_seq_id)));
1548
+
1549
+ return consts;
1550
+ }
1551
+
1447
1552
  int addonGetGgmlLogLevelNumber(ggml_log_level level) {
1448
1553
  switch (level) {
1449
1554
  case GGML_LOG_LEVEL_ERROR: return 2;
@@ -1693,9 +1798,16 @@ static void addonFreeLlamaBackend(Napi::Env env, int* data) {
1693
1798
  Napi::Object registerCallback(Napi::Env env, Napi::Object exports) {
1694
1799
  exports.DefineProperties({
1695
1800
  Napi::PropertyDescriptor::Function("systemInfo", systemInfo),
1801
+ Napi::PropertyDescriptor::Function("getSupportsGpuOffloading", addonGetSupportsGpuOffloading),
1802
+ Napi::PropertyDescriptor::Function("getSupportsMmap", addonGetSupportsMmap),
1803
+ Napi::PropertyDescriptor::Function("getSupportsMlock", addonGetSupportsMlock),
1804
+ Napi::PropertyDescriptor::Function("getBlockSizeForGgmlType", addonGetBlockSizeForGgmlType),
1805
+ Napi::PropertyDescriptor::Function("getTypeSizeForGgmlType", addonGetTypeSizeForGgmlType),
1806
+ Napi::PropertyDescriptor::Function("getConsts", addonGetConsts),
1696
1807
  Napi::PropertyDescriptor::Function("setLogger", setLogger),
1697
1808
  Napi::PropertyDescriptor::Function("setLoggerLogLevel", setLoggerLogLevel),
1698
1809
  Napi::PropertyDescriptor::Function("getGpuVramInfo", getGpuVramInfo),
1810
+ Napi::PropertyDescriptor::Function("getGpuDeviceInfo", getGpuDeviceInfo),
1699
1811
  Napi::PropertyDescriptor::Function("getGpuType", getGpuType),
1700
1812
  Napi::PropertyDescriptor::Function("init", addonInit),
1701
1813
  Napi::PropertyDescriptor::Function("dispose", addonDispose),
@@ -1,3 +1,3 @@
1
1
  {
2
- "release": "b2440"
2
+ "release": "b2608"
3
3
  }
Binary file
@@ -1,4 +1,6 @@
1
1
  #include <stddef.h>
2
+ #include <vector>
3
+ #include <string>
2
4
 
3
5
  #if defined(GPU_INFO_USE_HIPBLAS)
4
6
  #include <hip/hip_runtime.h>
@@ -97,3 +99,22 @@ bool gpuInfoGetTotalCudaDevicesInfo(size_t * total, size_t * used, gpuInfoCudaEr
97
99
 
98
100
  return true;
99
101
  }
102
+
103
+ void gpuInfoGetCudaDeviceNames(std::vector<std::string> * deviceNames, gpuInfoCudaErrorLogCallback_t errorLogCallback) {
104
+ int deviceCount = gpuInfoGetCudaDeviceCount(errorLogCallback);
105
+
106
+ if (deviceCount < 0) {
107
+ return;
108
+ }
109
+
110
+ for (int i = 0; i < deviceCount; i++) {
111
+ cudaDeviceProp prop;
112
+ auto getDevicePropertiesResult = cudaGetDeviceProperties(&prop, i);
113
+
114
+ if (getDevicePropertiesResult != cudaSuccess) {
115
+ errorLogCallback(cudaGetErrorString(getDevicePropertiesResult));
116
+ } else {
117
+ (*deviceNames).push_back(std::string(prop.name));
118
+ }
119
+ }
120
+ }
@@ -1,7 +1,10 @@
1
1
  #pragma once
2
2
 
3
3
  #include <stddef.h>
4
+ #include <vector>
5
+ #include <string>
4
6
 
5
7
  typedef void (*gpuInfoCudaErrorLogCallback_t)(const char* message);
6
8
 
7
9
  bool gpuInfoGetTotalCudaDevicesInfo(size_t * total, size_t * used, gpuInfoCudaErrorLogCallback_t errorLogCallback);
10
+ void gpuInfoGetCudaDeviceNames(std::vector<std::string> * deviceNames, gpuInfoCudaErrorLogCallback_t errorLogCallback);
@@ -1,5 +1,8 @@
1
1
  #pragma once
2
2
 
3
3
  #include <stdint.h>
4
+ #include <string>
5
+ #include <vector>
4
6
 
5
- void get_metal_gpu_info(uint64_t * total, uint64_t * used);
7
+ void getMetalGpuInfo(uint64_t * total, uint64_t * used);
8
+ void getMetalGpuDeviceNames(std::vector<std::string> * deviceNames);
@@ -1,7 +1,9 @@
1
1
  #include <stdint.h>
2
+ #include <vector>
3
+ #include <string>
2
4
  #import <Metal/Metal.h>
3
5
 
4
- void get_metal_gpu_info(uint64_t * total, uint64_t * used) {
6
+ void getMetalGpuInfo(uint64_t * total, uint64_t * used) {
5
7
  id<MTLDevice> device = MTLCreateSystemDefaultDevice();
6
8
 
7
9
  if (device) {
@@ -15,3 +17,14 @@ void get_metal_gpu_info(uint64_t * total, uint64_t * used) {
15
17
  [device release];
16
18
  device = nil;
17
19
  }
20
+
21
+ void getMetalGpuDeviceNames(std::vector<std::string> * deviceNames) {
22
+ NSArray<id<MTLDevice>> *devices = MTLCopyAllDevices();
23
+
24
+ for (id<MTLDevice> device in devices) {
25
+ (*deviceNames).push_back(std::string(([NSString stringWithUTF8String:device.name.UTF8String]).UTF8String));
26
+ }
27
+
28
+ [devices release];
29
+ devices = nil;
30
+ }
@@ -1,10 +1,11 @@
1
1
  #include <stddef.h>
2
+ #include <vector>
2
3
 
3
4
  #include <vulkan/vulkan.hpp>
4
5
 
5
6
  typedef void (*gpuInfoVulkanWarningLogCallback_t)(const char* message);
6
7
 
7
- bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkanWarningLogCallback_t warningLogCallback) {
8
+ static bool enumerateVulkanDevices(size_t* total, size_t* used, bool addDeviceNames, std::vector<std::string> * deviceNames, gpuInfoVulkanWarningLogCallback_t warningLogCallback) {
8
9
  vk::ApplicationInfo appInfo("node-llama-cpp GPU info", 1, "llama.cpp", 1, VK_API_VERSION_1_2);
9
10
  vk::InstanceCreateInfo createInfo(vk::InstanceCreateFlags(), &appInfo, {}, {});
10
11
  vk::Instance instance = vk::createInstance(createInfo);
@@ -41,8 +42,14 @@ bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkan
41
42
 
42
43
  for (uint32_t i = 0; i < memProps.memoryHeapCount; ++i) {
43
44
  if (memProps.memoryHeaps[i].flags & vk::MemoryHeapFlagBits::eDeviceLocal) {
44
- totalMem += memProps.memoryHeaps[i].size;
45
+ const auto size = memProps.memoryHeaps[i].size;
46
+ totalMem += size;
45
47
  usedMem += memoryBudgetProperties.heapUsage[i];
48
+
49
+ if (size > 0 && addDeviceNames) {
50
+ (*deviceNames).push_back(std::string(deviceProps.deviceName.data()));
51
+ }
52
+
46
53
  break;
47
54
  }
48
55
  }
@@ -63,3 +70,14 @@ bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkan
63
70
  *used = usedMem;
64
71
  return true;
65
72
  }
73
+
74
+ bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkanWarningLogCallback_t warningLogCallback) {
75
+ return enumerateVulkanDevices(total, used, false, nullptr, warningLogCallback);
76
+ }
77
+
78
+ bool gpuInfoGetVulkanDeviceNames(std::vector<std::string> * deviceNames, gpuInfoVulkanWarningLogCallback_t warningLogCallback) {
79
+ size_t vulkanDeviceTotal = 0;
80
+ size_t vulkanDeviceUsed = 0;
81
+
82
+ return enumerateVulkanDevices(&vulkanDeviceTotal, &vulkanDeviceUsed, true, deviceNames, warningLogCallback);
83
+ }
@@ -1,7 +1,9 @@
1
1
  #pragma once
2
2
 
3
3
  #include <stddef.h>
4
+ #include <vector>
4
5
 
5
6
  typedef void (*gpuInfoVulkanWarningLogCallback_t)(const char* message);
6
7
 
7
8
  bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkanWarningLogCallback_t warningLogCallback);
9
+ bool gpuInfoGetVulkanDeviceNames(std::vector<std::string> * deviceNames, gpuInfoVulkanWarningLogCallback_t warningLogCallback);
@@ -1,4 +1,4 @@
1
1
  {
2
- "tag": "b2440",
2
+ "tag": "b2608",
3
3
  "llamaCppGithubRepo": "ggerganov/llama.cpp"
4
4
  }
@@ -0,0 +1,41 @@
1
+ set(CMAKE_SYSTEM_NAME Windows)
2
+ set(CMAKE_SYSTEM_PROCESSOR ARM64)
3
+
4
+ # Look for cl.exe in the Visual Studio installation directories
5
+ set(PROGRAMFILES "$ENV{ProgramFiles}")
6
+ set(PROGRAMFILES_X86 "$ENV{ProgramFiles\(x86\)}")
7
+
8
+ set(VS_INSTALL_PATHS
9
+ "${PROGRAMFILES_X86}/Microsoft Visual Studio"
10
+ "${PROGRAMFILES}/Microsoft Visual Studio"
11
+ "C:/Program Files (x86)/Microsoft Visual Studio"
12
+ "C:/Program Files/Microsoft Visual Studio"
13
+ )
14
+ foreach(PATH IN LISTS VS_INSTALL_PATHS)
15
+ if(CL_EXE_PATH)
16
+ break()
17
+ endif()
18
+
19
+ file(GLOB_RECURSE FOUND_CL_EXE "${PATH}/*/VC/Tools/MSVC/*/bin/Hostx64/arm64/cl.exe")
20
+ if(FOUND_CL_EXE)
21
+ list(GET FOUND_CL_EXE 0 CL_EXE_PATH)
22
+ break()
23
+ endif()
24
+
25
+ if(CL_EXE_PATH)
26
+ break()
27
+ endif()
28
+
29
+ file(GLOB_RECURSE FOUND_CL_EXE "${PATH}/**/*/VC/Tools/MSVC/*/bin/Hostx64/arm64/cl.exe")
30
+ if(FOUND_CL_EXE)
31
+ list(GET FOUND_CL_EXE 0 CL_EXE_PATH)
32
+ break()
33
+ endif()
34
+ endforeach()
35
+
36
+ if(NOT CL_EXE_PATH)
37
+ message(FATAL_ERROR "cl.exe not found for ARM architecture.")
38
+ else()
39
+ set(CMAKE_C_COMPILER "${CL_EXE_PATH}")
40
+ set(CMAKE_CXX_COMPILER "${CL_EXE_PATH}")
41
+ endif()
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"arm64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"arm64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"armv7l","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"armv7l","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":"cuda","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":"cuda","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":"vulkan","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":"vulkan","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"mac","platformInfo":{"name":"macOS","version":"21.6.0"},"arch":"arm64","gpu":"metal","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"mac","platformInfo":{"name":"macOS","version":"21.6.0"},"arch":"arm64","gpu":"metal","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"mac","platformInfo":{"name":"macOS","version":"21.6.0"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"mac","platformInfo":{"name":"macOS","version":"21.6.0"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
Binary file
@@ -0,0 +1 @@
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"arm64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
Binary file
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":"cuda","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":"cuda","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
@@ -1 +1 @@
1
- {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":"vulkan","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2440"}}}
1
+ {"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":"vulkan","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "node-llama-cpp",
3
- "version": "3.0.0-beta.14",
3
+ "version": "3.0.0-beta.15",
4
4
  "description": "Run AI models locally on your machine with node.js bindings for llama.cpp. Force a JSON schema on the model output on the generation level",
5
5
  "main": "dist/index.js",
6
6
  "type": "module",
@@ -120,7 +120,7 @@
120
120
  "@types/cli-progress": "^3.11.0",
121
121
  "@types/cross-spawn": "^6.0.2",
122
122
  "@types/fs-extra": "^11.0.4",
123
- "@types/node": "^20.8.4",
123
+ "@types/node": "^20.11.29",
124
124
  "@types/proper-lockfile": "^4.1.4",
125
125
  "@types/semver": "^7.5.8",
126
126
  "@types/uuid": "^9.0.2",
@@ -128,8 +128,8 @@
128
128
  "@types/yargs": "^17.0.24",
129
129
  "@typescript-eslint/eslint-plugin": "^6.3.0",
130
130
  "@typescript-eslint/parser": "^6.3.0",
131
- "@vitest/coverage-v8": "^1.2.2",
132
- "@vitest/ui": "^1.2.2",
131
+ "@vitest/coverage-v8": "^1.4.0",
132
+ "@vitest/ui": "^1.4.0",
133
133
  "eslint": "^8.46.0",
134
134
  "eslint-plugin-import": "^2.28.0",
135
135
  "eslint-plugin-jsdoc": "^46.9.0",
@@ -146,10 +146,11 @@
146
146
  "typescript": "^5.2.2",
147
147
  "vite-node": "^1.4.0",
148
148
  "vitepress": "1.0.0-rc.22",
149
- "vitest": "^1.2.2",
149
+ "vitest": "^1.4.0",
150
150
  "zx": "^7.2.3"
151
151
  },
152
152
  "dependencies": {
153
+ "@huggingface/jinja": "^0.2.2",
153
154
  "async-retry": "^1.3.3",
154
155
  "bytes": "^3.1.2",
155
156
  "chalk": "^5.3.0",
@@ -160,7 +161,7 @@
160
161
  "cross-spawn": "^7.0.3",
161
162
  "env-var": "^7.3.1",
162
163
  "fs-extra": "^11.2.0",
163
- "lifecycle-utils": "^1.4.0",
164
+ "lifecycle-utils": "^1.4.1",
164
165
  "log-symbols": "^5.1.0",
165
166
  "node-addon-api": "^7.0.0",
166
167
  "octokit": "^3.1.0",
@@ -168,6 +169,7 @@
168
169
  "proper-lockfile": "^4.1.2",
169
170
  "semver": "^7.6.0",
170
171
  "simple-git": "^3.19.1",
172
+ "slice-ansi": "^7.1.0",
171
173
  "strip-ansi": "^7.1.0",
172
174
  "uuid": "^9.0.0",
173
175
  "which": "^4.0.0",
@@ -1 +0,0 @@
1
- {"version":3,"file":"TemplateChatWrapper.js","sourceRoot":"","sources":["../src/TemplateChatWrapper.ts"],"names":[],"mappings":"AACA,OAAO,EAAC,mBAAmB,EAAE,SAAS,EAAkB,YAAY,EAAC,MAAM,sBAAsB,CAAC;AAClG,OAAO,EAAC,WAAW,EAAsB,MAAM,kBAAkB,CAAC;AAClE,OAAO,EAAC,iBAAiB,EAAC,MAAM,8BAA8B,CAAC;AAY/D;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA8BG;AACH,MAAM,OAAO,mBAAoB,SAAQ,WAAW;IAChC,WAAW,GAAG,UAAU,CAAC;IAChB,QAAQ,CAAsB;IAEvC,QAAQ,CAAe;IACvB,eAAe,CAAsB;IACrC,aAAa,CAAS;IACtB,YAAY,CAAS;IACrB,cAAc,CAAS;IACvB,iCAAiC,CAAU;IAE3D,gBAAgB,CAAkB,mBAAmB,CAAuC;IAC5F,gBAAgB,CAAkB,0BAA0B,CAA8C;IAE1G,YAAmB,EACf,QAAQ,EACR,eAAe,EACf,aAAa,EACb,YAAY,EACZ,cAAc,GAAG,QAAQ,EACzB,2BAA2B,EAC3B,iCAAiC,GAAG,IAAI,EACf;QACzB,KAAK,EAAE,CAAC;QAER,IAAI,CAAC,QAAQ,GAAG,QAAQ,CAAC;QACzB,IAAI,CAAC,eAAe,GAAG,eAAe,CAAC;QACvC,IAAI,CAAC,aAAa,GAAG,aAAa,CAAC;QACnC,IAAI,CAAC,YAAY,GAAG,YAAY,CAAC;QACjC,IAAI,CAAC,cAAc,GAAG,cAAc,CAAC;QACrC,IAAI,CAAC,iCAAiC,GAAG,iCAAiC,CAAC;QAE3E,IAAI,CAAC,mBAAmB,GAAG,iBAAiB,CAAC,QAAQ,CAAC,CAAC;QACvD,IAAI,CAAC,0BAA0B,GAAG,wBAAwB,CAAC,eAAe,CAAC,CAAC;QAE5E,IAAI,CAAC,QAAQ,GAAG;YACZ,GAAG,KAAK,CAAC,QAAQ;YACjB,SAAS,EAAE,gCAAgC,CAAC,2BAA2B,CAAC,IAAI,WAAW,CAAC,cAAc,CAAC,SAAS;SACnH,CAAC;IACN,CAAC;IAEe,mBAAmB,CAAC,OAAmC,EAAE,EAAC,kBAAkB,EAAE,sBAAsB,KAGhH,EAAE;QAIF,MAAM,oBAAoB,GAAG,IAAI,CAAC,2CAA2C,CAAC,OAAO,EAAE,kBAAkB,EAAE;YACvG,cAAc,EAAE,sBAAsB;SACzC,CAAC,CAAC;QAEH,MAAM,WAAW,GAIZ,EAAE,CAAC;QAER,IAAI,WAAW,GAAa,EAAE,CAAC;QAC/B,IAAI,SAAS,GAAa,EAAE,CAAC;QAC7B,IAAI,UAAU,GAAa,EAAE,CAAC;QAC9B,IAAI,qBAAqB,GAAuC,IAAI,CAAC;QAErE,SAAS,KAAK;YACV,IAAI,WAAW,CAAC,MAAM,GAAG,CAAC,IAAI,SAAS,CAAC,MAAM,GAAG,CAAC,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC;gBACvE,WAAW,CAAC,IAAI,CAAC;oBACb,MAAM,EAAE,WAAW,CAAC,IAAI,CAAC,MAAM,CAAC;oBAChC,IAAI,EAAE,SAAS,CAAC,IAAI,CAAC,MAAM,CAAC;oBAC5B,KAAK,EAAE,UAAU,CAAC,IAAI,CAAC,MAAM,CAAC;iBACjC,CAAC,CAAC;YAEP,WAAW,GAAG,EAAE,CAAC;YACjB,SAAS,GAAG,EAAE,CAAC;YACf,UAAU,GAAG,EAAE,CAAC;QACpB,CAAC;QAED,MAAM,cAAc,GAAG,CAAC,IAAiC,EAAE,IAAY,EAAE,MAAsB,EAAE,EAAE;YAC/F,MAAM,EAAC,cAAc,EAAE,aAAa,EAAE,aAAa,EAAC,GAAG,IAAI,CAAC,0BAA0B,CAAC;YACvF,OAAO,SAAS,CAAC;gBACb,IAAI,YAAY,CAAC,CAAC,MAAM,IAAI,EAAE,CAAC,GAAG,cAAc,GAAG,IAAI,GAAG,aAAa,CAAC;gBACxE,IAAI;gBACJ,IAAI,YAAY,CAAC,aAAa,CAAC;aAClC,CAAC,CAAC;QACP,CAAC,CAAC;QAEF,KAAK,MAAM,IAAI,IAAI,oBAAoB,EAAE;YACrC,IAAI,IAAI,CAAC,IAAI,KAAK,QAAQ,EAAE;gBACxB,IAAI,CAAC,IAAI,CAAC,iCAAiC,IAAI,qBAAqB,KAAK,QAAQ;oBAC7E,KAAK,EAAE,CAAC;gBAEZ,qBAAqB,GAAG,QAAQ,CAAC;gBACjC,WAAW,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;aAC/B;iBAAM,IAAI,IAAI,CAAC,IAAI,KAAK,MAAM,EAAE;gBAC7B,IAAI,CAAC,IAAI,CAAC,iCAAiC,IAAI,CAAC,qBAAqB,KAAK,QAAQ,IAAI,qBAAqB,KAAK,MAAM,CAAC;oBACnH,KAAK,EAAE,CAAC;gBAEZ,qBAAqB,GAAG,MAAM,CAAC;gBAC/B,SAAS,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;aAC7B;iBAAM,IAAI,IAAI,CAAC,IAAI,KAAK,OAAO,EAAE;gBAC9B,IAAI,CAAC,IAAI,CAAC,iCAAiC;oBACvC,KAAK,EAAE,CAAC;gBAEZ,qBAAqB,GAAG,OAAO,CAAC;gBAChC,UAAU,CAAC,IAAI,CAAC,IAAI,CAAC,yBAAyB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,CAAC;aAClE;SACJ;QAED,KAAK,EAAE,CAAC;QAER,MAAM,WAAW,GAAG,SAAS,CACzB,WAAW,CAAC,GAAG,CAAC,CAAC,EAAC,MAAM,EAAE,IAAI,EAAE,KAAK,EAAC,EAAE,KAAK,EAAE,EAAE;YAC7C,MAAM,WAAW,GAAG,KAAK,KAAK,CAAC,CAAC;YAChC,MAAM,UAAU,GAAG,KAAK,KAAK,WAAW,CAAC,MAAM,GAAG,CAAC,CAAC;YAEpD,MAAM,GAAG,GAAG,SAAS,CAAC;gBAClB,WAAW;oBACP,CAAC,CAAC,MAAM,CAAC,MAAM,KAAK,CAAC;wBACjB,CAAC,CAAC,IAAI,YAAY,CAAC,CAAC,IAAI,CAAC,mBAAmB,CAAC,kBAAkB,IAAI,EAAE,CAAC,GAAG,IAAI,CAAC,mBAAmB,CAAC,aAAa,CAAC;wBAChH,CAAC,CAAC,IAAI,CAAC,mBAAmB,CAAC,kBAAkB,IAAI,IAAI;4BACjD,CAAC,CAAC,SAAS,CAAC;gCACR,IAAI,YAAY,CAAC,IAAI,CAAC,mBAAmB,CAAC,kBAAkB,CAAC;gCAC7D,MAAM;gCACN,IAAI,YAAY,CAAC,IAAI,CAAC,mBAAmB,CAAC,aAAa,CAAC;6BAC3D,CAAC;4BACF,CAAC,CAAC,cAAc,CAAC,QAAQ,EAAE,MAAM,EAAE,IAAI,CAAC,mBAAmB,CAAC,aAAa,CAAC;oBAClF,CAAC,CAAC,MAAM,CAAC,MAAM,KAAK,CAAC;wBACjB,CAAC,CAAC,SAAS,CAAC,EAAE,CAAC;wBACf,CAAC,CAAC,cAAc,CAAC,QAAQ,EAAE,MAAM,CAAC;gBAG1C,IAAI,CAAC,MAAM,KAAK,CAAC;oBACb,CAAC,CAAC,SAAS,CAAC,EAAE,CAAC;oBACf,CAAC,CAAC,cAAc,CAAC,MAAM,EAAE,IAAI,CAAC;gBAElC,KAAK,CAAC,MAAM,KAAK,CAAC;oBACd,CAAC,CAAC,SAAS,CAAC,EAAE,CAAC;oBACf,CAAC,CAAC,CAAC,UAAU;wBACT,CAAC,CAAC,cAAc,CAAC,OAAO,EAAE,KAAK,CAAC;wBAChC,CAAC,CAAC,SAAS,CAAC;4BACR,IAAI,YAAY,CAAC,IAAI,CAAC,mBAAmB,CAAC,gBAAgB,CAAC;4BAC3D,KAAK;yBACR,CAAC;aACb,CAAC,CAAC;YAEH,OAAO,SAAS,CACZ,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,KAAK,EAAE,EAAE;gBAC7B,IAAI,KAAK,YAAY,YAAY,EAAE;oBAC/B,MAAM,QAAQ,GAAG,GAAG,CAAC,GAAG,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;oBAErC,IAAI,QAAQ,IAAI,IAAI,IAAI,CAAC,CAAC,QAAQ,YAAY,YAAY,CAAC;wBACvD,OAAO,GAAG,CAAC,MAAM,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC;oBAE/B,OAAO,GAAG,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC;wBAC3B,IAAI,YAAY,CAAC,QAAQ,CAAC,KAAK,GAAG,KAAK,CAAC,KAAK,CAAC;qBACjD,CAAC,CAAC;iBACN;gBAED,OAAO,GAAG,CAAC,MAAM,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC;YAC/B,CAAC,EAAE,EAAsB,CAAC,CAC7B,CAAC;QACN,CAAC,CAAC,CACL,CAAC;QAEF,OAAO;YACH,WAAW;YACX,sBAAsB,EAAE;gBACpB,SAAS,CAAC,IAAI,mBAAmB,CAAC,KAAK,CAAC,CAAC;gBACzC,SAAS,CAAC,IAAI,CAAC,mBAAmB,CAAC,gBAAgB,CAAC;gBACpD,SAAS,CAAC,IAAI,YAAY,CAAC,IAAI,CAAC,mBAAmB,CAAC,gBAAgB,CAAC,CAAC;aACzE;SACJ,CAAC;IACN,CAAC;CACJ;AAUD,SAAS,gCAAgC,CAAC,QAAiD;IACvF,IAAI,QAAQ,IAAI,IAAI;QAChB,OAAO,IAAI,CAAC;IAEhB,MAAM,CAAC,oBAAoB,EAAE,0BAA0B,CAAC,GAAG,QAAQ,CAAC;IAEpE,IAAI,oBAAoB,IAAI,IAAI,IAAI,0BAA0B,IAAI,IAAI;QAClE,MAAM,IAAI,KAAK,CAAC,oEAAoE,CAAC,CAAC;IAE1F,MAAM,0BAA0B,GAAG,iBAAiB,CAAC,oBAAoB,EAAE,CAAC;YACxE,IAAI,EAAE,kBAAkB;YACxB,GAAG,EAAE,cAAc;SACtB,EAAE;YACC,IAAI,EAAE,oBAAoB;YAC1B,GAAG,EAAE,gBAAgB;SACxB,CAAC,CAAC,CAAC;IACJ,MAAM,gCAAgC,GAAG,iBAAiB,CAAC,0BAA0B,EAAE,CAAC;YACpF,IAAI,EAAE,wBAAwB;YAC9B,GAAG,EAAE,oBAAoB;SAC5B,CAAC,CAAC,CAAC;IAEJ,MAAM,UAAU,GAAG,0BAA0B,CAAC,YAAY,CAAC,MAAM,CAAC;IAClE,MAAM,gBAAgB,GAAG,0BAA0B,CAAC,cAAc,CAAC,MAAM,CAAC;IAC1E,MAAM,UAAU,GAAG,0BAA0B,CAAC,cAAc,CAAC,MAAM,CAAC;IAEpE,MAAM,YAAY,GAAG,gCAAgC,CAAC,kBAAkB,CAAC,MAAM,CAAC;IAChF,MAAM,YAAY,GAAG,gCAAgC,CAAC,kBAAkB,CAAC,MAAM,CAAC;IAEhF,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC;QACvB,MAAM,IAAI,KAAK,CAAC,iEAAiE,CAAC,CAAC;IAEvF,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC;QACvB,MAAM,IAAI,KAAK,CAAC,kEAAkE,CAAC,CAAC;IAExF,IAAI,YAAY,CAAC,MAAM,KAAK,CAAC;QACzB,MAAM,IAAI,KAAK,CAAC,8EAA8E,CAAC,CAAC;IAEpG,IAAI,YAAY,CAAC,MAAM,KAAK,CAAC;QACzB,MAAM,IAAI,KAAK,CAAC,6EAA6E,CAAC,CAAC;IAEnG,OAAO;QACH,IAAI,EAAE;YACF,mBAAmB,EAAE,IAAI;YACzB,MAAM,EAAE,UAAU;YAClB,YAAY,EAAE,gBAAgB;YAC9B,MAAM,EAAE,UAAU;SACrB;QACD,MAAM,EAAE;YACJ,MAAM,EAAE,YAAY;YACpB,MAAM,EAAE,YAAY;SACvB;KACJ,CAAC;AACN,CAAC;AAED,SAAS,iBAAiB,CAAC,QAAsB;IAM7C,MAAM,cAAc,GAAG,iBAAiB,CAAC,QAAQ,EAAE,CAAC;YAChD,IAAI,EAAE,kBAAkB;YACxB,GAAG,EAAE,cAAc;YACnB,QAAQ,EAAE,IAAI;SACjB,EAAE;YACC,IAAI,EAAE,aAAa;YACnB,GAAG,EAAE,SAAS;SACjB,EAAE;YACC,IAAI,EAAE,gBAAgB;YACtB,GAAG,EAAE,YAAY;SACpB,CAAC,CAAC,CAAC;IAEJ,IAAI,cAAc,CAAC,UAAU,CAAC,MAAM,CAAC,MAAM,IAAI,CAAC;QAC5C,MAAM,IAAI,KAAK,CAAC,qDAAqD,CAAC,CAAC;IAE3E,OAAO;QACH,kBAAkB,EAAE,cAAc,CAAC,YAAY,EAAE,MAAM,IAAI,IAAI;QAC/D,aAAa,EAAE,cAAc,CAAC,OAAO,CAAC,MAAM;QAC5C,gBAAgB,EAAE,cAAc,CAAC,UAAU,CAAC,MAAM;QAClD,gBAAgB,EAAE,cAAc,CAAC,UAAU,CAAC,MAAM;KACrD,CAAC;AACN,CAAC;AAED,SAAS,wBAAwB,CAAC,QAA6B;IAK3D,MAAM,cAAc,GAAG,iBAAiB,CAAC,QAAQ,EAAE,CAAC;YAChD,IAAI,EAAE,cAAc;YACpB,GAAG,EAAE,UAAU;SAClB,EAAE;YACC,IAAI,EAAE,aAAa;YACnB,GAAG,EAAE,SAAS;SACjB,CAAC,CAAC,CAAC;IAEJ,OAAO;QACH,cAAc,EAAE,cAAc,CAAC,QAAQ,CAAC,MAAM;QAC9C,aAAa,EAAE,cAAc,CAAC,OAAO,CAAC,MAAM;QAC5C,aAAa,EAAE,cAAc,CAAC,OAAO,CAAC,MAAM;KAC/C,CAAC;AACN,CAAC"}
@@ -1,33 +0,0 @@
1
- import { ModelTypeDescription } from "../AddonTypes.js";
2
- import { GeneralChatWrapper } from "../../chatWrappers/GeneralChatWrapper.js";
3
- import { LlamaChatWrapper } from "../../chatWrappers/LlamaChatWrapper.js";
4
- import { AlpacaChatWrapper } from "../../chatWrappers/AlpacaChatWrapper.js";
5
- import { FunctionaryChatWrapper } from "../../chatWrappers/FunctionaryChatWrapper.js";
6
- import { ChatMLChatWrapper } from "../../chatWrappers/ChatMLChatWrapper.js";
7
- import { FalconChatWrapper } from "../../chatWrappers/FalconChatWrapper.js";
8
- import { GemmaChatWrapper } from "../../chatWrappers/GemmaChatWrapper.js";
9
- export declare const chatWrapperTypeNames: readonly ["auto", "general", "llamaChat", "alpacaChat", "functionary", "chatML", "falconChat", "gemma"];
10
- export type ChatWrapperTypeName = (typeof chatWrapperTypeNames)[number];
11
- declare const chatWrappers: {
12
- readonly general: typeof GeneralChatWrapper;
13
- readonly llamaChat: typeof LlamaChatWrapper;
14
- readonly alpacaChat: typeof AlpacaChatWrapper;
15
- readonly functionary: typeof FunctionaryChatWrapper;
16
- readonly chatML: typeof ChatMLChatWrapper;
17
- readonly falconChat: typeof FalconChatWrapper;
18
- readonly gemma: typeof GemmaChatWrapper;
19
- };
20
- /**
21
- * @param configType
22
- * @param options
23
- */
24
- export declare function resolveChatWrapperBasedOnWrapperTypeName(configType: ChatWrapperTypeName, { bosString, filename, typeDescription, customWrapperSettings }?: {
25
- bosString?: string | null;
26
- filename?: string;
27
- /** @hidden this type alias is too long in the documentation */
28
- typeDescription?: ModelTypeDescription;
29
- customWrapperSettings?: {
30
- [wrapper in keyof typeof chatWrappers]?: ConstructorParameters<(typeof chatWrappers)[wrapper]>[0];
31
- };
32
- }): LlamaChatWrapper | ChatMLChatWrapper | GeneralChatWrapper | FalconChatWrapper | FunctionaryChatWrapper | GemmaChatWrapper;
33
- export {};