node-llama-cpp 3.0.0-beta.3 → 3.0.0-beta.30

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (690) hide show
  1. package/README.md +14 -11
  2. package/bins/linux-arm64/_nlcBuildMetadata.json +1 -0
  3. package/bins/linux-arm64/llama-addon.node +0 -0
  4. package/bins/linux-armv7l/_nlcBuildMetadata.json +1 -0
  5. package/bins/linux-armv7l/llama-addon.node +0 -0
  6. package/bins/linux-x64/_nlcBuildMetadata.json +1 -0
  7. package/bins/linux-x64/llama-addon.node +0 -0
  8. package/bins/linux-x64-cuda/_nlcBuildMetadata.json +1 -0
  9. package/bins/linux-x64-cuda/llama-addon.node +0 -0
  10. package/bins/linux-x64-vulkan/_nlcBuildMetadata.json +1 -0
  11. package/bins/linux-x64-vulkan/llama-addon.node +0 -0
  12. package/bins/mac-arm64-metal/_nlcBuildMetadata.json +1 -0
  13. package/bins/mac-arm64-metal/default.metallib +0 -0
  14. package/bins/mac-arm64-metal/llama-addon.node +0 -0
  15. package/bins/mac-x64/_nlcBuildMetadata.json +1 -0
  16. package/bins/mac-x64/llama-addon.node +0 -0
  17. package/bins/win-arm64/_nlcBuildMetadata.json +1 -0
  18. package/bins/win-arm64/llama-addon.exp +0 -0
  19. package/bins/win-arm64/llama-addon.lib +0 -0
  20. package/bins/win-arm64/llama-addon.node +0 -0
  21. package/bins/win-x64/_nlcBuildMetadata.json +1 -0
  22. package/bins/win-x64/llama-addon.exp +0 -0
  23. package/bins/win-x64/llama-addon.lib +0 -0
  24. package/bins/win-x64/llama-addon.node +0 -0
  25. package/bins/win-x64-cuda/_nlcBuildMetadata.json +1 -0
  26. package/bins/win-x64-cuda/llama-addon.exp +0 -0
  27. package/bins/win-x64-cuda/llama-addon.lib +0 -0
  28. package/bins/win-x64-cuda/llama-addon.node +0 -0
  29. package/bins/win-x64-vulkan/_nlcBuildMetadata.json +1 -0
  30. package/bins/win-x64-vulkan/llama-addon.exp +0 -0
  31. package/bins/win-x64-vulkan/llama-addon.lib +0 -0
  32. package/bins/win-x64-vulkan/llama-addon.node +0 -0
  33. package/dist/ChatWrapper.d.ts +8 -39
  34. package/dist/ChatWrapper.js +115 -72
  35. package/dist/ChatWrapper.js.map +1 -1
  36. package/dist/apiDocsIndex.d.ts +1 -0
  37. package/dist/apiDocsIndex.js +7 -0
  38. package/dist/apiDocsIndex.js.map +1 -0
  39. package/dist/{utils/getBin.d.ts → bindings/AddonTypes.d.ts} +54 -8
  40. package/dist/bindings/AddonTypes.js +2 -0
  41. package/dist/bindings/AddonTypes.js.map +1 -0
  42. package/dist/bindings/Llama.d.ts +47 -0
  43. package/dist/bindings/Llama.js +353 -0
  44. package/dist/bindings/Llama.js.map +1 -0
  45. package/dist/bindings/consts.d.ts +2 -0
  46. package/dist/bindings/consts.js +11 -0
  47. package/dist/bindings/consts.js.map +1 -0
  48. package/dist/bindings/getLlama.d.ts +148 -0
  49. package/dist/bindings/getLlama.js +401 -0
  50. package/dist/bindings/getLlama.js.map +1 -0
  51. package/dist/bindings/types.d.ts +56 -0
  52. package/dist/bindings/types.js +77 -0
  53. package/dist/bindings/types.js.map +1 -0
  54. package/dist/bindings/utils/MemoryOrchestrator.d.ts +21 -0
  55. package/dist/bindings/utils/MemoryOrchestrator.js +49 -0
  56. package/dist/bindings/utils/MemoryOrchestrator.js.map +1 -0
  57. package/dist/bindings/utils/NoBinaryFoundError.d.ts +2 -0
  58. package/dist/bindings/utils/NoBinaryFoundError.js +7 -0
  59. package/dist/bindings/utils/NoBinaryFoundError.js.map +1 -0
  60. package/dist/bindings/utils/asyncEvery.d.ts +5 -0
  61. package/dist/bindings/utils/asyncEvery.js +15 -0
  62. package/dist/bindings/utils/asyncEvery.js.map +1 -0
  63. package/dist/bindings/utils/asyncSome.d.ts +5 -0
  64. package/dist/bindings/utils/asyncSome.js +27 -0
  65. package/dist/bindings/utils/asyncSome.js.map +1 -0
  66. package/dist/{utils → bindings/utils}/binariesGithubRelease.js +1 -1
  67. package/dist/bindings/utils/binariesGithubRelease.js.map +1 -0
  68. package/dist/bindings/utils/clearAllLocalBuilds.d.ts +1 -0
  69. package/dist/bindings/utils/clearAllLocalBuilds.js +47 -0
  70. package/dist/bindings/utils/clearAllLocalBuilds.js.map +1 -0
  71. package/dist/bindings/utils/cloneLlamaCppRepo.d.ts +11 -0
  72. package/dist/bindings/utils/cloneLlamaCppRepo.js +166 -0
  73. package/dist/bindings/utils/cloneLlamaCppRepo.js.map +1 -0
  74. package/dist/bindings/utils/compileLLamaCpp.d.ts +17 -0
  75. package/dist/bindings/utils/compileLLamaCpp.js +226 -0
  76. package/dist/bindings/utils/compileLLamaCpp.js.map +1 -0
  77. package/dist/bindings/utils/detectAvailableComputeLayers.d.ts +14 -0
  78. package/dist/bindings/utils/detectAvailableComputeLayers.js +305 -0
  79. package/dist/bindings/utils/detectAvailableComputeLayers.js.map +1 -0
  80. package/dist/bindings/utils/detectGlibc.d.ts +4 -0
  81. package/dist/bindings/utils/detectGlibc.js +46 -0
  82. package/dist/bindings/utils/detectGlibc.js.map +1 -0
  83. package/dist/bindings/utils/getBestComputeLayersAvailable.d.ts +10 -0
  84. package/dist/bindings/utils/getBestComputeLayersAvailable.js +29 -0
  85. package/dist/bindings/utils/getBestComputeLayersAvailable.js.map +1 -0
  86. package/dist/bindings/utils/getBuildFolderNameForBuildOptions.d.ts +5 -0
  87. package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js +93 -0
  88. package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js.map +1 -0
  89. package/dist/bindings/utils/getCanUsePrebuiltBinaries.d.ts +1 -0
  90. package/dist/bindings/utils/getCanUsePrebuiltBinaries.js +8 -0
  91. package/dist/bindings/utils/getCanUsePrebuiltBinaries.js.map +1 -0
  92. package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.d.ts +2 -0
  93. package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.js +21 -0
  94. package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.js.map +1 -0
  95. package/dist/bindings/utils/getGpuTypesToUseForOption.d.ts +12 -0
  96. package/dist/bindings/utils/getGpuTypesToUseForOption.js +30 -0
  97. package/dist/bindings/utils/getGpuTypesToUseForOption.js.map +1 -0
  98. package/dist/bindings/utils/getLinuxDistroInfo.d.ts +9 -0
  99. package/dist/bindings/utils/getLinuxDistroInfo.js +46 -0
  100. package/dist/bindings/utils/getLinuxDistroInfo.js.map +1 -0
  101. package/dist/bindings/utils/getLlamaWithoutBackend.d.ts +5 -0
  102. package/dist/bindings/utils/getLlamaWithoutBackend.js +27 -0
  103. package/dist/bindings/utils/getLlamaWithoutBackend.js.map +1 -0
  104. package/dist/bindings/utils/getPlatform.d.ts +2 -0
  105. package/dist/bindings/utils/getPlatform.js +15 -0
  106. package/dist/bindings/utils/getPlatform.js.map +1 -0
  107. package/dist/bindings/utils/getPlatformInfo.d.ts +5 -0
  108. package/dist/bindings/utils/getPlatformInfo.js +28 -0
  109. package/dist/bindings/utils/getPlatformInfo.js.map +1 -0
  110. package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.d.ts +3 -0
  111. package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.js +27 -0
  112. package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.js.map +1 -0
  113. package/dist/bindings/utils/hasFileInPath.d.ts +2 -0
  114. package/dist/bindings/utils/hasFileInPath.js +34 -0
  115. package/dist/bindings/utils/hasFileInPath.js.map +1 -0
  116. package/dist/bindings/utils/lastBuildInfo.d.ts +6 -0
  117. package/dist/bindings/utils/lastBuildInfo.js +17 -0
  118. package/dist/bindings/utils/lastBuildInfo.js.map +1 -0
  119. package/dist/bindings/utils/logBinaryUsageExampleToConsole.d.ts +2 -0
  120. package/dist/bindings/utils/logBinaryUsageExampleToConsole.js +22 -0
  121. package/dist/bindings/utils/logBinaryUsageExampleToConsole.js.map +1 -0
  122. package/dist/bindings/utils/logDistroInstallInstruction.d.ts +14 -0
  123. package/dist/bindings/utils/logDistroInstallInstruction.js +48 -0
  124. package/dist/bindings/utils/logDistroInstallInstruction.js.map +1 -0
  125. package/dist/bindings/utils/resolveCustomCmakeOptions.d.ts +1 -0
  126. package/dist/bindings/utils/resolveCustomCmakeOptions.js +47 -0
  127. package/dist/bindings/utils/resolveCustomCmakeOptions.js.map +1 -0
  128. package/dist/bindings/utils/testBindingBinary.d.ts +1 -0
  129. package/dist/bindings/utils/testBindingBinary.js +100 -0
  130. package/dist/bindings/utils/testBindingBinary.js.map +1 -0
  131. package/dist/bindings/utils/testCmakeBinary.d.ts +6 -0
  132. package/dist/bindings/utils/testCmakeBinary.js +32 -0
  133. package/dist/bindings/utils/testCmakeBinary.js.map +1 -0
  134. package/dist/chatWrappers/AlpacaChatWrapper.d.ts +2 -1
  135. package/dist/chatWrappers/AlpacaChatWrapper.js +9 -2
  136. package/dist/chatWrappers/AlpacaChatWrapper.js.map +1 -1
  137. package/dist/chatWrappers/ChatMLChatWrapper.d.ts +2 -9
  138. package/dist/chatWrappers/ChatMLChatWrapper.js +23 -21
  139. package/dist/chatWrappers/ChatMLChatWrapper.js.map +1 -1
  140. package/dist/chatWrappers/FalconChatWrapper.d.ts +4 -10
  141. package/dist/chatWrappers/FalconChatWrapper.js +38 -21
  142. package/dist/chatWrappers/FalconChatWrapper.js.map +1 -1
  143. package/dist/chatWrappers/FunctionaryChatWrapper.d.ts +8 -32
  144. package/dist/chatWrappers/FunctionaryChatWrapper.js +323 -118
  145. package/dist/chatWrappers/FunctionaryChatWrapper.js.map +1 -1
  146. package/dist/chatWrappers/GemmaChatWrapper.d.ts +7 -0
  147. package/dist/chatWrappers/GemmaChatWrapper.js +96 -0
  148. package/dist/chatWrappers/GemmaChatWrapper.js.map +1 -0
  149. package/dist/chatWrappers/GeneralChatWrapper.d.ts +4 -10
  150. package/dist/chatWrappers/GeneralChatWrapper.js +45 -22
  151. package/dist/chatWrappers/GeneralChatWrapper.js.map +1 -1
  152. package/dist/chatWrappers/Llama2ChatWrapper.d.ts +12 -0
  153. package/dist/chatWrappers/{LlamaChatWrapper.js → Llama2ChatWrapper.js} +38 -20
  154. package/dist/chatWrappers/Llama2ChatWrapper.js.map +1 -0
  155. package/dist/chatWrappers/Llama3ChatWrapper.d.ts +16 -0
  156. package/dist/chatWrappers/Llama3ChatWrapper.js +174 -0
  157. package/dist/chatWrappers/Llama3ChatWrapper.js.map +1 -0
  158. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.d.ts +67 -0
  159. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +371 -0
  160. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -0
  161. package/dist/chatWrappers/generic/TemplateChatWrapper.d.ts +54 -0
  162. package/dist/chatWrappers/generic/TemplateChatWrapper.js +200 -0
  163. package/dist/chatWrappers/generic/TemplateChatWrapper.js.map +1 -0
  164. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.d.ts +23 -0
  165. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js +45 -0
  166. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js.map +1 -0
  167. package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.d.ts +42 -0
  168. package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.js +82 -0
  169. package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.js.map +1 -0
  170. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.d.ts +4 -0
  171. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js +210 -0
  172. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js.map +1 -0
  173. package/dist/chatWrappers/utils/resolveChatWrapper.d.ts +69 -0
  174. package/dist/chatWrappers/utils/resolveChatWrapper.js +243 -0
  175. package/dist/chatWrappers/utils/resolveChatWrapper.js.map +1 -0
  176. package/dist/cli/cli.js +21 -7
  177. package/dist/cli/cli.js.map +1 -1
  178. package/dist/cli/commands/BuildCommand.d.ts +11 -4
  179. package/dist/cli/commands/BuildCommand.js +114 -41
  180. package/dist/cli/commands/BuildCommand.js.map +1 -1
  181. package/dist/cli/commands/ChatCommand.d.ts +18 -6
  182. package/dist/cli/commands/ChatCommand.js +299 -143
  183. package/dist/cli/commands/ChatCommand.js.map +1 -1
  184. package/dist/cli/commands/ClearCommand.d.ts +1 -1
  185. package/dist/cli/commands/ClearCommand.js +11 -12
  186. package/dist/cli/commands/ClearCommand.js.map +1 -1
  187. package/dist/cli/commands/CompleteCommand.d.ts +29 -0
  188. package/dist/cli/commands/CompleteCommand.js +365 -0
  189. package/dist/cli/commands/CompleteCommand.js.map +1 -0
  190. package/dist/cli/commands/DebugCommand.d.ts +7 -0
  191. package/dist/cli/commands/DebugCommand.js +54 -0
  192. package/dist/cli/commands/DebugCommand.js.map +1 -0
  193. package/dist/cli/commands/DownloadCommand.d.ts +7 -4
  194. package/dist/cli/commands/DownloadCommand.js +121 -70
  195. package/dist/cli/commands/DownloadCommand.js.map +1 -1
  196. package/dist/cli/commands/InfillCommand.d.ts +31 -0
  197. package/dist/cli/commands/InfillCommand.js +401 -0
  198. package/dist/cli/commands/InfillCommand.js.map +1 -0
  199. package/dist/cli/commands/InitCommand.d.ts +11 -0
  200. package/dist/cli/commands/InitCommand.js +195 -0
  201. package/dist/cli/commands/InitCommand.js.map +1 -0
  202. package/dist/cli/commands/OnPostInstallCommand.js +9 -10
  203. package/dist/cli/commands/OnPostInstallCommand.js.map +1 -1
  204. package/dist/cli/commands/PullCommand.d.ts +12 -0
  205. package/dist/cli/commands/PullCommand.js +117 -0
  206. package/dist/cli/commands/PullCommand.js.map +1 -0
  207. package/dist/cli/commands/inspect/InspectCommand.d.ts +4 -0
  208. package/dist/cli/commands/inspect/InspectCommand.js +19 -0
  209. package/dist/cli/commands/inspect/InspectCommand.js.map +1 -0
  210. package/dist/cli/commands/inspect/commands/InspectGgufCommand.d.ts +12 -0
  211. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +136 -0
  212. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -0
  213. package/dist/cli/commands/inspect/commands/InspectGpuCommand.d.ts +4 -0
  214. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +164 -0
  215. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -0
  216. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.d.ts +17 -0
  217. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +613 -0
  218. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -0
  219. package/dist/cli/projectTemplates.d.ts +7 -0
  220. package/dist/cli/projectTemplates.js +10 -0
  221. package/dist/cli/projectTemplates.js.map +1 -0
  222. package/dist/cli/recommendedModels.d.ts +2 -0
  223. package/dist/cli/recommendedModels.js +363 -0
  224. package/dist/cli/recommendedModels.js.map +1 -0
  225. package/dist/cli/startCreateCli.d.ts +2 -0
  226. package/dist/cli/startCreateCli.js +26 -0
  227. package/dist/cli/startCreateCli.js.map +1 -0
  228. package/dist/cli/utils/ConsoleInteraction.d.ts +23 -0
  229. package/dist/cli/utils/ConsoleInteraction.js +122 -0
  230. package/dist/cli/utils/ConsoleInteraction.js.map +1 -0
  231. package/dist/cli/utils/ConsoleTable.d.ts +23 -0
  232. package/dist/cli/utils/ConsoleTable.js +86 -0
  233. package/dist/cli/utils/ConsoleTable.js.map +1 -0
  234. package/dist/cli/utils/basicChooseFromListConsoleInteraction.d.ts +13 -0
  235. package/dist/cli/utils/basicChooseFromListConsoleInteraction.js +111 -0
  236. package/dist/cli/utils/basicChooseFromListConsoleInteraction.js.map +1 -0
  237. package/dist/cli/utils/consolePromptQuestion.d.ts +6 -0
  238. package/dist/cli/utils/consolePromptQuestion.js +82 -0
  239. package/dist/cli/utils/consolePromptQuestion.js.map +1 -0
  240. package/dist/cli/utils/getReadablePath.d.ts +1 -0
  241. package/dist/cli/utils/getReadablePath.js +14 -0
  242. package/dist/cli/utils/getReadablePath.js.map +1 -0
  243. package/dist/cli/utils/interactivelyAskForModel.d.ts +7 -0
  244. package/dist/cli/utils/interactivelyAskForModel.js +451 -0
  245. package/dist/cli/utils/interactivelyAskForModel.js.map +1 -0
  246. package/dist/cli/utils/logUsedGpuTypeOption.d.ts +2 -0
  247. package/dist/cli/utils/logUsedGpuTypeOption.js +9 -0
  248. package/dist/cli/utils/logUsedGpuTypeOption.js.map +1 -0
  249. package/dist/cli/utils/printCommonInfoLines.d.ts +9 -0
  250. package/dist/cli/utils/printCommonInfoLines.js +75 -0
  251. package/dist/cli/utils/printCommonInfoLines.js.map +1 -0
  252. package/dist/cli/utils/printInfoLine.d.ts +12 -0
  253. package/dist/cli/utils/printInfoLine.js +54 -0
  254. package/dist/cli/utils/printInfoLine.js.map +1 -0
  255. package/dist/cli/utils/projectTemplates.d.ts +19 -0
  256. package/dist/cli/utils/projectTemplates.js +47 -0
  257. package/dist/cli/utils/projectTemplates.js.map +1 -0
  258. package/dist/cli/utils/resolveCommandGgufPath.d.ts +4 -0
  259. package/dist/cli/utils/resolveCommandGgufPath.js +71 -0
  260. package/dist/cli/utils/resolveCommandGgufPath.js.map +1 -0
  261. package/dist/cli/utils/resolveHeaderFlag.d.ts +1 -0
  262. package/dist/cli/utils/resolveHeaderFlag.js +21 -0
  263. package/dist/cli/utils/resolveHeaderFlag.js.map +1 -0
  264. package/dist/cli/utils/resolveModelRecommendationFileOptions.d.ts +19 -0
  265. package/dist/cli/utils/resolveModelRecommendationFileOptions.js +7 -0
  266. package/dist/cli/utils/resolveModelRecommendationFileOptions.js.map +1 -0
  267. package/dist/cli/utils/splitAnsiToLines.d.ts +1 -0
  268. package/dist/cli/utils/splitAnsiToLines.js +32 -0
  269. package/dist/cli/utils/splitAnsiToLines.js.map +1 -0
  270. package/dist/cli/utils/withCliCommandDescriptionDocsUrl.d.ts +2 -0
  271. package/dist/cli/utils/withCliCommandDescriptionDocsUrl.js +23 -0
  272. package/dist/cli/utils/withCliCommandDescriptionDocsUrl.js.map +1 -0
  273. package/dist/commands.d.ts +1 -0
  274. package/dist/commands.js +3 -0
  275. package/dist/commands.js.map +1 -1
  276. package/dist/config.d.ts +38 -5
  277. package/dist/config.js +61 -16
  278. package/dist/config.js.map +1 -1
  279. package/dist/consts.d.ts +3 -0
  280. package/dist/consts.js +10 -0
  281. package/dist/consts.js.map +1 -0
  282. package/dist/{llamaEvaluator → evaluator}/LlamaChat/LlamaChat.d.ts +112 -39
  283. package/dist/evaluator/LlamaChat/LlamaChat.js +1512 -0
  284. package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -0
  285. package/dist/evaluator/LlamaChat/utils/FunctionCallNameGrammar.d.ts +11 -0
  286. package/dist/evaluator/LlamaChat/utils/FunctionCallNameGrammar.js +55 -0
  287. package/dist/evaluator/LlamaChat/utils/FunctionCallNameGrammar.js.map +1 -0
  288. package/dist/evaluator/LlamaChat/utils/FunctionCallParamsGrammar.d.ts +16 -0
  289. package/dist/evaluator/LlamaChat/utils/FunctionCallParamsGrammar.js +45 -0
  290. package/dist/evaluator/LlamaChat/utils/FunctionCallParamsGrammar.js.map +1 -0
  291. package/dist/evaluator/LlamaChat/utils/LlamaFunctionCallValidationError.d.ts +8 -0
  292. package/dist/evaluator/LlamaChat/utils/LlamaFunctionCallValidationError.js +12 -0
  293. package/dist/evaluator/LlamaChat/utils/LlamaFunctionCallValidationError.js.map +1 -0
  294. package/dist/{llamaEvaluator → evaluator}/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js +42 -16
  295. package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +1 -0
  296. package/dist/evaluator/LlamaChatSession/LlamaChatSession.d.ts +288 -0
  297. package/dist/evaluator/LlamaChatSession/LlamaChatSession.js +419 -0
  298. package/dist/evaluator/LlamaChatSession/LlamaChatSession.js.map +1 -0
  299. package/dist/evaluator/LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.d.ts +39 -0
  300. package/dist/evaluator/LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.js +186 -0
  301. package/dist/evaluator/LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.js.map +1 -0
  302. package/dist/{llamaEvaluator → evaluator}/LlamaChatSession/utils/defineChatSessionFunction.d.ts +3 -0
  303. package/dist/{llamaEvaluator → evaluator}/LlamaChatSession/utils/defineChatSessionFunction.js +3 -0
  304. package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.js.map +1 -0
  305. package/dist/evaluator/LlamaCompletion.d.ts +143 -0
  306. package/dist/evaluator/LlamaCompletion.js +418 -0
  307. package/dist/evaluator/LlamaCompletion.js.map +1 -0
  308. package/dist/{llamaEvaluator → evaluator}/LlamaContext/LlamaContext.d.ts +41 -21
  309. package/dist/{llamaEvaluator → evaluator}/LlamaContext/LlamaContext.js +270 -81
  310. package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -0
  311. package/dist/evaluator/LlamaContext/types.d.ts +140 -0
  312. package/dist/evaluator/LlamaContext/types.js.map +1 -0
  313. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/firstInFirstOutStrategy.js.map +1 -0
  314. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/maximumParallelismStrategy.js.map +1 -0
  315. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.d.ts +2 -0
  316. package/dist/{llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js → evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js} +4 -4
  317. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js.map +1 -0
  318. package/dist/evaluator/LlamaEmbeddingContext.d.ts +51 -0
  319. package/dist/evaluator/LlamaEmbeddingContext.js +73 -0
  320. package/dist/evaluator/LlamaEmbeddingContext.js.map +1 -0
  321. package/dist/{llamaEvaluator → evaluator}/LlamaGrammar.d.ts +10 -7
  322. package/dist/{llamaEvaluator → evaluator}/LlamaGrammar.js +14 -11
  323. package/dist/evaluator/LlamaGrammar.js.map +1 -0
  324. package/dist/{llamaEvaluator → evaluator}/LlamaGrammarEvaluationState.js +4 -4
  325. package/dist/evaluator/LlamaGrammarEvaluationState.js.map +1 -0
  326. package/dist/{llamaEvaluator → evaluator}/LlamaJsonSchemaGrammar.d.ts +2 -1
  327. package/dist/{llamaEvaluator → evaluator}/LlamaJsonSchemaGrammar.js +3 -3
  328. package/dist/evaluator/LlamaJsonSchemaGrammar.js.map +1 -0
  329. package/dist/evaluator/LlamaModel/LlamaModel.d.ts +236 -0
  330. package/dist/evaluator/LlamaModel/LlamaModel.js +679 -0
  331. package/dist/evaluator/LlamaModel/LlamaModel.js.map +1 -0
  332. package/dist/evaluator/LlamaModel/utils/TokenAttributes.d.ts +29 -0
  333. package/dist/evaluator/LlamaModel/utils/TokenAttributes.js +65 -0
  334. package/dist/evaluator/LlamaModel/utils/TokenAttributes.js.map +1 -0
  335. package/dist/evaluator/TokenBias.d.ts +22 -0
  336. package/dist/evaluator/TokenBias.js +33 -0
  337. package/dist/evaluator/TokenBias.js.map +1 -0
  338. package/dist/evaluator/TokenMeter.d.ts +54 -0
  339. package/dist/evaluator/TokenMeter.js +86 -0
  340. package/dist/evaluator/TokenMeter.js.map +1 -0
  341. package/dist/gguf/consts.d.ts +3 -0
  342. package/dist/gguf/consts.js +8 -0
  343. package/dist/gguf/consts.js.map +1 -0
  344. package/dist/gguf/errors/InvalidGgufMagicError.d.ts +3 -0
  345. package/dist/gguf/errors/InvalidGgufMagicError.js +6 -0
  346. package/dist/gguf/errors/InvalidGgufMagicError.js.map +1 -0
  347. package/dist/gguf/errors/UnsupportedGgufValueTypeError.d.ts +4 -0
  348. package/dist/gguf/errors/UnsupportedGgufValueTypeError.js +9 -0
  349. package/dist/gguf/errors/UnsupportedGgufValueTypeError.js.map +1 -0
  350. package/dist/gguf/fileReaders/GgufFileReader.d.ts +33 -0
  351. package/dist/gguf/fileReaders/GgufFileReader.js +76 -0
  352. package/dist/gguf/fileReaders/GgufFileReader.js.map +1 -0
  353. package/dist/gguf/fileReaders/GgufFsFileReader.d.ts +17 -0
  354. package/dist/gguf/fileReaders/GgufFsFileReader.js +46 -0
  355. package/dist/gguf/fileReaders/GgufFsFileReader.js.map +1 -0
  356. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.d.ts +22 -0
  357. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js +63 -0
  358. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js.map +1 -0
  359. package/dist/gguf/insights/GgufInsights.d.ts +48 -0
  360. package/dist/gguf/insights/GgufInsights.js +381 -0
  361. package/dist/gguf/insights/GgufInsights.js.map +1 -0
  362. package/dist/gguf/insights/GgufInsightsConfigurationResolver.d.ts +87 -0
  363. package/dist/gguf/insights/GgufInsightsConfigurationResolver.js +141 -0
  364. package/dist/gguf/insights/GgufInsightsConfigurationResolver.js.map +1 -0
  365. package/dist/gguf/insights/utils/resolveContextContextSizeOption.d.ts +18 -0
  366. package/dist/gguf/insights/utils/resolveContextContextSizeOption.js +76 -0
  367. package/dist/gguf/insights/utils/resolveContextContextSizeOption.js.map +1 -0
  368. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.d.ts +14 -0
  369. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js +177 -0
  370. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js.map +1 -0
  371. package/dist/gguf/insights/utils/scoreLevels.d.ts +5 -0
  372. package/dist/gguf/insights/utils/scoreLevels.js +16 -0
  373. package/dist/gguf/insights/utils/scoreLevels.js.map +1 -0
  374. package/dist/gguf/parser/GgufV2Parser.d.ts +19 -0
  375. package/dist/gguf/parser/GgufV2Parser.js +115 -0
  376. package/dist/gguf/parser/GgufV2Parser.js.map +1 -0
  377. package/dist/gguf/parser/GgufV3Parser.d.ts +3 -0
  378. package/dist/gguf/parser/GgufV3Parser.js +4 -0
  379. package/dist/gguf/parser/GgufV3Parser.js.map +1 -0
  380. package/dist/gguf/parser/parseGguf.d.ts +8 -0
  381. package/dist/gguf/parser/parseGguf.js +63 -0
  382. package/dist/gguf/parser/parseGguf.js.map +1 -0
  383. package/dist/gguf/readGgufFileInfo.d.ts +33 -0
  384. package/dist/gguf/readGgufFileInfo.js +66 -0
  385. package/dist/gguf/readGgufFileInfo.js.map +1 -0
  386. package/dist/gguf/types/GgufFileInfoTypes.d.ts +84 -0
  387. package/dist/gguf/types/GgufFileInfoTypes.js +18 -0
  388. package/dist/gguf/types/GgufFileInfoTypes.js.map +1 -0
  389. package/dist/gguf/types/GgufMetadataTypes.d.ts +335 -0
  390. package/dist/gguf/types/GgufMetadataTypes.js +86 -0
  391. package/dist/gguf/types/GgufMetadataTypes.js.map +1 -0
  392. package/dist/gguf/types/GgufTensorInfoTypes.d.ts +37 -0
  393. package/dist/gguf/types/GgufTensorInfoTypes.js +33 -0
  394. package/dist/gguf/types/GgufTensorInfoTypes.js.map +1 -0
  395. package/dist/gguf/utils/GgufReadOffset.d.ts +6 -0
  396. package/dist/gguf/utils/GgufReadOffset.js +18 -0
  397. package/dist/gguf/utils/GgufReadOffset.js.map +1 -0
  398. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.d.ts +5 -0
  399. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js +38 -0
  400. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js.map +1 -0
  401. package/dist/gguf/utils/getGgufFileTypeName.d.ts +4 -0
  402. package/dist/gguf/utils/getGgufFileTypeName.js +13 -0
  403. package/dist/gguf/utils/getGgufFileTypeName.js.map +1 -0
  404. package/dist/gguf/utils/getGgufMetadataArchitectureData.d.ts +3 -0
  405. package/dist/gguf/utils/getGgufMetadataArchitectureData.js +4 -0
  406. package/dist/gguf/utils/getGgufMetadataArchitectureData.js.map +1 -0
  407. package/dist/gguf/utils/normalizeGgufDownloadUrl.d.ts +1 -0
  408. package/dist/gguf/utils/normalizeGgufDownloadUrl.js +16 -0
  409. package/dist/gguf/utils/normalizeGgufDownloadUrl.js.map +1 -0
  410. package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.d.ts +2 -0
  411. package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.js +39 -0
  412. package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.js.map +1 -0
  413. package/dist/gguf/utils/resolveSplitGgufParts.d.ts +7 -0
  414. package/dist/gguf/utils/resolveSplitGgufParts.js +55 -0
  415. package/dist/gguf/utils/resolveSplitGgufParts.js.map +1 -0
  416. package/dist/index.d.ts +41 -18
  417. package/dist/index.js +36 -15
  418. package/dist/index.js.map +1 -1
  419. package/dist/state.d.ts +4 -0
  420. package/dist/state.js +14 -0
  421. package/dist/state.js.map +1 -1
  422. package/dist/types.d.ts +116 -5
  423. package/dist/types.js.map +1 -1
  424. package/dist/utils/DisposeGuard.d.ts +13 -0
  425. package/dist/utils/DisposeGuard.js +120 -0
  426. package/dist/utils/DisposeGuard.js.map +1 -0
  427. package/dist/utils/InsufficientMemoryError.d.ts +3 -0
  428. package/dist/utils/InsufficientMemoryError.js +6 -0
  429. package/dist/utils/InsufficientMemoryError.js.map +1 -0
  430. package/dist/utils/LlamaText.d.ts +70 -26
  431. package/dist/utils/LlamaText.js +469 -157
  432. package/dist/utils/LlamaText.js.map +1 -1
  433. package/dist/utils/LruCache.d.ts +12 -0
  434. package/dist/utils/LruCache.js +44 -0
  435. package/dist/utils/LruCache.js.map +1 -0
  436. package/dist/utils/ReplHistory.js.map +1 -1
  437. package/dist/utils/StopGenerationDetector.d.ts +25 -9
  438. package/dist/utils/StopGenerationDetector.js +93 -22
  439. package/dist/utils/StopGenerationDetector.js.map +1 -1
  440. package/dist/utils/TokenStreamRegulator.d.ts +9 -4
  441. package/dist/utils/TokenStreamRegulator.js +81 -8
  442. package/dist/utils/TokenStreamRegulator.js.map +1 -1
  443. package/dist/utils/UnsupportedError.d.ts +2 -0
  444. package/dist/utils/UnsupportedError.js +7 -0
  445. package/dist/utils/UnsupportedError.js.map +1 -0
  446. package/dist/utils/appendUserMessageToChatHistory.js.map +1 -1
  447. package/dist/utils/clearTempFolder.js.map +1 -1
  448. package/dist/utils/cmake.js +38 -20
  449. package/dist/utils/cmake.js.map +1 -1
  450. package/dist/utils/createModelDownloader.d.ts +108 -0
  451. package/dist/utils/createModelDownloader.js +231 -0
  452. package/dist/utils/createModelDownloader.js.map +1 -0
  453. package/dist/utils/findBestOption.d.ts +4 -0
  454. package/dist/utils/findBestOption.js +15 -0
  455. package/dist/utils/findBestOption.js.map +1 -0
  456. package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.d.ts +1 -0
  457. package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.js +23 -12
  458. package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.js.map +1 -1
  459. package/dist/utils/gbnfJson/GbnfGrammarGenerator.js.map +1 -1
  460. package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.d.ts +5 -0
  461. package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.js +11 -0
  462. package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.js.map +1 -0
  463. package/dist/utils/gbnfJson/terminals/GbnfArray.d.ts +3 -1
  464. package/dist/utils/gbnfJson/terminals/GbnfArray.js +10 -5
  465. package/dist/utils/gbnfJson/terminals/GbnfArray.js.map +1 -1
  466. package/dist/utils/gbnfJson/terminals/GbnfBoolean.d.ts +1 -1
  467. package/dist/utils/gbnfJson/terminals/GbnfBoolean.js.map +1 -1
  468. package/dist/utils/gbnfJson/terminals/GbnfBooleanValue.js.map +1 -1
  469. package/dist/utils/gbnfJson/terminals/GbnfGrammar.js.map +1 -1
  470. package/dist/utils/gbnfJson/terminals/GbnfNull.d.ts +1 -1
  471. package/dist/utils/gbnfJson/terminals/GbnfNull.js.map +1 -1
  472. package/dist/utils/gbnfJson/terminals/GbnfNumber.d.ts +1 -1
  473. package/dist/utils/gbnfJson/terminals/GbnfNumber.js.map +1 -1
  474. package/dist/utils/gbnfJson/terminals/GbnfNumberValue.js.map +1 -1
  475. package/dist/utils/gbnfJson/terminals/GbnfObjectMap.d.ts +3 -1
  476. package/dist/utils/gbnfJson/terminals/GbnfObjectMap.js +9 -4
  477. package/dist/utils/gbnfJson/terminals/GbnfObjectMap.js.map +1 -1
  478. package/dist/utils/gbnfJson/terminals/GbnfOr.js.map +1 -1
  479. package/dist/utils/gbnfJson/terminals/GbnfRepetition.d.ts +9 -0
  480. package/dist/utils/gbnfJson/terminals/GbnfRepetition.js +37 -0
  481. package/dist/utils/gbnfJson/terminals/GbnfRepetition.js.map +1 -0
  482. package/dist/utils/gbnfJson/terminals/GbnfString.d.ts +1 -1
  483. package/dist/utils/gbnfJson/terminals/GbnfString.js +23 -5
  484. package/dist/utils/gbnfJson/terminals/GbnfString.js.map +1 -1
  485. package/dist/utils/gbnfJson/terminals/GbnfStringValue.js.map +1 -1
  486. package/dist/utils/gbnfJson/terminals/GbnfVerbatimText.js.map +1 -1
  487. package/dist/utils/gbnfJson/terminals/GbnfWhitespace.d.ts +7 -4
  488. package/dist/utils/gbnfJson/terminals/GbnfWhitespace.js +37 -9
  489. package/dist/utils/gbnfJson/terminals/GbnfWhitespace.js.map +1 -1
  490. package/dist/utils/gbnfJson/terminals/gbnfConsts.d.ts +5 -4
  491. package/dist/utils/gbnfJson/terminals/gbnfConsts.js +14 -3
  492. package/dist/utils/gbnfJson/terminals/gbnfConsts.js.map +1 -1
  493. package/dist/utils/gbnfJson/types.d.ts +3 -0
  494. package/dist/utils/gbnfJson/types.js.map +1 -1
  495. package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.d.ts +10 -0
  496. package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.js +15 -0
  497. package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.js.map +1 -0
  498. package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.d.ts +2 -1
  499. package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.js +6 -5
  500. package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.js.map +1 -1
  501. package/dist/utils/gbnfJson/utils/validateObjectAgainstGbnfSchema.js +2 -2
  502. package/dist/utils/gbnfJson/utils/validateObjectAgainstGbnfSchema.js.map +1 -1
  503. package/dist/utils/getBuildDefaults.d.ts +1 -2
  504. package/dist/utils/getBuildDefaults.js +2 -3
  505. package/dist/utils/getBuildDefaults.js.map +1 -1
  506. package/dist/utils/getConsoleLogPrefix.d.ts +1 -0
  507. package/dist/utils/getConsoleLogPrefix.js +10 -0
  508. package/dist/utils/getConsoleLogPrefix.js.map +1 -0
  509. package/dist/utils/getGrammarsFolder.d.ts +2 -1
  510. package/dist/utils/getGrammarsFolder.js +8 -7
  511. package/dist/utils/getGrammarsFolder.js.map +1 -1
  512. package/dist/utils/getModuleVersion.d.ts +1 -0
  513. package/dist/utils/getModuleVersion.js +13 -0
  514. package/dist/utils/getModuleVersion.js.map +1 -0
  515. package/dist/utils/getQueuedTokensBeforeStopTrigger.d.ts +6 -0
  516. package/dist/utils/getQueuedTokensBeforeStopTrigger.js +22 -0
  517. package/dist/utils/getQueuedTokensBeforeStopTrigger.js.map +1 -0
  518. package/dist/utils/getReadableContextSize.d.ts +1 -0
  519. package/dist/utils/getReadableContextSize.js +7 -0
  520. package/dist/utils/getReadableContextSize.js.map +1 -0
  521. package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.js +15 -11
  522. package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.js.map +1 -1
  523. package/dist/utils/gitReleaseBundles.js +73 -5
  524. package/dist/utils/gitReleaseBundles.js.map +1 -1
  525. package/dist/utils/hashString.d.ts +1 -0
  526. package/dist/utils/hashString.js +8 -0
  527. package/dist/utils/hashString.js.map +1 -0
  528. package/dist/utils/isLockfileActive.d.ts +4 -0
  529. package/dist/utils/isLockfileActive.js +12 -0
  530. package/dist/utils/isLockfileActive.js.map +1 -0
  531. package/dist/utils/isToken.d.ts +2 -0
  532. package/dist/utils/isToken.js +4 -0
  533. package/dist/utils/isToken.js.map +1 -0
  534. package/dist/utils/isUrl.d.ts +1 -0
  535. package/dist/utils/isUrl.js +15 -0
  536. package/dist/utils/isUrl.js.map +1 -0
  537. package/dist/utils/mergeUnionTypes.d.ts +10 -0
  538. package/dist/utils/mergeUnionTypes.js +2 -0
  539. package/dist/utils/mergeUnionTypes.js.map +1 -0
  540. package/dist/utils/parseModelFileName.d.ts +1 -0
  541. package/dist/utils/parseModelFileName.js +6 -1
  542. package/dist/utils/parseModelFileName.js.map +1 -1
  543. package/dist/utils/parseTextTemplate.d.ts +66 -0
  544. package/dist/utils/parseTextTemplate.js +116 -0
  545. package/dist/utils/parseTextTemplate.js.map +1 -0
  546. package/dist/utils/prettyPrintObject.d.ts +10 -0
  547. package/dist/utils/prettyPrintObject.js +84 -0
  548. package/dist/utils/prettyPrintObject.js.map +1 -0
  549. package/dist/utils/removeNullFields.d.ts +2 -1
  550. package/dist/utils/removeNullFields.js +8 -0
  551. package/dist/utils/removeNullFields.js.map +1 -1
  552. package/dist/utils/resolveGithubRelease.d.ts +2 -0
  553. package/dist/utils/resolveGithubRelease.js +36 -0
  554. package/dist/utils/resolveGithubRelease.js.map +1 -0
  555. package/dist/utils/runtime.d.ts +4 -0
  556. package/dist/utils/runtime.js +8 -0
  557. package/dist/utils/runtime.js.map +1 -0
  558. package/dist/utils/safeEventCallback.d.ts +6 -0
  559. package/dist/utils/safeEventCallback.js +29 -0
  560. package/dist/utils/safeEventCallback.js.map +1 -0
  561. package/dist/utils/spawnCommand.d.ts +11 -1
  562. package/dist/utils/spawnCommand.js +56 -6
  563. package/dist/utils/spawnCommand.js.map +1 -1
  564. package/dist/utils/tokenizeInput.d.ts +3 -0
  565. package/dist/utils/tokenizeInput.js +12 -0
  566. package/dist/utils/tokenizeInput.js.map +1 -0
  567. package/dist/utils/truncateTextAndRoundToWords.d.ts +2 -0
  568. package/dist/utils/truncateTextAndRoundToWords.js +30 -0
  569. package/dist/utils/truncateTextAndRoundToWords.js.map +1 -1
  570. package/dist/utils/utilTypes.d.ts +3 -0
  571. package/dist/utils/utilTypes.js +2 -0
  572. package/dist/utils/utilTypes.js.map +1 -0
  573. package/dist/utils/waitForLockfileRelease.d.ts +5 -0
  574. package/dist/utils/waitForLockfileRelease.js +20 -0
  575. package/dist/utils/waitForLockfileRelease.js.map +1 -0
  576. package/dist/utils/withLockfile.d.ts +7 -0
  577. package/dist/utils/withLockfile.js +44 -0
  578. package/dist/utils/withLockfile.js.map +1 -0
  579. package/dist/utils/withOra.d.ts +2 -0
  580. package/dist/utils/withOra.js +22 -6
  581. package/dist/utils/withOra.js.map +1 -1
  582. package/dist/utils/withProgressLog.d.ts +23 -0
  583. package/dist/utils/withProgressLog.js +211 -0
  584. package/dist/utils/withProgressLog.js.map +1 -0
  585. package/dist/utils/withStatusLogs.d.ts +2 -1
  586. package/dist/utils/withStatusLogs.js +12 -9
  587. package/dist/utils/withStatusLogs.js.map +1 -1
  588. package/dist/utils/wrapAbortSignal.d.ts +2 -0
  589. package/dist/utils/wrapAbortSignal.js +9 -0
  590. package/dist/utils/wrapAbortSignal.js.map +1 -0
  591. package/llama/.clang-format +1 -2
  592. package/llama/CMakeLists.txt +115 -4
  593. package/llama/addon.cpp +1300 -97
  594. package/llama/binariesGithubRelease.json +1 -1
  595. package/llama/gitRelease.bundle +0 -0
  596. package/llama/gpuInfo/cuda-gpu-info.cu +120 -0
  597. package/llama/gpuInfo/cuda-gpu-info.h +10 -0
  598. package/llama/gpuInfo/metal-gpu-info.h +8 -0
  599. package/llama/gpuInfo/metal-gpu-info.mm +30 -0
  600. package/llama/gpuInfo/vulkan-gpu-info.cpp +83 -0
  601. package/llama/gpuInfo/vulkan-gpu-info.h +9 -0
  602. package/llama/grammars/README.md +58 -5
  603. package/llama/grammars/json.gbnf +4 -4
  604. package/llama/grammars/json_arr.gbnf +4 -4
  605. package/llama/llama.cpp.info.json +4 -0
  606. package/llama/toolchains/win32.host-x64.target-arm64.cmake +41 -0
  607. package/package.json +78 -53
  608. package/templates/packed/electron-typescript-react.json +1 -0
  609. package/templates/packed/node-typescript.json +1 -0
  610. package/dist/AbortError.d.ts +0 -2
  611. package/dist/AbortError.js +0 -7
  612. package/dist/AbortError.js.map +0 -1
  613. package/dist/chatWrappers/LlamaChatWrapper.d.ts +0 -13
  614. package/dist/chatWrappers/LlamaChatWrapper.js.map +0 -1
  615. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.d.ts +0 -13
  616. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js +0 -57
  617. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js.map +0 -1
  618. package/dist/llamaEvaluator/LlamaBins.d.ts +0 -18
  619. package/dist/llamaEvaluator/LlamaBins.js +0 -5
  620. package/dist/llamaEvaluator/LlamaBins.js.map +0 -1
  621. package/dist/llamaEvaluator/LlamaChat/LlamaChat.js +0 -704
  622. package/dist/llamaEvaluator/LlamaChat/LlamaChat.js.map +0 -1
  623. package/dist/llamaEvaluator/LlamaChat/utils/FunctionCallGrammar.d.ts +0 -21
  624. package/dist/llamaEvaluator/LlamaChat/utils/FunctionCallGrammar.js +0 -120
  625. package/dist/llamaEvaluator/LlamaChat/utils/FunctionCallGrammar.js.map +0 -1
  626. package/dist/llamaEvaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +0 -1
  627. package/dist/llamaEvaluator/LlamaChatSession/LlamaChatSession.d.ts +0 -146
  628. package/dist/llamaEvaluator/LlamaChatSession/LlamaChatSession.js +0 -211
  629. package/dist/llamaEvaluator/LlamaChatSession/LlamaChatSession.js.map +0 -1
  630. package/dist/llamaEvaluator/LlamaChatSession/utils/defineChatSessionFunction.js.map +0 -1
  631. package/dist/llamaEvaluator/LlamaContext/LlamaContext.js.map +0 -1
  632. package/dist/llamaEvaluator/LlamaContext/types.d.ts +0 -82
  633. package/dist/llamaEvaluator/LlamaContext/types.js.map +0 -1
  634. package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js.map +0 -1
  635. package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js.map +0 -1
  636. package/dist/llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.d.ts +0 -2
  637. package/dist/llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js.map +0 -1
  638. package/dist/llamaEvaluator/LlamaEmbeddingContext.d.ts +0 -35
  639. package/dist/llamaEvaluator/LlamaEmbeddingContext.js +0 -73
  640. package/dist/llamaEvaluator/LlamaEmbeddingContext.js.map +0 -1
  641. package/dist/llamaEvaluator/LlamaGrammar.js.map +0 -1
  642. package/dist/llamaEvaluator/LlamaGrammarEvaluationState.js.map +0 -1
  643. package/dist/llamaEvaluator/LlamaJsonSchemaGrammar.js.map +0 -1
  644. package/dist/llamaEvaluator/LlamaModel.d.ts +0 -119
  645. package/dist/llamaEvaluator/LlamaModel.js +0 -322
  646. package/dist/llamaEvaluator/LlamaModel.js.map +0 -1
  647. package/dist/utils/binariesGithubRelease.js.map +0 -1
  648. package/dist/utils/clearLlamaBuild.d.ts +0 -1
  649. package/dist/utils/clearLlamaBuild.js +0 -12
  650. package/dist/utils/clearLlamaBuild.js.map +0 -1
  651. package/dist/utils/cloneLlamaCppRepo.d.ts +0 -2
  652. package/dist/utils/cloneLlamaCppRepo.js +0 -102
  653. package/dist/utils/cloneLlamaCppRepo.js.map +0 -1
  654. package/dist/utils/compileLLamaCpp.d.ts +0 -8
  655. package/dist/utils/compileLLamaCpp.js +0 -132
  656. package/dist/utils/compileLLamaCpp.js.map +0 -1
  657. package/dist/utils/getBin.js +0 -78
  658. package/dist/utils/getBin.js.map +0 -1
  659. package/dist/utils/getGbnfGrammarForGbnfJsonSchema.d.ts +0 -2
  660. package/dist/utils/getGbnfGrammarForGbnfJsonSchema.js +0 -9
  661. package/dist/utils/getGbnfGrammarForGbnfJsonSchema.js.map +0 -1
  662. package/dist/utils/getReleaseInfo.d.ts +0 -7
  663. package/dist/utils/getReleaseInfo.js +0 -30
  664. package/dist/utils/getReleaseInfo.js.map +0 -1
  665. package/dist/utils/parseModelTypeDescription.d.ts +0 -6
  666. package/dist/utils/parseModelTypeDescription.js +0 -9
  667. package/dist/utils/parseModelTypeDescription.js.map +0 -1
  668. package/dist/utils/resolveChatWrapper.d.ts +0 -4
  669. package/dist/utils/resolveChatWrapper.js +0 -16
  670. package/dist/utils/resolveChatWrapper.js.map +0 -1
  671. package/dist/utils/usedBinFlag.d.ts +0 -6
  672. package/dist/utils/usedBinFlag.js +0 -15
  673. package/dist/utils/usedBinFlag.js.map +0 -1
  674. package/llama/usedBin.json +0 -3
  675. package/llamaBins/linux-arm64/llama-addon.node +0 -0
  676. package/llamaBins/linux-armv7l/llama-addon.node +0 -0
  677. package/llamaBins/linux-x64/llama-addon.node +0 -0
  678. package/llamaBins/mac-arm64/llama-addon.node +0 -0
  679. package/llamaBins/mac-x64/llama-addon.node +0 -0
  680. package/llamaBins/win-x64/llama-addon.exp +0 -0
  681. package/llamaBins/win-x64/llama-addon.lib +0 -0
  682. package/llamaBins/win-x64/llama-addon.node +0 -0
  683. /package/dist/{utils → bindings/utils}/binariesGithubRelease.d.ts +0 -0
  684. /package/dist/{llamaEvaluator → evaluator}/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.d.ts +0 -0
  685. /package/dist/{llamaEvaluator → evaluator}/LlamaContext/types.js +0 -0
  686. /package/dist/{llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies → evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.d.ts +0 -0
  687. /package/dist/{llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies → evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.js +0 -0
  688. /package/dist/{llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies → evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies}/maximumParallelismStrategy.d.ts +0 -0
  689. /package/dist/{llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies → evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies}/maximumParallelismStrategy.js +0 -0
  690. /package/dist/{llamaEvaluator → evaluator}/LlamaGrammarEvaluationState.d.ts +0 -0
@@ -0,0 +1,679 @@
1
+ import process from "process";
2
+ import path from "path";
3
+ import { AsyncDisposeAggregator, DisposedError, EventRelay, withLock } from "lifecycle-utils";
4
+ import { removeNullFields } from "../../utils/removeNullFields.js";
5
+ import { DisposeGuard } from "../../utils/DisposeGuard.js";
6
+ import { LlamaLocks, LlamaLogLevel, LlamaVocabularyType, LlamaVocabularyTypeValues } from "../../bindings/types.js";
7
+ import { readGgufFileInfo } from "../../gguf/readGgufFileInfo.js";
8
+ import { GgufInsights } from "../../gguf/insights/GgufInsights.js";
9
+ import { getConsoleLogPrefix } from "../../utils/getConsoleLogPrefix.js";
10
+ import { getReadablePath } from "../../cli/utils/getReadablePath.js";
11
+ import { LlamaContext } from "../LlamaContext/LlamaContext.js";
12
+ import { LlamaEmbeddingContext } from "../LlamaEmbeddingContext.js";
13
+ import { TokenAttribute, TokenAttributes } from "./utils/TokenAttributes.js";
14
+ const defaultLoraThreads = 6;
15
+ const defaultLoraScale = 1;
16
+ const defaultUseMmap = true;
17
+ export class LlamaModel {
18
+ /** @internal */ _llama;
19
+ /** @internal */ _model;
20
+ /** @internal */ _backendModelDisposeGuard;
21
+ /** @internal */ _tokens;
22
+ /** @internal */ _modelPath;
23
+ /** @internal */ _fileInfo;
24
+ /** @internal */ _fileInsights;
25
+ /** @internal */ _gpuLayers;
26
+ /** @internal */ _filename;
27
+ /** @internal */ _disposedState = { disposed: false };
28
+ /** @internal */ _disposeAggregator = new AsyncDisposeAggregator();
29
+ /** @internal */ _llamaPreventDisposalHandle;
30
+ /** @internal */ _typeDescription;
31
+ /** @internal */ _trainContextSize;
32
+ /** @internal */ _embeddingVectorSize;
33
+ /** @internal */ _vocabularyType;
34
+ tokenizer;
35
+ onDispose = new EventRelay();
36
+ constructor({ modelPath, gpuLayers, vocabOnly, useMmap, useMlock, checkTensors, onLoadProgress, loadSignal }, { _llama, _fileInfo, _fileInsights }) {
37
+ this._llama = _llama;
38
+ this._fileInfo = _fileInfo;
39
+ this._modelPath = path.resolve(process.cwd(), modelPath);
40
+ this._fileInsights = _fileInsights;
41
+ this._gpuLayers = gpuLayers;
42
+ this._backendModelDisposeGuard = new DisposeGuard([this._llama._backendDisposeGuard]);
43
+ this._llamaPreventDisposalHandle = this._llama._backendDisposeGuard.createPreventDisposalHandle();
44
+ this._model = new this._llama._bindings.AddonModel(this._modelPath, removeNullFields({
45
+ addonExports: this._llama._bindings,
46
+ gpuLayers,
47
+ vocabOnly,
48
+ useMmap,
49
+ useMlock: _llama.supportsMlock
50
+ ? useMlock
51
+ : undefined,
52
+ checkTensors: checkTensors ?? false,
53
+ onLoadProgress: onLoadProgress == null
54
+ ? undefined
55
+ : (loadPercentage) => {
56
+ try {
57
+ onLoadProgress(loadPercentage);
58
+ }
59
+ catch (err) {
60
+ // the native addon code calls this function, so there's no use to throw an error here
61
+ console.error(err);
62
+ }
63
+ },
64
+ hasLoadAbortSignal: loadSignal != null
65
+ }));
66
+ this._tokens = LlamaModelTokens._create(this._model, this._disposedState);
67
+ this._filename = path.basename(modelPath);
68
+ this._disposeAggregator.add(() => {
69
+ this._disposedState.disposed = true;
70
+ });
71
+ this._disposeAggregator.add(this.onDispose.dispatchEvent);
72
+ this._disposeAggregator.add(this._llama.onDispose.createListener(disposeModelIfReferenced.bind(null, new WeakRef(this))));
73
+ this._disposeAggregator.add(async () => {
74
+ await this._backendModelDisposeGuard.acquireDisposeLock();
75
+ await this._model.dispose();
76
+ this._llamaPreventDisposalHandle.dispose();
77
+ });
78
+ this.tokenize = this.tokenize.bind(this);
79
+ this.detokenize = this.detokenize.bind(this);
80
+ this.isSpecialToken = this.isSpecialToken.bind(this);
81
+ this.tokenize.detokenize = this.detokenize;
82
+ this.tokenize.isSpecialToken = this.isSpecialToken;
83
+ this.tokenizer = this.tokenize;
84
+ }
85
+ async dispose() {
86
+ if (this._disposedState.disposed)
87
+ return;
88
+ this._disposedState.disposed = true;
89
+ await this._disposeAggregator.dispose();
90
+ }
91
+ /** @hidden */
92
+ async [Symbol.asyncDispose]() {
93
+ await this.dispose();
94
+ }
95
+ get disposed() {
96
+ return this._disposedState.disposed;
97
+ }
98
+ get tokens() {
99
+ return this._tokens;
100
+ }
101
+ get filename() {
102
+ return this._filename;
103
+ }
104
+ get fileInfo() {
105
+ return this._fileInfo;
106
+ }
107
+ get fileInsights() {
108
+ return this._fileInsights;
109
+ }
110
+ /**
111
+ * Number of layers offloaded to the GPU.
112
+ * If GPU support is disabled, this will always be `0`.
113
+ */
114
+ get gpuLayers() {
115
+ return this._gpuLayers;
116
+ }
117
+ /**
118
+ * Total model size in memory in bytes
119
+ */
120
+ get size() {
121
+ this._ensureNotDisposed();
122
+ return this._model.getModelSize();
123
+ }
124
+ tokenize(text, specialTokens = false, options) {
125
+ this._ensureNotDisposed();
126
+ if (text === "")
127
+ return [];
128
+ if (specialTokens === "builtin") {
129
+ const builtinToken = text;
130
+ switch (builtinToken) {
131
+ case "BOS": return this.tokens.bos == null ? [] : [this.tokens.bos];
132
+ case "EOS": return this.tokens.eos == null ? [] : [this.tokens.eos];
133
+ case "NL": return this.tokens.nl == null ? [] : [this.tokens.nl];
134
+ case "EOT": return this.tokens.infill.eot == null ? [] : [this.tokens.infill.eot];
135
+ }
136
+ void (builtinToken);
137
+ throw new Error(`Unknown builtin special token: ${builtinToken}`);
138
+ }
139
+ if (options === "trimLeadingSpace") {
140
+ if (specialTokens) {
141
+ const countLeadingSpaces = (text) => {
142
+ let count = 0;
143
+ for (; count < text.length; count++) {
144
+ if (text[count] !== " ")
145
+ break;
146
+ }
147
+ return count;
148
+ };
149
+ const textLeadingSpaces = countLeadingSpaces(text);
150
+ const [workaroundToken, workaroundTokenString] = (this.tokens.bos != null && this.tokens.bosString != null)
151
+ ? [this.tokens.bos, this.tokens.bosString]
152
+ : (this.tokens.eos != null && this.tokens.eosString != null)
153
+ ? [this.tokens.eos, this.tokens.eosString]
154
+ : (this.tokens.nl != null && this.tokens.nlString != null)
155
+ ? [this.tokens.nl, this.tokens.nlString]
156
+ : (this.tokens.infill.eot != null && this.tokens.infill.eotString != null)
157
+ ? [this.tokens.infill.eot, this.tokens.infill.eotString]
158
+ : [null, null];
159
+ if (workaroundToken != null && workaroundTokenString != null) {
160
+ const tokens = Array.from(this._model.tokenize(workaroundTokenString + text, true));
161
+ const workaroundTokenIndex = tokens.indexOf(workaroundToken);
162
+ // only use the tokenized output if it can be corrected, otherwise fallback to the default tokenization
163
+ if (workaroundTokenIndex >= 0 && workaroundTokenIndex <= 1) {
164
+ tokens.splice(0, workaroundTokenIndex + 1);
165
+ if (countLeadingSpaces(this.detokenize(tokens, true)) === textLeadingSpaces)
166
+ return tokens;
167
+ }
168
+ }
169
+ const workaroundTokensString = "\n";
170
+ const workaroundTokens = Array.from(this._model.tokenize(workaroundTokensString, true));
171
+ if (text.startsWith(workaroundTokensString)) {
172
+ const tokens = Array.from(this._model.tokenize(text, true));
173
+ if (this.detokenize(tokens, true).startsWith(workaroundTokensString))
174
+ return tokens;
175
+ }
176
+ const tokens = Array.from(this._model.tokenize(workaroundTokensString + text, true));
177
+ // only use the tokenized output if it can be corrected, otherwise fallback to the default tokenization
178
+ if (workaroundTokens.length > 0 && workaroundTokens.every((token, index) => tokens[index] === token)) {
179
+ tokens.splice(0, workaroundTokens.length);
180
+ if (countLeadingSpaces(this.detokenize(tokens, true)) === textLeadingSpaces)
181
+ return tokens;
182
+ }
183
+ }
184
+ else {
185
+ const workaroundTokensString = "\n";
186
+ const workaroundTokens = Array.from(this._model.tokenize(workaroundTokensString, false));
187
+ if (text.startsWith(workaroundTokensString)) {
188
+ const tokens = Array.from(this._model.tokenize(text, false));
189
+ if (this.detokenize(tokens, false).startsWith(workaroundTokensString))
190
+ return tokens;
191
+ }
192
+ const tokens = Array.from(this._model.tokenize(workaroundTokensString + text, false));
193
+ // only use the tokenized output if it can be corrected, otherwise fallback to the default tokenization
194
+ if (workaroundTokens.length > 0 && workaroundTokens.every((token, index) => tokens[index] === token)) {
195
+ tokens.splice(0, workaroundTokens.length);
196
+ return tokens;
197
+ }
198
+ }
199
+ }
200
+ return Array.from(this._model.tokenize(text, specialTokens));
201
+ }
202
+ /**
203
+ * Transform tokens into text
204
+ * @param tokens - the tokens to detokenize.
205
+ * @param [specialTokens] - if set to `true`, special tokens will be detokenized to their corresponding token text representation.
206
+ * Recommended for debugging purposes only.
207
+ * Defaults to `false`.
208
+ */
209
+ detokenize(tokens, specialTokens = false) {
210
+ this._ensureNotDisposed();
211
+ if (tokens.length === 0)
212
+ return "";
213
+ return this._model.detokenize(Uint32Array.from(tokens), Boolean(specialTokens));
214
+ }
215
+ getTokenAttributes(token) {
216
+ if (this.vocabularyType === LlamaVocabularyType.none)
217
+ return TokenAttributes._create(token, TokenAttribute.undefined);
218
+ return TokenAttributes._create(token, this._model.getTokenAttributes(token));
219
+ }
220
+ /** Check whether the given token is a special token (a control-type token or a token with no normal text representation) */
221
+ isSpecialToken(token) {
222
+ if (token == null)
223
+ return false;
224
+ if (this.getTokenAttributes(token).control)
225
+ return true;
226
+ const normalText = this.detokenize([token], false);
227
+ if (normalText === "")
228
+ return this.detokenize([token], true) !== "";
229
+ return false;
230
+ }
231
+ /** Check whether the given token is an EOG (End Of Generation) token, like EOS or EOT. */
232
+ isEogToken(token) {
233
+ if (token == null)
234
+ return false;
235
+ return token === this.tokens.eos || token === this.tokens.infill.eot || this._model.isEogToken(token);
236
+ }
237
+ async createContext(options = {}) {
238
+ return await withLock(this._llama._memoryLock, LlamaLocks.loadToMemory, options.createSignal, async () => {
239
+ const preventDisposalHandle = this._backendModelDisposeGuard.createPreventDisposalHandle();
240
+ try {
241
+ return await LlamaContext._create(options, { _model: this });
242
+ }
243
+ finally {
244
+ preventDisposalHandle.dispose();
245
+ }
246
+ });
247
+ }
248
+ async createEmbeddingContext(options = {}) {
249
+ return await withLock(this._llama._memoryLock, LlamaLocks.loadToMemory, options.createSignal, async () => {
250
+ const preventDisposalHandle = this._backendModelDisposeGuard.createPreventDisposalHandle();
251
+ try {
252
+ return await LlamaEmbeddingContext._create({ _model: this }, options);
253
+ }
254
+ finally {
255
+ preventDisposalHandle.dispose();
256
+ }
257
+ });
258
+ }
259
+ /**
260
+ * Get warnings about the model file that would affect its usage.
261
+ *
262
+ * These warnings include all the warnings generated by `GgufInsights`, but are more comprehensive.
263
+ */
264
+ getWarnings() {
265
+ this._ensureNotDisposed();
266
+ const warnings = this._fileInsights.getWarnings(this._modelPath);
267
+ const modelFilePathText = `("${getReadablePath(this._modelPath)}")`;
268
+ try {
269
+ const specialTokenString = this.tokens.bosString || this.tokens.eosString || this.tokens.infill.eotString;
270
+ if (specialTokenString != null && specialTokenString !== "") {
271
+ const beforeTextNoSpecialTokens = "some test text here";
272
+ const afterTextNoSpecialTokens = this.detokenize(this.tokenize(beforeTextNoSpecialTokens, false, "trimLeadingSpace"));
273
+ if (beforeTextNoSpecialTokens !== afterTextNoSpecialTokens)
274
+ warnings.push(`Using this model ${modelFilePathText} to tokenize text and then detokenize it resulted in a different text. ` +
275
+ "There might be an issue with the model or the tokenizer implementation. " +
276
+ "Using this model may not work as intended");
277
+ const beforeTextWithSpecialTokens = specialTokenString + beforeTextNoSpecialTokens;
278
+ const afterTextWithSpecialTokens = this.detokenize(this.tokenize(beforeTextWithSpecialTokens, true, "trimLeadingSpace"), true);
279
+ if (beforeTextWithSpecialTokens !== afterTextWithSpecialTokens)
280
+ warnings.push(`Using this model ${modelFilePathText} to tokenize text with special tokens and then ` +
281
+ "detokenize it resulted in a different text. " +
282
+ "There might be an issue with the model or the tokenizer implementation. " +
283
+ "Using this model may not work as intended");
284
+ }
285
+ }
286
+ catch (err) {
287
+ // do nothing
288
+ }
289
+ return warnings;
290
+ }
291
+ /** @hidden `ModelTypeDescription` type alias is too long in the documentation */
292
+ get typeDescription() {
293
+ this._ensureNotDisposed();
294
+ if (this._typeDescription == null)
295
+ this._typeDescription = this._model.getModelDescription();
296
+ return this._typeDescription;
297
+ }
298
+ /** The context size the model was trained on */
299
+ get trainContextSize() {
300
+ this._ensureNotDisposed();
301
+ if (this._trainContextSize == null)
302
+ this._trainContextSize = this._model.getTrainContextSize();
303
+ return this._trainContextSize;
304
+ }
305
+ /** The size of an embedding vector the model can produce */
306
+ get embeddingVectorSize() {
307
+ this._ensureNotDisposed();
308
+ if (this._embeddingVectorSize == null)
309
+ this._embeddingVectorSize = this._model.getEmbeddingVectorSize();
310
+ return this._embeddingVectorSize;
311
+ }
312
+ get vocabularyType() {
313
+ this._ensureNotDisposed();
314
+ if (this._vocabularyType == null) {
315
+ const vocabType = this._model.getVocabularyType();
316
+ this._vocabularyType = LlamaVocabularyTypeValues[vocabType];
317
+ if (this._vocabularyType == null) {
318
+ console.warn(getConsoleLogPrefix() + "Unknown vocabulary type:", vocabType);
319
+ this._vocabularyType = LlamaVocabularyType.none;
320
+ }
321
+ }
322
+ return this._vocabularyType;
323
+ }
324
+ /** @internal */
325
+ _ensureNotDisposed() {
326
+ if (this._disposedState.disposed)
327
+ throw new DisposedError();
328
+ }
329
+ /** @internal */
330
+ async _loadLora({ loraFilePath, baseModelPath, scale, threads }) {
331
+ await this._model.loadLora(path.resolve(process.cwd(), loraFilePath), scale ?? defaultLoraScale, Math.max(0, Math.floor(threads)), baseModelPath == null
332
+ ? undefined
333
+ : path.resolve(process.cwd(), baseModelPath));
334
+ }
335
+ /** @internal */
336
+ static async _create(modelOptions, { _llama }) {
337
+ const { loadSignal } = modelOptions;
338
+ let useMmap = modelOptions.useMmap ?? defaultUseMmap;
339
+ const loraOptions = typeof modelOptions.lora === "string"
340
+ ? { adapters: [{ loraFilePath: modelOptions.lora }] }
341
+ : modelOptions.lora;
342
+ if (loraOptions?.adapters != null && loraOptions.adapters.length > 0)
343
+ useMmap = false; // using LoRA with nmap crashes the process
344
+ const fileInfo = await readGgufFileInfo(modelOptions.modelPath, {
345
+ sourceType: "filesystem",
346
+ signal: loadSignal
347
+ });
348
+ const ggufInsights = await GgufInsights.from(fileInfo, _llama);
349
+ const gpuLayers = await ggufInsights.configurationResolver.resolveModelGpuLayers(modelOptions.gpuLayers, {
350
+ ignoreMemorySafetyChecks: modelOptions.ignoreMemorySafetyChecks
351
+ });
352
+ const vramRequiredEstimate = ggufInsights.estimateModelResourceRequirements({ gpuLayers: gpuLayers }).gpuVram;
353
+ const model = new LlamaModel({ ...modelOptions, gpuLayers, useMmap }, { _fileInfo: fileInfo, _fileInsights: ggufInsights, _llama });
354
+ const modelCreationMemoryReservation = modelOptions.ignoreMemorySafetyChecks
355
+ ? null
356
+ : _llama._vramOrchestrator.reserveMemory(vramRequiredEstimate);
357
+ const loggedWarnings = new Set();
358
+ function onAbort() {
359
+ model._model.abortActiveModelLoad();
360
+ loadSignal?.removeEventListener("abort", onAbort);
361
+ }
362
+ function logWarnings(warnings) {
363
+ for (const warning of warnings) {
364
+ if (loggedWarnings.has(warning))
365
+ continue;
366
+ _llama._log(LlamaLogLevel.warn, warning);
367
+ loggedWarnings.add(warning);
368
+ }
369
+ }
370
+ if (loadSignal != null) {
371
+ if (loadSignal.aborted)
372
+ throw loadSignal.reason;
373
+ loadSignal.addEventListener("abort", onAbort);
374
+ }
375
+ logWarnings(ggufInsights.getWarnings(modelOptions.modelPath));
376
+ try {
377
+ const modelLoaded = await model._model.init();
378
+ if (loadSignal?.aborted) {
379
+ if (modelLoaded)
380
+ await model._model.dispose();
381
+ throw loadSignal.reason;
382
+ }
383
+ else if (!modelLoaded)
384
+ throw new Error("Failed to load model");
385
+ loadSignal?.removeEventListener("abort", onAbort);
386
+ logWarnings(model.getWarnings());
387
+ if (loraOptions != null && loraOptions.adapters.length > 0) {
388
+ const loraThreads = loraOptions.threads ?? defaultLoraThreads;
389
+ let loadedAdapters = 0;
390
+ for (const adapter of loraOptions.adapters) {
391
+ try {
392
+ await model._loadLora({
393
+ loraFilePath: adapter.loraFilePath,
394
+ baseModelPath: adapter.baseModelPath,
395
+ scale: adapter.scale,
396
+ threads: loraThreads
397
+ });
398
+ loadedAdapters++;
399
+ try {
400
+ loraOptions.onLoadProgress?.(loadedAdapters / loraOptions.adapters.length);
401
+ }
402
+ catch (err) {
403
+ console.error(err);
404
+ }
405
+ }
406
+ catch (err) {
407
+ await model._model.dispose();
408
+ throw err;
409
+ }
410
+ if (loadSignal?.aborted) {
411
+ await model._model.dispose();
412
+ throw loadSignal.reason;
413
+ }
414
+ }
415
+ logWarnings(model.getWarnings());
416
+ }
417
+ else if (loraOptions?.onLoadProgress != null) {
418
+ try {
419
+ loraOptions.onLoadProgress(1);
420
+ }
421
+ catch (err) {
422
+ console.error(err);
423
+ }
424
+ }
425
+ return model;
426
+ }
427
+ finally {
428
+ loadSignal?.removeEventListener("abort", onAbort);
429
+ modelCreationMemoryReservation?.dispose?.();
430
+ }
431
+ }
432
+ }
433
+ export class LlamaModelTokens {
434
+ /** @internal */ _model;
435
+ /** @internal */ _disposedState;
436
+ /** @internal */ _infillTokens;
437
+ /** @internal */ _bosToken;
438
+ /** @internal */ _eosToken;
439
+ /** @internal */ _nlToken;
440
+ /** @internal */ _bosString;
441
+ /** @internal */ _eosString;
442
+ /** @internal */ _nlString;
443
+ /** @internal */ _shouldPrependBosToken;
444
+ constructor(model, disposedState) {
445
+ this._model = model;
446
+ this._disposedState = disposedState;
447
+ }
448
+ /**
449
+ * @returns infill tokens
450
+ */
451
+ get infill() {
452
+ this._ensureNotDisposed();
453
+ if (this._infillTokens == null)
454
+ this._infillTokens = LlamaModelInfillTokens._create(this._model, this._disposedState);
455
+ return this._infillTokens;
456
+ }
457
+ /**
458
+ * @returns The BOS (Beginning Of Sequence) token.
459
+ */
460
+ get bos() {
461
+ this._ensureNotDisposed();
462
+ if (this._bosToken == null)
463
+ this._bosToken = this._model.tokenBos();
464
+ if (this._bosToken === -1)
465
+ return null;
466
+ return this._bosToken;
467
+ }
468
+ /**
469
+ * @returns The EOS (End Of Sequence) token.
470
+ */
471
+ get eos() {
472
+ this._ensureNotDisposed();
473
+ if (this._eosToken == null)
474
+ this._eosToken = this._model.tokenEos();
475
+ if (this._eosToken === -1)
476
+ return null;
477
+ return this._eosToken;
478
+ }
479
+ /**
480
+ * @returns The NL (New Line) token.
481
+ */
482
+ get nl() {
483
+ this._ensureNotDisposed();
484
+ if (this._nlToken == null)
485
+ this._nlToken = this._model.tokenNl();
486
+ if (this._nlToken === -1)
487
+ return null;
488
+ return this._nlToken;
489
+ }
490
+ /**
491
+ * @returns The BOS (Beginning Of Sequence) token as a string.
492
+ */
493
+ get bosString() {
494
+ this._ensureNotDisposed();
495
+ const bosToken = this.bos;
496
+ if (bosToken == null)
497
+ return null;
498
+ if (this._bosString == null)
499
+ this._bosString = this._model.getTokenString(bosToken);
500
+ return this._bosString;
501
+ }
502
+ /**
503
+ * @returns The EOS (End Of Sequence) token as a string.
504
+ */
505
+ get eosString() {
506
+ this._ensureNotDisposed();
507
+ const eosToken = this.eos;
508
+ if (eosToken == null)
509
+ return null;
510
+ if (this._eosString == null)
511
+ this._eosString = this._model.getTokenString(eosToken);
512
+ return this._eosString;
513
+ }
514
+ /**
515
+ * @returns The NL (New Line) token as a string.
516
+ */
517
+ get nlString() {
518
+ this._ensureNotDisposed();
519
+ const nlToken = this.nl;
520
+ if (nlToken == null)
521
+ return null;
522
+ if (this._nlString == null)
523
+ this._nlString = this._model.getTokenString(nlToken);
524
+ return this._nlString;
525
+ }
526
+ /**
527
+ * @returns Whether we should prepend a BOS (Beginning Of Sequence) token for evaluations with this model.
528
+ */
529
+ get shouldPrependBosToken() {
530
+ this._ensureNotDisposed();
531
+ if (this._shouldPrependBosToken == null)
532
+ this._shouldPrependBosToken = this.bos != null && this._model.shouldPrependBosToken();
533
+ return this._shouldPrependBosToken;
534
+ }
535
+ /** @internal */
536
+ _ensureNotDisposed() {
537
+ if (this._disposedState.disposed)
538
+ throw new DisposedError();
539
+ }
540
+ /** @internal */
541
+ static _create(model, disposedState) {
542
+ return new LlamaModelTokens(model, disposedState);
543
+ }
544
+ }
545
+ export class LlamaModelInfillTokens {
546
+ /** @internal */ _model;
547
+ /** @internal */ _disposedState;
548
+ /** @internal */ _prefixToken;
549
+ /** @internal */ _middleToken;
550
+ /** @internal */ _suffixToken;
551
+ /** @internal */ _eotToken;
552
+ /** @internal */ _prefixString;
553
+ /** @internal */ _middleString;
554
+ /** @internal */ _suffixString;
555
+ /** @internal */ _eotString;
556
+ constructor(model, disposedState) {
557
+ this._model = model;
558
+ this._disposedState = disposedState;
559
+ }
560
+ /**
561
+ * @returns The beginning of infill prefix token.
562
+ */
563
+ get prefix() {
564
+ this._ensureNotDisposed();
565
+ if (this._prefixToken == null)
566
+ this._prefixToken = this._resolveSpecialToken(this._model.prefixToken(), ["<fim_prefix>"]);
567
+ if (this._prefixToken === -1)
568
+ return null;
569
+ return this._prefixToken;
570
+ }
571
+ /**
572
+ * @returns The beginning of infill middle token.
573
+ */
574
+ get middle() {
575
+ this._ensureNotDisposed();
576
+ if (this._middleToken == null)
577
+ this._middleToken = this._resolveSpecialToken(this._model.middleToken(), ["<fim_middle>"]);
578
+ if (this._middleToken === -1)
579
+ return null;
580
+ return this._middleToken;
581
+ }
582
+ /**
583
+ * @returns The beginning of infill suffix token.
584
+ */
585
+ get suffix() {
586
+ this._ensureNotDisposed();
587
+ if (this._suffixToken == null)
588
+ this._suffixToken = this._resolveSpecialToken(this._model.suffixToken(), ["<fim_suffix>"]);
589
+ if (this._suffixToken === -1)
590
+ return null;
591
+ return this._suffixToken;
592
+ }
593
+ /**
594
+ * @returns End of infill middle token (End Of Text).
595
+ */
596
+ get eot() {
597
+ this._ensureNotDisposed();
598
+ if (this._eotToken == null)
599
+ this._eotToken = this._model.eotToken();
600
+ if (this._eotToken === -1)
601
+ return null;
602
+ return this._eotToken;
603
+ }
604
+ /**
605
+ * @returns The beginning of infill prefix token as a string.
606
+ */
607
+ get prefixString() {
608
+ this._ensureNotDisposed();
609
+ const prefixToken = this.prefix;
610
+ if (prefixToken == null)
611
+ return null;
612
+ if (this._prefixString == null)
613
+ this._prefixString = this._model.getTokenString(prefixToken);
614
+ return this._prefixString;
615
+ }
616
+ /**
617
+ * @returns The beginning of infill middle token as a string.
618
+ */
619
+ get middleString() {
620
+ this._ensureNotDisposed();
621
+ const middleToken = this.middle;
622
+ if (middleToken == null)
623
+ return null;
624
+ if (this._middleString == null)
625
+ this._middleString = this._model.getTokenString(middleToken);
626
+ return this._middleString;
627
+ }
628
+ /**
629
+ * @returns The beginning of infill suffix token as a string.
630
+ */
631
+ get suffixString() {
632
+ this._ensureNotDisposed();
633
+ const suffixToken = this.suffix;
634
+ if (suffixToken == null)
635
+ return null;
636
+ if (this._suffixString == null)
637
+ this._suffixString = this._model.getTokenString(suffixToken);
638
+ return this._suffixString;
639
+ }
640
+ /**
641
+ * @returns End of infill middle token (End Of Text) as a string.
642
+ */
643
+ get eotString() {
644
+ this._ensureNotDisposed();
645
+ const eotToken = this.eot;
646
+ if (eotToken == null)
647
+ return null;
648
+ if (this._eotString == null)
649
+ this._eotString = this._model.getTokenString(eotToken);
650
+ return this._eotString;
651
+ }
652
+ /** @internal */
653
+ _ensureNotDisposed() {
654
+ if (this._disposedState.disposed)
655
+ throw new DisposedError();
656
+ }
657
+ /** @internal */
658
+ _resolveSpecialToken(token, fallbackTexts) {
659
+ if (token != null && token !== -1)
660
+ return token;
661
+ for (const text of fallbackTexts) {
662
+ const tokens = this._model.tokenize(text, true);
663
+ if (tokens.length !== 1)
664
+ continue;
665
+ return tokens[0];
666
+ }
667
+ return -1;
668
+ }
669
+ /** @internal */
670
+ static _create(model, disposedState) {
671
+ return new LlamaModelInfillTokens(model, disposedState);
672
+ }
673
+ }
674
+ function disposeModelIfReferenced(modelRef) {
675
+ const model = modelRef.deref();
676
+ if (model != null)
677
+ void model.dispose();
678
+ }
679
+ //# sourceMappingURL=LlamaModel.js.map