node-llama-cpp 3.0.0-beta.2 → 3.0.0-beta.20

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (639) hide show
  1. package/README.md +14 -11
  2. package/dist/ChatWrapper.d.ts +2 -15
  3. package/dist/ChatWrapper.js +28 -33
  4. package/dist/ChatWrapper.js.map +1 -1
  5. package/dist/apiDocsOverrides.d.ts +1 -0
  6. package/dist/apiDocsOverrides.js +5 -0
  7. package/dist/apiDocsOverrides.js.map +1 -0
  8. package/dist/{utils/getBin.d.ts → bindings/AddonTypes.d.ts} +54 -7
  9. package/dist/bindings/AddonTypes.js +2 -0
  10. package/dist/bindings/AddonTypes.js.map +1 -0
  11. package/dist/bindings/Llama.d.ts +47 -0
  12. package/dist/bindings/Llama.js +343 -0
  13. package/dist/bindings/Llama.js.map +1 -0
  14. package/dist/bindings/consts.d.ts +2 -0
  15. package/dist/bindings/consts.js +11 -0
  16. package/dist/bindings/consts.js.map +1 -0
  17. package/dist/bindings/getLlama.d.ts +145 -0
  18. package/dist/bindings/getLlama.js +389 -0
  19. package/dist/bindings/getLlama.js.map +1 -0
  20. package/dist/bindings/types.d.ts +55 -0
  21. package/dist/bindings/types.js +77 -0
  22. package/dist/bindings/types.js.map +1 -0
  23. package/dist/bindings/utils/MemoryOrchestrator.d.ts +21 -0
  24. package/dist/bindings/utils/MemoryOrchestrator.js +49 -0
  25. package/dist/bindings/utils/MemoryOrchestrator.js.map +1 -0
  26. package/dist/bindings/utils/NoBinaryFoundError.d.ts +2 -0
  27. package/dist/bindings/utils/NoBinaryFoundError.js +7 -0
  28. package/dist/bindings/utils/NoBinaryFoundError.js.map +1 -0
  29. package/dist/bindings/utils/asyncEvery.d.ts +5 -0
  30. package/dist/bindings/utils/asyncEvery.js +15 -0
  31. package/dist/bindings/utils/asyncEvery.js.map +1 -0
  32. package/dist/bindings/utils/asyncSome.d.ts +5 -0
  33. package/dist/bindings/utils/asyncSome.js +27 -0
  34. package/dist/bindings/utils/asyncSome.js.map +1 -0
  35. package/dist/{utils → bindings/utils}/binariesGithubRelease.js +1 -1
  36. package/dist/bindings/utils/binariesGithubRelease.js.map +1 -0
  37. package/dist/bindings/utils/clearAllLocalBuilds.d.ts +1 -0
  38. package/dist/bindings/utils/clearAllLocalBuilds.js +47 -0
  39. package/dist/bindings/utils/clearAllLocalBuilds.js.map +1 -0
  40. package/dist/bindings/utils/cloneLlamaCppRepo.d.ts +11 -0
  41. package/dist/bindings/utils/cloneLlamaCppRepo.js +166 -0
  42. package/dist/bindings/utils/cloneLlamaCppRepo.js.map +1 -0
  43. package/dist/bindings/utils/compileLLamaCpp.d.ts +15 -0
  44. package/dist/bindings/utils/compileLLamaCpp.js +221 -0
  45. package/dist/bindings/utils/compileLLamaCpp.js.map +1 -0
  46. package/dist/bindings/utils/detectAvailableComputeLayers.d.ts +14 -0
  47. package/dist/bindings/utils/detectAvailableComputeLayers.js +304 -0
  48. package/dist/bindings/utils/detectAvailableComputeLayers.js.map +1 -0
  49. package/dist/bindings/utils/detectGlibc.d.ts +4 -0
  50. package/dist/bindings/utils/detectGlibc.js +46 -0
  51. package/dist/bindings/utils/detectGlibc.js.map +1 -0
  52. package/dist/bindings/utils/getBestComputeLayersAvailable.d.ts +9 -0
  53. package/dist/bindings/utils/getBestComputeLayersAvailable.js +29 -0
  54. package/dist/bindings/utils/getBestComputeLayersAvailable.js.map +1 -0
  55. package/dist/bindings/utils/getBuildFolderNameForBuildOptions.d.ts +5 -0
  56. package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js +93 -0
  57. package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js.map +1 -0
  58. package/dist/bindings/utils/getCanUsePrebuiltBinaries.d.ts +1 -0
  59. package/dist/bindings/utils/getCanUsePrebuiltBinaries.js +8 -0
  60. package/dist/bindings/utils/getCanUsePrebuiltBinaries.js.map +1 -0
  61. package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.d.ts +2 -0
  62. package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.js +21 -0
  63. package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.js.map +1 -0
  64. package/dist/bindings/utils/getGpuTypesToUseForOption.d.ts +11 -0
  65. package/dist/bindings/utils/getGpuTypesToUseForOption.js +30 -0
  66. package/dist/bindings/utils/getGpuTypesToUseForOption.js.map +1 -0
  67. package/dist/bindings/utils/getLinuxDistroInfo.d.ts +9 -0
  68. package/dist/bindings/utils/getLinuxDistroInfo.js +46 -0
  69. package/dist/bindings/utils/getLinuxDistroInfo.js.map +1 -0
  70. package/dist/bindings/utils/getLlamaWithoutBackend.d.ts +5 -0
  71. package/dist/bindings/utils/getLlamaWithoutBackend.js +27 -0
  72. package/dist/bindings/utils/getLlamaWithoutBackend.js.map +1 -0
  73. package/dist/bindings/utils/getPlatform.d.ts +2 -0
  74. package/dist/bindings/utils/getPlatform.js +15 -0
  75. package/dist/bindings/utils/getPlatform.js.map +1 -0
  76. package/dist/bindings/utils/getPlatformInfo.d.ts +5 -0
  77. package/dist/bindings/utils/getPlatformInfo.js +28 -0
  78. package/dist/bindings/utils/getPlatformInfo.js.map +1 -0
  79. package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.d.ts +3 -0
  80. package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.js +27 -0
  81. package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.js.map +1 -0
  82. package/dist/bindings/utils/hasFileInPath.d.ts +2 -0
  83. package/dist/bindings/utils/hasFileInPath.js +34 -0
  84. package/dist/bindings/utils/hasFileInPath.js.map +1 -0
  85. package/dist/bindings/utils/lastBuildInfo.d.ts +6 -0
  86. package/dist/bindings/utils/lastBuildInfo.js +17 -0
  87. package/dist/bindings/utils/lastBuildInfo.js.map +1 -0
  88. package/dist/bindings/utils/logBinaryUsageExampleToConsole.d.ts +2 -0
  89. package/dist/bindings/utils/logBinaryUsageExampleToConsole.js +22 -0
  90. package/dist/bindings/utils/logBinaryUsageExampleToConsole.js.map +1 -0
  91. package/dist/bindings/utils/logDistroInstallInstruction.d.ts +14 -0
  92. package/dist/bindings/utils/logDistroInstallInstruction.js +48 -0
  93. package/dist/bindings/utils/logDistroInstallInstruction.js.map +1 -0
  94. package/dist/bindings/utils/resolveCustomCmakeOptions.d.ts +1 -0
  95. package/dist/bindings/utils/resolveCustomCmakeOptions.js +45 -0
  96. package/dist/bindings/utils/resolveCustomCmakeOptions.js.map +1 -0
  97. package/dist/bindings/utils/testBindingBinary.d.ts +1 -0
  98. package/dist/bindings/utils/testBindingBinary.js +98 -0
  99. package/dist/bindings/utils/testBindingBinary.js.map +1 -0
  100. package/dist/bindings/utils/testCmakeBinary.d.ts +5 -0
  101. package/dist/bindings/utils/testCmakeBinary.js +32 -0
  102. package/dist/bindings/utils/testCmakeBinary.js.map +1 -0
  103. package/dist/chatWrappers/AlpacaChatWrapper.d.ts +2 -1
  104. package/dist/chatWrappers/AlpacaChatWrapper.js +9 -2
  105. package/dist/chatWrappers/AlpacaChatWrapper.js.map +1 -1
  106. package/dist/chatWrappers/ChatMLChatWrapper.d.ts +5 -0
  107. package/dist/chatWrappers/ChatMLChatWrapper.js +13 -11
  108. package/dist/chatWrappers/ChatMLChatWrapper.js.map +1 -1
  109. package/dist/chatWrappers/FalconChatWrapper.d.ts +2 -1
  110. package/dist/chatWrappers/FalconChatWrapper.js +28 -11
  111. package/dist/chatWrappers/FalconChatWrapper.js.map +1 -1
  112. package/dist/chatWrappers/FunctionaryChatWrapper.js +86 -73
  113. package/dist/chatWrappers/FunctionaryChatWrapper.js.map +1 -1
  114. package/dist/chatWrappers/{LlamaChatWrapper.d.ts → GemmaChatWrapper.d.ts} +6 -1
  115. package/dist/chatWrappers/GemmaChatWrapper.js +88 -0
  116. package/dist/chatWrappers/GemmaChatWrapper.js.map +1 -0
  117. package/dist/chatWrappers/GeneralChatWrapper.d.ts +2 -1
  118. package/dist/chatWrappers/GeneralChatWrapper.js +35 -12
  119. package/dist/chatWrappers/GeneralChatWrapper.js.map +1 -1
  120. package/dist/chatWrappers/Llama2ChatWrapper.d.ts +20 -0
  121. package/dist/chatWrappers/{LlamaChatWrapper.js → Llama2ChatWrapper.js} +29 -11
  122. package/dist/chatWrappers/Llama2ChatWrapper.js.map +1 -0
  123. package/dist/chatWrappers/Llama3ChatWrapper.d.ts +31 -0
  124. package/dist/chatWrappers/Llama3ChatWrapper.js +129 -0
  125. package/dist/chatWrappers/Llama3ChatWrapper.js.map +1 -0
  126. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.d.ts +73 -0
  127. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +359 -0
  128. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -0
  129. package/dist/chatWrappers/generic/TemplateChatWrapper.d.ts +64 -0
  130. package/dist/chatWrappers/generic/TemplateChatWrapper.js +200 -0
  131. package/dist/chatWrappers/generic/TemplateChatWrapper.js.map +1 -0
  132. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.d.ts +33 -0
  133. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js +45 -0
  134. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js.map +1 -0
  135. package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.d.ts +42 -0
  136. package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.js +82 -0
  137. package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.js.map +1 -0
  138. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.d.ts +4 -0
  139. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js +206 -0
  140. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js.map +1 -0
  141. package/dist/chatWrappers/utils/resolveChatWrapper.d.ts +69 -0
  142. package/dist/chatWrappers/utils/resolveChatWrapper.js +214 -0
  143. package/dist/chatWrappers/utils/resolveChatWrapper.js.map +1 -0
  144. package/dist/cli/cli.js +21 -7
  145. package/dist/cli/cli.js.map +1 -1
  146. package/dist/cli/commands/BuildCommand.d.ts +6 -4
  147. package/dist/cli/commands/BuildCommand.js +103 -41
  148. package/dist/cli/commands/BuildCommand.js.map +1 -1
  149. package/dist/cli/commands/ChatCommand.d.ts +18 -6
  150. package/dist/cli/commands/ChatCommand.js +298 -142
  151. package/dist/cli/commands/ChatCommand.js.map +1 -1
  152. package/dist/cli/commands/ClearCommand.d.ts +1 -1
  153. package/dist/cli/commands/ClearCommand.js +11 -12
  154. package/dist/cli/commands/ClearCommand.js.map +1 -1
  155. package/dist/cli/commands/CompleteCommand.d.ts +29 -0
  156. package/dist/cli/commands/CompleteCommand.js +365 -0
  157. package/dist/cli/commands/CompleteCommand.js.map +1 -0
  158. package/dist/cli/commands/DebugCommand.d.ts +7 -0
  159. package/dist/cli/commands/DebugCommand.js +54 -0
  160. package/dist/cli/commands/DebugCommand.js.map +1 -0
  161. package/dist/cli/commands/DownloadCommand.d.ts +6 -4
  162. package/dist/cli/commands/DownloadCommand.js +120 -69
  163. package/dist/cli/commands/DownloadCommand.js.map +1 -1
  164. package/dist/cli/commands/InfillCommand.d.ts +31 -0
  165. package/dist/cli/commands/InfillCommand.js +401 -0
  166. package/dist/cli/commands/InfillCommand.js.map +1 -0
  167. package/dist/cli/commands/InitCommand.d.ts +11 -0
  168. package/dist/cli/commands/InitCommand.js +195 -0
  169. package/dist/cli/commands/InitCommand.js.map +1 -0
  170. package/dist/cli/commands/OnPostInstallCommand.js +9 -10
  171. package/dist/cli/commands/OnPostInstallCommand.js.map +1 -1
  172. package/dist/cli/commands/PullCommand.d.ts +12 -0
  173. package/dist/cli/commands/PullCommand.js +117 -0
  174. package/dist/cli/commands/PullCommand.js.map +1 -0
  175. package/dist/cli/commands/inspect/InspectCommand.d.ts +4 -0
  176. package/dist/cli/commands/inspect/InspectCommand.js +19 -0
  177. package/dist/cli/commands/inspect/InspectCommand.js.map +1 -0
  178. package/dist/cli/commands/inspect/commands/InspectGgufCommand.d.ts +12 -0
  179. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +136 -0
  180. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -0
  181. package/dist/cli/commands/inspect/commands/InspectGpuCommand.d.ts +4 -0
  182. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +138 -0
  183. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -0
  184. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.d.ts +17 -0
  185. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +613 -0
  186. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -0
  187. package/dist/cli/projectTemplates.d.ts +7 -0
  188. package/dist/cli/projectTemplates.js +10 -0
  189. package/dist/cli/projectTemplates.js.map +1 -0
  190. package/dist/cli/recommendedModels.d.ts +2 -0
  191. package/dist/cli/recommendedModels.js +342 -0
  192. package/dist/cli/recommendedModels.js.map +1 -0
  193. package/dist/cli/startCreateCli.d.ts +2 -0
  194. package/dist/cli/startCreateCli.js +26 -0
  195. package/dist/cli/startCreateCli.js.map +1 -0
  196. package/dist/cli/utils/ConsoleInteraction.d.ts +23 -0
  197. package/dist/cli/utils/ConsoleInteraction.js +122 -0
  198. package/dist/cli/utils/ConsoleInteraction.js.map +1 -0
  199. package/dist/cli/utils/ConsoleTable.d.ts +23 -0
  200. package/dist/cli/utils/ConsoleTable.js +86 -0
  201. package/dist/cli/utils/ConsoleTable.js.map +1 -0
  202. package/dist/cli/utils/basicChooseFromListConsoleInteraction.d.ts +13 -0
  203. package/dist/cli/utils/basicChooseFromListConsoleInteraction.js +111 -0
  204. package/dist/cli/utils/basicChooseFromListConsoleInteraction.js.map +1 -0
  205. package/dist/cli/utils/consolePromptQuestion.d.ts +6 -0
  206. package/dist/cli/utils/consolePromptQuestion.js +82 -0
  207. package/dist/cli/utils/consolePromptQuestion.js.map +1 -0
  208. package/dist/cli/utils/getReadablePath.d.ts +1 -0
  209. package/dist/cli/utils/getReadablePath.js +14 -0
  210. package/dist/cli/utils/getReadablePath.js.map +1 -0
  211. package/dist/cli/utils/interactivelyAskForModel.d.ts +7 -0
  212. package/dist/cli/utils/interactivelyAskForModel.js +451 -0
  213. package/dist/cli/utils/interactivelyAskForModel.js.map +1 -0
  214. package/dist/cli/utils/logUsedGpuTypeOption.d.ts +2 -0
  215. package/dist/cli/utils/logUsedGpuTypeOption.js +9 -0
  216. package/dist/cli/utils/logUsedGpuTypeOption.js.map +1 -0
  217. package/dist/cli/utils/printCommonInfoLines.d.ts +9 -0
  218. package/dist/cli/utils/printCommonInfoLines.js +71 -0
  219. package/dist/cli/utils/printCommonInfoLines.js.map +1 -0
  220. package/dist/cli/utils/printInfoLine.d.ts +12 -0
  221. package/dist/cli/utils/printInfoLine.js +54 -0
  222. package/dist/cli/utils/printInfoLine.js.map +1 -0
  223. package/dist/cli/utils/projectTemplates.d.ts +19 -0
  224. package/dist/cli/utils/projectTemplates.js +47 -0
  225. package/dist/cli/utils/projectTemplates.js.map +1 -0
  226. package/dist/cli/utils/resolveCommandGgufPath.d.ts +4 -0
  227. package/dist/cli/utils/resolveCommandGgufPath.js +71 -0
  228. package/dist/cli/utils/resolveCommandGgufPath.js.map +1 -0
  229. package/dist/cli/utils/resolveHeaderFlag.d.ts +1 -0
  230. package/dist/cli/utils/resolveHeaderFlag.js +21 -0
  231. package/dist/cli/utils/resolveHeaderFlag.js.map +1 -0
  232. package/dist/cli/utils/resolveModelRecommendationFileOptions.d.ts +19 -0
  233. package/dist/cli/utils/resolveModelRecommendationFileOptions.js +7 -0
  234. package/dist/cli/utils/resolveModelRecommendationFileOptions.js.map +1 -0
  235. package/dist/cli/utils/splitAnsiToLines.d.ts +1 -0
  236. package/dist/cli/utils/splitAnsiToLines.js +32 -0
  237. package/dist/cli/utils/splitAnsiToLines.js.map +1 -0
  238. package/dist/cli/utils/withCliCommandDescriptionDocsUrl.d.ts +2 -0
  239. package/dist/cli/utils/withCliCommandDescriptionDocsUrl.js +23 -0
  240. package/dist/cli/utils/withCliCommandDescriptionDocsUrl.js.map +1 -0
  241. package/dist/commands.d.ts +1 -0
  242. package/dist/commands.js +3 -0
  243. package/dist/commands.js.map +1 -1
  244. package/dist/config.d.ts +38 -5
  245. package/dist/config.js +61 -16
  246. package/dist/config.js.map +1 -1
  247. package/dist/consts.d.ts +3 -0
  248. package/dist/consts.js +10 -0
  249. package/dist/consts.js.map +1 -0
  250. package/dist/{llamaEvaluator → evaluator}/LlamaChat/LlamaChat.d.ts +37 -35
  251. package/dist/{llamaEvaluator → evaluator}/LlamaChat/LlamaChat.js +298 -221
  252. package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -0
  253. package/dist/{llamaEvaluator → evaluator}/LlamaChat/utils/FunctionCallGrammar.d.ts +2 -1
  254. package/dist/{llamaEvaluator → evaluator}/LlamaChat/utils/FunctionCallGrammar.js +5 -3
  255. package/dist/evaluator/LlamaChat/utils/FunctionCallGrammar.js.map +1 -0
  256. package/dist/{llamaEvaluator → evaluator}/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js +18 -0
  257. package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +1 -0
  258. package/dist/{llamaEvaluator → evaluator}/LlamaChatSession/LlamaChatSession.d.ts +40 -3
  259. package/dist/{llamaEvaluator → evaluator}/LlamaChatSession/LlamaChatSession.js +28 -7
  260. package/dist/evaluator/LlamaChatSession/LlamaChatSession.js.map +1 -0
  261. package/dist/{llamaEvaluator → evaluator}/LlamaChatSession/utils/defineChatSessionFunction.d.ts +3 -0
  262. package/dist/{llamaEvaluator → evaluator}/LlamaChatSession/utils/defineChatSessionFunction.js +3 -0
  263. package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.js.map +1 -0
  264. package/dist/evaluator/LlamaCompletion.d.ts +155 -0
  265. package/dist/evaluator/LlamaCompletion.js +405 -0
  266. package/dist/evaluator/LlamaCompletion.js.map +1 -0
  267. package/dist/{llamaEvaluator → evaluator}/LlamaContext/LlamaContext.d.ts +41 -20
  268. package/dist/{llamaEvaluator → evaluator}/LlamaContext/LlamaContext.js +271 -81
  269. package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -0
  270. package/dist/evaluator/LlamaContext/types.d.ts +140 -0
  271. package/dist/evaluator/LlamaContext/types.js.map +1 -0
  272. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/firstInFirstOutStrategy.js.map +1 -0
  273. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/maximumParallelismStrategy.js.map +1 -0
  274. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.d.ts +2 -0
  275. package/dist/{llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js → evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js} +4 -4
  276. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js.map +1 -0
  277. package/dist/evaluator/LlamaEmbeddingContext.d.ts +51 -0
  278. package/dist/evaluator/LlamaEmbeddingContext.js +73 -0
  279. package/dist/evaluator/LlamaEmbeddingContext.js.map +1 -0
  280. package/dist/{llamaEvaluator → evaluator}/LlamaGrammar.d.ts +8 -5
  281. package/dist/{llamaEvaluator → evaluator}/LlamaGrammar.js +13 -10
  282. package/dist/evaluator/LlamaGrammar.js.map +1 -0
  283. package/dist/{llamaEvaluator → evaluator}/LlamaGrammarEvaluationState.js +4 -4
  284. package/dist/evaluator/LlamaGrammarEvaluationState.js.map +1 -0
  285. package/dist/{llamaEvaluator → evaluator}/LlamaJsonSchemaGrammar.d.ts +2 -1
  286. package/dist/{llamaEvaluator → evaluator}/LlamaJsonSchemaGrammar.js +3 -3
  287. package/dist/evaluator/LlamaJsonSchemaGrammar.js.map +1 -0
  288. package/dist/evaluator/LlamaModel.d.ts +230 -0
  289. package/dist/evaluator/LlamaModel.js +597 -0
  290. package/dist/evaluator/LlamaModel.js.map +1 -0
  291. package/dist/evaluator/TokenBias.d.ts +22 -0
  292. package/dist/evaluator/TokenBias.js +33 -0
  293. package/dist/evaluator/TokenBias.js.map +1 -0
  294. package/dist/evaluator/TokenMeter.d.ts +54 -0
  295. package/dist/evaluator/TokenMeter.js +86 -0
  296. package/dist/evaluator/TokenMeter.js.map +1 -0
  297. package/dist/gguf/consts.d.ts +3 -0
  298. package/dist/gguf/consts.js +8 -0
  299. package/dist/gguf/consts.js.map +1 -0
  300. package/dist/gguf/errors/InvalidGgufMagicError.d.ts +3 -0
  301. package/dist/gguf/errors/InvalidGgufMagicError.js +6 -0
  302. package/dist/gguf/errors/InvalidGgufMagicError.js.map +1 -0
  303. package/dist/gguf/errors/UnsupportedGgufValueTypeError.d.ts +4 -0
  304. package/dist/gguf/errors/UnsupportedGgufValueTypeError.js +9 -0
  305. package/dist/gguf/errors/UnsupportedGgufValueTypeError.js.map +1 -0
  306. package/dist/gguf/fileReaders/GgufFileReader.d.ts +33 -0
  307. package/dist/gguf/fileReaders/GgufFileReader.js +76 -0
  308. package/dist/gguf/fileReaders/GgufFileReader.js.map +1 -0
  309. package/dist/gguf/fileReaders/GgufFsFileReader.d.ts +17 -0
  310. package/dist/gguf/fileReaders/GgufFsFileReader.js +45 -0
  311. package/dist/gguf/fileReaders/GgufFsFileReader.js.map +1 -0
  312. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.d.ts +22 -0
  313. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js +63 -0
  314. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js.map +1 -0
  315. package/dist/gguf/insights/GgufInsights.d.ts +42 -0
  316. package/dist/gguf/insights/GgufInsights.js +361 -0
  317. package/dist/gguf/insights/GgufInsights.js.map +1 -0
  318. package/dist/gguf/insights/GgufInsightsConfigurationResolver.d.ts +87 -0
  319. package/dist/gguf/insights/GgufInsightsConfigurationResolver.js +136 -0
  320. package/dist/gguf/insights/GgufInsightsConfigurationResolver.js.map +1 -0
  321. package/dist/gguf/insights/utils/resolveContextContextSizeOption.d.ts +18 -0
  322. package/dist/gguf/insights/utils/resolveContextContextSizeOption.js +76 -0
  323. package/dist/gguf/insights/utils/resolveContextContextSizeOption.js.map +1 -0
  324. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.d.ts +14 -0
  325. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js +177 -0
  326. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js.map +1 -0
  327. package/dist/gguf/insights/utils/scoreLevels.d.ts +5 -0
  328. package/dist/gguf/insights/utils/scoreLevels.js +16 -0
  329. package/dist/gguf/insights/utils/scoreLevels.js.map +1 -0
  330. package/dist/gguf/parser/GgufV2Parser.d.ts +19 -0
  331. package/dist/gguf/parser/GgufV2Parser.js +115 -0
  332. package/dist/gguf/parser/GgufV2Parser.js.map +1 -0
  333. package/dist/gguf/parser/GgufV3Parser.d.ts +3 -0
  334. package/dist/gguf/parser/GgufV3Parser.js +4 -0
  335. package/dist/gguf/parser/GgufV3Parser.js.map +1 -0
  336. package/dist/gguf/parser/parseGguf.d.ts +8 -0
  337. package/dist/gguf/parser/parseGguf.js +63 -0
  338. package/dist/gguf/parser/parseGguf.js.map +1 -0
  339. package/dist/gguf/readGgufFileInfo.d.ts +33 -0
  340. package/dist/gguf/readGgufFileInfo.js +66 -0
  341. package/dist/gguf/readGgufFileInfo.js.map +1 -0
  342. package/dist/gguf/types/GgufFileInfoTypes.d.ts +84 -0
  343. package/dist/gguf/types/GgufFileInfoTypes.js +18 -0
  344. package/dist/gguf/types/GgufFileInfoTypes.js.map +1 -0
  345. package/dist/gguf/types/GgufMetadataTypes.d.ts +334 -0
  346. package/dist/gguf/types/GgufMetadataTypes.js +86 -0
  347. package/dist/gguf/types/GgufMetadataTypes.js.map +1 -0
  348. package/dist/gguf/types/GgufTensorInfoTypes.d.ts +37 -0
  349. package/dist/gguf/types/GgufTensorInfoTypes.js +33 -0
  350. package/dist/gguf/types/GgufTensorInfoTypes.js.map +1 -0
  351. package/dist/gguf/utils/GgufReadOffset.d.ts +6 -0
  352. package/dist/gguf/utils/GgufReadOffset.js +18 -0
  353. package/dist/gguf/utils/GgufReadOffset.js.map +1 -0
  354. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.d.ts +5 -0
  355. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js +38 -0
  356. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js.map +1 -0
  357. package/dist/gguf/utils/getGgufFileTypeName.d.ts +4 -0
  358. package/dist/gguf/utils/getGgufFileTypeName.js +13 -0
  359. package/dist/gguf/utils/getGgufFileTypeName.js.map +1 -0
  360. package/dist/gguf/utils/getGgufMetadataArchitectureData.d.ts +3 -0
  361. package/dist/gguf/utils/getGgufMetadataArchitectureData.js +4 -0
  362. package/dist/gguf/utils/getGgufMetadataArchitectureData.js.map +1 -0
  363. package/dist/gguf/utils/normalizeGgufDownloadUrl.d.ts +1 -0
  364. package/dist/gguf/utils/normalizeGgufDownloadUrl.js +16 -0
  365. package/dist/gguf/utils/normalizeGgufDownloadUrl.js.map +1 -0
  366. package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.d.ts +2 -0
  367. package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.js +39 -0
  368. package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.js.map +1 -0
  369. package/dist/gguf/utils/resolveSplitGgufParts.d.ts +7 -0
  370. package/dist/gguf/utils/resolveSplitGgufParts.js +55 -0
  371. package/dist/gguf/utils/resolveSplitGgufParts.js.map +1 -0
  372. package/dist/index.d.ts +37 -17
  373. package/dist/index.js +33 -14
  374. package/dist/index.js.map +1 -1
  375. package/dist/state.d.ts +4 -0
  376. package/dist/state.js +14 -0
  377. package/dist/state.js.map +1 -1
  378. package/dist/types.d.ts +53 -2
  379. package/dist/types.js.map +1 -1
  380. package/dist/utils/DisposeGuard.d.ts +13 -0
  381. package/dist/utils/DisposeGuard.js +120 -0
  382. package/dist/utils/DisposeGuard.js.map +1 -0
  383. package/dist/utils/InsufficientMemoryError.d.ts +3 -0
  384. package/dist/utils/InsufficientMemoryError.js +6 -0
  385. package/dist/utils/InsufficientMemoryError.js.map +1 -0
  386. package/dist/utils/LlamaText.d.ts +50 -25
  387. package/dist/utils/LlamaText.js +367 -155
  388. package/dist/utils/LlamaText.js.map +1 -1
  389. package/dist/utils/StopGenerationDetector.d.ts +1 -1
  390. package/dist/utils/StopGenerationDetector.js +23 -18
  391. package/dist/utils/StopGenerationDetector.js.map +1 -1
  392. package/dist/utils/TokenStreamRegulator.d.ts +8 -4
  393. package/dist/utils/TokenStreamRegulator.js +78 -8
  394. package/dist/utils/TokenStreamRegulator.js.map +1 -1
  395. package/dist/utils/UnsupportedError.d.ts +2 -0
  396. package/dist/utils/UnsupportedError.js +7 -0
  397. package/dist/utils/UnsupportedError.js.map +1 -0
  398. package/dist/utils/cmake.js +38 -20
  399. package/dist/utils/cmake.js.map +1 -1
  400. package/dist/utils/createModelDownloader.d.ts +102 -0
  401. package/dist/utils/createModelDownloader.js +226 -0
  402. package/dist/utils/createModelDownloader.js.map +1 -0
  403. package/dist/utils/findBestOption.d.ts +4 -0
  404. package/dist/utils/findBestOption.js +15 -0
  405. package/dist/utils/findBestOption.js.map +1 -0
  406. package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.js +18 -8
  407. package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.js.map +1 -1
  408. package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.d.ts +5 -0
  409. package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.js +11 -0
  410. package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.js.map +1 -0
  411. package/dist/utils/gbnfJson/terminals/GbnfArray.d.ts +3 -1
  412. package/dist/utils/gbnfJson/terminals/GbnfArray.js +10 -5
  413. package/dist/utils/gbnfJson/terminals/GbnfArray.js.map +1 -1
  414. package/dist/utils/gbnfJson/terminals/GbnfBoolean.d.ts +1 -1
  415. package/dist/utils/gbnfJson/terminals/GbnfBoolean.js.map +1 -1
  416. package/dist/utils/gbnfJson/terminals/GbnfBooleanValue.js.map +1 -1
  417. package/dist/utils/gbnfJson/terminals/GbnfGrammar.js.map +1 -1
  418. package/dist/utils/gbnfJson/terminals/GbnfNull.d.ts +1 -1
  419. package/dist/utils/gbnfJson/terminals/GbnfNull.js.map +1 -1
  420. package/dist/utils/gbnfJson/terminals/GbnfNumber.d.ts +1 -1
  421. package/dist/utils/gbnfJson/terminals/GbnfNumber.js.map +1 -1
  422. package/dist/utils/gbnfJson/terminals/GbnfNumberValue.js.map +1 -1
  423. package/dist/utils/gbnfJson/terminals/GbnfObjectMap.d.ts +3 -1
  424. package/dist/utils/gbnfJson/terminals/GbnfObjectMap.js +9 -4
  425. package/dist/utils/gbnfJson/terminals/GbnfObjectMap.js.map +1 -1
  426. package/dist/utils/gbnfJson/terminals/GbnfOr.js.map +1 -1
  427. package/dist/utils/gbnfJson/terminals/GbnfRepetition.d.ts +9 -0
  428. package/dist/utils/gbnfJson/terminals/GbnfRepetition.js +37 -0
  429. package/dist/utils/gbnfJson/terminals/GbnfRepetition.js.map +1 -0
  430. package/dist/utils/gbnfJson/terminals/GbnfString.d.ts +1 -1
  431. package/dist/utils/gbnfJson/terminals/GbnfString.js +23 -5
  432. package/dist/utils/gbnfJson/terminals/GbnfString.js.map +1 -1
  433. package/dist/utils/gbnfJson/terminals/GbnfStringValue.js.map +1 -1
  434. package/dist/utils/gbnfJson/terminals/GbnfVerbatimText.js.map +1 -1
  435. package/dist/utils/gbnfJson/terminals/GbnfWhitespace.d.ts +7 -4
  436. package/dist/utils/gbnfJson/terminals/GbnfWhitespace.js +37 -9
  437. package/dist/utils/gbnfJson/terminals/GbnfWhitespace.js.map +1 -1
  438. package/dist/utils/gbnfJson/terminals/gbnfConsts.d.ts +5 -4
  439. package/dist/utils/gbnfJson/terminals/gbnfConsts.js +14 -3
  440. package/dist/utils/gbnfJson/terminals/gbnfConsts.js.map +1 -1
  441. package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.d.ts +10 -0
  442. package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.js +15 -0
  443. package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.js.map +1 -0
  444. package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.d.ts +2 -1
  445. package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.js +6 -5
  446. package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.js.map +1 -1
  447. package/dist/utils/getBuildDefaults.d.ts +1 -2
  448. package/dist/utils/getBuildDefaults.js +2 -3
  449. package/dist/utils/getBuildDefaults.js.map +1 -1
  450. package/dist/utils/getConsoleLogPrefix.d.ts +1 -0
  451. package/dist/utils/getConsoleLogPrefix.js +10 -0
  452. package/dist/utils/getConsoleLogPrefix.js.map +1 -0
  453. package/dist/utils/getGrammarsFolder.d.ts +2 -1
  454. package/dist/utils/getGrammarsFolder.js +8 -7
  455. package/dist/utils/getGrammarsFolder.js.map +1 -1
  456. package/dist/utils/getModuleVersion.d.ts +1 -0
  457. package/dist/utils/getModuleVersion.js +13 -0
  458. package/dist/utils/getModuleVersion.js.map +1 -0
  459. package/dist/utils/getQueuedTokensBeforeStopTrigger.d.ts +6 -0
  460. package/dist/utils/getQueuedTokensBeforeStopTrigger.js +22 -0
  461. package/dist/utils/getQueuedTokensBeforeStopTrigger.js.map +1 -0
  462. package/dist/utils/getReadableContextSize.d.ts +1 -0
  463. package/dist/utils/getReadableContextSize.js +7 -0
  464. package/dist/utils/getReadableContextSize.js.map +1 -0
  465. package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.js +15 -11
  466. package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.js.map +1 -1
  467. package/dist/utils/gitReleaseBundles.js +73 -5
  468. package/dist/utils/gitReleaseBundles.js.map +1 -1
  469. package/dist/utils/hashString.d.ts +1 -0
  470. package/dist/utils/hashString.js +8 -0
  471. package/dist/utils/hashString.js.map +1 -0
  472. package/dist/utils/isLockfileActive.d.ts +4 -0
  473. package/dist/utils/isLockfileActive.js +12 -0
  474. package/dist/utils/isLockfileActive.js.map +1 -0
  475. package/dist/utils/isToken.d.ts +2 -0
  476. package/dist/utils/isToken.js +4 -0
  477. package/dist/utils/isToken.js.map +1 -0
  478. package/dist/utils/isUrl.d.ts +1 -0
  479. package/dist/utils/isUrl.js +15 -0
  480. package/dist/utils/isUrl.js.map +1 -0
  481. package/dist/utils/mergeUnionTypes.d.ts +10 -0
  482. package/dist/utils/mergeUnionTypes.js +2 -0
  483. package/dist/utils/mergeUnionTypes.js.map +1 -0
  484. package/dist/utils/parseModelFileName.d.ts +1 -0
  485. package/dist/utils/parseModelFileName.js +6 -1
  486. package/dist/utils/parseModelFileName.js.map +1 -1
  487. package/dist/utils/parseTextTemplate.d.ts +66 -0
  488. package/dist/utils/parseTextTemplate.js +116 -0
  489. package/dist/utils/parseTextTemplate.js.map +1 -0
  490. package/dist/utils/prettyPrintObject.d.ts +10 -0
  491. package/dist/utils/prettyPrintObject.js +84 -0
  492. package/dist/utils/prettyPrintObject.js.map +1 -0
  493. package/dist/utils/removeNullFields.d.ts +2 -1
  494. package/dist/utils/removeNullFields.js +8 -0
  495. package/dist/utils/removeNullFields.js.map +1 -1
  496. package/dist/utils/resolveGithubRelease.d.ts +2 -0
  497. package/dist/utils/resolveGithubRelease.js +36 -0
  498. package/dist/utils/resolveGithubRelease.js.map +1 -0
  499. package/dist/utils/runtime.d.ts +4 -0
  500. package/dist/utils/runtime.js +8 -0
  501. package/dist/utils/runtime.js.map +1 -0
  502. package/dist/utils/spawnCommand.d.ts +11 -1
  503. package/dist/utils/spawnCommand.js +56 -6
  504. package/dist/utils/spawnCommand.js.map +1 -1
  505. package/dist/utils/tokenizeInput.d.ts +3 -0
  506. package/dist/utils/tokenizeInput.js +12 -0
  507. package/dist/utils/tokenizeInput.js.map +1 -0
  508. package/dist/utils/utilTypes.d.ts +3 -0
  509. package/dist/utils/utilTypes.js +2 -0
  510. package/dist/utils/utilTypes.js.map +1 -0
  511. package/dist/utils/waitForLockfileRelease.d.ts +5 -0
  512. package/dist/utils/waitForLockfileRelease.js +20 -0
  513. package/dist/utils/waitForLockfileRelease.js.map +1 -0
  514. package/dist/utils/withLockfile.d.ts +7 -0
  515. package/dist/utils/withLockfile.js +44 -0
  516. package/dist/utils/withLockfile.js.map +1 -0
  517. package/dist/utils/withOra.d.ts +2 -0
  518. package/dist/utils/withOra.js +22 -6
  519. package/dist/utils/withOra.js.map +1 -1
  520. package/dist/utils/withProgressLog.d.ts +23 -0
  521. package/dist/utils/withProgressLog.js +211 -0
  522. package/dist/utils/withProgressLog.js.map +1 -0
  523. package/dist/utils/withStatusLogs.d.ts +2 -1
  524. package/dist/utils/withStatusLogs.js +12 -9
  525. package/dist/utils/withStatusLogs.js.map +1 -1
  526. package/llama/.clang-format +1 -2
  527. package/llama/CMakeLists.txt +115 -4
  528. package/llama/addon.cpp +1318 -99
  529. package/llama/binariesGithubRelease.json +1 -1
  530. package/llama/gitRelease.bundle +0 -0
  531. package/llama/gpuInfo/cuda-gpu-info.cu +120 -0
  532. package/llama/gpuInfo/cuda-gpu-info.h +10 -0
  533. package/llama/gpuInfo/metal-gpu-info.h +8 -0
  534. package/llama/gpuInfo/metal-gpu-info.mm +30 -0
  535. package/llama/gpuInfo/vulkan-gpu-info.cpp +83 -0
  536. package/llama/gpuInfo/vulkan-gpu-info.h +9 -0
  537. package/llama/grammars/README.md +11 -1
  538. package/llama/grammars/json.gbnf +1 -1
  539. package/llama/grammars/json_arr.gbnf +1 -1
  540. package/llama/llama.cpp.info.json +4 -0
  541. package/llama/toolchains/win32.host-x64.target-arm64.cmake +41 -0
  542. package/llamaBins/linux-arm64/_nlcBuildMetadata.json +1 -0
  543. package/llamaBins/linux-arm64/llama-addon.node +0 -0
  544. package/llamaBins/linux-armv7l/_nlcBuildMetadata.json +1 -0
  545. package/llamaBins/linux-armv7l/llama-addon.node +0 -0
  546. package/llamaBins/linux-x64/_nlcBuildMetadata.json +1 -0
  547. package/llamaBins/linux-x64/llama-addon.node +0 -0
  548. package/llamaBins/linux-x64-cuda/_nlcBuildMetadata.json +1 -0
  549. package/llamaBins/linux-x64-cuda/llama-addon.node +0 -0
  550. package/llamaBins/linux-x64-vulkan/_nlcBuildMetadata.json +1 -0
  551. package/llamaBins/linux-x64-vulkan/llama-addon.node +0 -0
  552. package/llamaBins/mac-arm64-metal/_nlcBuildMetadata.json +1 -0
  553. package/llamaBins/mac-arm64-metal/default.metallib +0 -0
  554. package/llamaBins/mac-arm64-metal/llama-addon.node +0 -0
  555. package/llamaBins/mac-x64/_nlcBuildMetadata.json +1 -0
  556. package/llamaBins/mac-x64/llama-addon.node +0 -0
  557. package/llamaBins/win-arm64/_nlcBuildMetadata.json +1 -0
  558. package/llamaBins/win-arm64/llama-addon.exp +0 -0
  559. package/llamaBins/win-arm64/llama-addon.lib +0 -0
  560. package/llamaBins/win-arm64/llama-addon.node +0 -0
  561. package/llamaBins/win-x64/_nlcBuildMetadata.json +1 -0
  562. package/llamaBins/win-x64/llama-addon.exp +0 -0
  563. package/llamaBins/win-x64/llama-addon.lib +0 -0
  564. package/llamaBins/win-x64/llama-addon.node +0 -0
  565. package/llamaBins/win-x64-cuda/_nlcBuildMetadata.json +1 -0
  566. package/llamaBins/win-x64-cuda/llama-addon.exp +0 -0
  567. package/llamaBins/win-x64-cuda/llama-addon.lib +0 -0
  568. package/llamaBins/win-x64-cuda/llama-addon.node +0 -0
  569. package/llamaBins/win-x64-vulkan/_nlcBuildMetadata.json +1 -0
  570. package/llamaBins/win-x64-vulkan/llama-addon.exp +0 -0
  571. package/llamaBins/win-x64-vulkan/llama-addon.lib +0 -0
  572. package/llamaBins/win-x64-vulkan/llama-addon.node +0 -0
  573. package/package.json +61 -34
  574. package/templates/package.json +10 -0
  575. package/dist/AbortError.d.ts +0 -2
  576. package/dist/AbortError.js +0 -7
  577. package/dist/AbortError.js.map +0 -1
  578. package/dist/chatWrappers/LlamaChatWrapper.js.map +0 -1
  579. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.d.ts +0 -13
  580. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js +0 -55
  581. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js.map +0 -1
  582. package/dist/llamaEvaluator/LlamaBins.d.ts +0 -18
  583. package/dist/llamaEvaluator/LlamaBins.js +0 -5
  584. package/dist/llamaEvaluator/LlamaBins.js.map +0 -1
  585. package/dist/llamaEvaluator/LlamaChat/LlamaChat.js.map +0 -1
  586. package/dist/llamaEvaluator/LlamaChat/utils/FunctionCallGrammar.js.map +0 -1
  587. package/dist/llamaEvaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +0 -1
  588. package/dist/llamaEvaluator/LlamaChatSession/LlamaChatSession.js.map +0 -1
  589. package/dist/llamaEvaluator/LlamaChatSession/utils/defineChatSessionFunction.js.map +0 -1
  590. package/dist/llamaEvaluator/LlamaContext/LlamaContext.js.map +0 -1
  591. package/dist/llamaEvaluator/LlamaContext/types.d.ts +0 -86
  592. package/dist/llamaEvaluator/LlamaContext/types.js.map +0 -1
  593. package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js.map +0 -1
  594. package/dist/llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js.map +0 -1
  595. package/dist/llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.d.ts +0 -2
  596. package/dist/llamaEvaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js.map +0 -1
  597. package/dist/llamaEvaluator/LlamaGrammar.js.map +0 -1
  598. package/dist/llamaEvaluator/LlamaGrammarEvaluationState.js.map +0 -1
  599. package/dist/llamaEvaluator/LlamaJsonSchemaGrammar.js.map +0 -1
  600. package/dist/llamaEvaluator/LlamaModel.d.ts +0 -119
  601. package/dist/llamaEvaluator/LlamaModel.js +0 -322
  602. package/dist/llamaEvaluator/LlamaModel.js.map +0 -1
  603. package/dist/utils/binariesGithubRelease.js.map +0 -1
  604. package/dist/utils/clearLlamaBuild.d.ts +0 -1
  605. package/dist/utils/clearLlamaBuild.js +0 -12
  606. package/dist/utils/clearLlamaBuild.js.map +0 -1
  607. package/dist/utils/cloneLlamaCppRepo.d.ts +0 -2
  608. package/dist/utils/cloneLlamaCppRepo.js +0 -102
  609. package/dist/utils/cloneLlamaCppRepo.js.map +0 -1
  610. package/dist/utils/compileLLamaCpp.d.ts +0 -8
  611. package/dist/utils/compileLLamaCpp.js +0 -132
  612. package/dist/utils/compileLLamaCpp.js.map +0 -1
  613. package/dist/utils/getBin.js +0 -78
  614. package/dist/utils/getBin.js.map +0 -1
  615. package/dist/utils/getGbnfGrammarForGbnfJsonSchema.d.ts +0 -2
  616. package/dist/utils/getGbnfGrammarForGbnfJsonSchema.js +0 -9
  617. package/dist/utils/getGbnfGrammarForGbnfJsonSchema.js.map +0 -1
  618. package/dist/utils/getReleaseInfo.d.ts +0 -7
  619. package/dist/utils/getReleaseInfo.js +0 -30
  620. package/dist/utils/getReleaseInfo.js.map +0 -1
  621. package/dist/utils/parseModelTypeDescription.d.ts +0 -6
  622. package/dist/utils/parseModelTypeDescription.js +0 -9
  623. package/dist/utils/parseModelTypeDescription.js.map +0 -1
  624. package/dist/utils/resolveChatWrapper.d.ts +0 -4
  625. package/dist/utils/resolveChatWrapper.js +0 -16
  626. package/dist/utils/resolveChatWrapper.js.map +0 -1
  627. package/dist/utils/usedBinFlag.d.ts +0 -6
  628. package/dist/utils/usedBinFlag.js +0 -15
  629. package/dist/utils/usedBinFlag.js.map +0 -1
  630. package/llama/usedBin.json +0 -3
  631. package/llamaBins/mac-arm64/llama-addon.node +0 -0
  632. /package/dist/{utils → bindings/utils}/binariesGithubRelease.d.ts +0 -0
  633. /package/dist/{llamaEvaluator → evaluator}/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.d.ts +0 -0
  634. /package/dist/{llamaEvaluator → evaluator}/LlamaContext/types.js +0 -0
  635. /package/dist/{llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies → evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.d.ts +0 -0
  636. /package/dist/{llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies → evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.js +0 -0
  637. /package/dist/{llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies → evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies}/maximumParallelismStrategy.d.ts +0 -0
  638. /package/dist/{llamaEvaluator/LlamaContext/utils/batchItemsPrioritizingStrategies → evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies}/maximumParallelismStrategy.js +0 -0
  639. /package/dist/{llamaEvaluator → evaluator}/LlamaGrammarEvaluationState.d.ts +0 -0
@@ -0,0 +1,66 @@
1
+ import { isUrl } from "../utils/isUrl.js";
2
+ import { parseGguf } from "./parser/parseGguf.js";
3
+ import { GgufNetworkFetchFileReader } from "./fileReaders/GgufNetworkFetchFileReader.js";
4
+ import { GgufFsFileReader } from "./fileReaders/GgufFsFileReader.js";
5
+ import { ggufDefaultFetchRetryOptions } from "./consts.js";
6
+ import { normalizeGgufDownloadUrl } from "./utils/normalizeGgufDownloadUrl.js";
7
+ import { resolveSplitGgufParts } from "./utils/resolveSplitGgufParts.js";
8
+ /**
9
+ * Read a GGUF file and return its metadata and tensor info (unless `readTensorInfo` is set to `false`).
10
+ * Only the parts of the file required for the metadata and tensor info are read.
11
+ */
12
+ export async function readGgufFileInfo(pathOrUrl, { readTensorInfo = true, sourceType, ignoreKeys = [], logWarnings = true, fetchRetryOptions = ggufDefaultFetchRetryOptions, fetchHeaders = {}, spliceSplitFiles = true, signal } = {}) {
13
+ const useNetworkReader = sourceType === "network" || (sourceType == null && isUrl(pathOrUrl));
14
+ function createFileReader(pathOrUrl) {
15
+ if (useNetworkReader) {
16
+ return new GgufNetworkFetchFileReader({
17
+ url: normalizeGgufDownloadUrl(pathOrUrl),
18
+ retryOptions: fetchRetryOptions,
19
+ headers: fetchHeaders,
20
+ signal
21
+ });
22
+ }
23
+ else if (sourceType === "filesystem" || sourceType == null) {
24
+ return new GgufFsFileReader({
25
+ filePath: pathOrUrl,
26
+ signal
27
+ });
28
+ }
29
+ void (sourceType);
30
+ throw new Error(`Unsupported sourceType: ${sourceType}`);
31
+ }
32
+ async function readSingleFile(pathOrUrl) {
33
+ const fileReader = createFileReader(pathOrUrl);
34
+ return await parseGguf({
35
+ fileReader,
36
+ ignoreKeys,
37
+ readTensorInfo,
38
+ logWarnings
39
+ });
40
+ }
41
+ if (!spliceSplitFiles)
42
+ return await readSingleFile(pathOrUrl);
43
+ const allSplitPartPaths = resolveSplitGgufParts(pathOrUrl);
44
+ if (allSplitPartPaths.length === 1)
45
+ return await readSingleFile(allSplitPartPaths[0]);
46
+ const [first, ...rest] = await Promise.all(allSplitPartPaths.map((partPath) => readSingleFile(partPath)));
47
+ return {
48
+ version: first.version,
49
+ tensorCount: first.tensorCount,
50
+ metadata: first.metadata,
51
+ architectureMetadata: first.architectureMetadata,
52
+ tensorInfo: first.tensorInfo,
53
+ metadataSize: first.metadataSize,
54
+ splicedParts: allSplitPartPaths.length,
55
+ totalTensorInfoSize: first.totalTensorInfoSize == null
56
+ ? undefined
57
+ : (first.totalTensorInfoSize + rest.reduce((acc, part) => (acc + (part.totalTensorInfoSize ?? 0)), 0)),
58
+ totalTensorCount: Number(first.totalTensorCount) + rest.reduce((acc, part) => acc + Number(part.totalTensorCount), 0),
59
+ totalMetadataSize: first.totalMetadataSize + rest.reduce((acc, part) => acc + part.totalMetadataSize, 0),
60
+ fullTensorInfo: first.fullTensorInfo == null
61
+ ? undefined
62
+ : [first, ...rest].flatMap(part => (part.fullTensorInfo ?? [])),
63
+ tensorInfoSize: first.tensorInfoSize
64
+ };
65
+ }
66
+ //# sourceMappingURL=readGgufFileInfo.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"readGgufFileInfo.js","sourceRoot":"","sources":["../../src/gguf/readGgufFileInfo.ts"],"names":[],"mappings":"AACA,OAAO,EAAC,KAAK,EAAC,MAAM,mBAAmB,CAAC;AACxC,OAAO,EAAC,SAAS,EAAC,MAAM,uBAAuB,CAAC;AAChD,OAAO,EAAC,0BAA0B,EAAC,MAAM,6CAA6C,CAAC;AACvF,OAAO,EAAC,gBAAgB,EAAC,MAAM,mCAAmC,CAAC;AACnE,OAAO,EAAC,4BAA4B,EAAC,MAAM,aAAa,CAAC;AACzD,OAAO,EAAC,wBAAwB,EAAC,MAAM,qCAAqC,CAAC;AAC7E,OAAO,EAAC,qBAAqB,EAAC,MAAM,kCAAkC,CAAC;AAIvE;;;GAGG;AACH,MAAM,CAAC,KAAK,UAAU,gBAAgB,CAAC,SAAiB,EAAE,EACtD,cAAc,GAAG,IAAI,EACrB,UAAU,EACV,UAAU,GAAG,EAAE,EACf,WAAW,GAAG,IAAI,EAClB,iBAAiB,GAAG,4BAA4B,EAChD,YAAY,GAAG,EAAE,EACjB,gBAAgB,GAAG,IAAI,EACvB,MAAM,KAiCN,EAAE;IACF,MAAM,gBAAgB,GAAG,UAAU,KAAK,SAAS,IAAI,CAAC,UAAU,IAAI,IAAI,IAAI,KAAK,CAAC,SAAS,CAAC,CAAC,CAAC;IAE9F,SAAS,gBAAgB,CAAC,SAAiB;QACvC,IAAI,gBAAgB,EAAE;YAClB,OAAO,IAAI,0BAA0B,CAAC;gBAClC,GAAG,EAAE,wBAAwB,CAAC,SAAS,CAAC;gBACxC,YAAY,EAAE,iBAAiB;gBAC/B,OAAO,EAAE,YAAY;gBACrB,MAAM;aACT,CAAC,CAAC;SACN;aAAM,IAAI,UAAU,KAAK,YAAY,IAAI,UAAU,IAAI,IAAI,EAAE;YAC1D,OAAO,IAAI,gBAAgB,CAAC;gBACxB,QAAQ,EAAE,SAAS;gBACnB,MAAM;aACT,CAAC,CAAC;SACN;QAED,KAAK,CAAC,UAA0B,CAAC,CAAC;QAClC,MAAM,IAAI,KAAK,CAAC,2BAA2B,UAAU,EAAE,CAAC,CAAC;IAC7D,CAAC;IAED,KAAK,UAAU,cAAc,CAAC,SAAiB;QAC3C,MAAM,UAAU,GAAG,gBAAgB,CAAC,SAAS,CAAC,CAAC;QAC/C,OAAO,MAAM,SAAS,CAAC;YACnB,UAAU;YACV,UAAU;YACV,cAAc;YACd,WAAW;SACd,CAAC,CAAC;IACP,CAAC;IAED,IAAI,CAAC,gBAAgB;QACjB,OAAO,MAAM,cAAc,CAAC,SAAS,CAAC,CAAC;IAE3C,MAAM,iBAAiB,GAAG,qBAAqB,CAAC,SAAS,CAAC,CAAC;IAE3D,IAAI,iBAAiB,CAAC,MAAM,KAAK,CAAC;QAC9B,OAAO,MAAM,cAAc,CAAC,iBAAiB,CAAC,CAAC,CAAC,CAAC,CAAC;IAEtD,MAAM,CAAC,KAAK,EAAE,GAAG,IAAI,CAAC,GAAG,MAAM,OAAO,CAAC,GAAG,CACtC,iBAAiB,CAAC,GAAG,CAAC,CAAC,QAAQ,EAAE,EAAE,CAAC,cAAc,CAAC,QAAQ,CAAC,CAAC,CAChE,CAAC;IAEF,OAAO;QACH,OAAO,EAAE,KAAK,CAAC,OAAO;QACtB,WAAW,EAAE,KAAK,CAAC,WAAW;QAC9B,QAAQ,EAAE,KAAK,CAAC,QAAQ;QACxB,oBAAoB,EAAE,KAAK,CAAC,oBAAoB;QAChD,UAAU,EAAE,KAAK,CAAC,UAAU;QAC5B,YAAY,EAAE,KAAK,CAAC,YAAY;QAChC,YAAY,EAAE,iBAAiB,CAAC,MAAM;QACtC,mBAAmB,EAAE,KAAK,CAAC,mBAAmB,IAAI,IAAI;YAClD,CAAC,CAAC,SAAS;YACX,CAAC,CAAC,CAAC,KAAK,CAAC,mBAAmB,GAAG,IAAI,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,IAAI,EAAE,EAAE,CAAC,CAAC,GAAG,GAAG,CAAC,IAAI,CAAC,mBAAmB,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC;QAC1G,gBAAgB,EAAE,MAAM,CAAC,KAAK,CAAC,gBAAgB,CAAC,GAAG,IAAI,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,IAAI,EAAE,EAAE,CAAC,GAAG,GAAG,MAAM,CAAC,IAAI,CAAC,gBAAgB,CAAC,EAAE,CAAC,CAAC;QACrH,iBAAiB,EAAE,KAAK,CAAC,iBAAiB,GAAG,IAAI,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,IAAI,EAAE,EAAE,CAAC,GAAG,GAAG,IAAI,CAAC,iBAAiB,EAAE,CAAC,CAAC;QACxG,cAAc,EAAE,KAAK,CAAC,cAAc,IAAI,IAAI;YACxC,CAAC,CAAC,SAAS;YACX,CAAC,CAAC,CAAC,KAAK,EAAE,GAAG,IAAI,CAAC,CAAC,OAAO,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC,IAAI,CAAC,cAAc,IAAI,EAAE,CAAC,CAAC;QACnE,cAAc,EAAE,KAAK,CAAC,cAAc;KAChB,CAAC;AAC7B,CAAC"}
@@ -0,0 +1,84 @@
1
+ import type { GgufReadOffset } from "../utils/GgufReadOffset.js";
2
+ import type { GgufFileReader } from "../fileReaders/GgufFileReader.js";
3
+ import type { MergeOptionalUnionTypes } from "../../utils/mergeUnionTypes.js";
4
+ import type { GgufArchitectureType, GgufMetadata } from "./GgufMetadataTypes.js";
5
+ import type { GgufTensorInfo } from "./GgufTensorInfoTypes.js";
6
+ export type MetadataValue = string | number | bigint | boolean | MetadataValue[];
7
+ export type MetadataKeyValueRecord = Record<string, MetadataValue>;
8
+ export type MetadataNestedObject = {
9
+ [key: string]: MetadataValue | MetadataNestedObject;
10
+ };
11
+ export type GgufFileInfo = {
12
+ readonly version: 2 | 3 | number;
13
+ readonly tensorCount: number | bigint;
14
+ readonly metadata: GgufMetadata;
15
+ readonly metadataSize: number;
16
+ /** Same value as `metadata[metadata.general.architecture]`, but with merged types for convenience */
17
+ readonly architectureMetadata: MergeOptionalUnionTypes<Exclude<GgufMetadata[GgufArchitectureType], undefined>>;
18
+ /** can be null if `readTensorInfo` is set to `false` */
19
+ readonly tensorInfo?: GgufTensorInfo[];
20
+ /** can be null if `readTensorInfo` is set to `false` */
21
+ readonly tensorInfoSize?: number;
22
+ /**
23
+ * For spliced metadata of multiple file parts,
24
+ * this will be the number of files parts read and spliced into this metadata.
25
+ *
26
+ * Whe no splicing is done, this will be `1`.
27
+ */
28
+ readonly splicedParts: number;
29
+ /**
30
+ * For spliced metadata of multiple file parts, this will be the total tensor count from all the parts
31
+ *
32
+ * When no splicing is done, this will be the same as `tensorCount`.
33
+ */
34
+ readonly totalTensorCount: number | bigint;
35
+ /**
36
+ * For spliced metadata of multiple file parts, this will be the total metadata size from all the parts
37
+ *
38
+ * When no splicing is done, this will be the same as `metadataSize`.
39
+ */
40
+ readonly totalMetadataSize: number;
41
+ /**
42
+ * For spliced metadata of multiple file parts, this will be the spliced tensorInfo from all the parts.
43
+ * Can be null if `readTensorInfo` is set to `false`
44
+ *
45
+ * When no splicing is done, this will be the same as `tensorInfo`.
46
+ */
47
+ readonly fullTensorInfo?: GgufTensorInfo[];
48
+ /**
49
+ * For spliced metadata of multiple file parts, this will be the total tensor info size from all the parts
50
+ *
51
+ * When no splicing is done, this will be the same as `tensorInfoSize`.
52
+ */
53
+ readonly totalTensorInfoSize?: number;
54
+ };
55
+ export declare const enum GgufValueType {
56
+ Uint8 = 0,
57
+ Int8 = 1,
58
+ Uint16 = 2,
59
+ Int16 = 3,
60
+ Uint32 = 4,
61
+ Int32 = 5,
62
+ Float32 = 6,
63
+ Bool = 7,
64
+ String = 8,
65
+ Array = 9,
66
+ Uint64 = 10,
67
+ Int64 = 11,
68
+ Float64 = 12
69
+ }
70
+ export type GgufVersionParserOptions = {
71
+ fileReader: GgufFileReader;
72
+ readTensorInfo?: boolean;
73
+ ignoreKeys?: string[];
74
+ version: number;
75
+ readOffset: GgufReadOffset;
76
+ logWarnings: boolean;
77
+ };
78
+ export type GgufVersionParserResult = {
79
+ tensorCount: number | bigint;
80
+ metadata: GgufMetadata;
81
+ tensorInfo?: GgufTensorInfo[];
82
+ metadataSize: number;
83
+ tensorInfoSize?: number;
84
+ };
@@ -0,0 +1,18 @@
1
+ // source: `enum gguf_type` in `ggml.h` in the `llama.cpp` source code
2
+ export var GgufValueType;
3
+ (function (GgufValueType) {
4
+ GgufValueType[GgufValueType["Uint8"] = 0] = "Uint8";
5
+ GgufValueType[GgufValueType["Int8"] = 1] = "Int8";
6
+ GgufValueType[GgufValueType["Uint16"] = 2] = "Uint16";
7
+ GgufValueType[GgufValueType["Int16"] = 3] = "Int16";
8
+ GgufValueType[GgufValueType["Uint32"] = 4] = "Uint32";
9
+ GgufValueType[GgufValueType["Int32"] = 5] = "Int32";
10
+ GgufValueType[GgufValueType["Float32"] = 6] = "Float32";
11
+ GgufValueType[GgufValueType["Bool"] = 7] = "Bool";
12
+ GgufValueType[GgufValueType["String"] = 8] = "String";
13
+ GgufValueType[GgufValueType["Array"] = 9] = "Array";
14
+ GgufValueType[GgufValueType["Uint64"] = 10] = "Uint64";
15
+ GgufValueType[GgufValueType["Int64"] = 11] = "Int64";
16
+ GgufValueType[GgufValueType["Float64"] = 12] = "Float64";
17
+ })(GgufValueType || (GgufValueType = {}));
18
+ //# sourceMappingURL=GgufFileInfoTypes.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"GgufFileInfoTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufFileInfoTypes.ts"],"names":[],"mappings":"AAkEA,sEAAsE;AACtE,MAAM,CAAN,IAAkB,aAcjB;AAdD,WAAkB,aAAa;IAC3B,mDAAS,CAAA;IACT,iDAAQ,CAAA;IACR,qDAAU,CAAA;IACV,mDAAS,CAAA;IACT,qDAAU,CAAA;IACV,mDAAS,CAAA;IACT,uDAAW,CAAA;IACX,iDAAQ,CAAA;IACR,qDAAU,CAAA;IACV,mDAAS,CAAA;IACT,sDAAW,CAAA;IACX,oDAAU,CAAA;IACV,wDAAY,CAAA;AAChB,CAAC,EAdiB,aAAa,KAAb,aAAa,QAc9B"}
@@ -0,0 +1,334 @@
1
+ export declare const enum GgufArchitectureType {
2
+ llama = "llama",
3
+ falcon = "falcon",
4
+ gpt2 = "gpt2",
5
+ gptj = "gptj",
6
+ gptneox = "gptneox",
7
+ mpt = "mpt",
8
+ baichuan = "baichuan",
9
+ starcoder = "starcoder",
10
+ persimmon = "persimmon",
11
+ refact = "refact",
12
+ bert = "bert",
13
+ nomicBert = "nomic-bert",
14
+ bloom = "bloom",
15
+ stablelm = "stablelm",
16
+ qwen = "qwen",
17
+ qwen2 = "qwen2",
18
+ phi2 = "phi2",
19
+ plamo = "plamo",
20
+ codeshell = "codeshell",
21
+ orion = "orion",
22
+ internlm2 = "internlm2",
23
+ minicpm = "minicpm",
24
+ gemma = "gemma",
25
+ starcoder2 = "starcoder2",
26
+ mamba = "mamba",
27
+ commandR = "command-r",
28
+ rwkv = "rwkv"
29
+ }
30
+ export type GgufMetadata<A extends GgufArchitectureType = GgufArchitectureType> = {
31
+ readonly general: GgufMetadataGeneral<A>;
32
+ readonly tokenizer: GgufMetadataTokenizer;
33
+ } & (GgufArchitectureType extends A ? {
34
+ readonly [key in GgufArchitectureType]?: key extends keyof GgufMetadataLlmToType ? GgufMetadataLlmToType[key] : GgufMetadataDefaultArchitectureType;
35
+ } : {
36
+ readonly [key in A]: key extends keyof GgufMetadataLlmToType ? GgufMetadataLlmToType[key] : GgufMetadataDefaultArchitectureType;
37
+ });
38
+ export type GgufMetadataLlmToType = {
39
+ [GgufArchitectureType.llama]: GgufMetadataLlmLLaMA;
40
+ [GgufArchitectureType.mpt]: GgufMetadataMPT;
41
+ [GgufArchitectureType.gptneox]: GgufMetadataGPTNeoX;
42
+ [GgufArchitectureType.gptj]: GgufMetadataGPTJ;
43
+ [GgufArchitectureType.gpt2]: GgufMetadataGPT2;
44
+ [GgufArchitectureType.bloom]: GgufMetadataBloom;
45
+ [GgufArchitectureType.falcon]: GgufMetadataFalcon;
46
+ [GgufArchitectureType.mamba]: GgufMetadataMamba;
47
+ [GgufArchitectureType.rwkv]: GgufMetadataRWKV;
48
+ };
49
+ export declare enum GgufFileType {
50
+ ALL_F32 = 0,
51
+ MOSTLY_F16 = 1,
52
+ MOSTLY_Q4_0 = 2,
53
+ MOSTLY_Q4_1 = 3,
54
+ MOSTLY_Q4_1_SOME_F16 = 4,
55
+ MOSTLY_Q4_2 = 5,
56
+ MOSTLY_Q4_3 = 6,
57
+ MOSTLY_Q8_0 = 7,
58
+ MOSTLY_Q5_0 = 8,
59
+ MOSTLY_Q5_1 = 9,
60
+ MOSTLY_Q2_K = 10,
61
+ MOSTLY_Q3_K_S = 11,
62
+ MOSTLY_Q3_K_M = 12,
63
+ MOSTLY_Q3_K_L = 13,
64
+ MOSTLY_Q4_K_S = 14,
65
+ MOSTLY_Q4_K_M = 15,
66
+ MOSTLY_Q5_K_S = 16,
67
+ MOSTLY_Q5_K_M = 17,
68
+ MOSTLY_Q6_K = 18,
69
+ MOSTLY_IQ2_XXS = 19,
70
+ MOSTLY_IQ2_XS = 20,
71
+ MOSTLY_Q2_K_S = 21,
72
+ MOSTLY_IQ3_XS = 22,
73
+ MOSTLY_IQ3_XXS = 23,
74
+ MOSTLY_IQ1_S = 24,
75
+ MOSTLY_IQ4_NL = 25,
76
+ MOSTLY_IQ3_S = 26,
77
+ MOSTLY_IQ3_M = 27,
78
+ MOSTLY_IQ2_S = 28,
79
+ MOSTLY_IQ2_M = 29,
80
+ MOSTLY_IQ4_XS = 30
81
+ }
82
+ export type GgufMetadataGeneral<A extends GgufArchitectureType = GgufArchitectureType> = {
83
+ readonly architecture: A;
84
+ /**
85
+ * The version of the quantization format. Not required if the model is not
86
+ * quantized (i.e. no tensors are quantized). If any tensors are quantized,
87
+ * this must be present. This is separate to the quantization scheme of the
88
+ * tensors itself; the quantization version may change without changing the
89
+ * scheme's name (e.g. the quantization scheme is Q5_K, and the quantization
90
+ * version is 4).
91
+ */
92
+ readonly quantization_version: string;
93
+ /**
94
+ * the global alignment to use, as described above. This can vary to allow
95
+ * for different alignment schemes, but it must be a multiple of 8. Some
96
+ * writers may not write the alignment. If the alignment is not specified,
97
+ * assume it is `32`.
98
+ */
99
+ readonly alignment?: string;
100
+ /**
101
+ * The name of the model. This should be a human-readable name that can be
102
+ * used to identify the model. It should be unique within the community
103
+ * that the model is defined in.
104
+ */
105
+ readonly name?: string;
106
+ readonly author?: string;
107
+ /**
108
+ * URL to the model's homepage. This can be a GitHub repo, a paper, etc.
109
+ */
110
+ readonly url?: string;
111
+ /**
112
+ * free-form description of the model including anything that isn't
113
+ * covered by the other fields
114
+ */
115
+ readonly description?: string;
116
+ /**
117
+ * License of the model, expressed as a SPDX license expression
118
+ * (e.g. `MIT OR Apache-2.0`). *Should not* include any other information,
119
+ * such as the license text or the URL to the license.
120
+ */
121
+ readonly license?: string;
122
+ /**
123
+ * Information about where this model came from. This is useful for tracking
124
+ * the provenance of the model, and for finding the original source if the
125
+ * model is modified. For a model that was converted from GGML, for
126
+ * example, these keys would point to the model that was converted from.
127
+ */
128
+ readonly source?: {
129
+ /**
130
+ * URL to the source of the model. Can be a GitHub repo, a paper, etc.
131
+ */
132
+ readonly url?: string;
133
+ readonly huggingface?: {
134
+ readonly repository?: string;
135
+ };
136
+ };
137
+ /**
138
+ * An enumerated value describing the type of the majority of the tensors
139
+ * in the file. Optional; can be inferred from the tensor types.
140
+ */
141
+ readonly file_type?: GgufFileType | undefined;
142
+ };
143
+ export declare const enum GgufMetadataTokenizerTokenType {
144
+ undefined = 0,
145
+ normal = 1,
146
+ unknown = 2,
147
+ control = 3,
148
+ userDefined = 4,
149
+ unused = 5,
150
+ byte = 6
151
+ }
152
+ export type GgufMetadataTokenizer = {
153
+ readonly ggml: {
154
+ readonly model: "no_vocab" | "llama" | "gpt2" | "bert" | "replit" | "rwkv" | string;
155
+ readonly tokens: readonly string[];
156
+ readonly token_type: GgufMetadataTokenizerTokenType[];
157
+ readonly token_type_count?: number;
158
+ readonly scores?: readonly number[];
159
+ readonly merges?: readonly string[];
160
+ readonly bos_token_id?: number;
161
+ readonly eos_token_id?: number;
162
+ readonly unknown_token_id?: number;
163
+ readonly separator_token_id?: number;
164
+ readonly padding_token_id?: number;
165
+ readonly add_bos_token?: boolean;
166
+ readonly add_eos_token?: boolean;
167
+ readonly add_space_prefix?: boolean;
168
+ readonly added_tokens?: readonly string[];
169
+ readonly prefix_token_id?: number;
170
+ readonly suffix_token_id?: number;
171
+ readonly middle_token_id?: number;
172
+ readonly eot_token_id?: number;
173
+ };
174
+ readonly huggingface?: {
175
+ readonly json?: string;
176
+ };
177
+ readonly chat_template?: string;
178
+ };
179
+ export declare const enum GgufMetadataArchitecturePoolingType {
180
+ unspecified = -1,
181
+ none = 0,
182
+ mean = 1,
183
+ max = 2
184
+ }
185
+ export type GgufMetadataDefaultArchitectureType = {
186
+ readonly vocab_size?: number;
187
+ readonly context_length?: number;
188
+ readonly embedding_length?: number;
189
+ readonly block_count?: number;
190
+ readonly feed_forward_length?: number;
191
+ readonly use_parallel_residual?: boolean;
192
+ readonly tensor_data_layout?: string;
193
+ readonly expert_count?: number;
194
+ readonly expert_used_count?: number;
195
+ readonly pooling_type?: GgufMetadataArchitecturePoolingType;
196
+ readonly logit_scale?: number;
197
+ readonly attention?: {
198
+ readonly head_count?: number;
199
+ readonly head_count_kv?: number;
200
+ readonly max_alibi_bias?: number;
201
+ readonly clamp_kqv?: number;
202
+ readonly layer_norm_epsilon?: number;
203
+ readonly layer_norm_rms_epsilon?: number;
204
+ readonly key_length?: number;
205
+ readonly value_length?: number;
206
+ readonly causal?: boolean;
207
+ };
208
+ readonly rope?: {
209
+ readonly dimension_count?: number;
210
+ readonly freq_base?: number;
211
+ readonly scale_linear?: number;
212
+ readonly scaling?: {
213
+ readonly type?: "none" | "linear" | "yarn" | string;
214
+ readonly factor?: number;
215
+ readonly original_context_length?: number;
216
+ readonly finetuned?: boolean;
217
+ };
218
+ };
219
+ readonly ssm?: {
220
+ readonly conv_kernel?: number;
221
+ readonly inner_size?: number;
222
+ readonly state_size?: number;
223
+ readonly time_step_rank?: number;
224
+ };
225
+ };
226
+ export type GgufMetadataLlmLLaMA = {
227
+ readonly context_length: number;
228
+ readonly embedding_length: number;
229
+ readonly block_count: number;
230
+ readonly feed_forward_length: number;
231
+ readonly attention: {
232
+ readonly head_count: number;
233
+ readonly layer_norm_rms_epsilon: number;
234
+ readonly head_count_kv?: number;
235
+ };
236
+ readonly rope: {
237
+ readonly dimension_count: number;
238
+ readonly scale?: number;
239
+ };
240
+ readonly expert_count?: number;
241
+ readonly expert_used_count?: number;
242
+ readonly tensor_data_layout?: string;
243
+ };
244
+ export type GgufMetadataMPT = {
245
+ readonly context_length: number;
246
+ readonly embedding_length: number;
247
+ readonly block_count: number;
248
+ readonly attention: {
249
+ readonly head_count: number;
250
+ readonly alibi_bias_max: number;
251
+ readonly clip_kqv: number;
252
+ readonly layer_norm_epsilon: number;
253
+ };
254
+ };
255
+ export type GgufMetadataGPTNeoX = {
256
+ readonly context_length: number;
257
+ readonly embedding_length: number;
258
+ readonly block_count: number;
259
+ readonly use_parallel_residual: boolean;
260
+ readonly rope: {
261
+ readonly dimension_count: number;
262
+ readonly scale?: number;
263
+ };
264
+ readonly attention: {
265
+ readonly head_count: number;
266
+ readonly layer_norm_epsilon: number;
267
+ };
268
+ };
269
+ export type GgufMetadataGPTJ = {
270
+ readonly context_length: number;
271
+ readonly embedding_length: number;
272
+ readonly block_count: number;
273
+ readonly rope: {
274
+ readonly dimension_count: number;
275
+ readonly scale?: number;
276
+ };
277
+ readonly attention: {
278
+ readonly head_count: number;
279
+ readonly layer_norm_epsilon: number;
280
+ };
281
+ };
282
+ export type GgufMetadataGPT2 = {
283
+ readonly context_length: number;
284
+ readonly embedding_length: number;
285
+ readonly block_count: number;
286
+ readonly attention: {
287
+ readonly head_count: number;
288
+ readonly layer_norm_epsilon: number;
289
+ };
290
+ };
291
+ export type GgufMetadataBloom = {
292
+ readonly context_length: number;
293
+ readonly embedding_length: number;
294
+ readonly block_count: number;
295
+ readonly feed_forward_length: number;
296
+ readonly attention: {
297
+ readonly head_count: number;
298
+ readonly layer_norm_epsilon: number;
299
+ };
300
+ };
301
+ export type GgufMetadataFalcon = {
302
+ readonly context_length: number;
303
+ readonly embedding_length: number;
304
+ readonly block_count: number;
305
+ readonly attention: {
306
+ readonly head_count: number;
307
+ readonly head_count_kv: number;
308
+ readonly use_norm: boolean;
309
+ readonly layer_norm_epsilon: number;
310
+ };
311
+ readonly tensor_data_layout?: string;
312
+ };
313
+ export type GgufMetadataMamba = {
314
+ readonly context_length: number;
315
+ readonly embedding_length: number;
316
+ readonly block_count: number;
317
+ readonly ssm: {
318
+ readonly conv_kernel: number;
319
+ readonly inner_size: number;
320
+ readonly state_size: number;
321
+ readonly time_step_rank: number;
322
+ };
323
+ readonly attention: {
324
+ readonly layer_norm_rms_epsilon: number;
325
+ };
326
+ };
327
+ export type GgufMetadataRWKV = {
328
+ readonly architecture_version: 4 | number;
329
+ readonly context_length: number;
330
+ readonly block_count: number;
331
+ readonly embedding_length: number;
332
+ readonly feed_forward_length: number;
333
+ };
334
+ export declare function isGgufMetadataOfArchitectureType<A extends GgufArchitectureType>(metadata: GgufMetadata, type: A): metadata is GgufMetadata<A>;
@@ -0,0 +1,86 @@
1
+ export var GgufArchitectureType;
2
+ (function (GgufArchitectureType) {
3
+ GgufArchitectureType["llama"] = "llama";
4
+ GgufArchitectureType["falcon"] = "falcon";
5
+ GgufArchitectureType["gpt2"] = "gpt2";
6
+ GgufArchitectureType["gptj"] = "gptj";
7
+ GgufArchitectureType["gptneox"] = "gptneox";
8
+ GgufArchitectureType["mpt"] = "mpt";
9
+ GgufArchitectureType["baichuan"] = "baichuan";
10
+ GgufArchitectureType["starcoder"] = "starcoder";
11
+ GgufArchitectureType["persimmon"] = "persimmon";
12
+ GgufArchitectureType["refact"] = "refact";
13
+ GgufArchitectureType["bert"] = "bert";
14
+ GgufArchitectureType["nomicBert"] = "nomic-bert";
15
+ GgufArchitectureType["bloom"] = "bloom";
16
+ GgufArchitectureType["stablelm"] = "stablelm";
17
+ GgufArchitectureType["qwen"] = "qwen";
18
+ GgufArchitectureType["qwen2"] = "qwen2";
19
+ GgufArchitectureType["phi2"] = "phi2";
20
+ GgufArchitectureType["plamo"] = "plamo";
21
+ GgufArchitectureType["codeshell"] = "codeshell";
22
+ GgufArchitectureType["orion"] = "orion";
23
+ GgufArchitectureType["internlm2"] = "internlm2";
24
+ GgufArchitectureType["minicpm"] = "minicpm";
25
+ GgufArchitectureType["gemma"] = "gemma";
26
+ GgufArchitectureType["starcoder2"] = "starcoder2";
27
+ GgufArchitectureType["mamba"] = "mamba";
28
+ GgufArchitectureType["commandR"] = "command-r";
29
+ GgufArchitectureType["rwkv"] = "rwkv";
30
+ })(GgufArchitectureType || (GgufArchitectureType = {}));
31
+ // source: `enum llama_ftype` in `llama.h` in the `llama.cpp` source code
32
+ export var GgufFileType;
33
+ (function (GgufFileType) {
34
+ GgufFileType[GgufFileType["ALL_F32"] = 0] = "ALL_F32";
35
+ GgufFileType[GgufFileType["MOSTLY_F16"] = 1] = "MOSTLY_F16";
36
+ GgufFileType[GgufFileType["MOSTLY_Q4_0"] = 2] = "MOSTLY_Q4_0";
37
+ GgufFileType[GgufFileType["MOSTLY_Q4_1"] = 3] = "MOSTLY_Q4_1";
38
+ GgufFileType[GgufFileType["MOSTLY_Q4_1_SOME_F16"] = 4] = "MOSTLY_Q4_1_SOME_F16";
39
+ GgufFileType[GgufFileType["MOSTLY_Q4_2"] = 5] = "MOSTLY_Q4_2";
40
+ GgufFileType[GgufFileType["MOSTLY_Q4_3"] = 6] = "MOSTLY_Q4_3";
41
+ GgufFileType[GgufFileType["MOSTLY_Q8_0"] = 7] = "MOSTLY_Q8_0";
42
+ GgufFileType[GgufFileType["MOSTLY_Q5_0"] = 8] = "MOSTLY_Q5_0";
43
+ GgufFileType[GgufFileType["MOSTLY_Q5_1"] = 9] = "MOSTLY_Q5_1";
44
+ GgufFileType[GgufFileType["MOSTLY_Q2_K"] = 10] = "MOSTLY_Q2_K";
45
+ GgufFileType[GgufFileType["MOSTLY_Q3_K_S"] = 11] = "MOSTLY_Q3_K_S";
46
+ GgufFileType[GgufFileType["MOSTLY_Q3_K_M"] = 12] = "MOSTLY_Q3_K_M";
47
+ GgufFileType[GgufFileType["MOSTLY_Q3_K_L"] = 13] = "MOSTLY_Q3_K_L";
48
+ GgufFileType[GgufFileType["MOSTLY_Q4_K_S"] = 14] = "MOSTLY_Q4_K_S";
49
+ GgufFileType[GgufFileType["MOSTLY_Q4_K_M"] = 15] = "MOSTLY_Q4_K_M";
50
+ GgufFileType[GgufFileType["MOSTLY_Q5_K_S"] = 16] = "MOSTLY_Q5_K_S";
51
+ GgufFileType[GgufFileType["MOSTLY_Q5_K_M"] = 17] = "MOSTLY_Q5_K_M";
52
+ GgufFileType[GgufFileType["MOSTLY_Q6_K"] = 18] = "MOSTLY_Q6_K";
53
+ GgufFileType[GgufFileType["MOSTLY_IQ2_XXS"] = 19] = "MOSTLY_IQ2_XXS";
54
+ GgufFileType[GgufFileType["MOSTLY_IQ2_XS"] = 20] = "MOSTLY_IQ2_XS";
55
+ GgufFileType[GgufFileType["MOSTLY_Q2_K_S"] = 21] = "MOSTLY_Q2_K_S";
56
+ GgufFileType[GgufFileType["MOSTLY_IQ3_XS"] = 22] = "MOSTLY_IQ3_XS";
57
+ GgufFileType[GgufFileType["MOSTLY_IQ3_XXS"] = 23] = "MOSTLY_IQ3_XXS";
58
+ GgufFileType[GgufFileType["MOSTLY_IQ1_S"] = 24] = "MOSTLY_IQ1_S";
59
+ GgufFileType[GgufFileType["MOSTLY_IQ4_NL"] = 25] = "MOSTLY_IQ4_NL";
60
+ GgufFileType[GgufFileType["MOSTLY_IQ3_S"] = 26] = "MOSTLY_IQ3_S";
61
+ GgufFileType[GgufFileType["MOSTLY_IQ3_M"] = 27] = "MOSTLY_IQ3_M";
62
+ GgufFileType[GgufFileType["MOSTLY_IQ2_S"] = 28] = "MOSTLY_IQ2_S";
63
+ GgufFileType[GgufFileType["MOSTLY_IQ2_M"] = 29] = "MOSTLY_IQ2_M";
64
+ GgufFileType[GgufFileType["MOSTLY_IQ4_XS"] = 30] = "MOSTLY_IQ4_XS";
65
+ })(GgufFileType || (GgufFileType = {}));
66
+ export var GgufMetadataTokenizerTokenType;
67
+ (function (GgufMetadataTokenizerTokenType) {
68
+ GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["undefined"] = 0] = "undefined";
69
+ GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["normal"] = 1] = "normal";
70
+ GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["unknown"] = 2] = "unknown";
71
+ GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["control"] = 3] = "control";
72
+ GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["userDefined"] = 4] = "userDefined";
73
+ GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["unused"] = 5] = "unused";
74
+ GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["byte"] = 6] = "byte";
75
+ })(GgufMetadataTokenizerTokenType || (GgufMetadataTokenizerTokenType = {}));
76
+ export var GgufMetadataArchitecturePoolingType;
77
+ (function (GgufMetadataArchitecturePoolingType) {
78
+ GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["unspecified"] = -1] = "unspecified";
79
+ GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["none"] = 0] = "none";
80
+ GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["mean"] = 1] = "mean";
81
+ GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["max"] = 2] = "max";
82
+ })(GgufMetadataArchitecturePoolingType || (GgufMetadataArchitecturePoolingType = {}));
83
+ export function isGgufMetadataOfArchitectureType(metadata, type) {
84
+ return metadata?.general?.architecture === type;
85
+ }
86
+ //# sourceMappingURL=GgufMetadataTypes.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"GgufMetadataTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufMetadataTypes.ts"],"names":[],"mappings":"AAAA,MAAM,CAAN,IAAkB,oBA4BjB;AA5BD,WAAkB,oBAAoB;IAClC,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,mCAAW,CAAA;IACX,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,+CAAuB,CAAA;IACvB,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,gDAAwB,CAAA;IACxB,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,+CAAuB,CAAA;IACvB,uCAAe,CAAA;IACf,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,uCAAe,CAAA;IACf,iDAAyB,CAAA;IACzB,uCAAe,CAAA;IACf,8CAAsB,CAAA;IACtB,qCAAa,CAAA;AACjB,CAAC,EA5BiB,oBAAoB,KAApB,oBAAoB,QA4BrC;AA+BD,yEAAyE;AACzE,MAAM,CAAN,IAAY,YAgCX;AAhCD,WAAY,YAAY;IACpB,qDAAW,CAAA;IACX,2DAAc,CAAA;IACd,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,+EAAwB,CAAA;IACxB,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,8DAAgB,CAAA;IAChB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,8DAAgB,CAAA;IAChB,oEAAmB,CAAA;IACnB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,oEAAmB,CAAA;IACnB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;AACtB,CAAC,EAhCW,YAAY,KAAZ,YAAY,QAgCvB;AAyED,MAAM,CAAN,IAAkB,8BAQjB;AARD,WAAkB,8BAA8B;IAC5C,6FAAa,CAAA;IACb,uFAAU,CAAA;IACV,yFAAW,CAAA;IACX,yFAAW,CAAA;IACX,iGAAe,CAAA;IACf,uFAAU,CAAA;IACV,mFAAQ,CAAA;AACZ,CAAC,EARiB,8BAA8B,KAA9B,8BAA8B,QAQ/C;AA8BD,MAAM,CAAN,IAAkB,mCAKjB;AALD,WAAkB,mCAAmC;IACjD,4GAAgB,CAAA;IAChB,6FAAQ,CAAA;IACR,6FAAQ,CAAA;IACR,2FAAO,CAAA;AACX,CAAC,EALiB,mCAAmC,KAAnC,mCAAmC,QAKpD;AAuND,MAAM,UAAU,gCAAgC,CAC5C,QAAsB,EAAE,IAAO;IAE/B,OAAO,QAAQ,EAAE,OAAO,EAAE,YAAY,KAAK,IAAI,CAAC;AACpD,CAAC"}
@@ -0,0 +1,37 @@
1
+ export type GgufTensorInfo = {
2
+ readonly name: string;
3
+ readonly dimensions: readonly (number | bigint)[];
4
+ readonly ggmlType: GgmlType;
5
+ readonly offset: number | bigint;
6
+ };
7
+ export declare const enum GgmlType {
8
+ F32 = 0,
9
+ F16 = 1,
10
+ Q4_0 = 2,
11
+ Q4_1 = 3,
12
+ Q4_2 = 4,
13
+ Q4_3 = 5,
14
+ Q5_0 = 6,
15
+ Q5_1 = 7,
16
+ Q8_0 = 8,
17
+ Q8_1 = 9,
18
+ Q2_K = 10,
19
+ Q3_K = 11,
20
+ Q4_K = 12,
21
+ Q5_K = 13,
22
+ Q6_K = 14,
23
+ Q8_K = 15,
24
+ IQ2_XXS = 16,
25
+ IQ2_XS = 17,
26
+ IQ3_XXS = 18,
27
+ IQ1_S = 19,
28
+ IQ4_NL = 20,
29
+ IQ3_S = 21,
30
+ IQ2_S = 22,
31
+ IQ4_XS = 23,
32
+ I8 = 24,
33
+ I16 = 25,
34
+ I32 = 26,
35
+ I64 = 27,
36
+ F64 = 28
37
+ }
@@ -0,0 +1,33 @@
1
+ export var GgmlType;
2
+ (function (GgmlType) {
3
+ GgmlType[GgmlType["F32"] = 0] = "F32";
4
+ GgmlType[GgmlType["F16"] = 1] = "F16";
5
+ GgmlType[GgmlType["Q4_0"] = 2] = "Q4_0";
6
+ GgmlType[GgmlType["Q4_1"] = 3] = "Q4_1";
7
+ GgmlType[GgmlType["Q4_2"] = 4] = "Q4_2";
8
+ GgmlType[GgmlType["Q4_3"] = 5] = "Q4_3";
9
+ GgmlType[GgmlType["Q5_0"] = 6] = "Q5_0";
10
+ GgmlType[GgmlType["Q5_1"] = 7] = "Q5_1";
11
+ GgmlType[GgmlType["Q8_0"] = 8] = "Q8_0";
12
+ GgmlType[GgmlType["Q8_1"] = 9] = "Q8_1";
13
+ GgmlType[GgmlType["Q2_K"] = 10] = "Q2_K";
14
+ GgmlType[GgmlType["Q3_K"] = 11] = "Q3_K";
15
+ GgmlType[GgmlType["Q4_K"] = 12] = "Q4_K";
16
+ GgmlType[GgmlType["Q5_K"] = 13] = "Q5_K";
17
+ GgmlType[GgmlType["Q6_K"] = 14] = "Q6_K";
18
+ GgmlType[GgmlType["Q8_K"] = 15] = "Q8_K";
19
+ GgmlType[GgmlType["IQ2_XXS"] = 16] = "IQ2_XXS";
20
+ GgmlType[GgmlType["IQ2_XS"] = 17] = "IQ2_XS";
21
+ GgmlType[GgmlType["IQ3_XXS"] = 18] = "IQ3_XXS";
22
+ GgmlType[GgmlType["IQ1_S"] = 19] = "IQ1_S";
23
+ GgmlType[GgmlType["IQ4_NL"] = 20] = "IQ4_NL";
24
+ GgmlType[GgmlType["IQ3_S"] = 21] = "IQ3_S";
25
+ GgmlType[GgmlType["IQ2_S"] = 22] = "IQ2_S";
26
+ GgmlType[GgmlType["IQ4_XS"] = 23] = "IQ4_XS";
27
+ GgmlType[GgmlType["I8"] = 24] = "I8";
28
+ GgmlType[GgmlType["I16"] = 25] = "I16";
29
+ GgmlType[GgmlType["I32"] = 26] = "I32";
30
+ GgmlType[GgmlType["I64"] = 27] = "I64";
31
+ GgmlType[GgmlType["F64"] = 28] = "F64";
32
+ })(GgmlType || (GgmlType = {}));
33
+ //# sourceMappingURL=GgufTensorInfoTypes.js.map