node-llama-cpp 3.0.0-beta.14 → 3.0.0-beta.16

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (383) hide show
  1. package/README.md +1 -1
  2. package/dist/ChatWrapper.js +4 -0
  3. package/dist/ChatWrapper.js.map +1 -1
  4. package/dist/bindings/AddonTypes.d.ts +23 -0
  5. package/dist/bindings/Llama.d.ts +11 -0
  6. package/dist/bindings/Llama.js +56 -4
  7. package/dist/bindings/Llama.js.map +1 -1
  8. package/dist/bindings/getLlama.d.ts +20 -2
  9. package/dist/bindings/getLlama.js +15 -5
  10. package/dist/bindings/getLlama.js.map +1 -1
  11. package/dist/bindings/types.d.ts +15 -0
  12. package/dist/bindings/types.js +27 -2
  13. package/dist/bindings/types.js.map +1 -1
  14. package/dist/bindings/utils/MemoryOrchestrator.d.ts +21 -0
  15. package/dist/bindings/utils/MemoryOrchestrator.js +49 -0
  16. package/dist/bindings/utils/MemoryOrchestrator.js.map +1 -0
  17. package/dist/bindings/utils/cloneLlamaCppRepo.d.ts +1 -1
  18. package/dist/bindings/utils/cloneLlamaCppRepo.js +26 -25
  19. package/dist/bindings/utils/cloneLlamaCppRepo.js.map +1 -1
  20. package/dist/bindings/utils/compileLLamaCpp.js +2 -2
  21. package/dist/bindings/utils/compileLLamaCpp.js.map +1 -1
  22. package/dist/bindings/utils/getLlamaWithoutBackend.d.ts +5 -0
  23. package/dist/bindings/utils/getLlamaWithoutBackend.js +27 -0
  24. package/dist/bindings/utils/getLlamaWithoutBackend.js.map +1 -0
  25. package/dist/bindings/utils/resolveCustomCmakeOptions.js +2 -2
  26. package/dist/bindings/utils/resolveCustomCmakeOptions.js.map +1 -1
  27. package/dist/chatWrappers/AlpacaChatWrapper.d.ts +2 -1
  28. package/dist/chatWrappers/AlpacaChatWrapper.js +9 -2
  29. package/dist/chatWrappers/AlpacaChatWrapper.js.map +1 -1
  30. package/dist/chatWrappers/ChatMLChatWrapper.js +12 -10
  31. package/dist/chatWrappers/ChatMLChatWrapper.js.map +1 -1
  32. package/dist/chatWrappers/FalconChatWrapper.d.ts +2 -1
  33. package/dist/chatWrappers/FalconChatWrapper.js +28 -11
  34. package/dist/chatWrappers/FalconChatWrapper.js.map +1 -1
  35. package/dist/chatWrappers/FunctionaryChatWrapper.js +59 -45
  36. package/dist/chatWrappers/FunctionaryChatWrapper.js.map +1 -1
  37. package/dist/chatWrappers/GemmaChatWrapper.js +9 -7
  38. package/dist/chatWrappers/GemmaChatWrapper.js.map +1 -1
  39. package/dist/chatWrappers/GeneralChatWrapper.d.ts +2 -1
  40. package/dist/chatWrappers/GeneralChatWrapper.js +35 -12
  41. package/dist/chatWrappers/GeneralChatWrapper.js.map +1 -1
  42. package/dist/chatWrappers/LlamaChatWrapper.d.ts +7 -0
  43. package/dist/chatWrappers/LlamaChatWrapper.js +26 -8
  44. package/dist/chatWrappers/LlamaChatWrapper.js.map +1 -1
  45. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.d.ts +73 -0
  46. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +355 -0
  47. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -0
  48. package/dist/{TemplateChatWrapper.d.ts → chatWrappers/generic/TemplateChatWrapper.d.ts} +6 -9
  49. package/dist/{TemplateChatWrapper.js → chatWrappers/generic/TemplateChatWrapper.js} +31 -69
  50. package/dist/chatWrappers/generic/TemplateChatWrapper.js.map +1 -0
  51. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.d.ts +33 -0
  52. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js +45 -0
  53. package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js.map +1 -0
  54. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.d.ts +4 -0
  55. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js +206 -0
  56. package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js.map +1 -0
  57. package/dist/chatWrappers/utils/resolveChatWrapper.d.ts +67 -0
  58. package/dist/chatWrappers/utils/resolveChatWrapper.js +208 -0
  59. package/dist/chatWrappers/utils/resolveChatWrapper.js.map +1 -0
  60. package/dist/cli/cli.js +1 -1
  61. package/dist/cli/cli.js.map +1 -1
  62. package/dist/cli/commands/BuildCommand.js +1 -1
  63. package/dist/cli/commands/BuildCommand.js.map +1 -1
  64. package/dist/cli/commands/ChatCommand.d.ts +9 -5
  65. package/dist/cli/commands/ChatCommand.js +203 -118
  66. package/dist/cli/commands/ChatCommand.js.map +1 -1
  67. package/dist/cli/commands/ClearCommand.d.ts +1 -1
  68. package/dist/cli/commands/ClearCommand.js +5 -5
  69. package/dist/cli/commands/ClearCommand.js.map +1 -1
  70. package/dist/cli/commands/CompleteCommand.d.ts +5 -3
  71. package/dist/cli/commands/CompleteCommand.js +136 -85
  72. package/dist/cli/commands/CompleteCommand.js.map +1 -1
  73. package/dist/cli/commands/DebugCommand.js +4 -4
  74. package/dist/cli/commands/DownloadCommand.js +3 -4
  75. package/dist/cli/commands/DownloadCommand.js.map +1 -1
  76. package/dist/cli/commands/InfillCommand.d.ts +5 -3
  77. package/dist/cli/commands/InfillCommand.js +138 -89
  78. package/dist/cli/commands/InfillCommand.js.map +1 -1
  79. package/dist/cli/commands/{InspectCommand.d.ts → inspect/InspectCommand.d.ts} +1 -4
  80. package/dist/cli/commands/inspect/InspectCommand.js +17 -0
  81. package/dist/cli/commands/inspect/InspectCommand.js.map +1 -0
  82. package/dist/cli/commands/inspect/commands/InspectGgufCommand.d.ts +11 -0
  83. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +121 -0
  84. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -0
  85. package/dist/cli/commands/inspect/commands/InspectGpuCommand.d.ts +4 -0
  86. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +136 -0
  87. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -0
  88. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.d.ts +15 -0
  89. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +579 -0
  90. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -0
  91. package/dist/cli/recommendedModels.d.ts +2 -0
  92. package/dist/cli/recommendedModels.js +281 -0
  93. package/dist/cli/recommendedModels.js.map +1 -0
  94. package/dist/cli/utils/ConsoleInteraction.d.ts +23 -0
  95. package/dist/cli/utils/ConsoleInteraction.js +122 -0
  96. package/dist/cli/utils/ConsoleInteraction.js.map +1 -0
  97. package/dist/cli/utils/ConsoleTable.d.ts +23 -0
  98. package/dist/cli/utils/ConsoleTable.js +86 -0
  99. package/dist/cli/utils/ConsoleTable.js.map +1 -0
  100. package/dist/cli/utils/basicChooseFromListConsoleInteraction.d.ts +13 -0
  101. package/dist/cli/utils/basicChooseFromListConsoleInteraction.js +111 -0
  102. package/dist/cli/utils/basicChooseFromListConsoleInteraction.js.map +1 -0
  103. package/dist/cli/utils/consolePromptQuestion.d.ts +5 -0
  104. package/dist/cli/utils/consolePromptQuestion.js +80 -0
  105. package/dist/cli/utils/consolePromptQuestion.js.map +1 -0
  106. package/dist/cli/utils/getReadablePath.d.ts +1 -0
  107. package/dist/cli/utils/getReadablePath.js +14 -0
  108. package/dist/cli/utils/getReadablePath.js.map +1 -0
  109. package/dist/cli/utils/printCommonInfoLines.d.ts +9 -0
  110. package/dist/cli/utils/printCommonInfoLines.js +70 -0
  111. package/dist/cli/utils/printCommonInfoLines.js.map +1 -0
  112. package/dist/cli/utils/printInfoLine.d.ts +12 -0
  113. package/dist/cli/utils/printInfoLine.js +54 -0
  114. package/dist/cli/utils/printInfoLine.js.map +1 -0
  115. package/dist/cli/utils/resolveCommandGgufPath.d.ts +2 -0
  116. package/dist/cli/utils/resolveCommandGgufPath.js +494 -0
  117. package/dist/cli/utils/resolveCommandGgufPath.js.map +1 -0
  118. package/dist/cli/utils/resolveHeaderFlag.d.ts +1 -0
  119. package/dist/cli/utils/resolveHeaderFlag.js +21 -0
  120. package/dist/cli/utils/resolveHeaderFlag.js.map +1 -0
  121. package/dist/cli/utils/resolveModelRecommendationFileOptions.d.ts +19 -0
  122. package/dist/cli/utils/resolveModelRecommendationFileOptions.js +7 -0
  123. package/dist/cli/utils/resolveModelRecommendationFileOptions.js.map +1 -0
  124. package/dist/cli/utils/splitAnsiToLines.d.ts +1 -0
  125. package/dist/cli/utils/splitAnsiToLines.js +17 -0
  126. package/dist/cli/utils/splitAnsiToLines.js.map +1 -0
  127. package/dist/config.d.ts +5 -0
  128. package/dist/config.js +11 -2
  129. package/dist/config.js.map +1 -1
  130. package/dist/consts.d.ts +2 -0
  131. package/dist/consts.js +8 -0
  132. package/dist/consts.js.map +1 -1
  133. package/dist/evaluator/LlamaChat/LlamaChat.d.ts +8 -1
  134. package/dist/evaluator/LlamaChat/LlamaChat.js +15 -6
  135. package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -1
  136. package/dist/evaluator/LlamaChatSession/LlamaChatSession.d.ts +9 -2
  137. package/dist/evaluator/LlamaChatSession/LlamaChatSession.js +5 -3
  138. package/dist/evaluator/LlamaChatSession/LlamaChatSession.js.map +1 -1
  139. package/dist/evaluator/LlamaCompletion.d.ts +9 -2
  140. package/dist/evaluator/LlamaCompletion.js +11 -6
  141. package/dist/evaluator/LlamaCompletion.js.map +1 -1
  142. package/dist/evaluator/LlamaContext/LlamaContext.d.ts +30 -3
  143. package/dist/evaluator/LlamaContext/LlamaContext.js +227 -102
  144. package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -1
  145. package/dist/evaluator/LlamaContext/types.d.ts +57 -6
  146. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/firstInFirstOutStrategy.js.map +1 -0
  147. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/maximumParallelismStrategy.js.map +1 -0
  148. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.d.ts +2 -0
  149. package/dist/evaluator/LlamaContext/utils/{resolveBatchItemsPrioritizingStrategy.js → resolveBatchItemsPrioritizationStrategy.js} +4 -4
  150. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js.map +1 -0
  151. package/dist/evaluator/LlamaEmbeddingContext.d.ts +23 -2
  152. package/dist/evaluator/LlamaEmbeddingContext.js +4 -5
  153. package/dist/evaluator/LlamaEmbeddingContext.js.map +1 -1
  154. package/dist/evaluator/LlamaGrammar.d.ts +3 -2
  155. package/dist/evaluator/LlamaGrammar.js +3 -2
  156. package/dist/evaluator/LlamaGrammar.js.map +1 -1
  157. package/dist/evaluator/LlamaModel.d.ts +56 -6
  158. package/dist/evaluator/LlamaModel.js +99 -7
  159. package/dist/evaluator/LlamaModel.js.map +1 -1
  160. package/dist/evaluator/TokenBias.d.ts +22 -0
  161. package/dist/evaluator/TokenBias.js +33 -0
  162. package/dist/evaluator/TokenBias.js.map +1 -0
  163. package/dist/evaluator/TokenMeter.d.ts +54 -0
  164. package/dist/evaluator/TokenMeter.js +86 -0
  165. package/dist/evaluator/TokenMeter.js.map +1 -0
  166. package/dist/gguf/consts.d.ts +3 -0
  167. package/dist/gguf/consts.js +8 -0
  168. package/dist/gguf/consts.js.map +1 -0
  169. package/dist/gguf/errors/InvalidGgufMagicError.d.ts +3 -0
  170. package/dist/gguf/errors/InvalidGgufMagicError.js +6 -0
  171. package/dist/gguf/errors/InvalidGgufMagicError.js.map +1 -0
  172. package/dist/gguf/errors/UnsupportedGgufValueTypeError.d.ts +4 -0
  173. package/dist/gguf/errors/UnsupportedGgufValueTypeError.js +9 -0
  174. package/dist/gguf/errors/UnsupportedGgufValueTypeError.js.map +1 -0
  175. package/dist/gguf/fileReaders/GgufFileReader.d.ts +33 -0
  176. package/dist/gguf/fileReaders/GgufFileReader.js +76 -0
  177. package/dist/gguf/fileReaders/GgufFileReader.js.map +1 -0
  178. package/dist/gguf/fileReaders/GgufFsFileReader.d.ts +17 -0
  179. package/dist/gguf/fileReaders/GgufFsFileReader.js +45 -0
  180. package/dist/gguf/fileReaders/GgufFsFileReader.js.map +1 -0
  181. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.d.ts +22 -0
  182. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js +63 -0
  183. package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js.map +1 -0
  184. package/dist/gguf/insights/GgufInsights.d.ts +42 -0
  185. package/dist/gguf/insights/GgufInsights.js +361 -0
  186. package/dist/gguf/insights/GgufInsights.js.map +1 -0
  187. package/dist/gguf/insights/GgufInsightsConfigurationResolver.d.ts +87 -0
  188. package/dist/gguf/insights/GgufInsightsConfigurationResolver.js +136 -0
  189. package/dist/gguf/insights/GgufInsightsConfigurationResolver.js.map +1 -0
  190. package/dist/gguf/insights/utils/resolveContextContextSizeOption.d.ts +18 -0
  191. package/dist/gguf/insights/utils/resolveContextContextSizeOption.js +52 -0
  192. package/dist/gguf/insights/utils/resolveContextContextSizeOption.js.map +1 -0
  193. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.d.ts +14 -0
  194. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js +177 -0
  195. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js.map +1 -0
  196. package/dist/gguf/insights/utils/scoreLevels.d.ts +5 -0
  197. package/dist/gguf/insights/utils/scoreLevels.js +16 -0
  198. package/dist/gguf/insights/utils/scoreLevels.js.map +1 -0
  199. package/dist/gguf/parser/GgufV2Parser.d.ts +19 -0
  200. package/dist/gguf/parser/GgufV2Parser.js +115 -0
  201. package/dist/gguf/parser/GgufV2Parser.js.map +1 -0
  202. package/dist/gguf/parser/GgufV3Parser.d.ts +3 -0
  203. package/dist/gguf/parser/GgufV3Parser.js +4 -0
  204. package/dist/gguf/parser/GgufV3Parser.js.map +1 -0
  205. package/dist/gguf/parser/parseGguf.d.ts +8 -0
  206. package/dist/gguf/parser/parseGguf.js +58 -0
  207. package/dist/gguf/parser/parseGguf.js.map +1 -0
  208. package/dist/gguf/readGgufFileInfo.d.ts +30 -0
  209. package/dist/gguf/readGgufFileInfo.js +38 -0
  210. package/dist/gguf/readGgufFileInfo.js.map +1 -0
  211. package/dist/gguf/types/GgufFileInfoTypes.d.ts +52 -0
  212. package/dist/gguf/types/GgufFileInfoTypes.js +18 -0
  213. package/dist/gguf/types/GgufFileInfoTypes.js.map +1 -0
  214. package/dist/gguf/types/GgufMetadataTypes.d.ts +330 -0
  215. package/dist/gguf/types/GgufMetadataTypes.js +86 -0
  216. package/dist/gguf/types/GgufMetadataTypes.js.map +1 -0
  217. package/dist/gguf/types/GgufTensorInfoTypes.d.ts +37 -0
  218. package/dist/gguf/types/GgufTensorInfoTypes.js +33 -0
  219. package/dist/gguf/types/GgufTensorInfoTypes.js.map +1 -0
  220. package/dist/gguf/utils/GgufReadOffset.d.ts +6 -0
  221. package/dist/gguf/utils/GgufReadOffset.js +18 -0
  222. package/dist/gguf/utils/GgufReadOffset.js.map +1 -0
  223. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.d.ts +5 -0
  224. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js +38 -0
  225. package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js.map +1 -0
  226. package/dist/gguf/utils/getGgufFileTypeName.d.ts +4 -0
  227. package/dist/gguf/utils/getGgufFileTypeName.js +13 -0
  228. package/dist/gguf/utils/getGgufFileTypeName.js.map +1 -0
  229. package/dist/gguf/utils/getGgufMetadataArchitectureData.d.ts +3 -0
  230. package/dist/gguf/utils/getGgufMetadataArchitectureData.js +4 -0
  231. package/dist/gguf/utils/getGgufMetadataArchitectureData.js.map +1 -0
  232. package/dist/gguf/utils/normalizeGgufDownloadUrl.d.ts +1 -0
  233. package/dist/gguf/utils/normalizeGgufDownloadUrl.js +16 -0
  234. package/dist/gguf/utils/normalizeGgufDownloadUrl.js.map +1 -0
  235. package/dist/index.d.ts +14 -7
  236. package/dist/index.js +12 -6
  237. package/dist/index.js.map +1 -1
  238. package/dist/types.d.ts +1 -1
  239. package/dist/utils/InsufficientMemoryError.d.ts +3 -0
  240. package/dist/utils/InsufficientMemoryError.js +6 -0
  241. package/dist/utils/InsufficientMemoryError.js.map +1 -0
  242. package/dist/utils/LlamaText.d.ts +25 -10
  243. package/dist/utils/LlamaText.js +205 -23
  244. package/dist/utils/LlamaText.js.map +1 -1
  245. package/dist/utils/StopGenerationDetector.js +3 -1
  246. package/dist/utils/StopGenerationDetector.js.map +1 -1
  247. package/dist/utils/findBestOption.d.ts +4 -0
  248. package/dist/utils/findBestOption.js +15 -0
  249. package/dist/utils/findBestOption.js.map +1 -0
  250. package/dist/utils/getConsoleLogPrefix.js +1 -1
  251. package/dist/utils/getQueuedTokensBeforeStopTrigger.js +3 -3
  252. package/dist/utils/getQueuedTokensBeforeStopTrigger.js.map +1 -1
  253. package/dist/utils/getReadableContextSize.d.ts +1 -0
  254. package/dist/utils/getReadableContextSize.js +7 -0
  255. package/dist/utils/getReadableContextSize.js.map +1 -0
  256. package/dist/utils/gitReleaseBundles.js +68 -1
  257. package/dist/utils/gitReleaseBundles.js.map +1 -1
  258. package/dist/utils/isToken.d.ts +2 -0
  259. package/dist/utils/isToken.js +4 -0
  260. package/dist/utils/isToken.js.map +1 -0
  261. package/dist/utils/isUrl.d.ts +1 -0
  262. package/dist/utils/isUrl.js +15 -0
  263. package/dist/utils/isUrl.js.map +1 -0
  264. package/dist/utils/mergeUnionTypes.d.ts +4 -0
  265. package/dist/utils/parseModelFileName.d.ts +1 -0
  266. package/dist/utils/parseModelFileName.js +6 -1
  267. package/dist/utils/parseModelFileName.js.map +1 -1
  268. package/dist/utils/prettyPrintObject.d.ts +10 -1
  269. package/dist/utils/prettyPrintObject.js +57 -13
  270. package/dist/utils/prettyPrintObject.js.map +1 -1
  271. package/dist/utils/spawnCommand.js.map +1 -1
  272. package/dist/utils/tokenizeInput.d.ts +1 -1
  273. package/dist/utils/tokenizeInput.js +6 -3
  274. package/dist/utils/tokenizeInput.js.map +1 -1
  275. package/dist/utils/withOra.d.ts +2 -0
  276. package/dist/utils/withOra.js +14 -8
  277. package/dist/utils/withOra.js.map +1 -1
  278. package/dist/utils/withProgressLog.d.ts +23 -0
  279. package/dist/utils/withProgressLog.js +211 -0
  280. package/dist/utils/withProgressLog.js.map +1 -0
  281. package/dist/utils/withStatusLogs.js +1 -1
  282. package/dist/utils/withStatusLogs.js.map +1 -1
  283. package/llama/CMakeLists.txt +5 -5
  284. package/llama/addon.cpp +159 -9
  285. package/llama/binariesGithubRelease.json +1 -1
  286. package/llama/gitRelease.bundle +0 -0
  287. package/llama/gpuInfo/cuda-gpu-info.cu +21 -0
  288. package/llama/gpuInfo/cuda-gpu-info.h +3 -0
  289. package/llama/gpuInfo/metal-gpu-info.h +4 -1
  290. package/llama/gpuInfo/metal-gpu-info.mm +14 -1
  291. package/llama/gpuInfo/vulkan-gpu-info.cpp +20 -2
  292. package/llama/gpuInfo/vulkan-gpu-info.h +2 -0
  293. package/llama/grammars/README.md +10 -0
  294. package/llama/llama.cpp.info.json +1 -1
  295. package/llama/toolchains/win32.host-x64.target-arm64.cmake +41 -0
  296. package/llamaBins/linux-arm64/_nlcBuildMetadata.json +1 -1
  297. package/llamaBins/linux-arm64/llama-addon.node +0 -0
  298. package/llamaBins/linux-armv7l/_nlcBuildMetadata.json +1 -1
  299. package/llamaBins/linux-armv7l/llama-addon.node +0 -0
  300. package/llamaBins/linux-x64/_nlcBuildMetadata.json +1 -1
  301. package/llamaBins/linux-x64/llama-addon.node +0 -0
  302. package/llamaBins/linux-x64-cuda/_nlcBuildMetadata.json +1 -1
  303. package/llamaBins/linux-x64-cuda/llama-addon.node +0 -0
  304. package/llamaBins/linux-x64-vulkan/_nlcBuildMetadata.json +1 -1
  305. package/llamaBins/linux-x64-vulkan/llama-addon.node +0 -0
  306. package/llamaBins/mac-arm64-metal/_nlcBuildMetadata.json +1 -1
  307. package/llamaBins/mac-arm64-metal/default.metallib +0 -0
  308. package/llamaBins/mac-arm64-metal/llama-addon.node +0 -0
  309. package/llamaBins/mac-x64/_nlcBuildMetadata.json +1 -1
  310. package/llamaBins/mac-x64/llama-addon.node +0 -0
  311. package/llamaBins/win-arm64/_nlcBuildMetadata.json +1 -0
  312. package/llamaBins/win-arm64/llama-addon.exp +0 -0
  313. package/llamaBins/win-arm64/llama-addon.lib +0 -0
  314. package/llamaBins/win-arm64/llama-addon.node +0 -0
  315. package/llamaBins/win-x64/_nlcBuildMetadata.json +1 -1
  316. package/llamaBins/win-x64/llama-addon.node +0 -0
  317. package/llamaBins/win-x64-cuda/_nlcBuildMetadata.json +1 -1
  318. package/llamaBins/win-x64-cuda/llama-addon.node +0 -0
  319. package/llamaBins/win-x64-vulkan/_nlcBuildMetadata.json +1 -1
  320. package/llamaBins/win-x64-vulkan/llama-addon.node +0 -0
  321. package/package.json +15 -12
  322. package/dist/TemplateChatWrapper.js.map +0 -1
  323. package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.d.ts +0 -33
  324. package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.js +0 -49
  325. package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.js.map +0 -1
  326. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.d.ts +0 -13
  327. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js +0 -63
  328. package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js.map +0 -1
  329. package/dist/cli/commands/InspectCommand.js +0 -113
  330. package/dist/cli/commands/InspectCommand.js.map +0 -1
  331. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js.map +0 -1
  332. package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js.map +0 -1
  333. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.d.ts +0 -2
  334. package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js.map +0 -1
  335. package/dist/gguf/GGUFInsights.d.ts +0 -28
  336. package/dist/gguf/GGUFInsights.js +0 -58
  337. package/dist/gguf/GGUFInsights.js.map +0 -1
  338. package/dist/gguf/GGUFMetadata.d.ts +0 -19
  339. package/dist/gguf/GGUFMetadata.js +0 -38
  340. package/dist/gguf/GGUFMetadata.js.map +0 -1
  341. package/dist/gguf/errors/InvalidGGUFMagicError.d.ts +0 -3
  342. package/dist/gguf/errors/InvalidGGUFMagicError.js +0 -6
  343. package/dist/gguf/errors/InvalidGGUFMagicError.js.map +0 -1
  344. package/dist/gguf/errors/MetadataNotParsedYetError.d.ts +0 -3
  345. package/dist/gguf/errors/MetadataNotParsedYetError.js +0 -6
  346. package/dist/gguf/errors/MetadataNotParsedYetError.js.map +0 -1
  347. package/dist/gguf/errors/MissingNodeLlamaError.d.ts +0 -3
  348. package/dist/gguf/errors/MissingNodeLlamaError.js +0 -6
  349. package/dist/gguf/errors/MissingNodeLlamaError.js.map +0 -1
  350. package/dist/gguf/errors/ModelScore/NotEnoughVRamError.d.ts +0 -5
  351. package/dist/gguf/errors/ModelScore/NotEnoughVRamError.js +0 -11
  352. package/dist/gguf/errors/ModelScore/NotEnoughVRamError.js.map +0 -1
  353. package/dist/gguf/errors/UnsupportedMetadataTypeError.d.ts +0 -4
  354. package/dist/gguf/errors/UnsupportedMetadataTypeError.js +0 -8
  355. package/dist/gguf/errors/UnsupportedMetadataTypeError.js.map +0 -1
  356. package/dist/gguf/ggufParser/GGUFParser.d.ts +0 -18
  357. package/dist/gguf/ggufParser/GGUFParser.js +0 -123
  358. package/dist/gguf/ggufParser/GGUFParser.js.map +0 -1
  359. package/dist/gguf/ggufParser/GGUFTypes.d.ts +0 -257
  360. package/dist/gguf/ggufParser/GGUFTypes.js +0 -2
  361. package/dist/gguf/ggufParser/GGUFTypes.js.map +0 -1
  362. package/dist/gguf/ggufParser/checkArchitecture.d.ts +0 -14
  363. package/dist/gguf/ggufParser/checkArchitecture.js +0 -74
  364. package/dist/gguf/ggufParser/checkArchitecture.js.map +0 -1
  365. package/dist/gguf/ggufParser/stream/GGUFBaseStream.d.ts +0 -38
  366. package/dist/gguf/ggufParser/stream/GGUFBaseStream.js +0 -83
  367. package/dist/gguf/ggufParser/stream/GGUFBaseStream.js.map +0 -1
  368. package/dist/gguf/ggufParser/stream/GGUFFetchStream.d.ts +0 -14
  369. package/dist/gguf/ggufParser/stream/GGUFFetchStream.js +0 -35
  370. package/dist/gguf/ggufParser/stream/GGUFFetchStream.js.map +0 -1
  371. package/dist/gguf/ggufParser/stream/GGUFReadStream.d.ts +0 -15
  372. package/dist/gguf/ggufParser/stream/GGUFReadStream.js +0 -40
  373. package/dist/gguf/ggufParser/stream/GGUFReadStream.js.map +0 -1
  374. package/dist/utils/parseModelTypeDescription.d.ts +0 -6
  375. package/dist/utils/parseModelTypeDescription.js +0 -9
  376. package/dist/utils/parseModelTypeDescription.js.map +0 -1
  377. package/dist/utils/resolveChatWrapper.d.ts +0 -4
  378. package/dist/utils/resolveChatWrapper.js +0 -16
  379. package/dist/utils/resolveChatWrapper.js.map +0 -1
  380. /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.d.ts +0 -0
  381. /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.js +0 -0
  382. /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/maximumParallelismStrategy.d.ts +0 -0
  383. /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/maximumParallelismStrategy.js +0 -0
@@ -0,0 +1,45 @@
1
+ import fs from "node:fs/promises";
2
+ import { withLock } from "lifecycle-utils";
3
+ import { GgufReadOffset } from "../utils/GgufReadOffset.js";
4
+ import { defaultExtraAllocationSize } from "../consts.js";
5
+ import { GgufFileReader } from "./GgufFileReader.js";
6
+ export class GgufFsFileReader extends GgufFileReader {
7
+ filePath;
8
+ _signal;
9
+ constructor({ filePath, signal }) {
10
+ super();
11
+ this.filePath = filePath;
12
+ this._signal = signal;
13
+ }
14
+ async readByteRange(offset, length) {
15
+ const readOffset = GgufReadOffset.resolveReadOffset(offset);
16
+ const endOffset = readOffset.offset + length;
17
+ if (endOffset >= this._buffer.length)
18
+ await this._readToExpandBufferUpToOffset(endOffset);
19
+ const res = this._buffer.subarray(readOffset.offset, endOffset);
20
+ readOffset.moveBy(length);
21
+ return res;
22
+ }
23
+ async _readToExpandBufferUpToOffset(endOffset, extraAllocationSize = defaultExtraAllocationSize) {
24
+ return await withLock(this, "modifyBuffer", this._signal, async () => {
25
+ if (endOffset < this._buffer.length)
26
+ return;
27
+ const missingBytesBuffer = await this._readByteRange(this._buffer.length, endOffset + extraAllocationSize - this._buffer.length);
28
+ this._addToBuffer(missingBytesBuffer);
29
+ });
30
+ }
31
+ async _readByteRange(start, length) {
32
+ const fd = await fs.open(this.filePath, "r");
33
+ try {
34
+ if (this._signal?.aborted)
35
+ throw this._signal.reason;
36
+ const buffer = Buffer.alloc(length);
37
+ await fd.read(buffer, 0, length, start);
38
+ return buffer;
39
+ }
40
+ finally {
41
+ await fd.close();
42
+ }
43
+ }
44
+ }
45
+ //# sourceMappingURL=GgufFsFileReader.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"GgufFsFileReader.js","sourceRoot":"","sources":["../../../src/gguf/fileReaders/GgufFsFileReader.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,MAAM,kBAAkB,CAAC;AAClC,OAAO,EAAC,QAAQ,EAAC,MAAM,iBAAiB,CAAC;AACzC,OAAO,EAAC,cAAc,EAAC,MAAM,4BAA4B,CAAC;AAC1D,OAAO,EAAC,0BAA0B,EAAC,MAAM,cAAc,CAAC;AACxD,OAAO,EAAC,cAAc,EAAC,MAAM,qBAAqB,CAAC;AAOnD,MAAM,OAAO,gBAAiB,SAAQ,cAAc;IAChC,QAAQ,CAAS;IAChB,OAAO,CAAe;IAEvC,YAAmB,EAAC,QAAQ,EAAE,MAAM,EAA0B;QAC1D,KAAK,EAAE,CAAC;QACR,IAAI,CAAC,QAAQ,GAAG,QAAQ,CAAC;QACzB,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC;IAC1B,CAAC;IAEM,KAAK,CAAC,aAAa,CAAC,MAA+B,EAAE,MAAc;QACtE,MAAM,UAAU,GAAG,cAAc,CAAC,iBAAiB,CAAC,MAAM,CAAC,CAAC;QAC5D,MAAM,SAAS,GAAG,UAAU,CAAC,MAAM,GAAG,MAAM,CAAC;QAE7C,IAAI,SAAS,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM;YAChC,MAAM,IAAI,CAAC,6BAA6B,CAAC,SAAS,CAAC,CAAC;QAExD,MAAM,GAAG,GAAG,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,UAAU,CAAC,MAAM,EAAE,SAAS,CAAC,CAAC;QAChE,UAAU,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;QAC1B,OAAO,GAAG,CAAC;IACf,CAAC;IAEO,KAAK,CAAC,6BAA6B,CAAC,SAAiB,EAAE,sBAA8B,0BAA0B;QACnH,OAAO,MAAM,QAAQ,CAAC,IAAI,EAAE,cAAc,EAAE,IAAI,CAAC,OAAO,EAAE,KAAK,IAAI,EAAE;YACjE,IAAI,SAAS,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM;gBAC/B,OAAO;YAEX,MAAM,kBAAkB,GAAG,MAAM,IAAI,CAAC,cAAc,CAChD,IAAI,CAAC,OAAO,CAAC,MAAM,EACnB,SAAS,GAAG,mBAAmB,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM,CACxD,CAAC;YAEF,IAAI,CAAC,YAAY,CAAC,kBAAkB,CAAC,CAAC;QAC1C,CAAC,CAAC,CAAC;IACP,CAAC;IAEO,KAAK,CAAC,cAAc,CAAC,KAAa,EAAE,MAAc;QACtD,MAAM,EAAE,GAAG,MAAM,EAAE,CAAC,IAAI,CAAC,IAAI,CAAC,QAAQ,EAAE,GAAG,CAAC,CAAC;QAC7C,IAAI;YACA,IAAI,IAAI,CAAC,OAAO,EAAE,OAAO;gBACrB,MAAM,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC;YAE9B,MAAM,MAAM,GAAG,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC;YACpC,MAAM,EAAE,CAAC,IAAI,CAAC,MAAM,EAAE,CAAC,EAAE,MAAM,EAAE,KAAK,CAAC,CAAC;YACxC,OAAO,MAAM,CAAC;SACjB;gBAAS;YACN,MAAM,EAAE,CAAC,KAAK,EAAE,CAAC;SACpB;IACL,CAAC;CACJ"}
@@ -0,0 +1,22 @@
1
+ /// <reference types="node" />
2
+ /// <reference types="node" />
3
+ import retry from "async-retry";
4
+ import { GgufReadOffset } from "../utils/GgufReadOffset.js";
5
+ import { GgufFileReader } from "./GgufFileReader.js";
6
+ type GgufFetchFileReaderOptions = {
7
+ url: string;
8
+ retryOptions?: retry.Options;
9
+ headers?: Record<string, string>;
10
+ signal?: AbortSignal;
11
+ };
12
+ export declare class GgufNetworkFetchFileReader extends GgufFileReader {
13
+ readonly url: string;
14
+ readonly retryOptions: retry.Options;
15
+ readonly headers: Record<string, string>;
16
+ private readonly _signal?;
17
+ constructor({ url, retryOptions, headers, signal }: GgufFetchFileReaderOptions);
18
+ readByteRange(offset: number | GgufReadOffset, length: number): Promise<Buffer>;
19
+ private _fetchToExpandBufferUpToOffset;
20
+ private _fetchByteRange;
21
+ }
22
+ export {};
@@ -0,0 +1,63 @@
1
+ import retry from "async-retry";
2
+ import { withLock } from "lifecycle-utils";
3
+ import { GgufReadOffset } from "../utils/GgufReadOffset.js";
4
+ import { defaultExtraAllocationSize, ggufDefaultFetchRetryOptions } from "../consts.js";
5
+ import { GgufFileReader } from "./GgufFileReader.js";
6
+ export class GgufNetworkFetchFileReader extends GgufFileReader {
7
+ url;
8
+ retryOptions;
9
+ headers;
10
+ _signal;
11
+ constructor({ url, retryOptions = ggufDefaultFetchRetryOptions, headers, signal }) {
12
+ super();
13
+ this.url = url;
14
+ this.retryOptions = retryOptions;
15
+ this.headers = headers ?? {};
16
+ this._signal = signal;
17
+ }
18
+ async readByteRange(offset, length) {
19
+ const readOffset = GgufReadOffset.resolveReadOffset(offset);
20
+ const endOffset = readOffset.offset + length;
21
+ if (endOffset >= this._buffer.length)
22
+ await this._fetchToExpandBufferUpToOffset(endOffset);
23
+ const res = this._buffer.subarray(readOffset.offset, endOffset);
24
+ readOffset.moveBy(length);
25
+ return res;
26
+ }
27
+ async _fetchToExpandBufferUpToOffset(endOffset, extraAllocationSize = defaultExtraAllocationSize) {
28
+ await withLock(this, "modifyBuffer", this._signal, async () => {
29
+ if (endOffset < this._buffer.length)
30
+ return;
31
+ const missingBytesBuffer = await retry(async (bail) => {
32
+ try {
33
+ return await this._fetchByteRange(this._buffer.length, endOffset + extraAllocationSize - this._buffer.length);
34
+ }
35
+ catch (err) {
36
+ if (this._signal?.aborted) {
37
+ bail(this._signal.reason);
38
+ throw this._signal.reason;
39
+ }
40
+ throw err;
41
+ }
42
+ }, this.retryOptions);
43
+ if (this._signal?.aborted)
44
+ throw this._signal.reason;
45
+ this._addToBuffer(missingBytesBuffer);
46
+ });
47
+ }
48
+ async _fetchByteRange(start, length) {
49
+ const response = await fetch(this.url, {
50
+ headers: {
51
+ ...this.headers,
52
+ Range: `bytes=${start}-${start + length}`,
53
+ accept: "*/*"
54
+ },
55
+ signal: this._signal
56
+ });
57
+ if (!response.ok)
58
+ throw new Error(`Failed to fetch byte range: ${response.status} ${response.statusText}`);
59
+ const arrayBuffer = await response.arrayBuffer();
60
+ return Buffer.from(arrayBuffer);
61
+ }
62
+ }
63
+ //# sourceMappingURL=GgufNetworkFetchFileReader.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"GgufNetworkFetchFileReader.js","sourceRoot":"","sources":["../../../src/gguf/fileReaders/GgufNetworkFetchFileReader.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,MAAM,aAAa,CAAC;AAChC,OAAO,EAAC,QAAQ,EAAC,MAAM,iBAAiB,CAAC;AACzC,OAAO,EAAC,cAAc,EAAC,MAAM,4BAA4B,CAAC;AAC1D,OAAO,EAAC,0BAA0B,EAAE,4BAA4B,EAAC,MAAM,cAAc,CAAC;AACtF,OAAO,EAAC,cAAc,EAAC,MAAM,qBAAqB,CAAC;AASnD,MAAM,OAAO,0BAA2B,SAAQ,cAAc;IAC1C,GAAG,CAAS;IACZ,YAAY,CAAgB;IAC5B,OAAO,CAAyB;IAC/B,OAAO,CAAe;IAEvC,YAAmB,EAAC,GAAG,EAAE,YAAY,GAAG,4BAA4B,EAAE,OAAO,EAAE,MAAM,EAA6B;QAC9G,KAAK,EAAE,CAAC;QACR,IAAI,CAAC,GAAG,GAAG,GAAG,CAAC;QACf,IAAI,CAAC,YAAY,GAAG,YAAY,CAAC;QACjC,IAAI,CAAC,OAAO,GAAG,OAAO,IAAI,EAAE,CAAC;QAC7B,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC;IAC1B,CAAC;IAEM,KAAK,CAAC,aAAa,CAAC,MAA+B,EAAE,MAAc;QACtE,MAAM,UAAU,GAAG,cAAc,CAAC,iBAAiB,CAAC,MAAM,CAAC,CAAC;QAC5D,MAAM,SAAS,GAAG,UAAU,CAAC,MAAM,GAAG,MAAM,CAAC;QAE7C,IAAI,SAAS,IAAI,IAAI,CAAC,OAAO,CAAC,MAAM;YAChC,MAAM,IAAI,CAAC,8BAA8B,CAAC,SAAS,CAAC,CAAC;QAEzD,MAAM,GAAG,GAAG,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,UAAU,CAAC,MAAM,EAAE,SAAS,CAAC,CAAC;QAChE,UAAU,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;QAC1B,OAAO,GAAG,CAAC;IACf,CAAC;IAEO,KAAK,CAAC,8BAA8B,CAAC,SAAiB,EAAE,sBAA8B,0BAA0B;QACpH,MAAM,QAAQ,CAAC,IAAI,EAAE,cAAc,EAAE,IAAI,CAAC,OAAO,EAAE,KAAK,IAAI,EAAE;YAC1D,IAAI,SAAS,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM;gBAC/B,OAAO;YAEX,MAAM,kBAAkB,GAAG,MAAM,KAAK,CAAC,KAAK,EAAE,IAAI,EAAE,EAAE;gBAClD,IAAI;oBACA,OAAO,MAAM,IAAI,CAAC,eAAe,CAAC,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,SAAS,GAAG,mBAAmB,GAAG,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC;iBACjH;gBAAC,OAAO,GAAG,EAAE;oBACV,IAAI,IAAI,CAAC,OAAO,EAAE,OAAO,EAAE;wBACvB,IAAI,CAAC,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC;wBAC1B,MAAM,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC;qBAC7B;oBAED,MAAM,GAAG,CAAC;iBACb;YACL,CAAC,EAAE,IAAI,CAAC,YAAY,CAAC,CAAC;YAEtB,IAAI,IAAI,CAAC,OAAO,EAAE,OAAO;gBACrB,MAAM,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC;YAE9B,IAAI,CAAC,YAAY,CAAC,kBAAkB,CAAC,CAAC;QAC1C,CAAC,CAAC,CAAC;IACP,CAAC;IAEO,KAAK,CAAC,eAAe,CAAC,KAAa,EAAE,MAAc;QACvD,MAAM,QAAQ,GAAG,MAAM,KAAK,CAAC,IAAI,CAAC,GAAG,EAAE;YACnC,OAAO,EAAE;gBACL,GAAG,IAAI,CAAC,OAAO;gBACf,KAAK,EAAE,SAAS,KAAK,IAAI,KAAK,GAAG,MAAM,EAAE;gBACzC,MAAM,EAAE,KAAK;aAChB;YACD,MAAM,EAAE,IAAI,CAAC,OAAO;SACvB,CAAC,CAAC;QAEH,IAAI,CAAC,QAAQ,CAAC,EAAE;YACZ,MAAM,IAAI,KAAK,CAAC,+BAA+B,QAAQ,CAAC,MAAM,IAAI,QAAQ,CAAC,UAAU,EAAE,CAAC,CAAC;QAE7F,MAAM,WAAW,GAAG,MAAM,QAAQ,CAAC,WAAW,EAAE,CAAC;QACjD,OAAO,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;IACpC,CAAC;CACJ"}
@@ -0,0 +1,42 @@
1
+ import { Llama } from "../../bindings/Llama.js";
2
+ import { GgufFileInfo } from "../types/GgufFileInfoTypes.js";
3
+ import { GgufInsightsConfigurationResolver } from "./GgufInsightsConfigurationResolver.js";
4
+ export type GgufInsightsResourceRequirements = {
5
+ cpuRam: number;
6
+ gpuVram: number;
7
+ };
8
+ export declare class GgufInsights {
9
+ private constructor();
10
+ get ggufFileInfo(): GgufFileInfo;
11
+ get configurationResolver(): GgufInsightsConfigurationResolver;
12
+ /** The context size the model was trained on */
13
+ get trainContextSize(): number | undefined;
14
+ /** The size of an embedding vector the model can produce */
15
+ get embeddingVectorSize(): number | undefined;
16
+ get totalLayers(): number;
17
+ get modelSize(): number;
18
+ estimateModelResourceRequirements({ gpuLayers }: {
19
+ gpuLayers: number;
20
+ }): GgufInsightsResourceRequirements;
21
+ /**
22
+ * Estimates the memory required to create a context of the given parameters based on the implementation details of `llama.cpp`.
23
+ * The calculation doesn't include a precise estimation of the graph overhead memory, so it uses a rough estimate for that.
24
+ * The estimation for the graph overhead memory will be improved in the future to be more precise, but it's good enough for now.
25
+ */
26
+ estimateContextResourceRequirements({ contextSize, modelGpuLayers, batchSize, sequences, isEmbeddingContext, includeGraphOverhead }: {
27
+ contextSize: number;
28
+ modelGpuLayers: number;
29
+ batchSize?: number;
30
+ sequences?: number;
31
+ isEmbeddingContext?: boolean;
32
+ includeGraphOverhead?: boolean;
33
+ }): GgufInsightsResourceRequirements;
34
+ /**
35
+ * @param ggufFileInfo
36
+ * @param llama - If you already have a `Llama` instance, pass it to reuse it for the `GgufInsights` instance.
37
+ * If you don't pass a `Llama` instance, a basic `Llama` instance is created as a fallback - it's a slim instance that
38
+ * doesn't instantiate a `llama.cpp` backend, so it won't utilize the GPU at all, and be shared with other `GgufInsights` instances
39
+ * that need a fallback `Llama` instance.
40
+ */
41
+ static from(ggufFileInfo: GgufFileInfo, llama?: Llama): Promise<GgufInsights>;
42
+ }
@@ -0,0 +1,361 @@
1
+ import { getLlamaWithoutBackend } from "../../bindings/utils/getLlamaWithoutBackend.js";
2
+ import { getDefaultContextBatchSize, getDefaultContextSequences } from "../../evaluator/LlamaContext/LlamaContext.js";
3
+ import { GgufArchitectureType } from "../types/GgufMetadataTypes.js";
4
+ import { GgufInsightsConfigurationResolver } from "./GgufInsightsConfigurationResolver.js";
5
+ export class GgufInsights {
6
+ /** @internal */ _llama;
7
+ /** @internal */ _modelSize;
8
+ /** @internal */ _totalLayers = null;
9
+ /** @internal */ _ggufFileInfo;
10
+ /** @internal */ _configurationResolver;
11
+ constructor(ggufFileInfo, llama) {
12
+ this._llama = llama;
13
+ this._ggufFileInfo = ggufFileInfo;
14
+ this._modelSize = calculateTensorsSize(ggufFileInfo.tensorInfo ?? [], llama);
15
+ this._configurationResolver = GgufInsightsConfigurationResolver._create(this);
16
+ }
17
+ get ggufFileInfo() {
18
+ return this._ggufFileInfo;
19
+ }
20
+ get configurationResolver() {
21
+ return this._configurationResolver;
22
+ }
23
+ /** The context size the model was trained on */
24
+ get trainContextSize() {
25
+ return this._ggufFileInfo.architectureMetadata.context_length;
26
+ }
27
+ /** The size of an embedding vector the model can produce */
28
+ get embeddingVectorSize() {
29
+ return this._ggufFileInfo.architectureMetadata.embedding_length;
30
+ }
31
+ get totalLayers() {
32
+ if (this._totalLayers != null)
33
+ return this._totalLayers;
34
+ const outputLayers = 1;
35
+ this._totalLayers = this._getFileLayers() + outputLayers;
36
+ return this._totalLayers;
37
+ }
38
+ get modelSize() {
39
+ return this._modelSize;
40
+ }
41
+ estimateModelResourceRequirements({ gpuLayers }) {
42
+ const { cpu, gpu } = this._getTensorResourceSplit(gpuLayers);
43
+ return {
44
+ cpuRam: calculateTensorsSize(cpu, this._llama),
45
+ gpuVram: calculateTensorsSize(gpu, this._llama)
46
+ };
47
+ }
48
+ /**
49
+ * Estimates the memory required to create a context of the given parameters based on the implementation details of `llama.cpp`.
50
+ * The calculation doesn't include a precise estimation of the graph overhead memory, so it uses a rough estimate for that.
51
+ * The estimation for the graph overhead memory will be improved in the future to be more precise, but it's good enough for now.
52
+ */
53
+ estimateContextResourceRequirements({ contextSize, modelGpuLayers, batchSize, sequences, isEmbeddingContext = false, includeGraphOverhead = true }) {
54
+ if (sequences == null)
55
+ sequences = getDefaultContextSequences();
56
+ if (batchSize == null)
57
+ batchSize = getDefaultContextBatchSize({ contextSize, sequences });
58
+ const actualContextSize = contextSize * sequences;
59
+ const totalLayers = this.totalLayers;
60
+ const finalGpuLayers = Math.max(0, Math.min(modelGpuLayers ?? totalLayers, totalLayers));
61
+ const finalCpuLayers = totalLayers - finalGpuLayers;
62
+ const llmData = this._ggufFileInfo.architectureMetadata;
63
+ const vocabularySize = llmData.vocab_size ?? this._ggufFileInfo.metadata.tokenizer.ggml.tokens.length;
64
+ const logitsSize = vocabularySize * batchSize;
65
+ const embedSize = isEmbeddingContext
66
+ ? (llmData.embedding_length ?? 0) * batchSize
67
+ : 0;
68
+ const sizeTBytes = 8; // sizeof(size_t)
69
+ const floatBytes = 4; // sizeof(float)
70
+ const uint32TBytes = 4; // sizeof(uint32_t)
71
+ const int32TBytes = 4; // sizeof(int32_t)
72
+ // source: `llama_get_state_size` in `llama.cpp`
73
+ const sRngSize = sizeTBytes;
74
+ const sRng = this._llama._consts.llamaMaxRngState;
75
+ const sNOutputs = sizeTBytes;
76
+ const sNOutputPos = batchSize * int32TBytes;
77
+ const sLogitsSize = sizeTBytes;
78
+ const sLogits = logitsSize * floatBytes;
79
+ const sEmbeddingSize = sizeTBytes;
80
+ const sEmbedding = embedSize * floatBytes;
81
+ const sKvBufSize = sizeTBytes;
82
+ const sKvHead = uint32TBytes;
83
+ const sKvSize = uint32TBytes;
84
+ const sKvUsed = uint32TBytes;
85
+ const sKv = 2 * int32TBytes * modelGpuLayers * this._llama._consts.ggmlTensorOverhead;
86
+ const sKvCell = this._llama._consts.llamaPosSize + sizeTBytes + this._llama._consts.llamaSeqIdSize;
87
+ const kvSelfLength = this._ggufFileInfo.metadata.general.architecture === GgufArchitectureType.mamba
88
+ ? Math.max(1, sequences)
89
+ : actualContextSize;
90
+ const sKvCells = kvSelfLength * sKvCell;
91
+ const overheadMemory = (sRngSize +
92
+ sRng +
93
+ sNOutputs +
94
+ sNOutputPos +
95
+ sLogitsSize +
96
+ sLogits +
97
+ sEmbeddingSize +
98
+ sEmbedding +
99
+ sKvBufSize +
100
+ sKvHead +
101
+ sKvSize +
102
+ sKvUsed +
103
+ sKv +
104
+ sKvCells);
105
+ // Estimates the memory allocated by `ggml_backend_sched_reserve` in `llama_new_context_with_model` in `llama.cpp`.
106
+ // If you read this line and have better insights on how to estimate this memory, please open a PR to improve it :)
107
+ const estimateGraphOverheadMemory = () => {
108
+ const s1MB = Math.pow(1024, 2);
109
+ const tensorInfo = this._ggufFileInfo.tensorInfo ?? [];
110
+ let defaultCalculationAdjustment = 0;
111
+ if (batchSize == null)
112
+ return 0;
113
+ if (this._ggufFileInfo.metadata.general.architecture === GgufArchitectureType.llama) {
114
+ const expertCount = this._ggufFileInfo.architectureMetadata.expert_count ?? 0;
115
+ const headCount = this._ggufFileInfo.architectureMetadata.attention?.head_count ?? 0;
116
+ const embeddingLength = llmData.embedding_length ?? 0;
117
+ if (expertCount > 0) {
118
+ const expertsUsedCount = this._ggufFileInfo.architectureMetadata.expert_used_count ?? 2;
119
+ return int32TBytes * batchSize * (((expertsUsedCount + 1) * embeddingLength) + (actualContextSize * headCount));
120
+ }
121
+ return int32TBytes * batchSize * (embeddingLength + (actualContextSize * headCount));
122
+ }
123
+ else if (this._ggufFileInfo.metadata.general.architecture === GgufArchitectureType.qwen2) {
124
+ if (modelGpuLayers === this.totalLayers) {
125
+ defaultCalculationAdjustment -= (s1MB * 340) * (this.trainContextSize == null
126
+ ? 1
127
+ : actualContextSize / this.trainContextSize);
128
+ }
129
+ else {
130
+ defaultCalculationAdjustment -= (s1MB * 250) + ((s1MB * 50) * (this.trainContextSize == null
131
+ ? 1
132
+ : actualContextSize / this.trainContextSize));
133
+ }
134
+ }
135
+ else if (this._ggufFileInfo.metadata.general.architecture === GgufArchitectureType.gemma) {
136
+ // only works properly when all layers are on the GPU, which is why it's commented out:
137
+ // return int32TBytes * batchSize * ((llmData.embedding_length ?? 0));
138
+ if (modelGpuLayers === this.totalLayers) {
139
+ defaultCalculationAdjustment += (s1MB * 40) - ((s1MB * 270) * (this.trainContextSize == null
140
+ ? 1
141
+ : actualContextSize / this.trainContextSize));
142
+ }
143
+ else {
144
+ defaultCalculationAdjustment += -(s1MB * 550) + ((s1MB * 150) * (this.trainContextSize == null
145
+ ? 1
146
+ : Math.max(0, (1 - (actualContextSize / this.trainContextSize)))));
147
+ }
148
+ }
149
+ else if (this._ggufFileInfo.metadata.general.architecture === GgufArchitectureType.stablelm) {
150
+ const headCount = this._ggufFileInfo.architectureMetadata.attention?.head_count ?? 0;
151
+ return (int32TBytes * batchSize * actualContextSize * headCount) - (50 * s1MB);
152
+ // if (modelGpuLayers === this.totalLayers) {
153
+ // defaultCalculationAdjustment += -(s1MB * 20) + (
154
+ // (s1MB * 250) * (
155
+ // this.trainContextSize == null
156
+ // ? 1
157
+ // : actualContextSize / this.trainContextSize
158
+ // )
159
+ // );
160
+ // } else {
161
+ // defaultCalculationAdjustment += -(s1MB * 40) + (
162
+ // (s1MB * 300) * (
163
+ // this.trainContextSize == null
164
+ // ? 1
165
+ // : actualContextSize / this.trainContextSize
166
+ // )
167
+ // );
168
+ // }
169
+ }
170
+ const totalElements = tensorInfo.length === 0
171
+ ? this.totalLayers * (((llmData.embedding_length ?? 0) +
172
+ (llmData.feed_forward_length ?? 0)) / 2)
173
+ : tensorInfo.reduce((res, tensor) => {
174
+ return res + tensor.dimensions.reduce((res, dim) => res + Number(dim), 0);
175
+ }, 0);
176
+ // magic numbers for estimation. will be improved in the future
177
+ return (totalElements * 77.655 * (actualContextSize / 4096)) + defaultCalculationAdjustment;
178
+ };
179
+ const graphOverheadMemory = !includeGraphOverhead
180
+ ? 0
181
+ : estimateGraphOverheadMemory();
182
+ const usingGpu = finalGpuLayers !== 0;
183
+ const cpuRam = (!usingGpu
184
+ ? (overheadMemory + graphOverheadMemory)
185
+ : 0) +
186
+ this._estimateKvMemorySizeInBytes(actualContextSize, finalCpuLayers);
187
+ const gpuVram = usingGpu
188
+ ? (overheadMemory +
189
+ graphOverheadMemory +
190
+ this._estimateKvMemorySizeInBytes(actualContextSize, finalGpuLayers < totalLayers
191
+ ? (finalGpuLayers + 1)
192
+ : finalGpuLayers))
193
+ : 0;
194
+ return {
195
+ cpuRam,
196
+ gpuVram
197
+ };
198
+ }
199
+ /**
200
+ * Get the split tensor resources for CPU and GPU based on the number of GPU layers
201
+ * @internal
202
+ */
203
+ _getTensorResourceSplit(gpuLayers) {
204
+ const tensorInfo = this._ggufFileInfo.tensorInfo ?? [];
205
+ if (gpuLayers === 0) {
206
+ return {
207
+ cpu: tensorInfo,
208
+ gpu: []
209
+ };
210
+ }
211
+ const fileLayers = this._getFileLayers();
212
+ const startGpuLayer = Math.max(0, fileLayers - gpuLayers);
213
+ const gpuTensors = [];
214
+ const cpuTensors = [];
215
+ for (const singleTensorInfo of tensorInfo) {
216
+ const { layerNumber } = parseTensorName(singleTensorInfo.name);
217
+ if (gpuLayers !== this.totalLayers) {
218
+ const architecture = this._ggufFileInfo.metadata?.general?.architecture;
219
+ if (architecture === GgufArchitectureType.qwen2 || architecture === GgufArchitectureType.gemma) {
220
+ if (layerNumber != null && layerNumber >= startGpuLayer)
221
+ gpuTensors.push(singleTensorInfo);
222
+ else
223
+ cpuTensors.push(singleTensorInfo);
224
+ continue;
225
+ }
226
+ }
227
+ if (layerNumber == null || layerNumber >= startGpuLayer)
228
+ gpuTensors.push(singleTensorInfo);
229
+ else
230
+ cpuTensors.push(singleTensorInfo);
231
+ }
232
+ return {
233
+ cpu: cpuTensors,
234
+ gpu: gpuTensors
235
+ };
236
+ }
237
+ /** @internal */
238
+ _determineNumberOfLayersFromTensorInfo() {
239
+ const layerNumbers = new Set();
240
+ for (const singleTensorInfo of (this._ggufFileInfo.tensorInfo ?? [])) {
241
+ const { layerNumber } = parseTensorName(singleTensorInfo.name);
242
+ if (layerNumber != null)
243
+ layerNumbers.add(layerNumber);
244
+ }
245
+ return layerNumbers.size;
246
+ }
247
+ /** @internal */
248
+ _getFileLayers() {
249
+ return this._ggufFileInfo.architectureMetadata.block_count ?? this._determineNumberOfLayersFromTensorInfo();
250
+ }
251
+ /** @internal */
252
+ _estimateKvMemorySizeInBytes(contextSize, layers) {
253
+ // source: `llama_kv_cache_init` in `llama.cpp`
254
+ const nHead = this._ggufFileInfo.architectureMetadata.attention?.head_count ?? 0;
255
+ const nEmbd = this._ggufFileInfo.architectureMetadata.embedding_length ?? 0;
256
+ const nEmbdHeadK = this._ggufFileInfo.architectureMetadata.attention?.key_length ?? ((nHead == 0) ? 0 : (nEmbd / nHead));
257
+ const nHeadKv = this._ggufFileInfo.architectureMetadata.attention?.head_count_kv ?? nHead;
258
+ const modelNEmbdKGqa = nEmbdHeadK * nHeadKv;
259
+ const ssmDConv = this._ggufFileInfo.architectureMetadata.ssm?.conv_kernel ?? 0;
260
+ const ssmDInner = this._ggufFileInfo.architectureMetadata.ssm?.inner_size ?? 0;
261
+ const modelNEmbdKS = (ssmDConv > 0 ? (ssmDConv - 1) : 0) * ssmDInner;
262
+ const nEmbdHeadV = this._ggufFileInfo.architectureMetadata.attention?.value_length ?? ((nHead == 0) ? 0 : nEmbd / nHead);
263
+ const modelNEmbdVGqa = nEmbdHeadV * nHeadKv;
264
+ const ssmDState = this._ggufFileInfo.architectureMetadata.ssm?.state_size ?? 0;
265
+ const modelNEmbdVS = ssmDState * ssmDInner;
266
+ const totalNEmbdKGqa = modelNEmbdKGqa + modelNEmbdKS;
267
+ const totalNEmbdVGqa = modelNEmbdVGqa + modelNEmbdVS;
268
+ const keyTypeSize = this._ggufFileInfo.metadata.general.architecture === GgufArchitectureType.mamba
269
+ // if `type_k` of `llama_context_params` changes to be configurable in `LlamaContext`,
270
+ // this would have to depend on that value
271
+ ? this._llama._consts.ggmlTypeF32Size
272
+ : this._llama._consts.ggmlTypeF16Size;
273
+ const valueTypeSize = this._ggufFileInfo.metadata.general.architecture === GgufArchitectureType.mamba
274
+ // if `type_v` of `llama_context_params` changes to be configurable in `LlamaContext`,
275
+ // this would have to depend on that value
276
+ ? this._llama._consts.ggmlTypeF32Size
277
+ : this._llama._consts.ggmlTypeF16Size;
278
+ const keyTensorsSize = layers * totalNEmbdKGqa * contextSize * keyTypeSize;
279
+ const valueTensorsSize = layers * totalNEmbdVGqa * contextSize * valueTypeSize;
280
+ return keyTensorsSize + valueTensorsSize;
281
+ }
282
+ /**
283
+ * @param ggufFileInfo
284
+ * @param llama - If you already have a `Llama` instance, pass it to reuse it for the `GgufInsights` instance.
285
+ * If you don't pass a `Llama` instance, a basic `Llama` instance is created as a fallback - it's a slim instance that
286
+ * doesn't instantiate a `llama.cpp` backend, so it won't utilize the GPU at all, and be shared with other `GgufInsights` instances
287
+ * that need a fallback `Llama` instance.
288
+ */
289
+ static async from(ggufFileInfo, llama) {
290
+ let resolvedLlama = llama;
291
+ if (resolvedLlama == null)
292
+ resolvedLlama = await getLlamaWithoutBackend();
293
+ return new GgufInsights(ggufFileInfo, resolvedLlama);
294
+ }
295
+ }
296
+ function parseTensorName(tensorName) {
297
+ if (tensorName == null)
298
+ return { layerNumber: undefined };
299
+ const layerTensorPrefix = "blk.";
300
+ if (!tensorName.startsWith(layerTensorPrefix))
301
+ return { layerNumber: undefined };
302
+ const dotIndex = tensorName.indexOf(".", layerTensorPrefix.length);
303
+ const layerNumberString = tensorName.slice(layerTensorPrefix.length, dotIndex < 0
304
+ ? tensorName.length
305
+ : dotIndex);
306
+ const layerNumber = parseInt(layerNumberString);
307
+ if (Number.isFinite(layerNumber))
308
+ return { layerNumber };
309
+ return { layerNumber: undefined };
310
+ }
311
+ function calculateTensorsSize(tensorsInfo, llama) {
312
+ let size = 0;
313
+ for (const tensorInfo of tensorsInfo)
314
+ size += calculateTensorSize(tensorInfo, llama);
315
+ return size;
316
+ }
317
+ function calculateTensorSize(tensor, llama) {
318
+ const typeSize = llama._bindings.getTypeSizeForGgmlType(tensor.ggmlType);
319
+ const blockSize = llama._bindings.getBlockSizeForGgmlType(tensor.ggmlType);
320
+ const ggmlMaxDims = llama._consts.ggmlMaxDims;
321
+ if (typeSize == null || blockSize == null)
322
+ throw new Error("Invalid type or block size");
323
+ const { ne, nb } = getTensorNeAndNb(tensor, { typeSize, blockSize, ggmlMaxDims });
324
+ if (blockSize === 1) {
325
+ let totalBytes = typeSize;
326
+ for (let i = 0; i < ggmlMaxDims; i++) {
327
+ totalBytes += (ne[i] - 1) * nb[i];
328
+ }
329
+ return totalBytes;
330
+ }
331
+ else {
332
+ let totalBytes = Math.floor((ne[0] * nb[0]) / blockSize);
333
+ for (let i = 1; i < ggmlMaxDims; i++) {
334
+ totalBytes += (ne[i] - 1) * nb[i];
335
+ }
336
+ return totalBytes;
337
+ }
338
+ }
339
+ function getTensorNeAndNb(tensor, { typeSize, blockSize, ggmlMaxDims }) {
340
+ // number of elements
341
+ // source: `ggml_new_tensor_impl` in `ggml.c`
342
+ const ne = [
343
+ ...tensor.dimensions,
344
+ ...(Array(Math.max(0, ggmlMaxDims - tensor.dimensions.length)).fill(1))
345
+ ].slice(0, ggmlMaxDims);
346
+ // number of bytes
347
+ // source: `ggml_new_tensor_impl` in `ggml.c`
348
+ const nb = [
349
+ typeSize,
350
+ Math.floor(typeSize * (ne[0] / blockSize)),
351
+ ...Array(ggmlMaxDims - 2).fill(0)
352
+ ];
353
+ for (let i = 2; i < ggmlMaxDims; i++) {
354
+ nb[i] = nb[i - 1] * ne[i - 1];
355
+ }
356
+ return {
357
+ ne,
358
+ nb
359
+ };
360
+ }
361
+ //# sourceMappingURL=GgufInsights.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"GgufInsights.js","sourceRoot":"","sources":["../../../src/gguf/insights/GgufInsights.ts"],"names":[],"mappings":"AACA,OAAO,EAAC,sBAAsB,EAAC,MAAM,gDAAgD,CAAC;AACtF,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,8CAA8C,CAAC;AAGpH,OAAO,EAAC,oBAAoB,EAAC,MAAM,+BAA+B,CAAC;AACnE,OAAO,EAAC,iCAAiC,EAAC,MAAM,wCAAwC,CAAC;AAOzF,MAAM,OAAO,YAAY;IACrB,gBAAgB,CAAiB,MAAM,CAAQ;IAC/C,gBAAgB,CAAkB,UAAU,CAAS;IACrD,gBAAgB,CAAS,YAAY,GAAkB,IAAI,CAAC;IAC5D,gBAAgB,CAAkB,aAAa,CAAe;IAC9D,gBAAgB,CAAkB,sBAAsB,CAAoC;IAE5F,YAAoB,YAA0B,EAAE,KAAY;QACxD,IAAI,CAAC,MAAM,GAAG,KAAK,CAAC;QACpB,IAAI,CAAC,aAAa,GAAG,YAAY,CAAC;QAElC,IAAI,CAAC,UAAU,GAAG,oBAAoB,CAAC,YAAY,CAAC,UAAU,IAAI,EAAE,EAAE,KAAK,CAAC,CAAC;QAC7E,IAAI,CAAC,sBAAsB,GAAG,iCAAiC,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;IAClF,CAAC;IAED,IAAW,YAAY;QACnB,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED,IAAW,qBAAqB;QAC5B,OAAO,IAAI,CAAC,sBAAsB,CAAC;IACvC,CAAC;IAED,gDAAgD;IAChD,IAAW,gBAAgB;QACvB,OAAO,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,cAAc,CAAC;IAClE,CAAC;IAED,4DAA4D;IAC5D,IAAW,mBAAmB;QAC1B,OAAO,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,gBAAgB,CAAC;IACpE,CAAC;IAED,IAAW,WAAW;QAClB,IAAI,IAAI,CAAC,YAAY,IAAI,IAAI;YACzB,OAAO,IAAI,CAAC,YAAY,CAAC;QAE7B,MAAM,YAAY,GAAG,CAAC,CAAC;QACvB,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,cAAc,EAAE,GAAG,YAAY,CAAC;QAEzD,OAAO,IAAI,CAAC,YAAY,CAAC;IAC7B,CAAC;IAED,IAAW,SAAS;QAChB,OAAO,IAAI,CAAC,UAAU,CAAC;IAC3B,CAAC;IAEM,iCAAiC,CAAC,EAAC,SAAS,EAAsB;QACrE,MAAM,EAAC,GAAG,EAAE,GAAG,EAAC,GAAG,IAAI,CAAC,uBAAuB,CAAC,SAAS,CAAC,CAAC;QAE3D,OAAO;YACH,MAAM,EAAE,oBAAoB,CAAC,GAAG,EAAE,IAAI,CAAC,MAAM,CAAC;YAC9C,OAAO,EAAE,oBAAoB,CAAC,GAAG,EAAE,IAAI,CAAC,MAAM,CAAC;SAClD,CAAC;IACN,CAAC;IAED;;;;OAIG;IACI,mCAAmC,CAAC,EACvC,WAAW,EAAE,cAAc,EAAE,SAAS,EAAE,SAAS,EAAE,kBAAkB,GAAG,KAAK,EAAE,oBAAoB,GAAG,IAAI,EAI7G;QACG,IAAI,SAAS,IAAI,IAAI;YAAE,SAAS,GAAG,0BAA0B,EAAE,CAAC;QAChE,IAAI,SAAS,IAAI,IAAI;YAAE,SAAS,GAAG,0BAA0B,CAAC,EAAC,WAAW,EAAE,SAAS,EAAC,CAAC,CAAC;QAExF,MAAM,iBAAiB,GAAG,WAAW,GAAG,SAAS,CAAC;QAElD,MAAM,WAAW,GAAG,IAAI,CAAC,WAAW,CAAC;QACrC,MAAM,cAAc,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,cAAc,IAAI,WAAW,EAAE,WAAW,CAAC,CAAC,CAAC;QACzF,MAAM,cAAc,GAAG,WAAW,GAAG,cAAc,CAAC;QACpD,MAAM,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC;QAExD,MAAM,cAAc,GAAG,OAAO,CAAC,UAAU,IAAI,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,SAAS,CAAC,IAAI,CAAC,MAAM,CAAC,MAAM,CAAC;QACtG,MAAM,UAAU,GAAG,cAAc,GAAG,SAAS,CAAC;QAC9C,MAAM,SAAS,GAAG,kBAAkB;YAChC,CAAC,CAAC,CAAC,OAAO,CAAC,gBAAgB,IAAI,CAAC,CAAC,GAAG,SAAS;YAC7C,CAAC,CAAC,CAAC,CAAC;QAER,MAAM,UAAU,GAAG,CAAC,CAAC,CAAC,iBAAiB;QACvC,MAAM,UAAU,GAAG,CAAC,CAAC,CAAC,gBAAgB;QACtC,MAAM,YAAY,GAAG,CAAC,CAAC,CAAC,mBAAmB;QAC3C,MAAM,WAAW,GAAG,CAAC,CAAC,CAAC,kBAAkB;QAEzC,gDAAgD;QAChD,MAAM,QAAQ,GAAG,UAAU,CAAC;QAC5B,MAAM,IAAI,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,gBAAgB,CAAC;QAClD,MAAM,SAAS,GAAG,UAAU,CAAC;QAC7B,MAAM,WAAW,GAAG,SAAS,GAAG,WAAW,CAAC;QAC5C,MAAM,WAAW,GAAG,UAAU,CAAC;QAC/B,MAAM,OAAO,GAAG,UAAU,GAAG,UAAU,CAAC;QACxC,MAAM,cAAc,GAAG,UAAU,CAAC;QAClC,MAAM,UAAU,GAAG,SAAS,GAAG,UAAU,CAAC;QAC1C,MAAM,UAAU,GAAG,UAAU,CAAC;QAC9B,MAAM,OAAO,GAAG,YAAY,CAAC;QAC7B,MAAM,OAAO,GAAG,YAAY,CAAC;QAC7B,MAAM,OAAO,GAAG,YAAY,CAAC;QAC7B,MAAM,GAAG,GAAG,CAAC,GAAG,WAAW,GAAG,cAAc,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,kBAAkB,CAAC;QACtF,MAAM,OAAO,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,YAAY,GAAG,UAAU,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,cAAc,CAAC;QACnG,MAAM,YAAY,GAAG,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,OAAO,CAAC,YAAY,KAAK,oBAAoB,CAAC,KAAK;YAChG,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,SAAS,CAAC;YACxB,CAAC,CAAC,iBAAiB,CAAC;QACxB,MAAM,QAAQ,GAAG,YAAY,GAAG,OAAO,CAAC;QAExC,MAAM,cAAc,GAAG,CACnB,QAAQ;YACR,IAAI;YACJ,SAAS;YACT,WAAW;YACX,WAAW;YACX,OAAO;YACP,cAAc;YACd,UAAU;YACV,UAAU;YACV,OAAO;YACP,OAAO;YACP,OAAO;YACP,GAAG;YACH,QAAQ,CACX,CAAC;QAEF,mHAAmH;QACnH,mHAAmH;QACnH,MAAM,2BAA2B,GAAG,GAAG,EAAE;YACrC,MAAM,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC;YAC/B,MAAM,UAAU,GAAG,IAAI,CAAC,aAAa,CAAC,UAAU,IAAI,EAAE,CAAC;YAEvD,IAAI,4BAA4B,GAAG,CAAC,CAAC;YAErC,IAAI,SAAS,IAAI,IAAI;gBACjB,OAAO,CAAC,CAAC;YAEb,IAAI,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,OAAO,CAAC,YAAY,KAAK,oBAAoB,CAAC,KAAK,EAAE;gBACjF,MAAM,WAAW,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,YAAY,IAAI,CAAC,CAAC;gBAC9E,MAAM,SAAS,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,SAAS,EAAE,UAAU,IAAI,CAAC,CAAC;gBACrF,MAAM,eAAe,GAAG,OAAO,CAAC,gBAAgB,IAAI,CAAC,CAAC;gBAEtD,IAAI,WAAW,GAAG,CAAC,EAAE;oBACjB,MAAM,gBAAgB,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,iBAAiB,IAAI,CAAC,CAAC;oBAExF,OAAO,WAAW,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,gBAAgB,GAAG,CAAC,CAAC,GAAG,eAAe,CAAC,GAAG,CAAC,iBAAiB,GAAG,SAAS,CAAC,CAAC,CAAC;iBACnH;gBAED,OAAO,WAAW,GAAG,SAAS,GAAG,CAAC,eAAe,GAAG,CAAC,iBAAiB,GAAG,SAAS,CAAC,CAAC,CAAC;aACxF;iBAAM,IAAI,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,OAAO,CAAC,YAAY,KAAK,oBAAoB,CAAC,KAAK,EAAE;gBACxF,IAAI,cAAc,KAAK,IAAI,CAAC,WAAW,EAAE;oBACrC,4BAA4B,IAAI,CAAC,IAAI,GAAG,GAAG,CAAC,GAAG,CAC3C,IAAI,CAAC,gBAAgB,IAAI,IAAI;wBACzB,CAAC,CAAC,CAAC;wBACH,CAAC,CAAC,iBAAiB,GAAG,IAAI,CAAC,gBAAgB,CAClD,CAAC;iBACL;qBAAM;oBACH,4BAA4B,IAAI,CAAC,IAAI,GAAG,GAAG,CAAC,GAAG,CAC3C,CAAC,IAAI,GAAG,EAAE,CAAC,GAAG,CACV,IAAI,CAAC,gBAAgB,IAAI,IAAI;wBACzB,CAAC,CAAC,CAAC;wBACH,CAAC,CAAC,iBAAiB,GAAG,IAAI,CAAC,gBAAgB,CAClD,CACJ,CAAC;iBACL;aACJ;iBAAM,IAAI,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,OAAO,CAAC,YAAY,KAAK,oBAAoB,CAAC,KAAK,EAAE;gBACxF,uFAAuF;gBACvF,sEAAsE;gBAEtE,IAAI,cAAc,KAAK,IAAI,CAAC,WAAW,EAAE;oBACrC,4BAA4B,IAAI,CAAC,IAAI,GAAG,EAAE,CAAC,GAAG,CAC1C,CAAC,IAAI,GAAG,GAAG,CAAC,GAAG,CACX,IAAI,CAAC,gBAAgB,IAAI,IAAI;wBACzB,CAAC,CAAC,CAAC;wBACH,CAAC,CAAC,iBAAiB,GAAG,IAAI,CAAC,gBAAgB,CAClD,CACJ,CAAC;iBACL;qBAAM;oBACH,4BAA4B,IAAI,CAAC,CAAC,IAAI,GAAG,GAAG,CAAC,GAAG,CAC5C,CAAC,IAAI,GAAG,GAAG,CAAC,GAAG,CACX,IAAI,CAAC,gBAAgB,IAAI,IAAI;wBACzB,CAAC,CAAC,CAAC;wBACH,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,CAAC,CAAC,GAAG,CAAC,iBAAiB,GAAG,IAAI,CAAC,gBAAgB,CAAC,CAAC,CAAC,CACvE,CACJ,CAAC;iBACL;aACJ;iBAAM,IAAI,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,OAAO,CAAC,YAAY,KAAK,oBAAoB,CAAC,QAAQ,EAAE;gBAC3F,MAAM,SAAS,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,SAAS,EAAE,UAAU,IAAI,CAAC,CAAC;gBAErF,OAAO,CAAC,WAAW,GAAG,SAAS,GAAG,iBAAiB,GAAG,SAAS,CAAC,GAAG,CAAC,EAAE,GAAG,IAAI,CAAC,CAAC;gBAE/E,6CAA6C;gBAC7C,uDAAuD;gBACvD,2BAA2B;gBAC3B,4CAA4C;gBAC5C,sBAAsB;gBACtB,8DAA8D;gBAC9D,YAAY;gBACZ,SAAS;gBACT,WAAW;gBACX,uDAAuD;gBACvD,2BAA2B;gBAC3B,4CAA4C;gBAC5C,sBAAsB;gBACtB,8DAA8D;gBAC9D,YAAY;gBACZ,SAAS;gBACT,IAAI;aACP;YAED,MAAM,aAAa,GAAG,UAAU,CAAC,MAAM,KAAK,CAAC;gBACzC,CAAC,CAAC,IAAI,CAAC,WAAW,GAAG,CACjB,CACI,CAAC,OAAO,CAAC,gBAAgB,IAAI,CAAC,CAAC;oBAC/B,CAAC,OAAO,CAAC,mBAAmB,IAAI,CAAC,CAAC,CACrC,GAAG,CAAC,CACR;gBACD,CAAC,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,MAAM,EAAE,EAAE;oBAChC,OAAO,GAAG,GAAG,MAAM,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC,GAAW,EAAE,GAAG,EAAE,EAAE,CAAC,GAAG,GAAG,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC,CAAC;gBACtF,CAAC,EAAE,CAAC,CAAC,CAAC;YAEV,+DAA+D;YAC/D,OAAO,CAAC,aAAa,GAAG,MAAM,GAAG,CAAC,iBAAiB,GAAG,IAAI,CAAC,CAAC,GAAG,4BAA4B,CAAC;QAChG,CAAC,CAAC;QAEF,MAAM,mBAAmB,GAAG,CAAC,oBAAoB;YAC7C,CAAC,CAAC,CAAC;YACH,CAAC,CAAC,2BAA2B,EAAE,CAAC;QAEpC,MAAM,QAAQ,GAAG,cAAc,KAAK,CAAC,CAAC;QAEtC,MAAM,MAAM,GAAG,CACX,CAAC,QAAQ;YACL,CAAC,CAAC,CAAC,cAAc,GAAG,mBAAmB,CAAC;YACxC,CAAC,CAAC,CAAC,CACV;YACG,IAAI,CAAC,4BAA4B,CAAC,iBAAiB,EAAE,cAAc,CAAC,CAAC;QACzE,MAAM,OAAO,GAAG,QAAQ;YACpB,CAAC,CAAC,CACE,cAAc;gBACd,mBAAmB;gBACnB,IAAI,CAAC,4BAA4B,CAC7B,iBAAiB,EACjB,cAAc,GAAG,WAAW;oBACxB,CAAC,CAAC,CAAC,cAAc,GAAG,CAAC,CAAC;oBACtB,CAAC,CAAC,cAAc,CACvB,CACJ;YACD,CAAC,CAAC,CAAC,CAAC;QAER,OAAO;YACH,MAAM;YACN,OAAO;SACV,CAAC;IACN,CAAC;IAED;;;OAGG;IACI,uBAAuB,CAAC,SAAiB;QAI5C,MAAM,UAAU,GAAG,IAAI,CAAC,aAAa,CAAC,UAAU,IAAI,EAAE,CAAC;QAEvD,IAAI,SAAS,KAAK,CAAC,EAAE;YACjB,OAAO;gBACH,GAAG,EAAE,UAAU;gBACf,GAAG,EAAE,EAAE;aACV,CAAC;SACL;QAED,MAAM,UAAU,GAAG,IAAI,CAAC,cAAc,EAAE,CAAC;QACzC,MAAM,aAAa,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,UAAU,GAAG,SAAS,CAAC,CAAC;QAE1D,MAAM,UAAU,GAAqB,EAAE,CAAC;QACxC,MAAM,UAAU,GAAqB,EAAE,CAAC;QAExC,KAAK,MAAM,gBAAgB,IAAI,UAAU,EAAE;YACvC,MAAM,EAAC,WAAW,EAAC,GAAG,eAAe,CAAC,gBAAgB,CAAC,IAAI,CAAC,CAAC;YAE7D,IAAI,SAAS,KAAK,IAAI,CAAC,WAAW,EAAE;gBAChC,MAAM,YAAY,GAAG,IAAI,CAAC,aAAa,CAAC,QAAQ,EAAE,OAAO,EAAE,YAAY,CAAC;gBAExE,IAAI,YAAY,KAAK,oBAAoB,CAAC,KAAK,IAAI,YAAY,KAAK,oBAAoB,CAAC,KAAK,EAAE;oBAC5F,IAAI,WAAW,IAAI,IAAI,IAAI,WAAW,IAAI,aAAa;wBACnD,UAAU,CAAC,IAAI,CAAC,gBAAgB,CAAC,CAAC;;wBAElC,UAAU,CAAC,IAAI,CAAC,gBAAgB,CAAC,CAAC;oBAEtC,SAAS;iBACZ;aACJ;YAED,IAAI,WAAW,IAAI,IAAI,IAAI,WAAW,IAAI,aAAa;gBACnD,UAAU,CAAC,IAAI,CAAC,gBAAgB,CAAC,CAAC;;gBAElC,UAAU,CAAC,IAAI,CAAC,gBAAgB,CAAC,CAAC;SACzC;QAED,OAAO;YACH,GAAG,EAAE,UAAU;YACf,GAAG,EAAE,UAAU;SAClB,CAAC;IACN,CAAC;IAED,gBAAgB;IACT,sCAAsC;QACzC,MAAM,YAAY,GAAG,IAAI,GAAG,EAAU,CAAC;QAEvC,KAAK,MAAM,gBAAgB,IAAI,CAAC,IAAI,CAAC,aAAa,CAAC,UAAU,IAAI,EAAE,CAAC,EAAE;YAClE,MAAM,EAAC,WAAW,EAAC,GAAG,eAAe,CAAC,gBAAgB,CAAC,IAAI,CAAC,CAAC;YAE7D,IAAI,WAAW,IAAI,IAAI;gBACnB,YAAY,CAAC,GAAG,CAAC,WAAW,CAAC,CAAC;SACrC;QAED,OAAO,YAAY,CAAC,IAAI,CAAC;IAC7B,CAAC;IAED,gBAAgB;IACT,cAAc;QACjB,OAAO,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,WAAW,IAAI,IAAI,CAAC,sCAAsC,EAAE,CAAC;IAChH,CAAC;IAED,gBAAgB;IACT,4BAA4B,CAAC,WAAmB,EAAE,MAAc;QACnE,+CAA+C;QAC/C,MAAM,KAAK,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,SAAS,EAAE,UAAU,IAAI,CAAC,CAAC;QACjF,MAAM,KAAK,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,gBAAgB,IAAI,CAAC,CAAC;QAC5E,MAAM,UAAU,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,SAAS,EAAE,UAAU,IAAI,CAAC,CAAC,KAAK,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,KAAK,GAAG,KAAK,CAAC,CAAC,CAAC;QACzH,MAAM,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,SAAS,EAAE,aAAa,IAAI,KAAK,CAAC;QAC1F,MAAM,cAAc,GAAG,UAAU,GAAG,OAAO,CAAC;QAE5C,MAAM,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,GAAG,EAAE,WAAW,IAAI,CAAC,CAAC;QAC/E,MAAM,SAAS,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,GAAG,EAAE,UAAU,IAAI,CAAC,CAAC;QAC/E,MAAM,YAAY,GAAG,CAAC,QAAQ,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,QAAQ,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,SAAS,CAAC;QAErE,MAAM,UAAU,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,SAAS,EAAE,YAAY,IAAI,CAAC,CAAC,KAAK,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,KAAK,GAAG,KAAK,CAAC,CAAC;QACzH,MAAM,cAAc,GAAG,UAAU,GAAG,OAAO,CAAC;QAE5C,MAAM,SAAS,GAAG,IAAI,CAAC,aAAa,CAAC,oBAAoB,CAAC,GAAG,EAAE,UAAU,IAAI,CAAC,CAAC;QAC/E,MAAM,YAAY,GAAG,SAAS,GAAG,SAAS,CAAC;QAE3C,MAAM,cAAc,GAAG,cAAc,GAAG,YAAY,CAAC;QACrD,MAAM,cAAc,GAAG,cAAc,GAAG,YAAY,CAAC;QAErD,MAAM,WAAW,GAAG,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,OAAO,CAAC,YAAY,KAAK,oBAAoB,CAAC,KAAK;YAC/F,sFAAsF;YACtF,0CAA0C;YAC1C,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,eAAe;YACrC,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,eAAe,CAAC;QAC1C,MAAM,aAAa,GAAG,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,OAAO,CAAC,YAAY,KAAK,oBAAoB,CAAC,KAAK;YACjG,sFAAsF;YACtF,0CAA0C;YAC1C,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,eAAe;YACrC,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,eAAe,CAAC;QAE1C,MAAM,cAAc,GAAG,MAAM,GAAG,cAAc,GAAG,WAAW,GAAG,WAAW,CAAC;QAC3E,MAAM,gBAAgB,GAAG,MAAM,GAAG,cAAc,GAAG,WAAW,GAAG,aAAa,CAAC;QAE/E,OAAO,cAAc,GAAG,gBAAgB,CAAC;IAC7C,CAAC;IAED;;;;;;OAMG;IACI,MAAM,CAAC,KAAK,CAAC,IAAI,CAAC,YAA0B,EAAE,KAAa;QAC9D,IAAI,aAAa,GAAG,KAAK,CAAC;QAC1B,IAAI,aAAa,IAAI,IAAI;YACrB,aAAa,GAAG,MAAM,sBAAsB,EAAE,CAAC;QAEnD,OAAO,IAAI,YAAY,CAAC,YAAY,EAAE,aAAa,CAAC,CAAC;IACzD,CAAC;CACJ;AAED,SAAS,eAAe,CAAC,UAAmB;IAGxC,IAAI,UAAU,IAAI,IAAI;QAClB,OAAO,EAAC,WAAW,EAAE,SAAS,EAAC,CAAC;IAEpC,MAAM,iBAAiB,GAAG,MAAM,CAAC;IACjC,IAAI,CAAC,UAAU,CAAC,UAAU,CAAC,iBAAiB,CAAC;QACzC,OAAO,EAAC,WAAW,EAAE,SAAS,EAAC,CAAC;IAEpC,MAAM,QAAQ,GAAG,UAAU,CAAC,OAAO,CAAC,GAAG,EAAE,iBAAiB,CAAC,MAAM,CAAC,CAAC;IACnE,MAAM,iBAAiB,GAAG,UAAU,CAAC,KAAK,CACtC,iBAAiB,CAAC,MAAM,EACxB,QAAQ,GAAG,CAAC;QACR,CAAC,CAAC,UAAU,CAAC,MAAM;QACnB,CAAC,CAAC,QAAQ,CACjB,CAAC;IAEF,MAAM,WAAW,GAAG,QAAQ,CAAC,iBAAiB,CAAC,CAAC;IAChD,IAAI,MAAM,CAAC,QAAQ,CAAC,WAAW,CAAC;QAC5B,OAAO,EAAC,WAAW,EAAC,CAAC;IAEzB,OAAO,EAAC,WAAW,EAAE,SAAS,EAAC,CAAC;AACpC,CAAC;AAED,SAAS,oBAAoB,CAAC,WAA6B,EAAE,KAAY;IACrE,IAAI,IAAI,GAAG,CAAC,CAAC;IACb,KAAK,MAAM,UAAU,IAAI,WAAW;QAChC,IAAI,IAAI,mBAAmB,CAAC,UAAU,EAAE,KAAK,CAAC,CAAC;IAEnD,OAAO,IAAI,CAAC;AAChB,CAAC;AAED,SAAS,mBAAmB,CAAC,MAAsB,EAAE,KAAY;IAC7D,MAAM,QAAQ,GAAG,KAAK,CAAC,SAAS,CAAC,sBAAsB,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;IACzE,MAAM,SAAS,GAAG,KAAK,CAAC,SAAS,CAAC,uBAAuB,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;IAC3E,MAAM,WAAW,GAAG,KAAK,CAAC,OAAO,CAAC,WAAW,CAAC;IAE9C,IAAI,QAAQ,IAAI,IAAI,IAAI,SAAS,IAAI,IAAI;QACrC,MAAM,IAAI,KAAK,CAAC,4BAA4B,CAAC,CAAC;IAElD,MAAM,EAAC,EAAE,EAAE,EAAE,EAAC,GAAG,gBAAgB,CAAC,MAAM,EAAE,EAAC,QAAQ,EAAE,SAAS,EAAE,WAAW,EAAC,CAAC,CAAC;IAE9E,IAAI,SAAS,KAAK,CAAC,EAAE;QACjB,IAAI,UAAU,GAAG,QAAQ,CAAC;QAC1B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,WAAW,EAAE,CAAC,EAAE,EAAE;YAClC,UAAU,IAAI,CAAC,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,CAAC;SACrC;QAED,OAAO,UAAU,CAAC;KACrB;SAAM;QACH,IAAI,UAAU,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,CAAC,GAAG,SAAS,CAAC,CAAC;QACzD,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,WAAW,EAAE,CAAC,EAAE,EAAE;YAClC,UAAU,IAAI,CAAC,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,CAAC;SACrC;QAED,OAAO,UAAU,CAAC;KACrB;AACL,CAAC;AAED,SAAS,gBAAgB,CAAC,MAAsB,EAAE,EAC9C,QAAQ,EAAE,SAAS,EAAE,WAAW,EAGnC;IACG,qBAAqB;IACrB,6CAA6C;IAC7C,MAAM,EAAE,GAAG;QACP,GAAG,MAAM,CAAC,UAAU;QACpB,GAAG,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,WAAW,GAAG,MAAM,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;KAC1E,CAAC,KAAK,CAAC,CAAC,EAAE,WAAW,CAAC,CAAC;IAExB,kBAAkB;IAClB,6CAA6C;IAC7C,MAAM,EAAE,GAAG;QACP,QAAQ;QACR,IAAI,CAAC,KAAK,CAAC,QAAQ,GAAG,CAAC,EAAE,CAAC,CAAC,CAAC,GAAG,SAAS,CAAC,CAAC;QAC1C,GAAG,KAAK,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC;KACpC,CAAC;IACF,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,WAAW,EAAE,CAAC,EAAE,EAAE;QAClC,EAAE,CAAC,CAAC,CAAC,GAAG,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,GAAG,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;KACjC;IAED,OAAO;QACH,EAAE;QACF,EAAE;KACL,CAAC;AACN,CAAC"}
@@ -0,0 +1,87 @@
1
+ import { BuildGpu } from "../../bindings/types.js";
2
+ import { LlamaModelOptions } from "../../evaluator/LlamaModel.js";
3
+ import { LlamaContextOptions } from "../../evaluator/LlamaContext/types.js";
4
+ import type { GgufInsights } from "./GgufInsights.js";
5
+ export declare class GgufInsightsConfigurationResolver {
6
+ private constructor();
7
+ get ggufInsights(): GgufInsights;
8
+ /**
9
+ * Score the compatibility of the model configuration with the current GPU and VRAM state.
10
+ * Assumes a model is loaded with the default `"auto"` configurations.
11
+ * Scored based on the following criteria:
12
+ * - The number of GPU layers that can be offloaded to the GPU (only if there's a GPU. If there's no GPU then by how small the model is)
13
+ * - Whether all layers can be offloaded to the GPU (gives additional points)
14
+ * - Whether the resolved context size is at least as large as the specified `contextSize`
15
+ *
16
+ * IF the resolved context size is larger than the specified context size, for each multiplier of the specified `contextSize`
17
+ * that the resolved context size is larger by, 1 bonus point is given in the `bonusScore`.
18
+ *
19
+ * `contextSize` defaults to `4096` (if the model train context size is lower than this, the model train context size is used instead).
20
+ */
21
+ scoreModelConfigurationCompatibility({ contextSize, embeddingContext }?: {
22
+ contextSize?: number;
23
+ embeddingContext?: boolean;
24
+ }, { getVramState, getRamState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading }?: {
25
+ getVramState?(): {
26
+ total: number;
27
+ free: number;
28
+ };
29
+ getRamState?(): {
30
+ total: number;
31
+ free: number;
32
+ };
33
+ llamaVramPaddingSize?: number;
34
+ llamaGpu?: BuildGpu;
35
+ llamaSupportsGpuOffloading?: boolean;
36
+ }): {
37
+ /**
38
+ * A number between `0` (inclusive) and `1` (inclusive) representing the compatibility score.
39
+ */
40
+ compatibilityScore: number;
41
+ /**
42
+ * A number starting at `0` with no upper limit representing the bonus score.
43
+ * For each multiplier of the specified `contextSize` that the resolved context size is larger by, 1 bonus point is given.
44
+ */
45
+ bonusScore: number;
46
+ /**
47
+ * The total score, which is the sum of the compatibility and bonus scores.
48
+ */
49
+ totalScore: number;
50
+ /**
51
+ * The resolved values used to calculate the scores.
52
+ */
53
+ resolvedValues: {
54
+ gpuLayers: number;
55
+ contextSize: number;
56
+ modelRamUsage: number;
57
+ contextRamUsage: number;
58
+ totalRamUsage: number;
59
+ modelVramUsage: number;
60
+ contextVramUsage: number;
61
+ totalVramUsage: number;
62
+ };
63
+ };
64
+ resolveModelGpuLayers(gpuLayers: LlamaModelOptions["gpuLayers"], { ignoreMemorySafetyChecks, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading }?: {
65
+ ignoreMemorySafetyChecks?: boolean;
66
+ getVramState?(): {
67
+ total: number;
68
+ free: number;
69
+ };
70
+ llamaVramPaddingSize?: number;
71
+ llamaGpu?: BuildGpu;
72
+ llamaSupportsGpuOffloading?: boolean;
73
+ }): number;
74
+ resolveContextContextSize(contextSize: LlamaContextOptions["contextSize"], { modelGpuLayers, batchSize, sequences, modelTrainContextSize, getVramState, llamaGpu, ignoreMemorySafetyChecks, isEmbeddingContext }: {
75
+ modelGpuLayers: number;
76
+ modelTrainContextSize: number;
77
+ batchSize?: LlamaContextOptions["batchSize"];
78
+ sequences?: number;
79
+ getVramState?(): {
80
+ total: number;
81
+ free: number;
82
+ };
83
+ llamaGpu?: BuildGpu;
84
+ ignoreMemorySafetyChecks?: boolean;
85
+ isEmbeddingContext?: boolean;
86
+ }): number;
87
+ }