node-llama-cpp 3.17.1 → 3.18.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (121) hide show
  1. package/dist/bindings/AddonTypes.d.ts +13 -0
  2. package/dist/bindings/Llama.js +20 -2
  3. package/dist/bindings/Llama.js.map +1 -1
  4. package/dist/bindings/getLlama.d.ts +1 -1
  5. package/dist/bindings/getLlama.js +19 -8
  6. package/dist/bindings/getLlama.js.map +1 -1
  7. package/dist/bindings/utils/compileLLamaCpp.d.ts +2 -1
  8. package/dist/bindings/utils/compileLLamaCpp.js +8 -0
  9. package/dist/bindings/utils/compileLLamaCpp.js.map +1 -1
  10. package/dist/bindings/utils/getGpuTypesToUseForOption.d.ts +1 -1
  11. package/dist/bindings/utils/getLlamaGpuTypes.js +2 -0
  12. package/dist/bindings/utils/getLlamaGpuTypes.js.map +1 -1
  13. package/dist/chatWrappers/QwenChatWrapper.d.ts +7 -0
  14. package/dist/chatWrappers/QwenChatWrapper.js +176 -56
  15. package/dist/chatWrappers/QwenChatWrapper.js.map +1 -1
  16. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +127 -88
  17. package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -1
  18. package/dist/chatWrappers/generic/utils/extractFunctionCallSettingsFromJinjaTemplate.d.ts +16 -10
  19. package/dist/chatWrappers/generic/utils/extractFunctionCallSettingsFromJinjaTemplate.js +115 -5
  20. package/dist/chatWrappers/generic/utils/extractFunctionCallSettingsFromJinjaTemplate.js.map +1 -1
  21. package/dist/chatWrappers/generic/utils/extractSegmentSettingsFromTokenizerAndChatTemplate.js +1 -0
  22. package/dist/chatWrappers/generic/utils/extractSegmentSettingsFromTokenizerAndChatTemplate.js.map +1 -1
  23. package/dist/cli/commands/ChatCommand.d.ts +3 -0
  24. package/dist/cli/commands/ChatCommand.js +34 -5
  25. package/dist/cli/commands/ChatCommand.js.map +1 -1
  26. package/dist/cli/commands/CompleteCommand.d.ts +3 -0
  27. package/dist/cli/commands/CompleteCommand.js +34 -4
  28. package/dist/cli/commands/CompleteCommand.js.map +1 -1
  29. package/dist/cli/commands/InfillCommand.d.ts +3 -0
  30. package/dist/cli/commands/InfillCommand.js +34 -4
  31. package/dist/cli/commands/InfillCommand.js.map +1 -1
  32. package/dist/cli/commands/OnPostInstallCommand.js +31 -4
  33. package/dist/cli/commands/OnPostInstallCommand.js.map +1 -1
  34. package/dist/cli/commands/inspect/commands/InspectEstimateCommand.d.ts +3 -0
  35. package/dist/cli/commands/inspect/commands/InspectEstimateCommand.js +28 -1
  36. package/dist/cli/commands/inspect/commands/InspectEstimateCommand.js.map +1 -1
  37. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +5 -0
  38. package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -1
  39. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +51 -4
  40. package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -1
  41. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.d.ts +3 -0
  42. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +46 -5
  43. package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -1
  44. package/dist/cli/utils/interactivelyAskForModel.d.ts +4 -1
  45. package/dist/cli/utils/interactivelyAskForModel.js +21 -7
  46. package/dist/cli/utils/interactivelyAskForModel.js.map +1 -1
  47. package/dist/cli/utils/packageJsonConfig.d.ts +6 -0
  48. package/dist/cli/utils/packageJsonConfig.js +51 -0
  49. package/dist/cli/utils/packageJsonConfig.js.map +1 -0
  50. package/dist/cli/utils/packageManager.d.ts +1 -0
  51. package/dist/cli/utils/packageManager.js +15 -0
  52. package/dist/cli/utils/packageManager.js.map +1 -0
  53. package/dist/cli/utils/printCommonInfoLines.js +9 -0
  54. package/dist/cli/utils/printCommonInfoLines.js.map +1 -1
  55. package/dist/cli/utils/resolveCommandGgufPath.d.ts +4 -1
  56. package/dist/cli/utils/resolveCommandGgufPath.js +9 -2
  57. package/dist/cli/utils/resolveCommandGgufPath.js.map +1 -1
  58. package/dist/cli/utils/resolveNpmrcConfig.d.ts +18 -0
  59. package/dist/cli/utils/resolveNpmrcConfig.js +129 -0
  60. package/dist/cli/utils/resolveNpmrcConfig.js.map +1 -0
  61. package/dist/config.d.ts +6 -1
  62. package/dist/config.js +12 -2
  63. package/dist/config.js.map +1 -1
  64. package/dist/evaluator/LlamaChat/LlamaChat.d.ts +8 -2
  65. package/dist/evaluator/LlamaChat/LlamaChat.js +99 -6
  66. package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -1
  67. package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js +8 -2
  68. package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +1 -1
  69. package/dist/evaluator/LlamaChatSession/LlamaChatSession.d.ts +8 -2
  70. package/dist/evaluator/LlamaChatSession/LlamaChatSession.js.map +1 -1
  71. package/dist/evaluator/LlamaContext/LlamaContext.d.ts +91 -0
  72. package/dist/evaluator/LlamaContext/LlamaContext.js +215 -19
  73. package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -1
  74. package/dist/evaluator/LlamaContext/LlamaContextSequenceCheckpoints.d.ts +27 -0
  75. package/dist/evaluator/LlamaContext/LlamaContextSequenceCheckpoints.js +130 -0
  76. package/dist/evaluator/LlamaContext/LlamaContextSequenceCheckpoints.js.map +1 -0
  77. package/dist/evaluator/LlamaContext/types.d.ts +32 -1
  78. package/dist/evaluator/LlamaModel/LlamaModel.d.ts +33 -0
  79. package/dist/evaluator/LlamaModel/LlamaModel.js +24 -3
  80. package/dist/evaluator/LlamaModel/LlamaModel.js.map +1 -1
  81. package/dist/gguf/insights/GgufInsights.d.ts +12 -1
  82. package/dist/gguf/insights/GgufInsights.js +246 -49
  83. package/dist/gguf/insights/GgufInsights.js.map +1 -1
  84. package/dist/gguf/insights/GgufInsightsConfigurationResolver.d.ts +13 -4
  85. package/dist/gguf/insights/GgufInsightsConfigurationResolver.js +17 -5
  86. package/dist/gguf/insights/GgufInsightsConfigurationResolver.js.map +1 -1
  87. package/dist/gguf/insights/utils/resolveContextContextSizeOption.d.ts +4 -1
  88. package/dist/gguf/insights/utils/resolveContextContextSizeOption.js +7 -1
  89. package/dist/gguf/insights/utils/resolveContextContextSizeOption.js.map +1 -1
  90. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.d.ts +4 -1
  91. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js +16 -4
  92. package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js.map +1 -1
  93. package/dist/gguf/types/GgufMetadataTypes.d.ts +18 -2
  94. package/dist/gguf/types/GgufMetadataTypes.js +6 -0
  95. package/dist/gguf/types/GgufMetadataTypes.js.map +1 -1
  96. package/dist/gguf/types/GgufTensorInfoTypes.d.ts +4 -2
  97. package/dist/gguf/types/GgufTensorInfoTypes.js +11 -1
  98. package/dist/gguf/types/GgufTensorInfoTypes.js.map +1 -1
  99. package/dist/gguf/utils/getGgufFileTypeName.d.ts +1 -1
  100. package/dist/gguf/utils/ggufQuantNames.js +1 -0
  101. package/dist/gguf/utils/ggufQuantNames.js.map +1 -1
  102. package/dist/tsconfig.tsbuildinfo +1 -1
  103. package/dist/types.d.ts +1 -0
  104. package/dist/utils/getBuildDefaults.d.ts +1 -1
  105. package/dist/utils/getFirstWritableDir.d.ts +8 -0
  106. package/dist/utils/getFirstWritableDir.js +60 -0
  107. package/dist/utils/getFirstWritableDir.js.map +1 -0
  108. package/dist/utils/getTempDir.d.ts +10 -0
  109. package/dist/utils/getTempDir.js +121 -0
  110. package/dist/utils/getTempDir.js.map +1 -0
  111. package/dist/utils/prettyPrintObject.js +1 -1
  112. package/dist/utils/prettyPrintObject.js.map +1 -1
  113. package/dist/utils/resolveModelFile.js +19 -8
  114. package/dist/utils/resolveModelFile.js.map +1 -1
  115. package/llama/addon/AddonContext.cpp +182 -0
  116. package/llama/addon/AddonContext.h +27 -0
  117. package/llama/addon/addon.cpp +1 -0
  118. package/llama/binariesGithubRelease.json +1 -1
  119. package/llama/gitRelease.bundle +0 -0
  120. package/llama/llama.cpp.info.json +1 -1
  121. package/package.json +24 -24
@@ -24,9 +24,11 @@ export class GgufInsightsConfigurationResolver {
24
24
  * @param options
25
25
  * @param hardwareOverrides
26
26
  */
27
- async resolveAndScoreConfig({ targetGpuLayers, targetContextSize, embeddingContext = false, flashAttention = false, swaFullCache = false, useMmap = this._ggufInsights._llama.supportsMmap } = {}, { getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading } = {}) {
27
+ async resolveAndScoreConfig({ targetGpuLayers, targetContextSize, embeddingContext = false, flashAttention = false, kvCacheKeyType, kvCacheValueType, swaFullCache = false, useMmap = this._ggufInsights._llama.supportsMmap } = {}, { getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading } = {}) {
28
28
  const compatibilityScore = await this.scoreModelConfigurationCompatibility({
29
29
  flashAttention,
30
+ kvCacheKeyType,
31
+ kvCacheValueType,
30
32
  swaFullCache,
31
33
  contextSize: targetContextSize,
32
34
  embeddingContext,
@@ -64,7 +66,7 @@ export class GgufInsightsConfigurationResolver {
64
66
  *
65
67
  * `contextSize` defaults to `4096` (if the model train context size is lower than this, the model train context size is used instead).
66
68
  */
67
- async scoreModelConfigurationCompatibility({ contextSize = Math.min(4096, this._ggufInsights.trainContextSize ?? 4096), embeddingContext = false, flashAttention = false, swaFullCache = false, maximumFittedContextSizeMultiplier = 100, maximumUnfitConfigurationResourceMultiplier = 100, forceStrictContextSize = false, forceGpuLayers, useMmap = this._ggufInsights._llama.supportsMmap } = {}, { getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading } = {}) {
69
+ async scoreModelConfigurationCompatibility({ contextSize = Math.min(4096, this._ggufInsights.trainContextSize ?? 4096), embeddingContext = false, flashAttention = false, kvCacheKeyType, kvCacheValueType, swaFullCache = false, maximumFittedContextSizeMultiplier = 100, maximumUnfitConfigurationResourceMultiplier = 100, forceStrictContextSize = false, forceGpuLayers, useMmap = this._ggufInsights._llama.supportsMmap } = {}, { getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading } = {}) {
68
70
  const [vramState, ramState, swapState] = await Promise.all([
69
71
  getVramState(),
70
72
  getRamState(),
@@ -95,6 +97,8 @@ export class GgufInsightsConfigurationResolver {
95
97
  llamaSupportsGpuOffloading,
96
98
  defaultContextFlashAttention: flashAttention,
97
99
  defaultContextSwaFullCache: swaFullCache,
100
+ defaultContextKvCacheKeyType: kvCacheKeyType,
101
+ defaultContextKvCacheValueType: kvCacheValueType,
98
102
  ignoreMemorySafetyChecks: forceGpuLayers != null,
99
103
  useMmap
100
104
  });
@@ -137,6 +141,8 @@ export class GgufInsightsConfigurationResolver {
137
141
  modelTrainContextSize: this._ggufInsights.trainContextSize ?? defaultTrainContextSizeForEstimationPurposes,
138
142
  ignoreMemorySafetyChecks: forceStrictContextSize,
139
143
  flashAttention,
144
+ kvCacheKeyType,
145
+ kvCacheValueType,
140
146
  swaFullCache
141
147
  });
142
148
  contextFitsMemory = true;
@@ -157,7 +163,9 @@ export class GgufInsightsConfigurationResolver {
157
163
  isEmbeddingContext: embeddingContext,
158
164
  modelGpuLayers: resolvedGpuLayers,
159
165
  flashAttention,
160
- swaFullCache
166
+ swaFullCache,
167
+ kvCacheKeyType,
168
+ kvCacheValueType
161
169
  });
162
170
  const rankPoints = {
163
171
  gpuLayers: 60,
@@ -213,7 +221,7 @@ export class GgufInsightsConfigurationResolver {
213
221
  }
214
222
  };
215
223
  }
216
- async resolveModelGpuLayers(gpuLayers, { ignoreMemorySafetyChecks = false, getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading, defaultContextFlashAttention = false, defaultContextSwaFullCache = false, useMmap = this._ggufInsights._llama.supportsMmap } = {}) {
224
+ async resolveModelGpuLayers(gpuLayers, { ignoreMemorySafetyChecks = false, getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading, defaultContextFlashAttention = false, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache = false, useMmap = this._ggufInsights._llama.supportsMmap } = {}) {
217
225
  return resolveModelGpuLayersOption(gpuLayers, {
218
226
  ggufInsights: this._ggufInsights,
219
227
  ignoreMemorySafetyChecks,
@@ -222,6 +230,8 @@ export class GgufInsightsConfigurationResolver {
222
230
  llamaGpu,
223
231
  llamaSupportsGpuOffloading,
224
232
  defaultContextFlashAttention,
233
+ defaultContextKvCacheKeyType,
234
+ defaultContextKvCacheValueType,
225
235
  defaultContextSwaFullCache,
226
236
  useMmap
227
237
  });
@@ -231,7 +241,7 @@ export class GgufInsightsConfigurationResolver {
231
241
  *
232
242
  * If there's no context size that can fit the available resources, an `InsufficientMemoryError` is thrown.
233
243
  */
234
- async resolveContextContextSize(contextSize, { modelGpuLayers, batchSize, modelTrainContextSize, flashAttention = false, swaFullCache = false, getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaGpu = this._ggufInsights._llama.gpu, ignoreMemorySafetyChecks = false, isEmbeddingContext = false, sequences = getDefaultContextSequences() }) {
244
+ async resolveContextContextSize(contextSize, { modelGpuLayers, batchSize, modelTrainContextSize, flashAttention = false, kvCacheKeyType, kvCacheValueType, swaFullCache = false, getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaGpu = this._ggufInsights._llama.gpu, ignoreMemorySafetyChecks = false, isEmbeddingContext = false, sequences = getDefaultContextSequences() }) {
235
245
  return await resolveContextContextSizeOption({
236
246
  contextSize,
237
247
  batchSize,
@@ -240,6 +250,8 @@ export class GgufInsightsConfigurationResolver {
240
250
  modelGpuLayers,
241
251
  modelTrainContextSize,
242
252
  flashAttention,
253
+ kvCacheKeyType,
254
+ kvCacheValueType,
243
255
  swaFullCache,
244
256
  getVramState,
245
257
  getRamState,
@@ -1 +1 @@
1
- {"version":3,"file":"GgufInsightsConfigurationResolver.js","sourceRoot":"","sources":["../../../src/gguf/insights/GgufInsightsConfigurationResolver.ts"],"names":[],"mappings":"AAGA,OAAO,EAAC,0BAA0B,EAAC,MAAM,8CAA8C,CAAC;AACxF,OAAO,EAAC,uBAAuB,EAAC,MAAM,wCAAwC,CAAC;AAC/E,OAAO,EAAC,2BAA2B,EAAC,MAAM,wCAAwC,CAAC;AACnF,OAAO,EAAC,+BAA+B,EAAC,MAAM,4CAA4C,CAAC;AAC3F,OAAO,EAAC,WAAW,EAAC,MAAM,wBAAwB,CAAC;AACnD,OAAO,EAAC,0BAA0B,EAAC,MAAM,uCAAuC,CAAC;AAGjF,MAAM,CAAC,MAAM,4CAA4C,GAAG,IAAI,CAAC;AACjE,MAAM,kDAAkD,GAAG,IAAI,CAAC;AAGhE,MAAM,OAAO,iCAAiC;IAC1C,gBAAgB,CAAkB,aAAa,CAAe;IAE9D,YAAoB,YAA0B;QAC1C,IAAI,CAAC,aAAa,GAAG,YAAY,CAAC;IACtC,CAAC;IAED,IAAW,YAAY;QACnB,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED;;;;;;;;;OASG;IACI,KAAK,CAAC,qBAAqB,CAAC,EAC/B,eAAe,EACf,iBAAiB,EACjB,gBAAgB,GAAG,KAAK,EACxB,cAAc,GAAG,KAAK,EACtB,YAAY,GAAG,KAAK,EACpB,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAQhD,EAAE,EAAE,EACJ,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAChE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,KAQ5E,EAAE;QACF,MAAM,kBAAkB,GAAG,MAAM,IAAI,CAAC,oCAAoC,CAAC;YACvE,cAAc;YACd,YAAY;YACZ,WAAW,EAAE,iBAAiB;YAC9B,gBAAgB;YAChB,cAAc,EAAE,eAAe;YAC/B,sBAAsB,EAAE,iBAAiB,IAAI,IAAI;YACjD,OAAO;SACV,EAAE;YACC,YAAY;YACZ,WAAW;YACX,YAAY;YACZ,oBAAoB;YACpB,QAAQ;YACR,0BAA0B;SAC7B,CAAC,CAAC;QAEH,OAAO,kBAAkB,CAAC;IAC9B,CAAC;IAED;;;;;;;;;;;;;;;;;;;;OAoBG;IACI,KAAK,CAAC,oCAAoC,CAAC,EAC9C,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,aAAa,CAAC,gBAAgB,IAAI,IAAI,CAAC,EACzE,gBAAgB,GAAG,KAAK,EACxB,cAAc,GAAG,KAAK,EACtB,YAAY,GAAG,KAAK,EACpB,kCAAkC,GAAG,GAAG,EACxC,2CAA2C,GAAG,GAAG,EACjD,sBAAsB,GAAG,KAAK,EAC9B,cAAc,EACd,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAkBhD,EAAE,EAAE,EACJ,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAChE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,KAQ5E,EAAE;QAiCF,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QACH,IAAI,iBAAiB,GAAG,CAAC,cAAc,IAAI,IAAI,IAAI,cAAc,IAAI,KAAK,CAAC;YACvE,CAAC,CAAC,IAAI,CAAC,YAAY,CAAC,WAAW;YAC/B,CAAC,CAAC,cAAc,CAAC;QACrB,IAAI,kBAAkB,GAAG,KAAK,CAAC;QAE/B,IAAI,CAAC;YACD,iBAAiB,GAAG,MAAM,IAAI,CAAC,qBAAqB,CAChD,cAAc,IAAI,IAAI;gBAClB,CAAC,CAAC,cAAc;gBAChB,CAAC,CAAC,gBAAgB;oBACd,CAAC,CAAC;wBACE,UAAU,EAAE;4BACR,gBAAgB,EAAE,IAAI;4BACtB,WAAW,EAAE,sBAAsB;gCAC/B,CAAC,CAAC,WAAW;gCACb,CAAC,CAAC,SAAS;yBAClB;qBACJ;oBACD,CAAC,CAAC,sBAAsB,IAAI,IAAI;wBAC5B,CAAC,CAAC,EAAC,UAAU,EAAE,EAAC,WAAW,EAAC,EAAC;wBAC7B,CAAC,CAAC,MAAM,EACpB;gBACI,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,SAAS;gBACnC,oBAAoB;gBACpB,QAAQ;gBACR,0BAA0B;gBAC1B,4BAA4B,EAAE,cAAc;gBAC5C,0BAA0B,EAAE,YAAY;gBACxC,wBAAwB,EAAE,cAAc,IAAI,IAAI;gBAChD,OAAO;aACV,CACJ,CAAC;YACF,kBAAkB,GAAG,IAAI,CAAC;QAC9B,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,CAAC,GAAG,YAAY,uBAAuB,CAAC;gBACzC,MAAM,GAAG,CAAC;QAClB,CAAC;QAED,MAAM,SAAS,GAAG,0BAA0B,IAAI,QAAQ,KAAK,KAAK,CAAC;QACnE,MAAM,2BAA2B,GAAG,IAAI,CAAC,aAAa,CAAC,iCAAiC,CAAC;YACrF,SAAS,EAAE,iBAAiB;YAC5B,OAAO;SACV,CAAC,CAAC;QAEH,IAAI,mBAAmB,GAAG,sBAAsB;YAC5C,CAAC,CAAC,WAAW;YACb,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,IAAI,CAAC,YAAY,CAAC,gBAAgB,IAAI,kDAAkD,EACxF,kDAAkD,CACrD,CAAC;QACN,IAAI,iBAAiB,GAAG,KAAK,CAAC;QAE9B,IAAI,CAAC;YACD,mBAAmB,GAAG,MAAM,IAAI,CAAC,yBAAyB,CAAC,MAAM,EAAE;gBAC/D,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACvB,KAAK,EAAE,SAAS,CAAC,KAAK;oBACtB,IAAI,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,SAAS,CAAC,IAAI,GAAG,2BAA2B,CAAC,OAAO,CAAC;oBACvE,WAAW,EAAE,SAAS,CAAC,WAAW;iBACrC,CAAC;gBACF,WAAW,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACtB,KAAK,EAAE,QAAQ,CAAC,KAAK;oBACrB,IAAI,EAAE,IAAI,CAAC,GAAG,CACV,CAAC,EACD,QAAQ,CAAC,IAAI,GAAG,2BAA2B,CAAC,MAAM;wBAClD,CAAC,CAAC,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC,CAChF;iBACJ,CAAC;gBACF,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACvB,KAAK,EAAE,SAAS,CAAC,KAAK;oBACtB,IAAI,EAAE,IAAI,CAAC,GAAG,CACV,CAAC,EACD,SAAS,CAAC,IAAI,GAAG,IAAI,CAAC,GAAG,CACrB,CAAC,EACD,2BAA2B,CAAC,MAAM;wBAClC,CAAC,CAAC,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC;wBAC7E,CAAC,CAAC,QAAQ,CAAC,IAAI,CAAC,CACnB,CACJ;iBACJ,CAAC;gBACF,QAAQ;gBACR,kBAAkB,EAAE,gBAAgB;gBACpC,cAAc,EAAE,iBAAiB;gBACjC,qBAAqB,EAAE,IAAI,CAAC,aAAa,CAAC,gBAAgB,IAAI,4CAA4C;gBAC1G,wBAAwB,EAAE,sBAAsB;gBAChD,cAAc;gBACd,YAAY;aACf,CAAC,CAAC;YACH,iBAAiB,GAAG,IAAI,CAAC;YAEzB,IAAI,sBAAsB,IAAI,mBAAmB,GAAG,WAAW,EAAE,CAAC;gBAC9D,iBAAiB,GAAG,KAAK,CAAC;gBAC1B,mBAAmB,GAAG,WAAW,CAAC;YACtC,CAAC;iBAAM,IAAI,sBAAsB,IAAI,mBAAmB,GAAG,WAAW,EAAE,CAAC;gBACrE,mBAAmB,GAAG,WAAW,CAAC;YACtC,CAAC;QACL,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,CAAC,GAAG,YAAY,uBAAuB,CAAC;gBACzC,MAAM,GAAG,CAAC;QAClB,CAAC;QAED,MAAM,6BAA6B,GAAG,IAAI,CAAC,aAAa,CAAC,mCAAmC,CAAC;YACzF,WAAW,EAAE,mBAAmB;YAChC,kBAAkB,EAAE,gBAAgB;YACpC,cAAc,EAAE,iBAAiB;YACjC,cAAc;YACd,YAAY;SACf,CAAC,CAAC;QAEH,MAAM,UAAU,GAAG;YACf,SAAS,EAAE,EAAE;YACb,qBAAqB,EAAE,EAAE;YACzB,WAAW,EAAE,EAAE;YACf,iBAAiB,EAAE,EAAE;YACrB,qBAAqB,EAAE,EAAE,EAAE,sDAAsD;YACjF,gBAAgB,EAAE,EAAE;SACd,CAAC;QAEX,MAAM,eAAe,GAAG,UAAU,CAAC,SAAS,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,iBAAiB,GAAG,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC;QAC/G,MAAM,2BAA2B,GAAG,UAAU,CAAC,qBAAqB,GAAG,CACnE,iBAAiB,KAAK,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAC/D,CAAC;QACF,MAAM,iBAAiB,GAAG,iBAAiB;YACvC,CAAC,CAAC,UAAU,CAAC,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,mBAAmB,GAAG,WAAW,CAAC;YACzE,CAAC,CAAC,CAAC,CAAC;QACR,MAAM,uBAAuB,GAAG,UAAU,CAAC,iBAAiB,GAAG,CAC3D,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,IAAI;YAC/C,CAAC,CAAC,CAAC;YACH,CAAC,CAAC,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI;gBAClE,CAAC,CAAC,GAAG;gBACL,CAAC,CAAC,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,KAAK;oBAClD,CAAC,CAAC,GAAG;oBACL,CAAC,CAAC,CACE,GAAG,GAAG,IAAI,CAAC,GAAG,CACV,GAAG,EACH,GAAG,GAAG,CACF,CAAC,2BAA2B,CAAC,MAAM,GAAG,QAAQ,CAAC,KAAK,CAAC,GAAG,QAAQ,CAAC,KAAK,CACzE,CACJ,CACJ,CAChB,CAAC;QACF,MAAM,sBAAsB,GAAG,iBAAiB;YAC5C,CAAC,CAAC,CACE,EAAE,GAAG,IAAI,CAAC,GAAG,CACT,CAAC,EACD,CACI,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,mBAAmB,GAAG,WAAW,CAAC,GAAG,WAAW,CAC/D,GAAG,kCAAkC,CACzC,CACJ;YACD,CAAC,CAAC,CAAC,CAAC;QAER,IAAI,kBAAkB,GAAG,SAAS;YAC9B,CAAC,CAAC,CACE,CAAC,eAAe,GAAG,2BAA2B,GAAG,iBAAiB,GAAG,uBAAuB,CAAC;gBAC7F,CAAC,UAAU,CAAC,SAAS,GAAG,UAAU,CAAC,qBAAqB,GAAG,UAAU,CAAC,WAAW,GAAG,UAAU,CAAC,iBAAiB,CAAC,CACpH;YACD,CAAC,CAAC,CACE,CAAC,iBAAiB,GAAG,uBAAuB,GAAG,6BAA6B,CAAC,IAAI,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;gBAC3G,CAAC,UAAU,CAAC,WAAW,GAAG,UAAU,CAAC,iBAAiB,GAAG,UAAU,CAAC,qBAAqB,CAAC,CAAC,CAAC;QACpG,IAAI,UAAU,GAAG,sBAAsB,GAAG,UAAU,CAAC,gBAAgB,CAAC;QAEtE,IAAI,CAAC,kBAAkB,IAAI,CAAC,iBAAiB;YACzC,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO,GAAG,SAAS,CAAC,KAAK;YAC7F,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM,GAAG,QAAQ,CAAC,KAAK,GAAG,SAAS,CAAC,KAAK,EAC9G,CAAC;YACC,MAAM,oBAAoB,GAAG,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO,CAAC;YACzG,MAAM,mBAAmB,GAAG,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM,CAAC;YAEtG,kBAAkB,GAAG,CAAC,CAAC;YACvB,UAAU,GAAG,CACT,CAAC,CAAC,GAAG,CAAC,oBAAoB,GAAG,CAAC,SAAS,CAAC,KAAK,GAAG,2CAA2C,CAAC,CAAC,CAAC;gBAC9F,CAAC,CAAC,GAAG,CAAC,mBAAmB,GAAG,CAAC,CAAC,QAAQ,CAAC,KAAK,GAAG,SAAS,CAAC,KAAK,CAAC,GAAG,2CAA2C,CAAC,CAAC,CAAC,CACnH,GAAG,CAAC,CAAC;QACV,CAAC;QAED,OAAO;YACH,kBAAkB;YAClB,UAAU;YACV,UAAU,EAAE,kBAAkB,GAAG,UAAU;YAE3C,cAAc,EAAE;gBACZ,SAAS,EAAE,iBAAiB;gBAC5B,WAAW,EAAE,mBAAmB;gBAEhC,aAAa,EAAE,2BAA2B,CAAC,MAAM;gBACjD,eAAe,EAAE,6BAA6B,CAAC,MAAM;gBACrD,aAAa,EAAE,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM;gBAExF,cAAc,EAAE,2BAA2B,CAAC,OAAO;gBACnD,gBAAgB,EAAE,6BAA6B,CAAC,OAAO;gBACvD,cAAc,EAAE,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO;aAC9F;SACJ,CAAC;IACN,CAAC;IAEM,KAAK,CAAC,qBAAqB,CAAC,SAA0C,EAAE,EAC3E,wBAAwB,GAAG,KAAK,EAChC,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAAE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EAC1G,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,EAC5E,4BAA4B,GAAG,KAAK,EACpC,0BAA0B,GAAG,KAAK,EAClC,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAKhD,EAAE;QACF,OAAO,2BAA2B,CAAC,SAAS,EAAE;YAC1C,YAAY,EAAE,IAAI,CAAC,aAAa;YAChC,wBAAwB;YACxB,YAAY;YACZ,oBAAoB;YACpB,QAAQ;YACR,0BAA0B;YAC1B,4BAA4B;YAC5B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;IACP,CAAC;IAED;;;;OAIG;IACI,KAAK,CAAC,yBAAyB,CAAC,WAA+C,EAAE,EACpF,cAAc,EACd,SAAS,EACT,qBAAqB,EACrB,cAAc,GAAG,KAAK,EACtB,YAAY,GAAG,KAAK,EACpB,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,wBAAwB,GAAG,KAAK,EAChC,kBAAkB,GAAG,KAAK,EAC1B,SAAS,GAAG,0BAA0B,EAAE,EAc3C;QACG,OAAO,MAAM,+BAA+B,CAAC;YACzC,WAAW;YACX,SAAS;YACT,SAAS;YACT,iBAAiB,EAAE,IAAI,CAAC,aAAa;YACrC,cAAc;YACd,qBAAqB;YACrB,cAAc;YACd,YAAY;YACZ,YAAY;YACZ,WAAW;YACX,YAAY;YACZ,QAAQ;YACR,wBAAwB;YACxB,kBAAkB;SACrB,CAAC,CAAC;IACP,CAAC;IAED,gBAAgB;IACT,MAAM,CAAC,OAAO,CAAC,YAA0B;QAC5C,OAAO,IAAI,iCAAiC,CAAC,YAAY,CAAC,CAAC;IAC/D,CAAC;CACJ;AAED,SAAS,6BAA6B,CAAC,SAAiB;IACpD,MAAM,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC;IAC/B,OAAO,EAAE,GAAG,WAAW,CAAC,SAAS,EAAE,CAAC;YAChC,KAAK,EAAE,IAAI;YACX,GAAG,EAAE,IAAI,GAAG,GAAG;YACf,MAAM,EAAE,EAAE;SACb,EAAE;YACC,KAAK,EAAE,IAAI,GAAG,GAAG;YACjB,GAAG,EAAE,IAAI,GAAG,CAAC;YACb,MAAM,EAAE,EAAE;SACb,EAAE;YACC,KAAK,EAAE,IAAI,GAAG,CAAC;YACf,MAAM,EAAE,CAAC;SACZ,CAAC,CAAC,CAAC;AACR,CAAC"}
1
+ {"version":3,"file":"GgufInsightsConfigurationResolver.js","sourceRoot":"","sources":["../../../src/gguf/insights/GgufInsightsConfigurationResolver.ts"],"names":[],"mappings":"AAGA,OAAO,EAAC,0BAA0B,EAAC,MAAM,8CAA8C,CAAC;AACxF,OAAO,EAAC,uBAAuB,EAAC,MAAM,wCAAwC,CAAC;AAE/E,OAAO,EAAC,2BAA2B,EAAC,MAAM,wCAAwC,CAAC;AACnF,OAAO,EAAC,+BAA+B,EAAC,MAAM,4CAA4C,CAAC;AAC3F,OAAO,EAAC,WAAW,EAAC,MAAM,wBAAwB,CAAC;AACnD,OAAO,EAAC,0BAA0B,EAAC,MAAM,uCAAuC,CAAC;AAGjF,MAAM,CAAC,MAAM,4CAA4C,GAAG,IAAI,CAAC;AACjE,MAAM,kDAAkD,GAAG,IAAI,CAAC;AAGhE,MAAM,OAAO,iCAAiC;IAC1C,gBAAgB,CAAkB,aAAa,CAAe;IAE9D,YAAoB,YAA0B;QAC1C,IAAI,CAAC,aAAa,GAAG,YAAY,CAAC;IACtC,CAAC;IAED,IAAW,YAAY;QACnB,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED;;;;;;;;;OASG;IACI,KAAK,CAAC,qBAAqB,CAAC,EAC/B,eAAe,EACf,iBAAiB,EACjB,gBAAgB,GAAG,KAAK,EACxB,cAAc,GAAG,KAAK,EACtB,cAAc,EACd,gBAAgB,EAChB,YAAY,GAAG,KAAK,EACpB,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAUhD,EAAE,EAAE,EACJ,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAChE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,KAQ5E,EAAE;QACF,MAAM,kBAAkB,GAAG,MAAM,IAAI,CAAC,oCAAoC,CAAC;YACvE,cAAc;YACd,cAAc;YACd,gBAAgB;YAChB,YAAY;YACZ,WAAW,EAAE,iBAAiB;YAC9B,gBAAgB;YAChB,cAAc,EAAE,eAAe;YAC/B,sBAAsB,EAAE,iBAAiB,IAAI,IAAI;YACjD,OAAO;SACV,EAAE;YACC,YAAY;YACZ,WAAW;YACX,YAAY;YACZ,oBAAoB;YACpB,QAAQ;YACR,0BAA0B;SAC7B,CAAC,CAAC;QAEH,OAAO,kBAAkB,CAAC;IAC9B,CAAC;IAED;;;;;;;;;;;;;;;;;;;;OAoBG;IACI,KAAK,CAAC,oCAAoC,CAAC,EAC9C,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,aAAa,CAAC,gBAAgB,IAAI,IAAI,CAAC,EACzE,gBAAgB,GAAG,KAAK,EACxB,cAAc,GAAG,KAAK,EACtB,cAAc,EACd,gBAAgB,EAChB,YAAY,GAAG,KAAK,EACpB,kCAAkC,GAAG,GAAG,EACxC,2CAA2C,GAAG,GAAG,EACjD,sBAAsB,GAAG,KAAK,EAC9B,cAAc,EACd,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAoBhD,EAAE,EAAE,EACJ,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAChE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,KAQ5E,EAAE;QAiCF,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QACH,IAAI,iBAAiB,GAAG,CAAC,cAAc,IAAI,IAAI,IAAI,cAAc,IAAI,KAAK,CAAC;YACvE,CAAC,CAAC,IAAI,CAAC,YAAY,CAAC,WAAW;YAC/B,CAAC,CAAC,cAAc,CAAC;QACrB,IAAI,kBAAkB,GAAG,KAAK,CAAC;QAE/B,IAAI,CAAC;YACD,iBAAiB,GAAG,MAAM,IAAI,CAAC,qBAAqB,CAChD,cAAc,IAAI,IAAI;gBAClB,CAAC,CAAC,cAAc;gBAChB,CAAC,CAAC,gBAAgB;oBACd,CAAC,CAAC;wBACE,UAAU,EAAE;4BACR,gBAAgB,EAAE,IAAI;4BACtB,WAAW,EAAE,sBAAsB;gCAC/B,CAAC,CAAC,WAAW;gCACb,CAAC,CAAC,SAAS;yBAClB;qBACJ;oBACD,CAAC,CAAC,sBAAsB,IAAI,IAAI;wBAC5B,CAAC,CAAC,EAAC,UAAU,EAAE,EAAC,WAAW,EAAC,EAAC;wBAC7B,CAAC,CAAC,MAAM,EACpB;gBACI,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,SAAS;gBACnC,oBAAoB;gBACpB,QAAQ;gBACR,0BAA0B;gBAC1B,4BAA4B,EAAE,cAAc;gBAC5C,0BAA0B,EAAE,YAAY;gBACxC,4BAA4B,EAAE,cAAc;gBAC5C,8BAA8B,EAAE,gBAAgB;gBAChD,wBAAwB,EAAE,cAAc,IAAI,IAAI;gBAChD,OAAO;aACV,CACJ,CAAC;YACF,kBAAkB,GAAG,IAAI,CAAC;QAC9B,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,CAAC,GAAG,YAAY,uBAAuB,CAAC;gBACzC,MAAM,GAAG,CAAC;QAClB,CAAC;QAED,MAAM,SAAS,GAAG,0BAA0B,IAAI,QAAQ,KAAK,KAAK,CAAC;QACnE,MAAM,2BAA2B,GAAG,IAAI,CAAC,aAAa,CAAC,iCAAiC,CAAC;YACrF,SAAS,EAAE,iBAAiB;YAC5B,OAAO;SACV,CAAC,CAAC;QAEH,IAAI,mBAAmB,GAAG,sBAAsB;YAC5C,CAAC,CAAC,WAAW;YACb,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,IAAI,CAAC,YAAY,CAAC,gBAAgB,IAAI,kDAAkD,EACxF,kDAAkD,CACrD,CAAC;QACN,IAAI,iBAAiB,GAAG,KAAK,CAAC;QAE9B,IAAI,CAAC;YACD,mBAAmB,GAAG,MAAM,IAAI,CAAC,yBAAyB,CAAC,MAAM,EAAE;gBAC/D,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACvB,KAAK,EAAE,SAAS,CAAC,KAAK;oBACtB,IAAI,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,SAAS,CAAC,IAAI,GAAG,2BAA2B,CAAC,OAAO,CAAC;oBACvE,WAAW,EAAE,SAAS,CAAC,WAAW;iBACrC,CAAC;gBACF,WAAW,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACtB,KAAK,EAAE,QAAQ,CAAC,KAAK;oBACrB,IAAI,EAAE,IAAI,CAAC,GAAG,CACV,CAAC,EACD,QAAQ,CAAC,IAAI,GAAG,2BAA2B,CAAC,MAAM;wBAClD,CAAC,CAAC,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC,CAChF;iBACJ,CAAC;gBACF,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACvB,KAAK,EAAE,SAAS,CAAC,KAAK;oBACtB,IAAI,EAAE,IAAI,CAAC,GAAG,CACV,CAAC,EACD,SAAS,CAAC,IAAI,GAAG,IAAI,CAAC,GAAG,CACrB,CAAC,EACD,2BAA2B,CAAC,MAAM;wBAClC,CAAC,CAAC,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC;wBAC7E,CAAC,CAAC,QAAQ,CAAC,IAAI,CAAC,CACnB,CACJ;iBACJ,CAAC;gBACF,QAAQ;gBACR,kBAAkB,EAAE,gBAAgB;gBACpC,cAAc,EAAE,iBAAiB;gBACjC,qBAAqB,EAAE,IAAI,CAAC,aAAa,CAAC,gBAAgB,IAAI,4CAA4C;gBAC1G,wBAAwB,EAAE,sBAAsB;gBAChD,cAAc;gBACd,cAAc;gBACd,gBAAgB;gBAChB,YAAY;aACf,CAAC,CAAC;YACH,iBAAiB,GAAG,IAAI,CAAC;YAEzB,IAAI,sBAAsB,IAAI,mBAAmB,GAAG,WAAW,EAAE,CAAC;gBAC9D,iBAAiB,GAAG,KAAK,CAAC;gBAC1B,mBAAmB,GAAG,WAAW,CAAC;YACtC,CAAC;iBAAM,IAAI,sBAAsB,IAAI,mBAAmB,GAAG,WAAW,EAAE,CAAC;gBACrE,mBAAmB,GAAG,WAAW,CAAC;YACtC,CAAC;QACL,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,CAAC,GAAG,YAAY,uBAAuB,CAAC;gBACzC,MAAM,GAAG,CAAC;QAClB,CAAC;QAED,MAAM,6BAA6B,GAAG,IAAI,CAAC,aAAa,CAAC,mCAAmC,CAAC;YACzF,WAAW,EAAE,mBAAmB;YAChC,kBAAkB,EAAE,gBAAgB;YACpC,cAAc,EAAE,iBAAiB;YACjC,cAAc;YACd,YAAY;YACZ,cAAc;YACd,gBAAgB;SACnB,CAAC,CAAC;QAEH,MAAM,UAAU,GAAG;YACf,SAAS,EAAE,EAAE;YACb,qBAAqB,EAAE,EAAE;YACzB,WAAW,EAAE,EAAE;YACf,iBAAiB,EAAE,EAAE;YACrB,qBAAqB,EAAE,EAAE,EAAE,sDAAsD;YACjF,gBAAgB,EAAE,EAAE;SACd,CAAC;QAEX,MAAM,eAAe,GAAG,UAAU,CAAC,SAAS,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,iBAAiB,GAAG,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC;QAC/G,MAAM,2BAA2B,GAAG,UAAU,CAAC,qBAAqB,GAAG,CACnE,iBAAiB,KAAK,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAC/D,CAAC;QACF,MAAM,iBAAiB,GAAG,iBAAiB;YACvC,CAAC,CAAC,UAAU,CAAC,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,mBAAmB,GAAG,WAAW,CAAC;YACzE,CAAC,CAAC,CAAC,CAAC;QACR,MAAM,uBAAuB,GAAG,UAAU,CAAC,iBAAiB,GAAG,CAC3D,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,IAAI;YAC/C,CAAC,CAAC,CAAC;YACH,CAAC,CAAC,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI;gBAClE,CAAC,CAAC,GAAG;gBACL,CAAC,CAAC,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,KAAK;oBAClD,CAAC,CAAC,GAAG;oBACL,CAAC,CAAC,CACE,GAAG,GAAG,IAAI,CAAC,GAAG,CACV,GAAG,EACH,GAAG,GAAG,CACF,CAAC,2BAA2B,CAAC,MAAM,GAAG,QAAQ,CAAC,KAAK,CAAC,GAAG,QAAQ,CAAC,KAAK,CACzE,CACJ,CACJ,CAChB,CAAC;QACF,MAAM,sBAAsB,GAAG,iBAAiB;YAC5C,CAAC,CAAC,CACE,EAAE,GAAG,IAAI,CAAC,GAAG,CACT,CAAC,EACD,CACI,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,mBAAmB,GAAG,WAAW,CAAC,GAAG,WAAW,CAC/D,GAAG,kCAAkC,CACzC,CACJ;YACD,CAAC,CAAC,CAAC,CAAC;QAER,IAAI,kBAAkB,GAAG,SAAS;YAC9B,CAAC,CAAC,CACE,CAAC,eAAe,GAAG,2BAA2B,GAAG,iBAAiB,GAAG,uBAAuB,CAAC;gBAC7F,CAAC,UAAU,CAAC,SAAS,GAAG,UAAU,CAAC,qBAAqB,GAAG,UAAU,CAAC,WAAW,GAAG,UAAU,CAAC,iBAAiB,CAAC,CACpH;YACD,CAAC,CAAC,CACE,CAAC,iBAAiB,GAAG,uBAAuB,GAAG,6BAA6B,CAAC,IAAI,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;gBAC3G,CAAC,UAAU,CAAC,WAAW,GAAG,UAAU,CAAC,iBAAiB,GAAG,UAAU,CAAC,qBAAqB,CAAC,CAAC,CAAC;QACpG,IAAI,UAAU,GAAG,sBAAsB,GAAG,UAAU,CAAC,gBAAgB,CAAC;QAEtE,IAAI,CAAC,kBAAkB,IAAI,CAAC,iBAAiB;YACzC,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO,GAAG,SAAS,CAAC,KAAK;YAC7F,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM,GAAG,QAAQ,CAAC,KAAK,GAAG,SAAS,CAAC,KAAK,EAC9G,CAAC;YACC,MAAM,oBAAoB,GAAG,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO,CAAC;YACzG,MAAM,mBAAmB,GAAG,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM,CAAC;YAEtG,kBAAkB,GAAG,CAAC,CAAC;YACvB,UAAU,GAAG,CACT,CAAC,CAAC,GAAG,CAAC,oBAAoB,GAAG,CAAC,SAAS,CAAC,KAAK,GAAG,2CAA2C,CAAC,CAAC,CAAC;gBAC9F,CAAC,CAAC,GAAG,CAAC,mBAAmB,GAAG,CAAC,CAAC,QAAQ,CAAC,KAAK,GAAG,SAAS,CAAC,KAAK,CAAC,GAAG,2CAA2C,CAAC,CAAC,CAAC,CACnH,GAAG,CAAC,CAAC;QACV,CAAC;QAED,OAAO;YACH,kBAAkB;YAClB,UAAU;YACV,UAAU,EAAE,kBAAkB,GAAG,UAAU;YAE3C,cAAc,EAAE;gBACZ,SAAS,EAAE,iBAAiB;gBAC5B,WAAW,EAAE,mBAAmB;gBAEhC,aAAa,EAAE,2BAA2B,CAAC,MAAM;gBACjD,eAAe,EAAE,6BAA6B,CAAC,MAAM;gBACrD,aAAa,EAAE,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM;gBAExF,cAAc,EAAE,2BAA2B,CAAC,OAAO;gBACnD,gBAAgB,EAAE,6BAA6B,CAAC,OAAO;gBACvD,cAAc,EAAE,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO;aAC9F;SACJ,CAAC;IACN,CAAC;IAEM,KAAK,CAAC,qBAAqB,CAAC,SAA0C,EAAE,EAC3E,wBAAwB,GAAG,KAAK,EAChC,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAAE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EAC1G,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,EAC5E,4BAA4B,GAAG,KAAK,EACpC,4BAA4B,EAC5B,8BAA8B,EAC9B,0BAA0B,GAAG,KAAK,EAClC,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAMhD,EAAE;QACF,OAAO,2BAA2B,CAAC,SAAS,EAAE;YAC1C,YAAY,EAAE,IAAI,CAAC,aAAa;YAChC,wBAAwB;YACxB,YAAY;YACZ,oBAAoB;YACpB,QAAQ;YACR,0BAA0B;YAC1B,4BAA4B;YAC5B,4BAA4B;YAC5B,8BAA8B;YAC9B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;IACP,CAAC;IAED;;;;OAIG;IACI,KAAK,CAAC,yBAAyB,CAAC,WAA+C,EAAE,EACpF,cAAc,EACd,SAAS,EACT,qBAAqB,EACrB,cAAc,GAAG,KAAK,EACtB,cAAc,EACd,gBAAgB,EAChB,YAAY,GAAG,KAAK,EACpB,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,wBAAwB,GAAG,KAAK,EAChC,kBAAkB,GAAG,KAAK,EAC1B,SAAS,GAAG,0BAA0B,EAAE,EAgB3C;QACG,OAAO,MAAM,+BAA+B,CAAC;YACzC,WAAW;YACX,SAAS;YACT,SAAS;YACT,iBAAiB,EAAE,IAAI,CAAC,aAAa;YACrC,cAAc;YACd,qBAAqB;YACrB,cAAc;YACd,cAAc;YACd,gBAAgB;YAChB,YAAY;YACZ,YAAY;YACZ,WAAW;YACX,YAAY;YACZ,QAAQ;YACR,wBAAwB;YACxB,kBAAkB;SACrB,CAAC,CAAC;IACP,CAAC;IAED,gBAAgB;IACT,MAAM,CAAC,OAAO,CAAC,YAA0B;QAC5C,OAAO,IAAI,iCAAiC,CAAC,YAAY,CAAC,CAAC;IAC/D,CAAC;CACJ;AAED,SAAS,6BAA6B,CAAC,SAAiB;IACpD,MAAM,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC;IAC/B,OAAO,EAAE,GAAG,WAAW,CAAC,SAAS,EAAE,CAAC;YAChC,KAAK,EAAE,IAAI;YACX,GAAG,EAAE,IAAI,GAAG,GAAG;YACf,MAAM,EAAE,EAAE;SACb,EAAE;YACC,KAAK,EAAE,IAAI,GAAG,GAAG;YACjB,GAAG,EAAE,IAAI,GAAG,CAAC;YACb,MAAM,EAAE,EAAE;SACb,EAAE;YACC,KAAK,EAAE,IAAI,GAAG,CAAC;YACf,MAAM,EAAE,CAAC;SACZ,CAAC,CAAC,CAAC;AACR,CAAC"}
@@ -1,7 +1,8 @@
1
1
  import { LlamaContextOptions } from "../../../evaluator/LlamaContext/types.js";
2
2
  import { GgufInsights } from "../GgufInsights.js";
3
3
  import { BuildGpu } from "../../../bindings/types.js";
4
- export declare function resolveContextContextSizeOption({ contextSize, batchSize, sequences, modelFileInsights, modelGpuLayers, modelTrainContextSize, flashAttention, swaFullCache, getVramState, getRamState, getSwapState, ignoreMemorySafetyChecks, isEmbeddingContext, maxContextSizeSwapUse }: {
4
+ import type { GgmlType } from "../../types/GgufTensorInfoTypes.js";
5
+ export declare function resolveContextContextSizeOption({ contextSize, batchSize, sequences, modelFileInsights, modelGpuLayers, modelTrainContextSize, flashAttention, kvCacheKeyType, kvCacheValueType, swaFullCache, getVramState, getRamState, getSwapState, ignoreMemorySafetyChecks, isEmbeddingContext, maxContextSizeSwapUse }: {
5
6
  contextSize?: LlamaContextOptions["contextSize"];
6
7
  batchSize?: LlamaContextOptions["batchSize"];
7
8
  sequences: number;
@@ -9,6 +10,8 @@ export declare function resolveContextContextSizeOption({ contextSize, batchSize
9
10
  modelGpuLayers: number;
10
11
  modelTrainContextSize: number;
11
12
  flashAttention: boolean;
13
+ kvCacheKeyType?: GgmlType;
14
+ kvCacheValueType?: GgmlType;
12
15
  swaFullCache: boolean;
13
16
  getVramState(): Promise<{
14
17
  total: number;
@@ -3,7 +3,7 @@ import { getDefaultContextBatchSize, getDefaultModelContextSize } from "../../..
3
3
  import { InsufficientMemoryError } from "../../../utils/InsufficientMemoryError.js";
4
4
  import { getRamUsageFromUnifiedVram } from "./getRamUsageFromUnifiedVram.js";
5
5
  const defaultMaxContextSizeSwapUse = 2048;
6
- export async function resolveContextContextSizeOption({ contextSize, batchSize, sequences, modelFileInsights, modelGpuLayers, modelTrainContextSize, flashAttention, swaFullCache, getVramState, getRamState, getSwapState, ignoreMemorySafetyChecks = false, isEmbeddingContext = false, maxContextSizeSwapUse = defaultMaxContextSizeSwapUse }) {
6
+ export async function resolveContextContextSizeOption({ contextSize, batchSize, sequences, modelFileInsights, modelGpuLayers, modelTrainContextSize, flashAttention, kvCacheKeyType, kvCacheValueType, swaFullCache, getVramState, getRamState, getSwapState, ignoreMemorySafetyChecks = false, isEmbeddingContext = false, maxContextSizeSwapUse = defaultMaxContextSizeSwapUse }) {
7
7
  if (contextSize == null)
8
8
  contextSize = "auto";
9
9
  if (typeof contextSize === "number") {
@@ -21,6 +21,8 @@ export async function resolveContextContextSizeOption({ contextSize, batchSize,
21
21
  modelGpuLayers: modelGpuLayers,
22
22
  sequences,
23
23
  flashAttention,
24
+ kvCacheKeyType,
25
+ kvCacheValueType,
24
26
  swaFullCache,
25
27
  isEmbeddingContext
26
28
  });
@@ -51,6 +53,8 @@ export async function resolveContextContextSizeOption({ contextSize, batchSize,
51
53
  modelGpuLayers: modelGpuLayers,
52
54
  sequences,
53
55
  flashAttention,
56
+ kvCacheKeyType,
57
+ kvCacheValueType,
54
58
  swaFullCache,
55
59
  isEmbeddingContext
56
60
  });
@@ -90,6 +94,8 @@ export async function resolveContextContextSizeOption({ contextSize, batchSize,
90
94
  modelGpuLayers: modelGpuLayers,
91
95
  sequences,
92
96
  flashAttention,
97
+ kvCacheKeyType,
98
+ kvCacheValueType,
93
99
  swaFullCache,
94
100
  isEmbeddingContext
95
101
  });
@@ -1 +1 @@
1
- {"version":3,"file":"resolveContextContextSizeOption.js","sourceRoot":"","sources":["../../../../src/gguf/insights/utils/resolveContextContextSizeOption.ts"],"names":[],"mappings":"AAGA,OAAO,EAAC,mCAAmC,EAAC,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,iDAAiD,CAAC;AACvH,OAAO,EAAC,uBAAuB,EAAC,MAAM,2CAA2C,CAAC;AAClF,OAAO,EAAC,0BAA0B,EAAC,MAAM,iCAAiC,CAAC;AAE3E,MAAM,4BAA4B,GAAG,IAAI,CAAC;AAE1C,MAAM,CAAC,KAAK,UAAU,+BAA+B,CAAC,EAClD,WAAW,EAAE,SAAS,EAAE,SAAS,EAAE,iBAAiB,EAAE,cAAc,EAAE,qBAAqB,EAAE,cAAc,EAAE,YAAY,EACzH,YAAY,EAAE,WAAW,EAAE,YAAY,EAAE,wBAAwB,GAAG,KAAK,EAAE,kBAAkB,GAAG,KAAK,EACrG,qBAAqB,GAAG,4BAA4B,EAiBvD;IACG,IAAI,WAAW,IAAI,IAAI;QACnB,WAAW,GAAG,MAAM,CAAC;IAEzB,IAAI,OAAO,WAAW,KAAK,QAAQ,EAAE,CAAC;QAClC,MAAM,mBAAmB,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,WAAW,CAAC,CAAC,CAAC;QAEjE,IAAI,wBAAwB;YACxB,OAAO,mBAAmB,CAAC;QAE/B,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QACH,MAAM,2BAA2B,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;YACtF,WAAW,EAAE,mBAAmB;YAChC,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,mBAAmB,EAAE,SAAS,EAAC,CAAC;YACjG,cAAc,EAAE,cAAc;YAC9B,SAAS;YACT,cAAc;YACd,YAAY;YACZ,kBAAkB;SACrB,CAAC,CAAC;QAEH,IAAI,2BAA2B,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YACpD,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,mBAAmB,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,CAAC,CAAC;aACvK,IAAI,2BAA2B,CAAC,MAAM,GAAG,CAC1C,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAC9G;YACG,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,mBAAmB,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;QAE5N,OAAO,mBAAmB,CAAC;IAC/B,CAAC;SAAM,IAAI,WAAW,KAAK,MAAM,IAAI,OAAO,WAAW,KAAK,QAAQ,EAAE,CAAC;QACnE,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QAEH,MAAM,cAAc,GAAG,WAAW,KAAK,MAAM;YACzC,CAAC,CAAC,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC;YACvE,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,WAAW,CAAC,GAAG,IAAI,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC,EACxF,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC,CACxE,CAAC;QAEN,MAAM,cAAc,GAAG,WAAW,KAAK,MAAM;YACzC,CAAC,CAAC,mCAAmC;YACrC,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,WAAW,CAAC,GAAG,IAAI,mCAAmC,EACtD,mCAAmC,CACtC,CAAC;QAEN,IAAI,4BAA4B,GAAkB,IAAI,CAAC;QACvD,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,cAAc,GAAG,cAAc,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC3E,KAAK,IAAI,eAAe,GAAG,cAAc,EAAE,eAAe,IAAI,cAAc,IAAI,eAAe,IAAI,cAAc,GAAG,CAAC;YACjH,MAAM,2BAA2B,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;gBACtF,WAAW,EAAE,eAAe;gBAC5B,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,eAAe,EAAE,SAAS,EAAC,CAAC;gBAC7F,cAAc,EAAE,cAAc;gBAC9B,SAAS;gBACT,cAAc;gBACd,YAAY;gBACZ,kBAAkB;aACrB,CAAC,CAAC;YAEH,IAAI,2BAA2B,CAAC,OAAO,IAAI,SAAS,CAAC,IAAI;gBACrD,2BAA2B,CAAC,MAAM,IAAI,CAClC,QAAQ,CAAC,IAAI,GAAG,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,GAAG,CACzF,eAAe,IAAI,qBAAqB;oBACpC,CAAC,CAAC,SAAS,CAAC,IAAI;oBAChB,CAAC,CAAC,CAAC,CACV,CACJ,EACH,CAAC;gBACC,IAAI,4BAA4B,IAAI,IAAI,IAAI,eAAe,IAAI,4BAA4B,EAAE,CAAC;oBAC1F,4BAA4B,GAAG,eAAe,CAAC;oBAE/C,IAAI,IAAI,KAAK,CAAC,CAAC;wBACX,MAAM;yBACL,IAAI,IAAI,GAAG,CAAC;wBACb,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;gBAClD,CAAC;YACL,CAAC;iBAAM,IAAI,IAAI,GAAG,CAAC;gBACf,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;YAE9C,IAAI,eAAe,IAAI,cAAc,IAAI,IAAI,KAAK,CAAC,CAAC;gBAChD,MAAM;YAEV,eAAe,IAAI,IAAI,CAAC;YACxB,IAAI,eAAe,GAAG,cAAc,EAAE,CAAC;gBACnC,eAAe,GAAG,cAAc,CAAC;gBACjC,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACvD,CAAC;iBAAM,IAAI,eAAe,GAAG,cAAc,EAAE,CAAC;gBAC1C,eAAe,GAAG,cAAc,CAAC;gBACjC,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACxD,CAAC;QACL,CAAC;QAED,IAAI,4BAA4B,IAAI,IAAI;YACpC,OAAO,4BAA4B,CAAC;QAExC,IAAI,wBAAwB;YACxB,OAAO,cAAc,CAAC;QAE1B,MAAM,kCAAkC,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;YAC7F,WAAW,EAAE,cAAc;YAC3B,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,cAAc,EAAE,SAAS,EAAC,CAAC;YAC5F,cAAc,EAAE,cAAc;YAC9B,SAAS;YACT,cAAc;YACd,YAAY;YACZ,kBAAkB;SACrB,CAAC,CAAC;QAEH,MAAM,eAAe,GAAG,0BAA0B,CAAC,kCAAkC,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC;QAC1G,IAAI,kCAAkC,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YAC3D,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,eAAe;YAE5F,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,+CAA+C,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;aAC3N,IAAI,kCAAkC,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YAChE,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,CAAC,CAAC;aAClK,IAAI,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,eAAe;YACjG,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;aAClN,IAAI,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,eAAe;YAChF,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,qCAAqC,CAAC,CAAC;;YAElK,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,2CAA2C,CAAC,CAAC;IAChL,CAAC;IAED,MAAM,IAAI,KAAK,CAAC,0BAA0B,WAAW,GAAG,CAAC,CAAC;AAC9D,CAAC"}
1
+ {"version":3,"file":"resolveContextContextSizeOption.js","sourceRoot":"","sources":["../../../../src/gguf/insights/utils/resolveContextContextSizeOption.ts"],"names":[],"mappings":"AAGA,OAAO,EAAC,mCAAmC,EAAC,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,iDAAiD,CAAC;AACvH,OAAO,EAAC,uBAAuB,EAAC,MAAM,2CAA2C,CAAC;AAClF,OAAO,EAAC,0BAA0B,EAAC,MAAM,iCAAiC,CAAC;AAG3E,MAAM,4BAA4B,GAAG,IAAI,CAAC;AAE1C,MAAM,CAAC,KAAK,UAAU,+BAA+B,CAAC,EAClD,WAAW,EAAE,SAAS,EAAE,SAAS,EAAE,iBAAiB,EAAE,cAAc,EAAE,qBAAqB,EAAE,cAAc,EAC3G,cAAc,EAAE,gBAAgB,EAAE,YAAY,EAC9C,YAAY,EAAE,WAAW,EAAE,YAAY,EAAE,wBAAwB,GAAG,KAAK,EAAE,kBAAkB,GAAG,KAAK,EACrG,qBAAqB,GAAG,4BAA4B,EAmBvD;IACG,IAAI,WAAW,IAAI,IAAI;QACnB,WAAW,GAAG,MAAM,CAAC;IAEzB,IAAI,OAAO,WAAW,KAAK,QAAQ,EAAE,CAAC;QAClC,MAAM,mBAAmB,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,WAAW,CAAC,CAAC,CAAC;QAEjE,IAAI,wBAAwB;YACxB,OAAO,mBAAmB,CAAC;QAE/B,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QACH,MAAM,2BAA2B,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;YACtF,WAAW,EAAE,mBAAmB;YAChC,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,mBAAmB,EAAE,SAAS,EAAC,CAAC;YACjG,cAAc,EAAE,cAAc;YAC9B,SAAS;YACT,cAAc;YACd,cAAc;YACd,gBAAgB;YAChB,YAAY;YACZ,kBAAkB;SACrB,CAAC,CAAC;QAEH,IAAI,2BAA2B,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YACpD,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,mBAAmB,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,CAAC,CAAC;aACvK,IAAI,2BAA2B,CAAC,MAAM,GAAG,CAC1C,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAC9G;YACG,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,mBAAmB,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;QAE5N,OAAO,mBAAmB,CAAC;IAC/B,CAAC;SAAM,IAAI,WAAW,KAAK,MAAM,IAAI,OAAO,WAAW,KAAK,QAAQ,EAAE,CAAC;QACnE,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QAEH,MAAM,cAAc,GAAG,WAAW,KAAK,MAAM;YACzC,CAAC,CAAC,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC;YACvE,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,WAAW,CAAC,GAAG,IAAI,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC,EACxF,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC,CACxE,CAAC;QAEN,MAAM,cAAc,GAAG,WAAW,KAAK,MAAM;YACzC,CAAC,CAAC,mCAAmC;YACrC,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,WAAW,CAAC,GAAG,IAAI,mCAAmC,EACtD,mCAAmC,CACtC,CAAC;QAEN,IAAI,4BAA4B,GAAkB,IAAI,CAAC;QACvD,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,cAAc,GAAG,cAAc,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC3E,KAAK,IAAI,eAAe,GAAG,cAAc,EAAE,eAAe,IAAI,cAAc,IAAI,eAAe,IAAI,cAAc,GAAG,CAAC;YACjH,MAAM,2BAA2B,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;gBACtF,WAAW,EAAE,eAAe;gBAC5B,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,eAAe,EAAE,SAAS,EAAC,CAAC;gBAC7F,cAAc,EAAE,cAAc;gBAC9B,SAAS;gBACT,cAAc;gBACd,cAAc;gBACd,gBAAgB;gBAChB,YAAY;gBACZ,kBAAkB;aACrB,CAAC,CAAC;YAEH,IAAI,2BAA2B,CAAC,OAAO,IAAI,SAAS,CAAC,IAAI;gBACrD,2BAA2B,CAAC,MAAM,IAAI,CAClC,QAAQ,CAAC,IAAI,GAAG,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,GAAG,CACzF,eAAe,IAAI,qBAAqB;oBACpC,CAAC,CAAC,SAAS,CAAC,IAAI;oBAChB,CAAC,CAAC,CAAC,CACV,CACJ,EACH,CAAC;gBACC,IAAI,4BAA4B,IAAI,IAAI,IAAI,eAAe,IAAI,4BAA4B,EAAE,CAAC;oBAC1F,4BAA4B,GAAG,eAAe,CAAC;oBAE/C,IAAI,IAAI,KAAK,CAAC,CAAC;wBACX,MAAM;yBACL,IAAI,IAAI,GAAG,CAAC;wBACb,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;gBAClD,CAAC;YACL,CAAC;iBAAM,IAAI,IAAI,GAAG,CAAC;gBACf,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;YAE9C,IAAI,eAAe,IAAI,cAAc,IAAI,IAAI,KAAK,CAAC,CAAC;gBAChD,MAAM;YAEV,eAAe,IAAI,IAAI,CAAC;YACxB,IAAI,eAAe,GAAG,cAAc,EAAE,CAAC;gBACnC,eAAe,GAAG,cAAc,CAAC;gBACjC,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACvD,CAAC;iBAAM,IAAI,eAAe,GAAG,cAAc,EAAE,CAAC;gBAC1C,eAAe,GAAG,cAAc,CAAC;gBACjC,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACxD,CAAC;QACL,CAAC;QAED,IAAI,4BAA4B,IAAI,IAAI;YACpC,OAAO,4BAA4B,CAAC;QAExC,IAAI,wBAAwB;YACxB,OAAO,cAAc,CAAC;QAE1B,MAAM,kCAAkC,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;YAC7F,WAAW,EAAE,cAAc;YAC3B,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,cAAc,EAAE,SAAS,EAAC,CAAC;YAC5F,cAAc,EAAE,cAAc;YAC9B,SAAS;YACT,cAAc;YACd,cAAc;YACd,gBAAgB;YAChB,YAAY;YACZ,kBAAkB;SACrB,CAAC,CAAC;QAEH,MAAM,eAAe,GAAG,0BAA0B,CAAC,kCAAkC,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC;QAC1G,IAAI,kCAAkC,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YAC3D,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,eAAe;YAE5F,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,+CAA+C,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;aAC3N,IAAI,kCAAkC,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YAChE,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,CAAC,CAAC;aAClK,IAAI,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,eAAe;YACjG,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;aAClN,IAAI,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,eAAe;YAChF,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,qCAAqC,CAAC,CAAC;;YAElK,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,2CAA2C,CAAC,CAAC;IAChL,CAAC;IAED,MAAM,IAAI,KAAK,CAAC,0BAA0B,WAAW,GAAG,CAAC,CAAC;AAC9D,CAAC"}
@@ -1,7 +1,8 @@
1
1
  import { LlamaModelOptions } from "../../../evaluator/LlamaModel/LlamaModel.js";
2
2
  import { BuildGpu } from "../../../bindings/types.js";
3
+ import type { GgmlType } from "../../types/GgufTensorInfoTypes.js";
3
4
  import type { GgufInsights } from "../GgufInsights.js";
4
- export declare function resolveModelGpuLayersOption(gpuLayers: LlamaModelOptions["gpuLayers"], { ggufInsights, ignoreMemorySafetyChecks, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading, defaultContextFlashAttention, defaultContextSwaFullCache, useMmap }: {
5
+ export declare function resolveModelGpuLayersOption(gpuLayers: LlamaModelOptions["gpuLayers"], { ggufInsights, ignoreMemorySafetyChecks, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading, defaultContextFlashAttention, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache, useMmap }: {
5
6
  ggufInsights: GgufInsights;
6
7
  ignoreMemorySafetyChecks?: boolean;
7
8
  getVramState(): Promise<{
@@ -12,6 +13,8 @@ export declare function resolveModelGpuLayersOption(gpuLayers: LlamaModelOptions
12
13
  llamaGpu: BuildGpu;
13
14
  llamaSupportsGpuOffloading: boolean;
14
15
  defaultContextFlashAttention: boolean;
16
+ defaultContextKvCacheKeyType?: GgmlType;
17
+ defaultContextKvCacheValueType?: GgmlType;
15
18
  defaultContextSwaFullCache: boolean;
16
19
  useMmap?: boolean;
17
20
  }): Promise<number>;
@@ -4,7 +4,7 @@ import { getDefaultContextBatchSize, getDefaultModelContextSize } from "../../..
4
4
  import { minAllowedContextSizeInCalculations } from "../../../config.js";
5
5
  import { scoreLevels } from "./scoreLevels.js";
6
6
  const fitContextExtraMemoryPaddingPercentage = 0.5;
7
- export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ignoreMemorySafetyChecks = false, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading, defaultContextFlashAttention, defaultContextSwaFullCache, useMmap }) {
7
+ export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ignoreMemorySafetyChecks = false, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading, defaultContextFlashAttention, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache, useMmap }) {
8
8
  if (gpuLayers == null)
9
9
  gpuLayers = "auto";
10
10
  if (!llamaSupportsGpuOffloading)
@@ -21,6 +21,8 @@ export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ign
21
21
  ggufInsights,
22
22
  currentVram: vramState.free,
23
23
  defaultContextFlashAttention,
24
+ defaultContextKvCacheKeyType,
25
+ defaultContextKvCacheValueType,
24
26
  defaultContextSwaFullCache,
25
27
  useMmap
26
28
  });
@@ -53,6 +55,8 @@ export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ign
53
55
  ? gpuLayers.max
54
56
  : undefined,
55
57
  defaultContextFlashAttention,
58
+ defaultContextKvCacheKeyType,
59
+ defaultContextKvCacheValueType,
56
60
  defaultContextSwaFullCache,
57
61
  useMmap
58
62
  });
@@ -64,7 +68,7 @@ export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ign
64
68
  }
65
69
  throw new Error(`Invalid gpuLayers value: ${gpuLayers}`);
66
70
  }
67
- function getBestGpuLayersForFreeVram({ ggufInsights, freeVram, fitContext, minGpuLayers, maxGpuLayers, defaultContextFlashAttention, defaultContextSwaFullCache, useMmap }) {
71
+ function getBestGpuLayersForFreeVram({ ggufInsights, freeVram, fitContext, minGpuLayers, maxGpuLayers, defaultContextFlashAttention, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache, useMmap }) {
68
72
  return findBestOption({
69
73
  *generator() {
70
74
  const minLayers = Math.floor(Math.max(0, minGpuLayers ?? 0));
@@ -83,6 +87,8 @@ function getBestGpuLayersForFreeVram({ ggufInsights, freeVram, fitContext, minGp
83
87
  fitContext,
84
88
  defaultContextFlashAttention,
85
89
  defaultContextSwaFullCache,
90
+ defaultContextKvCacheKeyType,
91
+ defaultContextKvCacheValueType,
86
92
  useMmap
87
93
  });
88
94
  if (layersRequirements == null)
@@ -130,7 +136,7 @@ function scoreGpuLayersAndContextCombination({ gpuLayers, contextSize }, { total
130
136
  }
131
137
  return scoreGpuLayers() + scoreContextSize();
132
138
  }
133
- function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fitContext, defaultContextFlashAttention = false, defaultContextSwaFullCache = false, useMmap }) {
139
+ function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fitContext, defaultContextFlashAttention = false, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache = false, useMmap }) {
134
140
  const modelVram = ggufInsights.estimateModelResourceRequirements({
135
141
  gpuLayers,
136
142
  useMmap
@@ -145,6 +151,8 @@ function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fit
145
151
  sequences: 1,
146
152
  isEmbeddingContext: fitContext.embeddingContext ?? false,
147
153
  flashAttention: defaultContextFlashAttention,
154
+ kvCacheKeyType: defaultContextKvCacheKeyType,
155
+ kvCacheValueType: defaultContextKvCacheValueType,
148
156
  swaFullCache: defaultContextSwaFullCache
149
157
  }).gpuVram;
150
158
  const totalVram = modelVram + contextVram;
@@ -162,6 +170,8 @@ function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fit
162
170
  vram: currentVram - modelVram,
163
171
  isEmbeddingContext: fitContext?.embeddingContext ?? false,
164
172
  flashAttention: defaultContextFlashAttention,
173
+ kvCacheKeyType: defaultContextKvCacheKeyType,
174
+ kvCacheValueType: defaultContextKvCacheValueType,
165
175
  swaFullCache: defaultContextSwaFullCache
166
176
  });
167
177
  if (maxContext == null || modelVram + maxContext.vram > currentVram)
@@ -172,7 +182,7 @@ function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fit
172
182
  totalVram: modelVram + maxContext.vram
173
183
  };
174
184
  }
175
- function findMaxPossibleContextSizeForVram({ gpuLayers, ggufInsights, vram, isEmbeddingContext, flashAttention, swaFullCache }) {
185
+ function findMaxPossibleContextSizeForVram({ gpuLayers, ggufInsights, vram, isEmbeddingContext, flashAttention, kvCacheKeyType, kvCacheValueType, swaFullCache }) {
176
186
  const maxContextSize = getDefaultModelContextSize({ trainContextSize: ggufInsights.trainContextSize });
177
187
  return findMaxValidValue({
178
188
  maxValue: maxContextSize,
@@ -186,6 +196,8 @@ function findMaxPossibleContextSizeForVram({ gpuLayers, ggufInsights, vram, isEm
186
196
  sequences: 1,
187
197
  isEmbeddingContext,
188
198
  flashAttention,
199
+ kvCacheKeyType,
200
+ kvCacheValueType,
189
201
  swaFullCache
190
202
  }).gpuVram;
191
203
  if (contextVram <= vram)
@@ -1 +1 @@
1
- {"version":3,"file":"resolveModelGpuLayersOption.js","sourceRoot":"","sources":["../../../../src/gguf/insights/utils/resolveModelGpuLayersOption.ts"],"names":[],"mappings":"AAEA,OAAO,EAAC,uBAAuB,EAAC,MAAM,2CAA2C,CAAC;AAClF,OAAO,EAAC,cAAc,EAAC,MAAM,kCAAkC,CAAC;AAChE,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,iDAAiD,CAAC;AACvH,OAAO,EAAC,mCAAmC,EAAC,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAC,WAAW,EAAC,MAAM,kBAAkB,CAAC;AAG7C,MAAM,sCAAsC,GAAG,GAAG,CAAC;AAEnD,MAAM,CAAC,KAAK,UAAU,2BAA2B,CAAC,SAAyC,EAAE,EACzF,YAAY,EAAE,wBAAwB,GAAG,KAAK,EAAE,YAAY,EAAE,oBAAoB,EAClF,QAAQ,EAAE,0BAA0B,EAAE,4BAA4B,EAAE,0BAA0B,EAAE,OAAO,EAK1G;IACG,IAAI,SAAS,IAAI,IAAI;QACjB,SAAS,GAAG,MAAM,CAAC;IAEvB,IAAI,CAAC,0BAA0B;QAC3B,OAAO,CAAC,CAAC;IAEb,IAAI,SAAS,KAAK,KAAK,IAAI,OAAO,SAAS,KAAK,QAAQ,EAAE,CAAC;QACvD,MAAM,iBAAiB,GAAG,OAAO,SAAS,KAAK,QAAQ;YACnD,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,YAAY,CAAC,WAAW,EAAE,SAAS,CAAC,CAAC;YAC5D,CAAC,CAAC,YAAY,CAAC,WAAW,CAAC;QAE/B,IAAI,wBAAwB;YACxB,OAAO,iBAAiB,CAAC;QAE7B,MAAM,SAAS,GAAG,MAAM,YAAY,EAAE,CAAC;QACvC,MAAM,qBAAqB,GAAG,2BAA2B,CAAC;YACtD,SAAS,EAAE,iBAAiB;YAC5B,YAAY;YACZ,WAAW,EAAE,SAAS,CAAC,IAAI;YAC3B,4BAA4B;YAC5B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;QAEH,IAAI,qBAAqB,IAAI,IAAI;YAC7B,MAAM,IAAI,uBAAuB,CAAC,8DAA8D,CAAC,CAAC;QAEtG,OAAO,iBAAiB,CAAC;IAC7B,CAAC;SAAM,IAAI,SAAS,KAAK,MAAM,IAAI,OAAO,SAAS,KAAK,QAAQ,EAAE,CAAC;QAC/D,IAAI,QAAQ,KAAK,KAAK;YAClB,OAAO,CAAC,CAAC;QAEb,MAAM,SAAS,GAAG,MAAM,YAAY,EAAE,CAAC;QACvC,IAAI,SAAS,CAAC,KAAK,KAAK,CAAC;YACrB,OAAO,CAAC,CAAC;QAEb,IAAI,QAAQ,GAAG,SAAS,CAAC,IAAI,CAAC;QAC9B,IAAI,OAAO,SAAS,KAAK,QAAQ,IAAI,SAAS,CAAC,UAAU,EAAE,WAAW,IAAI,IAAI,EAAE,CAAC;YAC7E,QAAQ,IAAI,oBAAoB,GAAG,sCAAsC,CAAC;YAE1E,IAAI,QAAQ,GAAG,CAAC;gBACZ,QAAQ,GAAG,CAAC,CAAC;QACrB,CAAC;QAED,MAAM,mBAAmB,GAAG,2BAA2B,CAAC;YACpD,YAAY;YACZ,QAAQ;YACR,UAAU,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACrC,CAAC,CAAC,SAAS,CAAC,UAAU;gBACtB,CAAC,CAAC,SAAS;YACf,YAAY,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACvC,CAAC,CAAC,SAAS,CAAC,GAAG;gBACf,CAAC,CAAC,SAAS;YACf,YAAY,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACvC,CAAC,CAAC,SAAS,CAAC,GAAG;gBACf,CAAC,CAAC,SAAS;YACf,4BAA4B;YAC5B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;QAEH,MAAM,wBAAwB,GAAG,OAAO,SAAS,KAAK,QAAQ;YAC1D,CAAC,SAAS,CAAC,GAAG,IAAI,IAAI,IAAI,SAAS,CAAC,GAAG,IAAI,IAAI,IAAI,SAAS,CAAC,UAAU,EAAE,WAAW,IAAI,IAAI,CAAC,CAAC;QAElG,IAAI,CAAC,wBAAwB,IAAI,mBAAmB,IAAI,IAAI,IAAI,wBAAwB;YACpF,MAAM,IAAI,uBAAuB,CAAC,8DAA8D,CAAC,CAAC;QAEtG,OAAO,mBAAmB,IAAI,CAAC,CAAC;IACpC,CAAC;IAED,MAAM,IAAI,KAAK,CAAC,4BAA4B,SAAS,EAAE,CAAC,CAAC;AAC7D,CAAC;AAED,SAAS,2BAA2B,CAAC,EACjC,YAAY,EACZ,QAAQ,EACR,UAAU,EACV,YAAY,EACZ,YAAY,EACZ,4BAA4B,EAC5B,0BAA0B,EAC1B,OAAO,EAUV;IACG,OAAO,cAAc,CAAC;QAClB,CAAC,SAAS;YACN,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,YAAY,IAAI,CAAC,CAAC,CAAC,CAAC;YAC7D,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,YAAY,CAAC,WAAW,EAAE,YAAY,IAAI,YAAY,CAAC,WAAW,CAAC,CAAC,CAAC;YAE3G,KAAK,IAAI,MAAM,GAAG,SAAS,EAAE,MAAM,IAAI,SAAS,EAAE,MAAM,EAAE,EAAE,CAAC;gBACzD,MAAM;oBACF,SAAS,EAAE,MAAM;iBACpB,CAAC;YACN,CAAC;QACL,CAAC;QACD,KAAK,CAAC,MAAM;YACR,MAAM,kBAAkB,GAAG,2BAA2B,CAAC;gBACnD,SAAS,EAAE,MAAM,CAAC,SAAS;gBAC3B,YAAY;gBACZ,WAAW,EAAE,QAAQ;gBACrB,UAAU;gBACV,4BAA4B;gBAC5B,0BAA0B;gBAC1B,OAAO;aACV,CAAC,CAAC;YAEH,IAAI,kBAAkB,IAAI,IAAI;gBAC1B,OAAO,IAAI,CAAC;YAEhB,OAAO,mCAAmC,CAAC,EAAC,SAAS,EAAE,MAAM,CAAC,SAAS,EAAE,WAAW,EAAE,kBAAkB,CAAC,WAAW,EAAC,EAAE;gBACnH,cAAc,EAAE,YAAY,CAAC,WAAW;gBACxC,gBAAgB,EAAE,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,YAAY,CAAC,gBAAgB,EAAC,CAAC;aAClG,CAAC,CAAC;QACP,CAAC;KACJ,CAAC,EAAE,SAAS,IAAI,IAAI,CAAC;AAC1B,CAAC;AAED,SAAS,mCAAmC,CAAC,EAAC,SAAS,EAAE,WAAW,EAA2C,EAAE,EAC7G,cAAc,EAAE,gBAAgB,EAGnC;IACG,SAAS,cAAc;QACnB,OAAO,WAAW,CAAC,SAAS,EAAE,CAAC;gBAC3B,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,EAAE;aACb,EAAE;gBACC,KAAK,EAAE,cAAc;gBACrB,MAAM,EAAE,EAAE;gBACV,GAAG,EAAE,cAAc;aACtB,CAAC,CAAC,CAAC;IACR,CAAC;IAED,SAAS,gBAAgB;QACrB,MAAM,mBAAmB,GAAG,SAAS,GAAG,cAAc,CAAC;QAEvD,OAAO,WAAW,CAAC,WAAW,EAAE,CAAC;gBAC7B,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;aAC5C,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,EAAE;aAC7C,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;gBACzC,GAAG,EAAE,IAAI,CAAC,GAAG,CAAC,gBAAgB,EAAE,KAAK,CAAC;aACzC,CAAC,CAAC,CAAC;IACR,CAAC;IAED,OAAO,cAAc,EAAE,GAAG,gBAAgB,EAAE,CAAC;AACjD,CAAC;AAED,SAAS,2BAA2B,CAAC,EACjC,SAAS,EAAE,YAAY,EAAE,WAAW,EAAE,UAAU,EAAE,4BAA4B,GAAG,KAAK,EAAE,0BAA0B,GAAG,KAAK,EAAE,OAAO,EAItI;IACG,MAAM,SAAS,GAAG,YAAY,CAAC,iCAAiC,CAAC;QAC7D,SAAS;QACT,OAAO;KACV,CAAC,CAAC,OAAO,CAAC;IAEX,IAAI,SAAS,GAAG,WAAW;QACvB,OAAO,IAAI,CAAC;IAEhB,IAAI,UAAU,IAAI,IAAI,IAAI,UAAU,CAAC,WAAW,IAAI,IAAI,EAAE,CAAC;QACvD,MAAM,WAAW,GAAG,YAAY,CAAC,mCAAmC,CAAC;YACjE,WAAW,EAAE,UAAU,CAAC,WAAW;YACnC,SAAS,EAAE,0BAA0B,CAAC,EAAC,WAAW,EAAE,UAAU,CAAC,WAAW,EAAE,SAAS,EAAE,CAAC,EAAC,CAAC;YAC1F,cAAc,EAAE,SAAS;YACzB,SAAS,EAAE,CAAC;YACZ,kBAAkB,EAAE,UAAU,CAAC,gBAAgB,IAAI,KAAK;YACxD,cAAc,EAAE,4BAA4B;YAC5C,YAAY,EAAE,0BAA0B;SAC3C,CAAC,CAAC,OAAO,CAAC;QAEX,MAAM,SAAS,GAAG,SAAS,GAAG,WAAW,CAAC;QAC1C,IAAI,SAAS,GAAG,WAAW;YACvB,OAAO,IAAI,CAAC;QAEhB,OAAO;YACH,WAAW,EAAE,UAAU,CAAC,WAAW;YACnC,WAAW;YACX,SAAS;SACZ,CAAC;IACN,CAAC;IAED,MAAM,UAAU,GAAG,iCAAiC,CAAC;QACjD,SAAS;QACT,YAAY;QACZ,IAAI,EAAE,WAAW,GAAG,SAAS;QAC7B,kBAAkB,EAAE,UAAU,EAAE,gBAAgB,IAAI,KAAK;QACzD,cAAc,EAAE,4BAA4B;QAC5C,YAAY,EAAE,0BAA0B;KAC3C,CAAC,CAAC;IAEH,IAAI,UAAU,IAAI,IAAI,IAAI,SAAS,GAAG,UAAU,CAAC,IAAI,GAAG,WAAW;QAC/D,OAAO,IAAI,CAAC;IAEhB,OAAO;QACH,WAAW,EAAE,UAAU,CAAC,WAAW;QACnC,WAAW,EAAE,UAAU,CAAC,IAAI;QAC5B,SAAS,EAAE,SAAS,GAAG,UAAU,CAAC,IAAI;KACzC,CAAC;AACN,CAAC;AAED,SAAS,iCAAiC,CAAC,EAAC,SAAS,EAAE,YAAY,EAAE,IAAI,EAAE,kBAAkB,EAAE,cAAc,EAAE,YAAY,EAE1H;IACG,MAAM,cAAc,GAAG,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,YAAY,CAAC,gBAAgB,EAAC,CAAC,CAAC;IAErG,OAAO,iBAAiB,CAAC;QACrB,QAAQ,EAAE,cAAc;QACxB,QAAQ,EAAE,mCAAmC;QAC7C,OAAO,EAAE,CAAC;QACV,IAAI,CAAC,WAAW;YACZ,MAAM,WAAW,GAAG,YAAY,CAAC,mCAAmC,CAAC;gBACjE,WAAW;gBACX,SAAS,EAAE,0BAA0B,CAAC,EAAC,WAAW,EAAE,SAAS,EAAE,CAAC,EAAC,CAAC;gBAClE,cAAc,EAAE,SAAS;gBACzB,SAAS,EAAE,CAAC;gBACZ,kBAAkB;gBAClB,cAAc;gBACd,YAAY;aACf,CAAC,CAAC,OAAO,CAAC;YAEX,IAAI,WAAW,IAAI,IAAI;gBACnB,OAAO;oBACH,WAAW;oBACX,IAAI,EAAE,WAAW;iBACpB,CAAC;YAEN,OAAO,IAAI,CAAC;QAChB,CAAC;KACJ,CAAC,CAAC;AACP,CAAC;AAED,SAAS,iBAAiB,CAAI,EAC1B,QAAQ,EACR,QAAQ,EACR,OAAO,GAAG,CAAC,EACX,IAAI,EAMP;IACG,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,QAAQ,GAAG,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;IACrE,IAAI,SAAS,GAAsC,IAAI,CAAC;IAExD,KAAK,IAAI,KAAK,GAAG,QAAQ,EAAE,KAAK,IAAI,QAAQ,GAAG,CAAC;QAC5C,MAAM,MAAM,GAAa,CAAC,SAAS,IAAI,IAAI,IAAI,KAAK,KAAK,SAAS,CAAC,KAAK,CAAC;YACrE,CAAC,CAAC,SAAS,CAAC,MAAM;YAClB,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAElB,IAAI,MAAM,IAAI,IAAI,EAAE,CAAC;YACjB,IAAI,SAAS,IAAI,IAAI,IAAI,KAAK,IAAI,SAAS,CAAC,KAAK,EAAE,CAAC;gBAChD,SAAS,GAAG,EAAC,KAAK,EAAE,KAAK,EAAE,MAAM,EAAE,MAAM,EAAC,CAAC;gBAE3C,IAAI,IAAI,KAAK,CAAC,OAAO;oBACjB,MAAM;qBACL,IAAI,IAAI,GAAG,CAAC;oBACb,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;YACxD,CAAC;QACL,CAAC;aAAM,IAAI,SAAS,IAAI,IAAI,IAAI,KAAK,GAAG,SAAS,CAAC,KAAK,EAAE,CAAC;YACtD,KAAK,GAAG,SAAS,CAAC,KAAK,CAAC;YACxB,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACzD,SAAS;QACb,CAAC;aAAM,IAAI,IAAI,GAAG,CAAC;YACf,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;QAEpD,IAAI,KAAK,KAAK,QAAQ,IAAI,IAAI,KAAK,CAAC,OAAO;YACvC,MAAM;QAEV,KAAK,IAAI,IAAI,CAAC;QACd,IAAI,KAAK,GAAG,QAAQ,EAAE,CAAC;YACnB,KAAK,GAAG,QAAQ,CAAC;YACjB,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC7D,CAAC;aAAM,IAAI,KAAK,GAAG,QAAQ,EAAE,CAAC;YAC1B,KAAK,GAAG,QAAQ,CAAC;YACjB,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC9D,CAAC;IACL,CAAC;IAED,IAAI,SAAS,IAAI,IAAI;QACjB,OAAO,SAAS,CAAC,MAAM,CAAC;IAE5B,OAAO,IAAI,CAAC;AAChB,CAAC"}
1
+ {"version":3,"file":"resolveModelGpuLayersOption.js","sourceRoot":"","sources":["../../../../src/gguf/insights/utils/resolveModelGpuLayersOption.ts"],"names":[],"mappings":"AAEA,OAAO,EAAC,uBAAuB,EAAC,MAAM,2CAA2C,CAAC;AAClF,OAAO,EAAC,cAAc,EAAC,MAAM,kCAAkC,CAAC;AAChE,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,iDAAiD,CAAC;AACvH,OAAO,EAAC,mCAAmC,EAAC,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAC,WAAW,EAAC,MAAM,kBAAkB,CAAC;AAI7C,MAAM,sCAAsC,GAAG,GAAG,CAAC;AAEnD,MAAM,CAAC,KAAK,UAAU,2BAA2B,CAAC,SAAyC,EAAE,EACzF,YAAY,EAAE,wBAAwB,GAAG,KAAK,EAAE,YAAY,EAAE,oBAAoB,EAClF,QAAQ,EAAE,0BAA0B,EAAE,4BAA4B,EAClE,4BAA4B,EAAE,8BAA8B,EAAE,0BAA0B,EAAE,OAAO,EAOpG;IACG,IAAI,SAAS,IAAI,IAAI;QACjB,SAAS,GAAG,MAAM,CAAC;IAEvB,IAAI,CAAC,0BAA0B;QAC3B,OAAO,CAAC,CAAC;IAEb,IAAI,SAAS,KAAK,KAAK,IAAI,OAAO,SAAS,KAAK,QAAQ,EAAE,CAAC;QACvD,MAAM,iBAAiB,GAAG,OAAO,SAAS,KAAK,QAAQ;YACnD,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,YAAY,CAAC,WAAW,EAAE,SAAS,CAAC,CAAC;YAC5D,CAAC,CAAC,YAAY,CAAC,WAAW,CAAC;QAE/B,IAAI,wBAAwB;YACxB,OAAO,iBAAiB,CAAC;QAE7B,MAAM,SAAS,GAAG,MAAM,YAAY,EAAE,CAAC;QACvC,MAAM,qBAAqB,GAAG,2BAA2B,CAAC;YACtD,SAAS,EAAE,iBAAiB;YAC5B,YAAY;YACZ,WAAW,EAAE,SAAS,CAAC,IAAI;YAC3B,4BAA4B;YAC5B,4BAA4B;YAC5B,8BAA8B;YAC9B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;QAEH,IAAI,qBAAqB,IAAI,IAAI;YAC7B,MAAM,IAAI,uBAAuB,CAAC,8DAA8D,CAAC,CAAC;QAEtG,OAAO,iBAAiB,CAAC;IAC7B,CAAC;SAAM,IAAI,SAAS,KAAK,MAAM,IAAI,OAAO,SAAS,KAAK,QAAQ,EAAE,CAAC;QAC/D,IAAI,QAAQ,KAAK,KAAK;YAClB,OAAO,CAAC,CAAC;QAEb,MAAM,SAAS,GAAG,MAAM,YAAY,EAAE,CAAC;QACvC,IAAI,SAAS,CAAC,KAAK,KAAK,CAAC;YACrB,OAAO,CAAC,CAAC;QAEb,IAAI,QAAQ,GAAG,SAAS,CAAC,IAAI,CAAC;QAC9B,IAAI,OAAO,SAAS,KAAK,QAAQ,IAAI,SAAS,CAAC,UAAU,EAAE,WAAW,IAAI,IAAI,EAAE,CAAC;YAC7E,QAAQ,IAAI,oBAAoB,GAAG,sCAAsC,CAAC;YAE1E,IAAI,QAAQ,GAAG,CAAC;gBACZ,QAAQ,GAAG,CAAC,CAAC;QACrB,CAAC;QAED,MAAM,mBAAmB,GAAG,2BAA2B,CAAC;YACpD,YAAY;YACZ,QAAQ;YACR,UAAU,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACrC,CAAC,CAAC,SAAS,CAAC,UAAU;gBACtB,CAAC,CAAC,SAAS;YACf,YAAY,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACvC,CAAC,CAAC,SAAS,CAAC,GAAG;gBACf,CAAC,CAAC,SAAS;YACf,YAAY,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACvC,CAAC,CAAC,SAAS,CAAC,GAAG;gBACf,CAAC,CAAC,SAAS;YACf,4BAA4B;YAC5B,4BAA4B;YAC5B,8BAA8B;YAC9B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;QAEH,MAAM,wBAAwB,GAAG,OAAO,SAAS,KAAK,QAAQ;YAC1D,CAAC,SAAS,CAAC,GAAG,IAAI,IAAI,IAAI,SAAS,CAAC,GAAG,IAAI,IAAI,IAAI,SAAS,CAAC,UAAU,EAAE,WAAW,IAAI,IAAI,CAAC,CAAC;QAElG,IAAI,CAAC,wBAAwB,IAAI,mBAAmB,IAAI,IAAI,IAAI,wBAAwB;YACpF,MAAM,IAAI,uBAAuB,CAAC,8DAA8D,CAAC,CAAC;QAEtG,OAAO,mBAAmB,IAAI,CAAC,CAAC;IACpC,CAAC;IAED,MAAM,IAAI,KAAK,CAAC,4BAA4B,SAAS,EAAE,CAAC,CAAC;AAC7D,CAAC;AAED,SAAS,2BAA2B,CAAC,EACjC,YAAY,EACZ,QAAQ,EACR,UAAU,EACV,YAAY,EACZ,YAAY,EACZ,4BAA4B,EAC5B,4BAA4B,EAC5B,8BAA8B,EAC9B,0BAA0B,EAC1B,OAAO,EAYV;IACG,OAAO,cAAc,CAAC;QAClB,CAAC,SAAS;YACN,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,YAAY,IAAI,CAAC,CAAC,CAAC,CAAC;YAC7D,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,YAAY,CAAC,WAAW,EAAE,YAAY,IAAI,YAAY,CAAC,WAAW,CAAC,CAAC,CAAC;YAE3G,KAAK,IAAI,MAAM,GAAG,SAAS,EAAE,MAAM,IAAI,SAAS,EAAE,MAAM,EAAE,EAAE,CAAC;gBACzD,MAAM;oBACF,SAAS,EAAE,MAAM;iBACpB,CAAC;YACN,CAAC;QACL,CAAC;QACD,KAAK,CAAC,MAAM;YACR,MAAM,kBAAkB,GAAG,2BAA2B,CAAC;gBACnD,SAAS,EAAE,MAAM,CAAC,SAAS;gBAC3B,YAAY;gBACZ,WAAW,EAAE,QAAQ;gBACrB,UAAU;gBACV,4BAA4B;gBAC5B,0BAA0B;gBAC1B,4BAA4B;gBAC5B,8BAA8B;gBAC9B,OAAO;aACV,CAAC,CAAC;YAEH,IAAI,kBAAkB,IAAI,IAAI;gBAC1B,OAAO,IAAI,CAAC;YAEhB,OAAO,mCAAmC,CAAC,EAAC,SAAS,EAAE,MAAM,CAAC,SAAS,EAAE,WAAW,EAAE,kBAAkB,CAAC,WAAW,EAAC,EAAE;gBACnH,cAAc,EAAE,YAAY,CAAC,WAAW;gBACxC,gBAAgB,EAAE,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,YAAY,CAAC,gBAAgB,EAAC,CAAC;aAClG,CAAC,CAAC;QACP,CAAC;KACJ,CAAC,EAAE,SAAS,IAAI,IAAI,CAAC;AAC1B,CAAC;AAED,SAAS,mCAAmC,CAAC,EAAC,SAAS,EAAE,WAAW,EAA2C,EAAE,EAC7G,cAAc,EAAE,gBAAgB,EAGnC;IACG,SAAS,cAAc;QACnB,OAAO,WAAW,CAAC,SAAS,EAAE,CAAC;gBAC3B,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,EAAE;aACb,EAAE;gBACC,KAAK,EAAE,cAAc;gBACrB,MAAM,EAAE,EAAE;gBACV,GAAG,EAAE,cAAc;aACtB,CAAC,CAAC,CAAC;IACR,CAAC;IAED,SAAS,gBAAgB;QACrB,MAAM,mBAAmB,GAAG,SAAS,GAAG,cAAc,CAAC;QAEvD,OAAO,WAAW,CAAC,WAAW,EAAE,CAAC;gBAC7B,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;aAC5C,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,EAAE;aAC7C,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;gBACzC,GAAG,EAAE,IAAI,CAAC,GAAG,CAAC,gBAAgB,EAAE,KAAK,CAAC;aACzC,CAAC,CAAC,CAAC;IACR,CAAC;IAED,OAAO,cAAc,EAAE,GAAG,gBAAgB,EAAE,CAAC;AACjD,CAAC;AAED,SAAS,2BAA2B,CAAC,EACjC,SAAS,EAAE,YAAY,EAAE,WAAW,EAAE,UAAU,EAAE,4BAA4B,GAAG,KAAK,EACtF,4BAA4B,EAAE,8BAA8B,EAAE,0BAA0B,GAAG,KAAK,EAAE,OAAO,EAK5G;IACG,MAAM,SAAS,GAAG,YAAY,CAAC,iCAAiC,CAAC;QAC7D,SAAS;QACT,OAAO;KACV,CAAC,CAAC,OAAO,CAAC;IAEX,IAAI,SAAS,GAAG,WAAW;QACvB,OAAO,IAAI,CAAC;IAEhB,IAAI,UAAU,IAAI,IAAI,IAAI,UAAU,CAAC,WAAW,IAAI,IAAI,EAAE,CAAC;QACvD,MAAM,WAAW,GAAG,YAAY,CAAC,mCAAmC,CAAC;YACjE,WAAW,EAAE,UAAU,CAAC,WAAW;YACnC,SAAS,EAAE,0BAA0B,CAAC,EAAC,WAAW,EAAE,UAAU,CAAC,WAAW,EAAE,SAAS,EAAE,CAAC,EAAC,CAAC;YAC1F,cAAc,EAAE,SAAS;YACzB,SAAS,EAAE,CAAC;YACZ,kBAAkB,EAAE,UAAU,CAAC,gBAAgB,IAAI,KAAK;YACxD,cAAc,EAAE,4BAA4B;YAC5C,cAAc,EAAE,4BAA4B;YAC5C,gBAAgB,EAAE,8BAA8B;YAChD,YAAY,EAAE,0BAA0B;SAC3C,CAAC,CAAC,OAAO,CAAC;QAEX,MAAM,SAAS,GAAG,SAAS,GAAG,WAAW,CAAC;QAC1C,IAAI,SAAS,GAAG,WAAW;YACvB,OAAO,IAAI,CAAC;QAEhB,OAAO;YACH,WAAW,EAAE,UAAU,CAAC,WAAW;YACnC,WAAW;YACX,SAAS;SACZ,CAAC;IACN,CAAC;IAED,MAAM,UAAU,GAAG,iCAAiC,CAAC;QACjD,SAAS;QACT,YAAY;QACZ,IAAI,EAAE,WAAW,GAAG,SAAS;QAC7B,kBAAkB,EAAE,UAAU,EAAE,gBAAgB,IAAI,KAAK;QACzD,cAAc,EAAE,4BAA4B;QAC5C,cAAc,EAAE,4BAA4B;QAC5C,gBAAgB,EAAE,8BAA8B;QAChD,YAAY,EAAE,0BAA0B;KAC3C,CAAC,CAAC;IAEH,IAAI,UAAU,IAAI,IAAI,IAAI,SAAS,GAAG,UAAU,CAAC,IAAI,GAAG,WAAW;QAC/D,OAAO,IAAI,CAAC;IAEhB,OAAO;QACH,WAAW,EAAE,UAAU,CAAC,WAAW;QACnC,WAAW,EAAE,UAAU,CAAC,IAAI;QAC5B,SAAS,EAAE,SAAS,GAAG,UAAU,CAAC,IAAI;KACzC,CAAC;AACN,CAAC;AAED,SAAS,iCAAiC,CAAC,EACvC,SAAS,EAAE,YAAY,EAAE,IAAI,EAAE,kBAAkB,EAAE,cAAc,EAAE,cAAc,EAAE,gBAAgB,EAAE,YAAY,EAIpH;IACG,MAAM,cAAc,GAAG,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,YAAY,CAAC,gBAAgB,EAAC,CAAC,CAAC;IAErG,OAAO,iBAAiB,CAAC;QACrB,QAAQ,EAAE,cAAc;QACxB,QAAQ,EAAE,mCAAmC;QAC7C,OAAO,EAAE,CAAC;QACV,IAAI,CAAC,WAAW;YACZ,MAAM,WAAW,GAAG,YAAY,CAAC,mCAAmC,CAAC;gBACjE,WAAW;gBACX,SAAS,EAAE,0BAA0B,CAAC,EAAC,WAAW,EAAE,SAAS,EAAE,CAAC,EAAC,CAAC;gBAClE,cAAc,EAAE,SAAS;gBACzB,SAAS,EAAE,CAAC;gBACZ,kBAAkB;gBAClB,cAAc;gBACd,cAAc;gBACd,gBAAgB;gBAChB,YAAY;aACf,CAAC,CAAC,OAAO,CAAC;YAEX,IAAI,WAAW,IAAI,IAAI;gBACnB,OAAO;oBACH,WAAW;oBACX,IAAI,EAAE,WAAW;iBACpB,CAAC;YAEN,OAAO,IAAI,CAAC;QAChB,CAAC;KACJ,CAAC,CAAC;AACP,CAAC;AAED,SAAS,iBAAiB,CAAI,EAC1B,QAAQ,EACR,QAAQ,EACR,OAAO,GAAG,CAAC,EACX,IAAI,EAMP;IACG,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,QAAQ,GAAG,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;IACrE,IAAI,SAAS,GAAsC,IAAI,CAAC;IAExD,KAAK,IAAI,KAAK,GAAG,QAAQ,EAAE,KAAK,IAAI,QAAQ,GAAG,CAAC;QAC5C,MAAM,MAAM,GAAa,CAAC,SAAS,IAAI,IAAI,IAAI,KAAK,KAAK,SAAS,CAAC,KAAK,CAAC;YACrE,CAAC,CAAC,SAAS,CAAC,MAAM;YAClB,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAElB,IAAI,MAAM,IAAI,IAAI,EAAE,CAAC;YACjB,IAAI,SAAS,IAAI,IAAI,IAAI,KAAK,IAAI,SAAS,CAAC,KAAK,EAAE,CAAC;gBAChD,SAAS,GAAG,EAAC,KAAK,EAAE,KAAK,EAAE,MAAM,EAAE,MAAM,EAAC,CAAC;gBAE3C,IAAI,IAAI,KAAK,CAAC,OAAO;oBACjB,MAAM;qBACL,IAAI,IAAI,GAAG,CAAC;oBACb,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;YACxD,CAAC;QACL,CAAC;aAAM,IAAI,SAAS,IAAI,IAAI,IAAI,KAAK,GAAG,SAAS,CAAC,KAAK,EAAE,CAAC;YACtD,KAAK,GAAG,SAAS,CAAC,KAAK,CAAC;YACxB,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACzD,SAAS;QACb,CAAC;aAAM,IAAI,IAAI,GAAG,CAAC;YACf,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;QAEpD,IAAI,KAAK,KAAK,QAAQ,IAAI,IAAI,KAAK,CAAC,OAAO;YACvC,MAAM;QAEV,KAAK,IAAI,IAAI,CAAC;QACd,IAAI,KAAK,GAAG,QAAQ,EAAE,CAAC;YACnB,KAAK,GAAG,QAAQ,CAAC;YACjB,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC7D,CAAC;aAAM,IAAI,KAAK,GAAG,QAAQ,EAAE,CAAC;YAC1B,KAAK,GAAG,QAAQ,CAAC;YACjB,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC9D,CAAC;IACL,CAAC;IAED,IAAI,SAAS,IAAI,IAAI;QACjB,OAAO,SAAS,CAAC,MAAM,CAAC;IAE5B,OAAO,IAAI,CAAC;AAChB,CAAC"}
@@ -18,6 +18,7 @@ export declare const enum GgufArchitectureType {
18
18
  neoBert = "neo-bert",
19
19
  jinaBertV2 = "jina-bert-v2",
20
20
  jinaBertV3 = "jina-bert-v3",
21
+ eurobert = "eurobert",
21
22
  bloom = "bloom",
22
23
  stablelm = "stablelm",
23
24
  qwen = "qwen",
@@ -71,6 +72,7 @@ export declare const enum GgufArchitectureType {
71
72
  t5 = "t5",
72
73
  t5encoder = "t5encoder",
73
74
  jais = "jais",
75
+ jais2 = "jais2",
74
76
  nemotron = "nemotron",
75
77
  nemotronH = "nemotron_h",
76
78
  nemotronHMoe = "nemotron_h_moe",
@@ -112,10 +114,13 @@ export declare const enum GgufArchitectureType {
112
114
  rnd1 = "rnd1",
113
115
  panguEmbedded = "pangu-embedded",
114
116
  mistral3 = "mistral3",
117
+ mistral4 = "mistral4",
118
+ paddleocr = "paddleocr",
115
119
  mimo2 = "mimo2",
116
120
  step35 = "step35",
117
121
  llamaEmbed = "llama-embed",
118
122
  maincoder = "maincoder",
123
+ kimiLinear = "kimi-linear",
119
124
  clip = "clip",
120
125
  unknown = "(unknown)"
121
126
  }
@@ -176,7 +181,8 @@ export declare enum GgufFileType {
176
181
  MOSTLY_Q4_0_8_8 = 35,// deprecated
177
182
  MOSTLY_TQ1_0 = 36,
178
183
  MOSTLY_TQ2_0 = 37,
179
- MOSTLY_MXFP4_MOE = 38
184
+ MOSTLY_MXFP4_MOE = 38,
185
+ MOSTLY_NVFP4 = 39
180
186
  }
181
187
  export type GgufMetadataGeneral<A extends GgufArchitectureType = GgufArchitectureType> = {
182
188
  readonly architecture: A;
@@ -268,7 +274,7 @@ export declare const enum GgufMetadataTokenizerTokenType {
268
274
  export type GgufMetadataTokenizer = {
269
275
  readonly ggml: {
270
276
  readonly model: "no_vocab" | "none" | "llama" | "gpt2" | "bert" | "rwkv" | "t5" | "plamo2" | string;
271
- readonly pre?: "default" | "llama3" | "llama-v3" | "llama-bpe" | "deepseek-llm" | "deepseek-coder" | "falcon" | "falcon3" | "pixtral" | "mpt" | "starcoder" | "gpt-2" | "phi-2" | "jina-es" | "jina-de" | "jina-v1-en" | "jina-v2-es" | "jina-v2-de" | "jina-v2-code" | "refact" | "command-r" | "qwen2" | "stablelm2" | "olmo" | "dbrx" | "smaug-bpe" | "poro-chat" | "chatglm-bpe" | "viking" | "jais" | "tekken" | "smollm" | "codeshell" | "bloom" | "gpt3-finnish" | "exaone" | "exaone4" | "chameleon" | "minerva-7b" | "megrez" | "gpt-4o" | "superbpe" | "trillion" | "bailingmoe" | "a.x-4.0" | "mellum" | string;
277
+ readonly pre?: "default" | "llama3" | "llama-v3" | "llama-bpe" | "deepseek-llm" | "deepseek-coder" | "falcon" | "falcon3" | "pixtral" | "mpt" | "starcoder" | "gpt-2" | "phi-2" | "jina-es" | "jina-de" | "jina-v1-en" | "jina-v2-es" | "jina-v2-de" | "jina-v2-code" | "refact" | "command-r" | "qwen2" | "stablelm2" | "olmo" | "dbrx" | "smaug-bpe" | "poro-chat" | "chatglm-bpe" | "viking" | "jais" | "tekken" | "smollm" | "codeshell" | "bloom" | "gpt3-finnish" | "exaone" | "exaone4" | "chameleon" | "minerva-7b" | "megrez" | "gpt-4o" | "superbpe" | "trillion" | "bailingmoe" | "a.x-4.0" | "mellum" | "modern-bert" | "roberta-bpe" | "deepseek-r1-qwen" | "kormo" | "qwen35" | string;
272
278
  readonly tokens: readonly string[];
273
279
  readonly token_type: GgufMetadataTokenizerTokenType[];
274
280
  readonly token_type_count?: number;
@@ -319,6 +325,7 @@ export type GgufMetadataDefaultArchitectureType = {
319
325
  readonly context_length?: number;
320
326
  readonly embedding_length?: number;
321
327
  readonly block_count?: number;
328
+ readonly full_attention_interval?: number;
322
329
  readonly feed_forward_length?: number;
323
330
  readonly use_parallel_residual?: boolean;
324
331
  readonly tensor_data_layout?: string;
@@ -337,11 +344,13 @@ export type GgufMetadataDefaultArchitectureType = {
337
344
  readonly key_length?: number;
338
345
  readonly value_length?: number;
339
346
  readonly sliding_window?: number;
347
+ readonly sliding_window_pattern?: number | number[];
340
348
  readonly causal?: boolean;
341
349
  };
342
350
  readonly rope?: {
343
351
  readonly dimension_count?: number;
344
352
  readonly freq_base?: number;
353
+ readonly freq_base_swa?: number;
345
354
  readonly scale_linear?: number;
346
355
  readonly scaling?: {
347
356
  readonly type?: "none" | "linear" | "yarn" | string;
@@ -355,6 +364,13 @@ export type GgufMetadataDefaultArchitectureType = {
355
364
  readonly inner_size?: number;
356
365
  readonly state_size?: number;
357
366
  readonly time_step_rank?: number;
367
+ readonly group_count?: number;
368
+ };
369
+ readonly kda?: {
370
+ readonly head_dim?: number;
371
+ };
372
+ readonly shortconv?: {
373
+ readonly l_cache?: number;
358
374
  };
359
375
  readonly wkv?: {
360
376
  readonly head_size?: number;
@@ -19,6 +19,7 @@ export var GgufArchitectureType;
19
19
  GgufArchitectureType["neoBert"] = "neo-bert";
20
20
  GgufArchitectureType["jinaBertV2"] = "jina-bert-v2";
21
21
  GgufArchitectureType["jinaBertV3"] = "jina-bert-v3";
22
+ GgufArchitectureType["eurobert"] = "eurobert";
22
23
  GgufArchitectureType["bloom"] = "bloom";
23
24
  GgufArchitectureType["stablelm"] = "stablelm";
24
25
  GgufArchitectureType["qwen"] = "qwen";
@@ -72,6 +73,7 @@ export var GgufArchitectureType;
72
73
  GgufArchitectureType["t5"] = "t5";
73
74
  GgufArchitectureType["t5encoder"] = "t5encoder";
74
75
  GgufArchitectureType["jais"] = "jais";
76
+ GgufArchitectureType["jais2"] = "jais2";
75
77
  GgufArchitectureType["nemotron"] = "nemotron";
76
78
  GgufArchitectureType["nemotronH"] = "nemotron_h";
77
79
  GgufArchitectureType["nemotronHMoe"] = "nemotron_h_moe";
@@ -113,10 +115,13 @@ export var GgufArchitectureType;
113
115
  GgufArchitectureType["rnd1"] = "rnd1";
114
116
  GgufArchitectureType["panguEmbedded"] = "pangu-embedded";
115
117
  GgufArchitectureType["mistral3"] = "mistral3";
118
+ GgufArchitectureType["mistral4"] = "mistral4";
119
+ GgufArchitectureType["paddleocr"] = "paddleocr";
116
120
  GgufArchitectureType["mimo2"] = "mimo2";
117
121
  GgufArchitectureType["step35"] = "step35";
118
122
  GgufArchitectureType["llamaEmbed"] = "llama-embed";
119
123
  GgufArchitectureType["maincoder"] = "maincoder";
124
+ GgufArchitectureType["kimiLinear"] = "kimi-linear";
120
125
  GgufArchitectureType["clip"] = "clip";
121
126
  GgufArchitectureType["unknown"] = "(unknown)";
122
127
  })(GgufArchitectureType || (GgufArchitectureType = {}));
@@ -162,6 +167,7 @@ export var GgufFileType;
162
167
  GgufFileType[GgufFileType["MOSTLY_TQ1_0"] = 36] = "MOSTLY_TQ1_0";
163
168
  GgufFileType[GgufFileType["MOSTLY_TQ2_0"] = 37] = "MOSTLY_TQ2_0";
164
169
  GgufFileType[GgufFileType["MOSTLY_MXFP4_MOE"] = 38] = "MOSTLY_MXFP4_MOE";
170
+ GgufFileType[GgufFileType["MOSTLY_NVFP4"] = 39] = "MOSTLY_NVFP4";
165
171
  })(GgufFileType || (GgufFileType = {}));
166
172
  export var GgufMetadataTokenizerTokenType;
167
173
  (function (GgufMetadataTokenizerTokenType) {
@@ -1 +1 @@
1
- {"version":3,"file":"GgufMetadataTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufMetadataTypes.ts"],"names":[],"mappings":"AAAA,MAAM,CAAN,IAAkB,oBAwHjB;AAxHD,WAAkB,oBAAoB;IAClC,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,mCAAW,CAAA;IACX,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,kDAA0B,CAAA;IAC1B,gDAAwB,CAAA;IACxB,uDAA+B,CAAA;IAC/B,4CAAoB,CAAA;IACpB,mDAA2B,CAAA;IAC3B,mDAA2B,CAAA;IAC3B,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,2CAAmB,CAAA;IACnB,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,iDAAyB,CAAA;IACzB,yCAAiB,CAAA;IACjB,+CAAuB,CAAA;IACvB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,yCAAiB,CAAA;IACjB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,yCAAiB,CAAA;IACjB,+CAAuB,CAAA;IACvB,uCAAe,CAAA;IACf,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,6CAAqB,CAAA;IACrB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,0DAAkC,CAAA;IAClC,iDAAyB,CAAA;IACzB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,uCAAe,CAAA;IACf,8CAAsB,CAAA;IACtB,yCAAiB,CAAA;IACjB,8CAAsB,CAAA;IACtB,2CAAmB,CAAA;IACnB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,2CAAmB,CAAA;IACnB,yCAAiB,CAAA;IACjB,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,0CAAkB,CAAA;IAClB,yCAAiB,CAAA;IACjB,iCAAS,CAAA;IACT,+CAAuB,CAAA;IACvB,qCAAa,CAAA;IACb,6CAAqB,CAAA;IACrB,gDAAwB,CAAA;IACxB,uDAA+B,CAAA;IAC/B,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,gDAAwB,CAAA;IACxB,uCAAe,CAAA;IACf,iDAAyB,CAAA;IACzB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,iDAAyB,CAAA;IACzB,uDAA+B,CAAA;IAC/B,+CAAuB,CAAA;IACvB,4DAAoC,CAAA;IACpC,mCAAW,CAAA;IACX,iDAAyB,CAAA;IACzB,mDAA2B,CAAA;IAC3B,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,oDAA4B,CAAA;IAC5B,kDAA0B,CAAA;IAC1B,sDAA8B,CAAA;IAC9B,2CAAmB,CAAA;IACnB,0CAAkB,CAAA;IAClB,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,uCAAe,CAAA;IACf,qDAA6B,CAAA;IAC7B,uCAAe,CAAA;IACf,8CAAsB,CAAA;IACtB,4CAAoB,CAAA;IACpB,6CAAqB,CAAA;IACrB,2CAAmB,CAAA;IACnB,gDAAwB,CAAA;IACxB,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,wDAAgC,CAAA;IAChC,6CAAqB,CAAA;IACrB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,kDAA0B,CAAA;IAC1B,+CAAuB,CAAA;IACvB,qCAAa,CAAA;IACb,6CAAqB,CAAA;AACzB,CAAC,EAxHiB,oBAAoB,KAApB,oBAAoB,QAwHrC;AA+BD,yEAAyE;AACzE,MAAM,CAAN,IAAY,YAwCX;AAxCD,WAAY,YAAY;IACpB,qDAAW,CAAA;IACX,2DAAc,CAAA;IACd,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,+EAAwB,CAAA;IACxB,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,8DAAgB,CAAA;IAChB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,8DAAgB,CAAA;IAChB,oEAAmB,CAAA;IACnB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,oEAAmB,CAAA;IACnB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,8DAAgB,CAAA;IAChB,sEAAoB,CAAA;IACpB,sEAAoB,CAAA;IACpB,sEAAoB,CAAA;IACpB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,wEAAqB,CAAA;AACzB,CAAC,EAxCW,YAAY,KAAZ,YAAY,QAwCvB;AA2FD,MAAM,CAAN,IAAkB,8BAQjB;AARD,WAAkB,8BAA8B;IAC5C,6FAAa,CAAA;IACb,uFAAU,CAAA;IACV,yFAAW,CAAA;IACX,yFAAW,CAAA;IACX,iGAAe,CAAA;IACf,uFAAU,CAAA;IACV,mFAAQ,CAAA;AACZ,CAAC,EARiB,8BAA8B,KAA9B,8BAA8B,QAQ/C;AAiDD,MAAM,CAAN,IAAkB,mCAOjB;AAPD,WAAkB,mCAAmC;IACjD,4GAAgB,CAAA;IAChB,6FAAQ,CAAA;IACR,6FAAQ,CAAA;IACR,2FAAO,CAAA;IACP,6FAAQ,CAAA;IACR,6FAAQ,CAAA;AACZ,CAAC,EAPiB,mCAAmC,KAAnC,mCAAmC,QAOpD;AAoND,MAAM,UAAU,gCAAgC,CAC5C,QAAsB,EAAE,IAAO;IAE/B,OAAO,QAAQ,EAAE,OAAO,EAAE,YAAY,KAAK,IAAI,CAAC;AACpD,CAAC"}
1
+ {"version":3,"file":"GgufMetadataTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufMetadataTypes.ts"],"names":[],"mappings":"AAAA,MAAM,CAAN,IAAkB,oBA6HjB;AA7HD,WAAkB,oBAAoB;IAClC,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,mCAAW,CAAA;IACX,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,kDAA0B,CAAA;IAC1B,gDAAwB,CAAA;IACxB,uDAA+B,CAAA;IAC/B,4CAAoB,CAAA;IACpB,mDAA2B,CAAA;IAC3B,mDAA2B,CAAA;IAC3B,6CAAqB,CAAA;IACrB,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,2CAAmB,CAAA;IACnB,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,iDAAyB,CAAA;IACzB,yCAAiB,CAAA;IACjB,+CAAuB,CAAA;IACvB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,yCAAiB,CAAA;IACjB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,yCAAiB,CAAA;IACjB,+CAAuB,CAAA;IACvB,uCAAe,CAAA;IACf,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,6CAAqB,CAAA;IACrB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,0DAAkC,CAAA;IAClC,iDAAyB,CAAA;IACzB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,uCAAe,CAAA;IACf,8CAAsB,CAAA;IACtB,yCAAiB,CAAA;IACjB,8CAAsB,CAAA;IACtB,2CAAmB,CAAA;IACnB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,2CAAmB,CAAA;IACnB,yCAAiB,CAAA;IACjB,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,0CAAkB,CAAA;IAClB,yCAAiB,CAAA;IACjB,iCAAS,CAAA;IACT,+CAAuB,CAAA;IACvB,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,gDAAwB,CAAA;IACxB,uDAA+B,CAAA;IAC/B,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,gDAAwB,CAAA;IACxB,uCAAe,CAAA;IACf,iDAAyB,CAAA;IACzB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,iDAAyB,CAAA;IACzB,uDAA+B,CAAA;IAC/B,+CAAuB,CAAA;IACvB,4DAAoC,CAAA;IACpC,mCAAW,CAAA;IACX,iDAAyB,CAAA;IACzB,mDAA2B,CAAA;IAC3B,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,oDAA4B,CAAA;IAC5B,kDAA0B,CAAA;IAC1B,sDAA8B,CAAA;IAC9B,2CAAmB,CAAA;IACnB,0CAAkB,CAAA;IAClB,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,uCAAe,CAAA;IACf,qDAA6B,CAAA;IAC7B,uCAAe,CAAA;IACf,8CAAsB,CAAA;IACtB,4CAAoB,CAAA;IACpB,6CAAqB,CAAA;IACrB,2CAAmB,CAAA;IACnB,gDAAwB,CAAA;IACxB,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,wDAAgC,CAAA;IAChC,6CAAqB,CAAA;IACrB,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,kDAA0B,CAAA;IAC1B,+CAAuB,CAAA;IACvB,kDAA0B,CAAA;IAC1B,qCAAa,CAAA;IACb,6CAAqB,CAAA;AACzB,CAAC,EA7HiB,oBAAoB,KAApB,oBAAoB,QA6HrC;AA+BD,yEAAyE;AACzE,MAAM,CAAN,IAAY,YAyCX;AAzCD,WAAY,YAAY;IACpB,qDAAW,CAAA;IACX,2DAAc,CAAA;IACd,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,+EAAwB,CAAA;IACxB,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,8DAAgB,CAAA;IAChB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,8DAAgB,CAAA;IAChB,oEAAmB,CAAA;IACnB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,oEAAmB,CAAA;IACnB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,8DAAgB,CAAA;IAChB,sEAAoB,CAAA;IACpB,sEAAoB,CAAA;IACpB,sEAAoB,CAAA;IACpB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,wEAAqB,CAAA;IACrB,gEAAiB,CAAA;AACrB,CAAC,EAzCW,YAAY,KAAZ,YAAY,QAyCvB;AA2FD,MAAM,CAAN,IAAkB,8BAQjB;AARD,WAAkB,8BAA8B;IAC5C,6FAAa,CAAA;IACb,uFAAU,CAAA;IACV,yFAAW,CAAA;IACX,yFAAW,CAAA;IACX,iGAAe,CAAA;IACf,uFAAU,CAAA;IACV,mFAAQ,CAAA;AACZ,CAAC,EARiB,8BAA8B,KAA9B,8BAA8B,QAQ/C;AAkDD,MAAM,CAAN,IAAkB,mCAOjB;AAPD,WAAkB,mCAAmC;IACjD,4GAAgB,CAAA;IAChB,6FAAQ,CAAA;IACR,6FAAQ,CAAA;IACR,2FAAO,CAAA;IACP,6FAAQ,CAAA;IACR,6FAAQ,CAAA;AACZ,CAAC,EAPiB,mCAAmC,KAAnC,mCAAmC,QAOpD;AAgOD,MAAM,UAAU,gCAAgC,CAC5C,QAAsB,EAAE,IAAO;IAE/B,OAAO,QAAQ,EAAE,OAAO,EAAE,YAAY,KAAK,IAAI,CAAC;AACpD,CAAC"}
@@ -17,7 +17,7 @@ export type GgufTensorInfo = {
17
17
  */
18
18
  readonly filePart: number;
19
19
  };
20
- export declare const enum GgmlType {
20
+ export declare enum GgmlType {
21
21
  F32 = 0,
22
22
  F16 = 1,
23
23
  Q4_0 = 2,
@@ -57,5 +57,7 @@ export declare const enum GgmlType {
57
57
  IQ4_NL_4_4 = 36,
58
58
  IQ4_NL_4_8 = 37,
59
59
  IQ4_NL_8_8 = 38,
60
- MXFP4 = 39
60
+ MXFP4 = 39,// MXFP4 (1 block)
61
+ NVFP4 = 40
61
62
  }
63
+ export declare function resolveGgmlTypeOption(option?: keyof typeof GgmlType | GgmlType): GgmlType | undefined;
@@ -39,6 +39,16 @@ export var GgmlType;
39
39
  GgmlType[GgmlType["IQ4_NL_4_4"] = 36] = "IQ4_NL_4_4";
40
40
  GgmlType[GgmlType["IQ4_NL_4_8"] = 37] = "IQ4_NL_4_8";
41
41
  GgmlType[GgmlType["IQ4_NL_8_8"] = 38] = "IQ4_NL_8_8";
42
- GgmlType[GgmlType["MXFP4"] = 39] = "MXFP4"; // MXFP4 (1 block)
42
+ GgmlType[GgmlType["MXFP4"] = 39] = "MXFP4";
43
+ GgmlType[GgmlType["NVFP4"] = 40] = "NVFP4"; // NVFP4 (4 blocks, E4M3 scale)
43
44
  })(GgmlType || (GgmlType = {}));
45
+ export function resolveGgmlTypeOption(option) {
46
+ if (option == null)
47
+ return undefined;
48
+ if (typeof option === "number" && Object.hasOwn(GgmlType, option))
49
+ return option;
50
+ else if (typeof option === "string" && Object.hasOwn(GgmlType, option))
51
+ return GgmlType[option];
52
+ return undefined;
53
+ }
44
54
  //# sourceMappingURL=GgufTensorInfoTypes.js.map
@@ -1 +1 @@
1
- {"version":3,"file":"GgufTensorInfoTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufTensorInfoTypes.ts"],"names":[],"mappings":"AAsBA,MAAM,CAAN,IAAkB,QAyCjB;AAzCD,WAAkB,QAAQ;IACtB,qCAAO,CAAA;IACP,qCAAO,CAAA;IACP,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,8CAAY,CAAA;IACZ,4CAAW,CAAA;IACX,8CAAY,CAAA;IACZ,0CAAU,CAAA;IACV,4CAAW,CAAA;IACX,0CAAU,CAAA;IACV,0CAAU,CAAA;IACV,4CAAW,CAAA;IACX,oCAAO,CAAA;IACP,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,0CAAU,CAAA;IACV,wCAAS,CAAA;IACT,gDAAa,CAAA;IACb,gDAAa,CAAA;IACb,gDAAa,CAAA;IACb,0CAAU,CAAA;IACV,0CAAU,CAAA;IACV,oDAAe,CAAA;IACf,oDAAe,CAAA;IACf,oDAAe,CAAA;IACf,0CAAU,CAAA,CAAC,kBAAkB;AACjC,CAAC,EAzCiB,QAAQ,KAAR,QAAQ,QAyCzB"}
1
+ {"version":3,"file":"GgufTensorInfoTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufTensorInfoTypes.ts"],"names":[],"mappings":"AAsBA,MAAM,CAAN,IAAY,QA0CX;AA1CD,WAAY,QAAQ;IAChB,qCAAO,CAAA;IACP,qCAAO,CAAA;IACP,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,8CAAY,CAAA;IACZ,4CAAW,CAAA;IACX,8CAAY,CAAA;IACZ,0CAAU,CAAA;IACV,4CAAW,CAAA;IACX,0CAAU,CAAA;IACV,0CAAU,CAAA;IACV,4CAAW,CAAA;IACX,oCAAO,CAAA;IACP,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,0CAAU,CAAA;IACV,wCAAS,CAAA;IACT,gDAAa,CAAA;IACb,gDAAa,CAAA;IACb,gDAAa,CAAA;IACb,0CAAU,CAAA;IACV,0CAAU,CAAA;IACV,oDAAe,CAAA;IACf,oDAAe,CAAA;IACf,oDAAe,CAAA;IACf,0CAAU,CAAA;IACV,0CAAU,CAAA,CAAC,+BAA+B;AAC9C,CAAC,EA1CW,QAAQ,KAAR,QAAQ,QA0CnB;AAED,MAAM,UAAU,qBAAqB,CAAC,MAAyC;IAC3E,IAAI,MAAM,IAAI,IAAI;QACd,OAAO,SAAS,CAAC;IAErB,IAAI,OAAO,MAAM,KAAK,QAAQ,IAAI,MAAM,CAAC,MAAM,CAAC,QAAQ,EAAE,MAAM,CAAC;QAC7D,OAAO,MAAkB,CAAC;SACzB,IAAI,OAAO,MAAM,KAAK,QAAQ,IAAI,MAAM,CAAC,MAAM,CAAC,QAAQ,EAAE,MAAM,CAAC;QAClE,OAAO,QAAQ,CAAC,MAA+B,CAAC,CAAC;IAErD,OAAO,SAAS,CAAC;AACrB,CAAC"}
@@ -1,4 +1,4 @@
1
1
  /**
2
2
  * Convert a GGUF file type number to its corresponding type name
3
3
  */
4
- export declare function getGgufFileTypeName(fileType?: number): "ALL_F32" | "MOSTLY_F16" | "MOSTLY_Q4_0" | "MOSTLY_Q4_1" | "MOSTLY_Q4_1_SOME_F16" | "MOSTLY_Q4_2" | "MOSTLY_Q4_3" | "MOSTLY_Q8_0" | "MOSTLY_Q5_0" | "MOSTLY_Q5_1" | "MOSTLY_Q2_K" | "MOSTLY_Q3_K_S" | "MOSTLY_Q3_K_M" | "MOSTLY_Q3_K_L" | "MOSTLY_Q4_K_S" | "MOSTLY_Q4_K_M" | "MOSTLY_Q5_K_S" | "MOSTLY_Q5_K_M" | "MOSTLY_Q6_K" | "MOSTLY_IQ2_XXS" | "MOSTLY_IQ2_XS" | "MOSTLY_Q2_K_S" | "MOSTLY_IQ3_XS" | "MOSTLY_IQ3_XXS" | "MOSTLY_IQ1_S" | "MOSTLY_IQ4_NL" | "MOSTLY_IQ3_S" | "MOSTLY_IQ3_M" | "MOSTLY_IQ2_S" | "MOSTLY_IQ2_M" | "MOSTLY_IQ4_XS" | "MOSTLY_IQ1_M" | "MOSTLY_BF16" | "MOSTLY_Q4_0_4_4" | "MOSTLY_Q4_0_4_8" | "MOSTLY_Q4_0_8_8" | "MOSTLY_TQ1_0" | "MOSTLY_TQ2_0" | "MOSTLY_MXFP4_MOE" | undefined;
4
+ export declare function getGgufFileTypeName(fileType?: number): "ALL_F32" | "MOSTLY_F16" | "MOSTLY_Q4_0" | "MOSTLY_Q4_1" | "MOSTLY_Q4_1_SOME_F16" | "MOSTLY_Q4_2" | "MOSTLY_Q4_3" | "MOSTLY_Q8_0" | "MOSTLY_Q5_0" | "MOSTLY_Q5_1" | "MOSTLY_Q2_K" | "MOSTLY_Q3_K_S" | "MOSTLY_Q3_K_M" | "MOSTLY_Q3_K_L" | "MOSTLY_Q4_K_S" | "MOSTLY_Q4_K_M" | "MOSTLY_Q5_K_S" | "MOSTLY_Q5_K_M" | "MOSTLY_Q6_K" | "MOSTLY_IQ2_XXS" | "MOSTLY_IQ2_XS" | "MOSTLY_Q2_K_S" | "MOSTLY_IQ3_XS" | "MOSTLY_IQ3_XXS" | "MOSTLY_IQ1_S" | "MOSTLY_IQ4_NL" | "MOSTLY_IQ3_S" | "MOSTLY_IQ3_M" | "MOSTLY_IQ2_S" | "MOSTLY_IQ2_M" | "MOSTLY_IQ4_XS" | "MOSTLY_IQ1_M" | "MOSTLY_BF16" | "MOSTLY_Q4_0_4_4" | "MOSTLY_Q4_0_4_8" | "MOSTLY_Q4_0_8_8" | "MOSTLY_TQ1_0" | "MOSTLY_TQ2_0" | "MOSTLY_MXFP4_MOE" | "MOSTLY_NVFP4" | undefined;
@@ -3,6 +3,7 @@ export const ggufQuantNames = new Map([
3
3
  ["Q4_0", GgufFileType.MOSTLY_Q4_0],
4
4
  ["Q4_1", GgufFileType.MOSTLY_Q4_1],
5
5
  ["MXFP4", GgufFileType.MOSTLY_MXFP4_MOE],
6
+ ["NVFP4", GgufFileType.MOSTLY_MXFP4_MOE],
6
7
  ["Q5_0", GgufFileType.MOSTLY_Q5_0],
7
8
  ["Q5_1", GgufFileType.MOSTLY_Q5_1],
8
9
  ["IQ2_XXS", GgufFileType.MOSTLY_IQ2_XXS],
@@ -1 +1 @@
1
- {"version":3,"file":"ggufQuantNames.js","sourceRoot":"","sources":["../../../src/gguf/utils/ggufQuantNames.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,YAAY,EAAC,MAAM,+BAA+B,CAAC;AAE3D,MAAM,CAAC,MAAM,cAAc,GAAG,IAAI,GAAG,CAAuB;IACxD,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,OAAO,EAAE,YAAY,CAAC,gBAAgB,CAAC;IACxC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,SAAS,EAAE,YAAY,CAAC,cAAc,CAAC;IACxC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,SAAS,EAAE,YAAY,CAAC,cAAc,CAAC;IACxC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,KAAK,EAAE,YAAY,CAAC,UAAU,CAAC;IAChC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,KAAK,EAAE,YAAY,CAAC,OAAO,CAAC;IAC7B,CAAC,MAAM,EAAE,YAAY,CAAC,OAAO,CAAC;CACjC,CAAC,CAAC"}
1
+ {"version":3,"file":"ggufQuantNames.js","sourceRoot":"","sources":["../../../src/gguf/utils/ggufQuantNames.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,YAAY,EAAC,MAAM,+BAA+B,CAAC;AAE3D,MAAM,CAAC,MAAM,cAAc,GAAG,IAAI,GAAG,CAAuB;IACxD,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,OAAO,EAAE,YAAY,CAAC,gBAAgB,CAAC;IACxC,CAAC,OAAO,EAAE,YAAY,CAAC,gBAAgB,CAAC;IACxC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,SAAS,EAAE,YAAY,CAAC,cAAc,CAAC;IACxC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,SAAS,EAAE,YAAY,CAAC,cAAc,CAAC;IACxC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,KAAK,EAAE,YAAY,CAAC,UAAU,CAAC;IAChC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,KAAK,EAAE,YAAY,CAAC,OAAO,CAAC;IAC7B,CAAC,MAAM,EAAE,YAAY,CAAC,OAAO,CAAC;CACjC,CAAC,CAAC"}