node-llama-cpp 3.17.1 → 3.18.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/bindings/AddonTypes.d.ts +13 -0
- package/dist/bindings/Llama.js +20 -2
- package/dist/bindings/Llama.js.map +1 -1
- package/dist/bindings/getLlama.d.ts +1 -1
- package/dist/bindings/getLlama.js +19 -8
- package/dist/bindings/getLlama.js.map +1 -1
- package/dist/bindings/utils/compileLLamaCpp.d.ts +2 -1
- package/dist/bindings/utils/compileLLamaCpp.js +8 -0
- package/dist/bindings/utils/compileLLamaCpp.js.map +1 -1
- package/dist/bindings/utils/getGpuTypesToUseForOption.d.ts +1 -1
- package/dist/bindings/utils/getLlamaGpuTypes.js +2 -0
- package/dist/bindings/utils/getLlamaGpuTypes.js.map +1 -1
- package/dist/chatWrappers/QwenChatWrapper.d.ts +7 -0
- package/dist/chatWrappers/QwenChatWrapper.js +176 -56
- package/dist/chatWrappers/QwenChatWrapper.js.map +1 -1
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +127 -88
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -1
- package/dist/chatWrappers/generic/utils/extractFunctionCallSettingsFromJinjaTemplate.d.ts +16 -10
- package/dist/chatWrappers/generic/utils/extractFunctionCallSettingsFromJinjaTemplate.js +115 -5
- package/dist/chatWrappers/generic/utils/extractFunctionCallSettingsFromJinjaTemplate.js.map +1 -1
- package/dist/chatWrappers/generic/utils/extractSegmentSettingsFromTokenizerAndChatTemplate.js +1 -0
- package/dist/chatWrappers/generic/utils/extractSegmentSettingsFromTokenizerAndChatTemplate.js.map +1 -1
- package/dist/cli/commands/ChatCommand.d.ts +3 -0
- package/dist/cli/commands/ChatCommand.js +34 -5
- package/dist/cli/commands/ChatCommand.js.map +1 -1
- package/dist/cli/commands/CompleteCommand.d.ts +3 -0
- package/dist/cli/commands/CompleteCommand.js +34 -4
- package/dist/cli/commands/CompleteCommand.js.map +1 -1
- package/dist/cli/commands/InfillCommand.d.ts +3 -0
- package/dist/cli/commands/InfillCommand.js +34 -4
- package/dist/cli/commands/InfillCommand.js.map +1 -1
- package/dist/cli/commands/OnPostInstallCommand.js +31 -4
- package/dist/cli/commands/OnPostInstallCommand.js.map +1 -1
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.d.ts +3 -0
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.js +28 -1
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.js.map +1 -1
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +5 -0
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -1
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +51 -4
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -1
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.d.ts +3 -0
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +46 -5
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -1
- package/dist/cli/utils/interactivelyAskForModel.d.ts +4 -1
- package/dist/cli/utils/interactivelyAskForModel.js +21 -7
- package/dist/cli/utils/interactivelyAskForModel.js.map +1 -1
- package/dist/cli/utils/packageJsonConfig.d.ts +6 -0
- package/dist/cli/utils/packageJsonConfig.js +51 -0
- package/dist/cli/utils/packageJsonConfig.js.map +1 -0
- package/dist/cli/utils/packageManager.d.ts +1 -0
- package/dist/cli/utils/packageManager.js +15 -0
- package/dist/cli/utils/packageManager.js.map +1 -0
- package/dist/cli/utils/printCommonInfoLines.js +9 -0
- package/dist/cli/utils/printCommonInfoLines.js.map +1 -1
- package/dist/cli/utils/resolveCommandGgufPath.d.ts +4 -1
- package/dist/cli/utils/resolveCommandGgufPath.js +9 -2
- package/dist/cli/utils/resolveCommandGgufPath.js.map +1 -1
- package/dist/cli/utils/resolveNpmrcConfig.d.ts +18 -0
- package/dist/cli/utils/resolveNpmrcConfig.js +129 -0
- package/dist/cli/utils/resolveNpmrcConfig.js.map +1 -0
- package/dist/config.d.ts +6 -1
- package/dist/config.js +12 -2
- package/dist/config.js.map +1 -1
- package/dist/evaluator/LlamaChat/LlamaChat.d.ts +8 -2
- package/dist/evaluator/LlamaChat/LlamaChat.js +99 -6
- package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -1
- package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js +8 -2
- package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +1 -1
- package/dist/evaluator/LlamaChatSession/LlamaChatSession.d.ts +8 -2
- package/dist/evaluator/LlamaChatSession/LlamaChatSession.js.map +1 -1
- package/dist/evaluator/LlamaContext/LlamaContext.d.ts +91 -0
- package/dist/evaluator/LlamaContext/LlamaContext.js +215 -19
- package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -1
- package/dist/evaluator/LlamaContext/LlamaContextSequenceCheckpoints.d.ts +27 -0
- package/dist/evaluator/LlamaContext/LlamaContextSequenceCheckpoints.js +130 -0
- package/dist/evaluator/LlamaContext/LlamaContextSequenceCheckpoints.js.map +1 -0
- package/dist/evaluator/LlamaContext/types.d.ts +32 -1
- package/dist/evaluator/LlamaModel/LlamaModel.d.ts +33 -0
- package/dist/evaluator/LlamaModel/LlamaModel.js +24 -3
- package/dist/evaluator/LlamaModel/LlamaModel.js.map +1 -1
- package/dist/gguf/insights/GgufInsights.d.ts +12 -1
- package/dist/gguf/insights/GgufInsights.js +246 -49
- package/dist/gguf/insights/GgufInsights.js.map +1 -1
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.d.ts +13 -4
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.js +17 -5
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.js.map +1 -1
- package/dist/gguf/insights/utils/resolveContextContextSizeOption.d.ts +4 -1
- package/dist/gguf/insights/utils/resolveContextContextSizeOption.js +7 -1
- package/dist/gguf/insights/utils/resolveContextContextSizeOption.js.map +1 -1
- package/dist/gguf/insights/utils/resolveModelGpuLayersOption.d.ts +4 -1
- package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js +16 -4
- package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js.map +1 -1
- package/dist/gguf/types/GgufMetadataTypes.d.ts +18 -2
- package/dist/gguf/types/GgufMetadataTypes.js +6 -0
- package/dist/gguf/types/GgufMetadataTypes.js.map +1 -1
- package/dist/gguf/types/GgufTensorInfoTypes.d.ts +4 -2
- package/dist/gguf/types/GgufTensorInfoTypes.js +11 -1
- package/dist/gguf/types/GgufTensorInfoTypes.js.map +1 -1
- package/dist/gguf/utils/getGgufFileTypeName.d.ts +1 -1
- package/dist/gguf/utils/ggufQuantNames.js +1 -0
- package/dist/gguf/utils/ggufQuantNames.js.map +1 -1
- package/dist/tsconfig.tsbuildinfo +1 -1
- package/dist/types.d.ts +1 -0
- package/dist/utils/getBuildDefaults.d.ts +1 -1
- package/dist/utils/getFirstWritableDir.d.ts +8 -0
- package/dist/utils/getFirstWritableDir.js +60 -0
- package/dist/utils/getFirstWritableDir.js.map +1 -0
- package/dist/utils/getTempDir.d.ts +10 -0
- package/dist/utils/getTempDir.js +121 -0
- package/dist/utils/getTempDir.js.map +1 -0
- package/dist/utils/prettyPrintObject.js +1 -1
- package/dist/utils/prettyPrintObject.js.map +1 -1
- package/dist/utils/resolveModelFile.js +19 -8
- package/dist/utils/resolveModelFile.js.map +1 -1
- package/llama/addon/AddonContext.cpp +182 -0
- package/llama/addon/AddonContext.h +27 -0
- package/llama/addon/addon.cpp +1 -0
- package/llama/binariesGithubRelease.json +1 -1
- package/llama/gitRelease.bundle +0 -0
- package/llama/llama.cpp.info.json +1 -1
- package/package.json +24 -24
|
@@ -24,9 +24,11 @@ export class GgufInsightsConfigurationResolver {
|
|
|
24
24
|
* @param options
|
|
25
25
|
* @param hardwareOverrides
|
|
26
26
|
*/
|
|
27
|
-
async resolveAndScoreConfig({ targetGpuLayers, targetContextSize, embeddingContext = false, flashAttention = false, swaFullCache = false, useMmap = this._ggufInsights._llama.supportsMmap } = {}, { getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading } = {}) {
|
|
27
|
+
async resolveAndScoreConfig({ targetGpuLayers, targetContextSize, embeddingContext = false, flashAttention = false, kvCacheKeyType, kvCacheValueType, swaFullCache = false, useMmap = this._ggufInsights._llama.supportsMmap } = {}, { getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading } = {}) {
|
|
28
28
|
const compatibilityScore = await this.scoreModelConfigurationCompatibility({
|
|
29
29
|
flashAttention,
|
|
30
|
+
kvCacheKeyType,
|
|
31
|
+
kvCacheValueType,
|
|
30
32
|
swaFullCache,
|
|
31
33
|
contextSize: targetContextSize,
|
|
32
34
|
embeddingContext,
|
|
@@ -64,7 +66,7 @@ export class GgufInsightsConfigurationResolver {
|
|
|
64
66
|
*
|
|
65
67
|
* `contextSize` defaults to `4096` (if the model train context size is lower than this, the model train context size is used instead).
|
|
66
68
|
*/
|
|
67
|
-
async scoreModelConfigurationCompatibility({ contextSize = Math.min(4096, this._ggufInsights.trainContextSize ?? 4096), embeddingContext = false, flashAttention = false, swaFullCache = false, maximumFittedContextSizeMultiplier = 100, maximumUnfitConfigurationResourceMultiplier = 100, forceStrictContextSize = false, forceGpuLayers, useMmap = this._ggufInsights._llama.supportsMmap } = {}, { getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading } = {}) {
|
|
69
|
+
async scoreModelConfigurationCompatibility({ contextSize = Math.min(4096, this._ggufInsights.trainContextSize ?? 4096), embeddingContext = false, flashAttention = false, kvCacheKeyType, kvCacheValueType, swaFullCache = false, maximumFittedContextSizeMultiplier = 100, maximumUnfitConfigurationResourceMultiplier = 100, forceStrictContextSize = false, forceGpuLayers, useMmap = this._ggufInsights._llama.supportsMmap } = {}, { getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading } = {}) {
|
|
68
70
|
const [vramState, ramState, swapState] = await Promise.all([
|
|
69
71
|
getVramState(),
|
|
70
72
|
getRamState(),
|
|
@@ -95,6 +97,8 @@ export class GgufInsightsConfigurationResolver {
|
|
|
95
97
|
llamaSupportsGpuOffloading,
|
|
96
98
|
defaultContextFlashAttention: flashAttention,
|
|
97
99
|
defaultContextSwaFullCache: swaFullCache,
|
|
100
|
+
defaultContextKvCacheKeyType: kvCacheKeyType,
|
|
101
|
+
defaultContextKvCacheValueType: kvCacheValueType,
|
|
98
102
|
ignoreMemorySafetyChecks: forceGpuLayers != null,
|
|
99
103
|
useMmap
|
|
100
104
|
});
|
|
@@ -137,6 +141,8 @@ export class GgufInsightsConfigurationResolver {
|
|
|
137
141
|
modelTrainContextSize: this._ggufInsights.trainContextSize ?? defaultTrainContextSizeForEstimationPurposes,
|
|
138
142
|
ignoreMemorySafetyChecks: forceStrictContextSize,
|
|
139
143
|
flashAttention,
|
|
144
|
+
kvCacheKeyType,
|
|
145
|
+
kvCacheValueType,
|
|
140
146
|
swaFullCache
|
|
141
147
|
});
|
|
142
148
|
contextFitsMemory = true;
|
|
@@ -157,7 +163,9 @@ export class GgufInsightsConfigurationResolver {
|
|
|
157
163
|
isEmbeddingContext: embeddingContext,
|
|
158
164
|
modelGpuLayers: resolvedGpuLayers,
|
|
159
165
|
flashAttention,
|
|
160
|
-
swaFullCache
|
|
166
|
+
swaFullCache,
|
|
167
|
+
kvCacheKeyType,
|
|
168
|
+
kvCacheValueType
|
|
161
169
|
});
|
|
162
170
|
const rankPoints = {
|
|
163
171
|
gpuLayers: 60,
|
|
@@ -213,7 +221,7 @@ export class GgufInsightsConfigurationResolver {
|
|
|
213
221
|
}
|
|
214
222
|
};
|
|
215
223
|
}
|
|
216
|
-
async resolveModelGpuLayers(gpuLayers, { ignoreMemorySafetyChecks = false, getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading, defaultContextFlashAttention = false, defaultContextSwaFullCache = false, useMmap = this._ggufInsights._llama.supportsMmap } = {}) {
|
|
224
|
+
async resolveModelGpuLayers(gpuLayers, { ignoreMemorySafetyChecks = false, getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), llamaVramPaddingSize = this._ggufInsights._llama.vramPaddingSize, llamaGpu = this._ggufInsights._llama.gpu, llamaSupportsGpuOffloading = this._ggufInsights._llama.supportsGpuOffloading, defaultContextFlashAttention = false, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache = false, useMmap = this._ggufInsights._llama.supportsMmap } = {}) {
|
|
217
225
|
return resolveModelGpuLayersOption(gpuLayers, {
|
|
218
226
|
ggufInsights: this._ggufInsights,
|
|
219
227
|
ignoreMemorySafetyChecks,
|
|
@@ -222,6 +230,8 @@ export class GgufInsightsConfigurationResolver {
|
|
|
222
230
|
llamaGpu,
|
|
223
231
|
llamaSupportsGpuOffloading,
|
|
224
232
|
defaultContextFlashAttention,
|
|
233
|
+
defaultContextKvCacheKeyType,
|
|
234
|
+
defaultContextKvCacheValueType,
|
|
225
235
|
defaultContextSwaFullCache,
|
|
226
236
|
useMmap
|
|
227
237
|
});
|
|
@@ -231,7 +241,7 @@ export class GgufInsightsConfigurationResolver {
|
|
|
231
241
|
*
|
|
232
242
|
* If there's no context size that can fit the available resources, an `InsufficientMemoryError` is thrown.
|
|
233
243
|
*/
|
|
234
|
-
async resolveContextContextSize(contextSize, { modelGpuLayers, batchSize, modelTrainContextSize, flashAttention = false, swaFullCache = false, getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaGpu = this._ggufInsights._llama.gpu, ignoreMemorySafetyChecks = false, isEmbeddingContext = false, sequences = getDefaultContextSequences() }) {
|
|
244
|
+
async resolveContextContextSize(contextSize, { modelGpuLayers, batchSize, modelTrainContextSize, flashAttention = false, kvCacheKeyType, kvCacheValueType, swaFullCache = false, getVramState = (() => this._ggufInsights._llama._vramOrchestrator.getMemoryState()), getRamState = (async () => this._ggufInsights._llama._ramOrchestrator.getMemoryState()), getSwapState = (() => this._ggufInsights._llama._swapOrchestrator.getMemoryState()), llamaGpu = this._ggufInsights._llama.gpu, ignoreMemorySafetyChecks = false, isEmbeddingContext = false, sequences = getDefaultContextSequences() }) {
|
|
235
245
|
return await resolveContextContextSizeOption({
|
|
236
246
|
contextSize,
|
|
237
247
|
batchSize,
|
|
@@ -240,6 +250,8 @@ export class GgufInsightsConfigurationResolver {
|
|
|
240
250
|
modelGpuLayers,
|
|
241
251
|
modelTrainContextSize,
|
|
242
252
|
flashAttention,
|
|
253
|
+
kvCacheKeyType,
|
|
254
|
+
kvCacheValueType,
|
|
243
255
|
swaFullCache,
|
|
244
256
|
getVramState,
|
|
245
257
|
getRamState,
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"GgufInsightsConfigurationResolver.js","sourceRoot":"","sources":["../../../src/gguf/insights/GgufInsightsConfigurationResolver.ts"],"names":[],"mappings":"AAGA,OAAO,EAAC,0BAA0B,EAAC,MAAM,8CAA8C,CAAC;AACxF,OAAO,EAAC,uBAAuB,EAAC,MAAM,wCAAwC,CAAC;AAC/E,OAAO,EAAC,2BAA2B,EAAC,MAAM,wCAAwC,CAAC;AACnF,OAAO,EAAC,+BAA+B,EAAC,MAAM,4CAA4C,CAAC;AAC3F,OAAO,EAAC,WAAW,EAAC,MAAM,wBAAwB,CAAC;AACnD,OAAO,EAAC,0BAA0B,EAAC,MAAM,uCAAuC,CAAC;AAGjF,MAAM,CAAC,MAAM,4CAA4C,GAAG,IAAI,CAAC;AACjE,MAAM,kDAAkD,GAAG,IAAI,CAAC;AAGhE,MAAM,OAAO,iCAAiC;IAC1C,gBAAgB,CAAkB,aAAa,CAAe;IAE9D,YAAoB,YAA0B;QAC1C,IAAI,CAAC,aAAa,GAAG,YAAY,CAAC;IACtC,CAAC;IAED,IAAW,YAAY;QACnB,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED;;;;;;;;;OASG;IACI,KAAK,CAAC,qBAAqB,CAAC,EAC/B,eAAe,EACf,iBAAiB,EACjB,gBAAgB,GAAG,KAAK,EACxB,cAAc,GAAG,KAAK,EACtB,YAAY,GAAG,KAAK,EACpB,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAQhD,EAAE,EAAE,EACJ,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAChE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,KAQ5E,EAAE;QACF,MAAM,kBAAkB,GAAG,MAAM,IAAI,CAAC,oCAAoC,CAAC;YACvE,cAAc;YACd,YAAY;YACZ,WAAW,EAAE,iBAAiB;YAC9B,gBAAgB;YAChB,cAAc,EAAE,eAAe;YAC/B,sBAAsB,EAAE,iBAAiB,IAAI,IAAI;YACjD,OAAO;SACV,EAAE;YACC,YAAY;YACZ,WAAW;YACX,YAAY;YACZ,oBAAoB;YACpB,QAAQ;YACR,0BAA0B;SAC7B,CAAC,CAAC;QAEH,OAAO,kBAAkB,CAAC;IAC9B,CAAC;IAED;;;;;;;;;;;;;;;;;;;;OAoBG;IACI,KAAK,CAAC,oCAAoC,CAAC,EAC9C,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,aAAa,CAAC,gBAAgB,IAAI,IAAI,CAAC,EACzE,gBAAgB,GAAG,KAAK,EACxB,cAAc,GAAG,KAAK,EACtB,YAAY,GAAG,KAAK,EACpB,kCAAkC,GAAG,GAAG,EACxC,2CAA2C,GAAG,GAAG,EACjD,sBAAsB,GAAG,KAAK,EAC9B,cAAc,EACd,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAkBhD,EAAE,EAAE,EACJ,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAChE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,KAQ5E,EAAE;QAiCF,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QACH,IAAI,iBAAiB,GAAG,CAAC,cAAc,IAAI,IAAI,IAAI,cAAc,IAAI,KAAK,CAAC;YACvE,CAAC,CAAC,IAAI,CAAC,YAAY,CAAC,WAAW;YAC/B,CAAC,CAAC,cAAc,CAAC;QACrB,IAAI,kBAAkB,GAAG,KAAK,CAAC;QAE/B,IAAI,CAAC;YACD,iBAAiB,GAAG,MAAM,IAAI,CAAC,qBAAqB,CAChD,cAAc,IAAI,IAAI;gBAClB,CAAC,CAAC,cAAc;gBAChB,CAAC,CAAC,gBAAgB;oBACd,CAAC,CAAC;wBACE,UAAU,EAAE;4BACR,gBAAgB,EAAE,IAAI;4BACtB,WAAW,EAAE,sBAAsB;gCAC/B,CAAC,CAAC,WAAW;gCACb,CAAC,CAAC,SAAS;yBAClB;qBACJ;oBACD,CAAC,CAAC,sBAAsB,IAAI,IAAI;wBAC5B,CAAC,CAAC,EAAC,UAAU,EAAE,EAAC,WAAW,EAAC,EAAC;wBAC7B,CAAC,CAAC,MAAM,EACpB;gBACI,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,SAAS;gBACnC,oBAAoB;gBACpB,QAAQ;gBACR,0BAA0B;gBAC1B,4BAA4B,EAAE,cAAc;gBAC5C,0BAA0B,EAAE,YAAY;gBACxC,wBAAwB,EAAE,cAAc,IAAI,IAAI;gBAChD,OAAO;aACV,CACJ,CAAC;YACF,kBAAkB,GAAG,IAAI,CAAC;QAC9B,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,CAAC,GAAG,YAAY,uBAAuB,CAAC;gBACzC,MAAM,GAAG,CAAC;QAClB,CAAC;QAED,MAAM,SAAS,GAAG,0BAA0B,IAAI,QAAQ,KAAK,KAAK,CAAC;QACnE,MAAM,2BAA2B,GAAG,IAAI,CAAC,aAAa,CAAC,iCAAiC,CAAC;YACrF,SAAS,EAAE,iBAAiB;YAC5B,OAAO;SACV,CAAC,CAAC;QAEH,IAAI,mBAAmB,GAAG,sBAAsB;YAC5C,CAAC,CAAC,WAAW;YACb,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,IAAI,CAAC,YAAY,CAAC,gBAAgB,IAAI,kDAAkD,EACxF,kDAAkD,CACrD,CAAC;QACN,IAAI,iBAAiB,GAAG,KAAK,CAAC;QAE9B,IAAI,CAAC;YACD,mBAAmB,GAAG,MAAM,IAAI,CAAC,yBAAyB,CAAC,MAAM,EAAE;gBAC/D,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACvB,KAAK,EAAE,SAAS,CAAC,KAAK;oBACtB,IAAI,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,SAAS,CAAC,IAAI,GAAG,2BAA2B,CAAC,OAAO,CAAC;oBACvE,WAAW,EAAE,SAAS,CAAC,WAAW;iBACrC,CAAC;gBACF,WAAW,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACtB,KAAK,EAAE,QAAQ,CAAC,KAAK;oBACrB,IAAI,EAAE,IAAI,CAAC,GAAG,CACV,CAAC,EACD,QAAQ,CAAC,IAAI,GAAG,2BAA2B,CAAC,MAAM;wBAClD,CAAC,CAAC,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC,CAChF;iBACJ,CAAC;gBACF,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACvB,KAAK,EAAE,SAAS,CAAC,KAAK;oBACtB,IAAI,EAAE,IAAI,CAAC,GAAG,CACV,CAAC,EACD,SAAS,CAAC,IAAI,GAAG,IAAI,CAAC,GAAG,CACrB,CAAC,EACD,2BAA2B,CAAC,MAAM;wBAClC,CAAC,CAAC,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC;wBAC7E,CAAC,CAAC,QAAQ,CAAC,IAAI,CAAC,CACnB,CACJ;iBACJ,CAAC;gBACF,QAAQ;gBACR,kBAAkB,EAAE,gBAAgB;gBACpC,cAAc,EAAE,iBAAiB;gBACjC,qBAAqB,EAAE,IAAI,CAAC,aAAa,CAAC,gBAAgB,IAAI,4CAA4C;gBAC1G,wBAAwB,EAAE,sBAAsB;gBAChD,cAAc;gBACd,YAAY;aACf,CAAC,CAAC;YACH,iBAAiB,GAAG,IAAI,CAAC;YAEzB,IAAI,sBAAsB,IAAI,mBAAmB,GAAG,WAAW,EAAE,CAAC;gBAC9D,iBAAiB,GAAG,KAAK,CAAC;gBAC1B,mBAAmB,GAAG,WAAW,CAAC;YACtC,CAAC;iBAAM,IAAI,sBAAsB,IAAI,mBAAmB,GAAG,WAAW,EAAE,CAAC;gBACrE,mBAAmB,GAAG,WAAW,CAAC;YACtC,CAAC;QACL,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,CAAC,GAAG,YAAY,uBAAuB,CAAC;gBACzC,MAAM,GAAG,CAAC;QAClB,CAAC;QAED,MAAM,6BAA6B,GAAG,IAAI,CAAC,aAAa,CAAC,mCAAmC,CAAC;YACzF,WAAW,EAAE,mBAAmB;YAChC,kBAAkB,EAAE,gBAAgB;YACpC,cAAc,EAAE,iBAAiB;YACjC,cAAc;YACd,YAAY;SACf,CAAC,CAAC;QAEH,MAAM,UAAU,GAAG;YACf,SAAS,EAAE,EAAE;YACb,qBAAqB,EAAE,EAAE;YACzB,WAAW,EAAE,EAAE;YACf,iBAAiB,EAAE,EAAE;YACrB,qBAAqB,EAAE,EAAE,EAAE,sDAAsD;YACjF,gBAAgB,EAAE,EAAE;SACd,CAAC;QAEX,MAAM,eAAe,GAAG,UAAU,CAAC,SAAS,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,iBAAiB,GAAG,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC;QAC/G,MAAM,2BAA2B,GAAG,UAAU,CAAC,qBAAqB,GAAG,CACnE,iBAAiB,KAAK,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAC/D,CAAC;QACF,MAAM,iBAAiB,GAAG,iBAAiB;YACvC,CAAC,CAAC,UAAU,CAAC,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,mBAAmB,GAAG,WAAW,CAAC;YACzE,CAAC,CAAC,CAAC,CAAC;QACR,MAAM,uBAAuB,GAAG,UAAU,CAAC,iBAAiB,GAAG,CAC3D,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,IAAI;YAC/C,CAAC,CAAC,CAAC;YACH,CAAC,CAAC,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI;gBAClE,CAAC,CAAC,GAAG;gBACL,CAAC,CAAC,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,KAAK;oBAClD,CAAC,CAAC,GAAG;oBACL,CAAC,CAAC,CACE,GAAG,GAAG,IAAI,CAAC,GAAG,CACV,GAAG,EACH,GAAG,GAAG,CACF,CAAC,2BAA2B,CAAC,MAAM,GAAG,QAAQ,CAAC,KAAK,CAAC,GAAG,QAAQ,CAAC,KAAK,CACzE,CACJ,CACJ,CAChB,CAAC;QACF,MAAM,sBAAsB,GAAG,iBAAiB;YAC5C,CAAC,CAAC,CACE,EAAE,GAAG,IAAI,CAAC,GAAG,CACT,CAAC,EACD,CACI,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,mBAAmB,GAAG,WAAW,CAAC,GAAG,WAAW,CAC/D,GAAG,kCAAkC,CACzC,CACJ;YACD,CAAC,CAAC,CAAC,CAAC;QAER,IAAI,kBAAkB,GAAG,SAAS;YAC9B,CAAC,CAAC,CACE,CAAC,eAAe,GAAG,2BAA2B,GAAG,iBAAiB,GAAG,uBAAuB,CAAC;gBAC7F,CAAC,UAAU,CAAC,SAAS,GAAG,UAAU,CAAC,qBAAqB,GAAG,UAAU,CAAC,WAAW,GAAG,UAAU,CAAC,iBAAiB,CAAC,CACpH;YACD,CAAC,CAAC,CACE,CAAC,iBAAiB,GAAG,uBAAuB,GAAG,6BAA6B,CAAC,IAAI,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;gBAC3G,CAAC,UAAU,CAAC,WAAW,GAAG,UAAU,CAAC,iBAAiB,GAAG,UAAU,CAAC,qBAAqB,CAAC,CAAC,CAAC;QACpG,IAAI,UAAU,GAAG,sBAAsB,GAAG,UAAU,CAAC,gBAAgB,CAAC;QAEtE,IAAI,CAAC,kBAAkB,IAAI,CAAC,iBAAiB;YACzC,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO,GAAG,SAAS,CAAC,KAAK;YAC7F,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM,GAAG,QAAQ,CAAC,KAAK,GAAG,SAAS,CAAC,KAAK,EAC9G,CAAC;YACC,MAAM,oBAAoB,GAAG,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO,CAAC;YACzG,MAAM,mBAAmB,GAAG,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM,CAAC;YAEtG,kBAAkB,GAAG,CAAC,CAAC;YACvB,UAAU,GAAG,CACT,CAAC,CAAC,GAAG,CAAC,oBAAoB,GAAG,CAAC,SAAS,CAAC,KAAK,GAAG,2CAA2C,CAAC,CAAC,CAAC;gBAC9F,CAAC,CAAC,GAAG,CAAC,mBAAmB,GAAG,CAAC,CAAC,QAAQ,CAAC,KAAK,GAAG,SAAS,CAAC,KAAK,CAAC,GAAG,2CAA2C,CAAC,CAAC,CAAC,CACnH,GAAG,CAAC,CAAC;QACV,CAAC;QAED,OAAO;YACH,kBAAkB;YAClB,UAAU;YACV,UAAU,EAAE,kBAAkB,GAAG,UAAU;YAE3C,cAAc,EAAE;gBACZ,SAAS,EAAE,iBAAiB;gBAC5B,WAAW,EAAE,mBAAmB;gBAEhC,aAAa,EAAE,2BAA2B,CAAC,MAAM;gBACjD,eAAe,EAAE,6BAA6B,CAAC,MAAM;gBACrD,aAAa,EAAE,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM;gBAExF,cAAc,EAAE,2BAA2B,CAAC,OAAO;gBACnD,gBAAgB,EAAE,6BAA6B,CAAC,OAAO;gBACvD,cAAc,EAAE,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO;aAC9F;SACJ,CAAC;IACN,CAAC;IAEM,KAAK,CAAC,qBAAqB,CAAC,SAA0C,EAAE,EAC3E,wBAAwB,GAAG,KAAK,EAChC,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAAE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EAC1G,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,EAC5E,4BAA4B,GAAG,KAAK,EACpC,0BAA0B,GAAG,KAAK,EAClC,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAKhD,EAAE;QACF,OAAO,2BAA2B,CAAC,SAAS,EAAE;YAC1C,YAAY,EAAE,IAAI,CAAC,aAAa;YAChC,wBAAwB;YACxB,YAAY;YACZ,oBAAoB;YACpB,QAAQ;YACR,0BAA0B;YAC1B,4BAA4B;YAC5B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;IACP,CAAC;IAED;;;;OAIG;IACI,KAAK,CAAC,yBAAyB,CAAC,WAA+C,EAAE,EACpF,cAAc,EACd,SAAS,EACT,qBAAqB,EACrB,cAAc,GAAG,KAAK,EACtB,YAAY,GAAG,KAAK,EACpB,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,wBAAwB,GAAG,KAAK,EAChC,kBAAkB,GAAG,KAAK,EAC1B,SAAS,GAAG,0BAA0B,EAAE,EAc3C;QACG,OAAO,MAAM,+BAA+B,CAAC;YACzC,WAAW;YACX,SAAS;YACT,SAAS;YACT,iBAAiB,EAAE,IAAI,CAAC,aAAa;YACrC,cAAc;YACd,qBAAqB;YACrB,cAAc;YACd,YAAY;YACZ,YAAY;YACZ,WAAW;YACX,YAAY;YACZ,QAAQ;YACR,wBAAwB;YACxB,kBAAkB;SACrB,CAAC,CAAC;IACP,CAAC;IAED,gBAAgB;IACT,MAAM,CAAC,OAAO,CAAC,YAA0B;QAC5C,OAAO,IAAI,iCAAiC,CAAC,YAAY,CAAC,CAAC;IAC/D,CAAC;CACJ;AAED,SAAS,6BAA6B,CAAC,SAAiB;IACpD,MAAM,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC;IAC/B,OAAO,EAAE,GAAG,WAAW,CAAC,SAAS,EAAE,CAAC;YAChC,KAAK,EAAE,IAAI;YACX,GAAG,EAAE,IAAI,GAAG,GAAG;YACf,MAAM,EAAE,EAAE;SACb,EAAE;YACC,KAAK,EAAE,IAAI,GAAG,GAAG;YACjB,GAAG,EAAE,IAAI,GAAG,CAAC;YACb,MAAM,EAAE,EAAE;SACb,EAAE;YACC,KAAK,EAAE,IAAI,GAAG,CAAC;YACf,MAAM,EAAE,CAAC;SACZ,CAAC,CAAC,CAAC;AACR,CAAC"}
|
|
1
|
+
{"version":3,"file":"GgufInsightsConfigurationResolver.js","sourceRoot":"","sources":["../../../src/gguf/insights/GgufInsightsConfigurationResolver.ts"],"names":[],"mappings":"AAGA,OAAO,EAAC,0BAA0B,EAAC,MAAM,8CAA8C,CAAC;AACxF,OAAO,EAAC,uBAAuB,EAAC,MAAM,wCAAwC,CAAC;AAE/E,OAAO,EAAC,2BAA2B,EAAC,MAAM,wCAAwC,CAAC;AACnF,OAAO,EAAC,+BAA+B,EAAC,MAAM,4CAA4C,CAAC;AAC3F,OAAO,EAAC,WAAW,EAAC,MAAM,wBAAwB,CAAC;AACnD,OAAO,EAAC,0BAA0B,EAAC,MAAM,uCAAuC,CAAC;AAGjF,MAAM,CAAC,MAAM,4CAA4C,GAAG,IAAI,CAAC;AACjE,MAAM,kDAAkD,GAAG,IAAI,CAAC;AAGhE,MAAM,OAAO,iCAAiC;IAC1C,gBAAgB,CAAkB,aAAa,CAAe;IAE9D,YAAoB,YAA0B;QAC1C,IAAI,CAAC,aAAa,GAAG,YAAY,CAAC;IACtC,CAAC;IAED,IAAW,YAAY;QACnB,OAAO,IAAI,CAAC,aAAa,CAAC;IAC9B,CAAC;IAED;;;;;;;;;OASG;IACI,KAAK,CAAC,qBAAqB,CAAC,EAC/B,eAAe,EACf,iBAAiB,EACjB,gBAAgB,GAAG,KAAK,EACxB,cAAc,GAAG,KAAK,EACtB,cAAc,EACd,gBAAgB,EAChB,YAAY,GAAG,KAAK,EACpB,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAUhD,EAAE,EAAE,EACJ,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAChE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,KAQ5E,EAAE;QACF,MAAM,kBAAkB,GAAG,MAAM,IAAI,CAAC,oCAAoC,CAAC;YACvE,cAAc;YACd,cAAc;YACd,gBAAgB;YAChB,YAAY;YACZ,WAAW,EAAE,iBAAiB;YAC9B,gBAAgB;YAChB,cAAc,EAAE,eAAe;YAC/B,sBAAsB,EAAE,iBAAiB,IAAI,IAAI;YACjD,OAAO;SACV,EAAE;YACC,YAAY;YACZ,WAAW;YACX,YAAY;YACZ,oBAAoB;YACpB,QAAQ;YACR,0BAA0B;SAC7B,CAAC,CAAC;QAEH,OAAO,kBAAkB,CAAC;IAC9B,CAAC;IAED;;;;;;;;;;;;;;;;;;;;OAoBG;IACI,KAAK,CAAC,oCAAoC,CAAC,EAC9C,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,aAAa,CAAC,gBAAgB,IAAI,IAAI,CAAC,EACzE,gBAAgB,GAAG,KAAK,EACxB,cAAc,GAAG,KAAK,EACtB,cAAc,EACd,gBAAgB,EAChB,YAAY,GAAG,KAAK,EACpB,kCAAkC,GAAG,GAAG,EACxC,2CAA2C,GAAG,GAAG,EACjD,sBAAsB,GAAG,KAAK,EAC9B,cAAc,EACd,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAoBhD,EAAE,EAAE,EACJ,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAChE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,KAQ5E,EAAE;QAiCF,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QACH,IAAI,iBAAiB,GAAG,CAAC,cAAc,IAAI,IAAI,IAAI,cAAc,IAAI,KAAK,CAAC;YACvE,CAAC,CAAC,IAAI,CAAC,YAAY,CAAC,WAAW;YAC/B,CAAC,CAAC,cAAc,CAAC;QACrB,IAAI,kBAAkB,GAAG,KAAK,CAAC;QAE/B,IAAI,CAAC;YACD,iBAAiB,GAAG,MAAM,IAAI,CAAC,qBAAqB,CAChD,cAAc,IAAI,IAAI;gBAClB,CAAC,CAAC,cAAc;gBAChB,CAAC,CAAC,gBAAgB;oBACd,CAAC,CAAC;wBACE,UAAU,EAAE;4BACR,gBAAgB,EAAE,IAAI;4BACtB,WAAW,EAAE,sBAAsB;gCAC/B,CAAC,CAAC,WAAW;gCACb,CAAC,CAAC,SAAS;yBAClB;qBACJ;oBACD,CAAC,CAAC,sBAAsB,IAAI,IAAI;wBAC5B,CAAC,CAAC,EAAC,UAAU,EAAE,EAAC,WAAW,EAAC,EAAC;wBAC7B,CAAC,CAAC,MAAM,EACpB;gBACI,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,SAAS;gBACnC,oBAAoB;gBACpB,QAAQ;gBACR,0BAA0B;gBAC1B,4BAA4B,EAAE,cAAc;gBAC5C,0BAA0B,EAAE,YAAY;gBACxC,4BAA4B,EAAE,cAAc;gBAC5C,8BAA8B,EAAE,gBAAgB;gBAChD,wBAAwB,EAAE,cAAc,IAAI,IAAI;gBAChD,OAAO;aACV,CACJ,CAAC;YACF,kBAAkB,GAAG,IAAI,CAAC;QAC9B,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,CAAC,GAAG,YAAY,uBAAuB,CAAC;gBACzC,MAAM,GAAG,CAAC;QAClB,CAAC;QAED,MAAM,SAAS,GAAG,0BAA0B,IAAI,QAAQ,KAAK,KAAK,CAAC;QACnE,MAAM,2BAA2B,GAAG,IAAI,CAAC,aAAa,CAAC,iCAAiC,CAAC;YACrF,SAAS,EAAE,iBAAiB;YAC5B,OAAO;SACV,CAAC,CAAC;QAEH,IAAI,mBAAmB,GAAG,sBAAsB;YAC5C,CAAC,CAAC,WAAW;YACb,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,IAAI,CAAC,YAAY,CAAC,gBAAgB,IAAI,kDAAkD,EACxF,kDAAkD,CACrD,CAAC;QACN,IAAI,iBAAiB,GAAG,KAAK,CAAC;QAE9B,IAAI,CAAC;YACD,mBAAmB,GAAG,MAAM,IAAI,CAAC,yBAAyB,CAAC,MAAM,EAAE;gBAC/D,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACvB,KAAK,EAAE,SAAS,CAAC,KAAK;oBACtB,IAAI,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,SAAS,CAAC,IAAI,GAAG,2BAA2B,CAAC,OAAO,CAAC;oBACvE,WAAW,EAAE,SAAS,CAAC,WAAW;iBACrC,CAAC;gBACF,WAAW,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACtB,KAAK,EAAE,QAAQ,CAAC,KAAK;oBACrB,IAAI,EAAE,IAAI,CAAC,GAAG,CACV,CAAC,EACD,QAAQ,CAAC,IAAI,GAAG,2BAA2B,CAAC,MAAM;wBAClD,CAAC,CAAC,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC,CAChF;iBACJ,CAAC;gBACF,YAAY,EAAE,KAAK,IAAI,EAAE,CAAC,CAAC;oBACvB,KAAK,EAAE,SAAS,CAAC,KAAK;oBACtB,IAAI,EAAE,IAAI,CAAC,GAAG,CACV,CAAC,EACD,SAAS,CAAC,IAAI,GAAG,IAAI,CAAC,GAAG,CACrB,CAAC,EACD,2BAA2B,CAAC,MAAM;wBAClC,CAAC,CAAC,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC;wBAC7E,CAAC,CAAC,QAAQ,CAAC,IAAI,CAAC,CACnB,CACJ;iBACJ,CAAC;gBACF,QAAQ;gBACR,kBAAkB,EAAE,gBAAgB;gBACpC,cAAc,EAAE,iBAAiB;gBACjC,qBAAqB,EAAE,IAAI,CAAC,aAAa,CAAC,gBAAgB,IAAI,4CAA4C;gBAC1G,wBAAwB,EAAE,sBAAsB;gBAChD,cAAc;gBACd,cAAc;gBACd,gBAAgB;gBAChB,YAAY;aACf,CAAC,CAAC;YACH,iBAAiB,GAAG,IAAI,CAAC;YAEzB,IAAI,sBAAsB,IAAI,mBAAmB,GAAG,WAAW,EAAE,CAAC;gBAC9D,iBAAiB,GAAG,KAAK,CAAC;gBAC1B,mBAAmB,GAAG,WAAW,CAAC;YACtC,CAAC;iBAAM,IAAI,sBAAsB,IAAI,mBAAmB,GAAG,WAAW,EAAE,CAAC;gBACrE,mBAAmB,GAAG,WAAW,CAAC;YACtC,CAAC;QACL,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,CAAC,GAAG,YAAY,uBAAuB,CAAC;gBACzC,MAAM,GAAG,CAAC;QAClB,CAAC;QAED,MAAM,6BAA6B,GAAG,IAAI,CAAC,aAAa,CAAC,mCAAmC,CAAC;YACzF,WAAW,EAAE,mBAAmB;YAChC,kBAAkB,EAAE,gBAAgB;YACpC,cAAc,EAAE,iBAAiB;YACjC,cAAc;YACd,YAAY;YACZ,cAAc;YACd,gBAAgB;SACnB,CAAC,CAAC;QAEH,MAAM,UAAU,GAAG;YACf,SAAS,EAAE,EAAE;YACb,qBAAqB,EAAE,EAAE;YACzB,WAAW,EAAE,EAAE;YACf,iBAAiB,EAAE,EAAE;YACrB,qBAAqB,EAAE,EAAE,EAAE,sDAAsD;YACjF,gBAAgB,EAAE,EAAE;SACd,CAAC;QAEX,MAAM,eAAe,GAAG,UAAU,CAAC,SAAS,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,iBAAiB,GAAG,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC;QAC/G,MAAM,2BAA2B,GAAG,UAAU,CAAC,qBAAqB,GAAG,CACnE,iBAAiB,KAAK,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAC/D,CAAC;QACF,MAAM,iBAAiB,GAAG,iBAAiB;YACvC,CAAC,CAAC,UAAU,CAAC,WAAW,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,mBAAmB,GAAG,WAAW,CAAC;YACzE,CAAC,CAAC,CAAC,CAAC;QACR,MAAM,uBAAuB,GAAG,UAAU,CAAC,iBAAiB,GAAG,CAC3D,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,IAAI;YAC/C,CAAC,CAAC,CAAC;YACH,CAAC,CAAC,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI;gBAClE,CAAC,CAAC,GAAG;gBACL,CAAC,CAAC,2BAA2B,CAAC,MAAM,IAAI,QAAQ,CAAC,KAAK;oBAClD,CAAC,CAAC,GAAG;oBACL,CAAC,CAAC,CACE,GAAG,GAAG,IAAI,CAAC,GAAG,CACV,GAAG,EACH,GAAG,GAAG,CACF,CAAC,2BAA2B,CAAC,MAAM,GAAG,QAAQ,CAAC,KAAK,CAAC,GAAG,QAAQ,CAAC,KAAK,CACzE,CACJ,CACJ,CAChB,CAAC;QACF,MAAM,sBAAsB,GAAG,iBAAiB;YAC5C,CAAC,CAAC,CACE,EAAE,GAAG,IAAI,CAAC,GAAG,CACT,CAAC,EACD,CACI,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,mBAAmB,GAAG,WAAW,CAAC,GAAG,WAAW,CAC/D,GAAG,kCAAkC,CACzC,CACJ;YACD,CAAC,CAAC,CAAC,CAAC;QAER,IAAI,kBAAkB,GAAG,SAAS;YAC9B,CAAC,CAAC,CACE,CAAC,eAAe,GAAG,2BAA2B,GAAG,iBAAiB,GAAG,uBAAuB,CAAC;gBAC7F,CAAC,UAAU,CAAC,SAAS,GAAG,UAAU,CAAC,qBAAqB,GAAG,UAAU,CAAC,WAAW,GAAG,UAAU,CAAC,iBAAiB,CAAC,CACpH;YACD,CAAC,CAAC,CACE,CAAC,iBAAiB,GAAG,uBAAuB,GAAG,6BAA6B,CAAC,IAAI,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;gBAC3G,CAAC,UAAU,CAAC,WAAW,GAAG,UAAU,CAAC,iBAAiB,GAAG,UAAU,CAAC,qBAAqB,CAAC,CAAC,CAAC;QACpG,IAAI,UAAU,GAAG,sBAAsB,GAAG,UAAU,CAAC,gBAAgB,CAAC;QAEtE,IAAI,CAAC,kBAAkB,IAAI,CAAC,iBAAiB;YACzC,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO,GAAG,SAAS,CAAC,KAAK;YAC7F,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM,GAAG,QAAQ,CAAC,KAAK,GAAG,SAAS,CAAC,KAAK,EAC9G,CAAC;YACC,MAAM,oBAAoB,GAAG,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO,CAAC;YACzG,MAAM,mBAAmB,GAAG,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM,CAAC;YAEtG,kBAAkB,GAAG,CAAC,CAAC;YACvB,UAAU,GAAG,CACT,CAAC,CAAC,GAAG,CAAC,oBAAoB,GAAG,CAAC,SAAS,CAAC,KAAK,GAAG,2CAA2C,CAAC,CAAC,CAAC;gBAC9F,CAAC,CAAC,GAAG,CAAC,mBAAmB,GAAG,CAAC,CAAC,QAAQ,CAAC,KAAK,GAAG,SAAS,CAAC,KAAK,CAAC,GAAG,2CAA2C,CAAC,CAAC,CAAC,CACnH,GAAG,CAAC,CAAC;QACV,CAAC;QAED,OAAO;YACH,kBAAkB;YAClB,UAAU;YACV,UAAU,EAAE,kBAAkB,GAAG,UAAU;YAE3C,cAAc,EAAE;gBACZ,SAAS,EAAE,iBAAiB;gBAC5B,WAAW,EAAE,mBAAmB;gBAEhC,aAAa,EAAE,2BAA2B,CAAC,MAAM;gBACjD,eAAe,EAAE,6BAA6B,CAAC,MAAM;gBACrD,aAAa,EAAE,2BAA2B,CAAC,MAAM,GAAG,6BAA6B,CAAC,MAAM;gBAExF,cAAc,EAAE,2BAA2B,CAAC,OAAO;gBACnD,gBAAgB,EAAE,6BAA6B,CAAC,OAAO;gBACvD,cAAc,EAAE,2BAA2B,CAAC,OAAO,GAAG,6BAA6B,CAAC,OAAO;aAC9F;SACJ,CAAC;IACN,CAAC;IAEM,KAAK,CAAC,qBAAqB,CAAC,SAA0C,EAAE,EAC3E,wBAAwB,GAAG,KAAK,EAChC,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,oBAAoB,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,eAAe,EAAE,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EAC1G,0BAA0B,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,qBAAqB,EAC5E,4BAA4B,GAAG,KAAK,EACpC,4BAA4B,EAC5B,8BAA8B,EAC9B,0BAA0B,GAAG,KAAK,EAClC,OAAO,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,YAAY,KAMhD,EAAE;QACF,OAAO,2BAA2B,CAAC,SAAS,EAAE;YAC1C,YAAY,EAAE,IAAI,CAAC,aAAa;YAChC,wBAAwB;YACxB,YAAY;YACZ,oBAAoB;YACpB,QAAQ;YACR,0BAA0B;YAC1B,4BAA4B;YAC5B,4BAA4B;YAC5B,8BAA8B;YAC9B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;IACP,CAAC;IAED;;;;OAIG;IACI,KAAK,CAAC,yBAAyB,CAAC,WAA+C,EAAE,EACpF,cAAc,EACd,SAAS,EACT,qBAAqB,EACrB,cAAc,GAAG,KAAK,EACtB,cAAc,EACd,gBAAgB,EAChB,YAAY,GAAG,KAAK,EACpB,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,WAAW,GAAG,CAAC,KAAK,IAAI,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,gBAAgB,CAAC,cAAc,EAAE,CAAC,EACvF,YAAY,GAAG,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,iBAAiB,CAAC,cAAc,EAAE,CAAC,EACnF,QAAQ,GAAG,IAAI,CAAC,aAAa,CAAC,MAAM,CAAC,GAAG,EACxC,wBAAwB,GAAG,KAAK,EAChC,kBAAkB,GAAG,KAAK,EAC1B,SAAS,GAAG,0BAA0B,EAAE,EAgB3C;QACG,OAAO,MAAM,+BAA+B,CAAC;YACzC,WAAW;YACX,SAAS;YACT,SAAS;YACT,iBAAiB,EAAE,IAAI,CAAC,aAAa;YACrC,cAAc;YACd,qBAAqB;YACrB,cAAc;YACd,cAAc;YACd,gBAAgB;YAChB,YAAY;YACZ,YAAY;YACZ,WAAW;YACX,YAAY;YACZ,QAAQ;YACR,wBAAwB;YACxB,kBAAkB;SACrB,CAAC,CAAC;IACP,CAAC;IAED,gBAAgB;IACT,MAAM,CAAC,OAAO,CAAC,YAA0B;QAC5C,OAAO,IAAI,iCAAiC,CAAC,YAAY,CAAC,CAAC;IAC/D,CAAC;CACJ;AAED,SAAS,6BAA6B,CAAC,SAAiB;IACpD,MAAM,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC;IAC/B,OAAO,EAAE,GAAG,WAAW,CAAC,SAAS,EAAE,CAAC;YAChC,KAAK,EAAE,IAAI;YACX,GAAG,EAAE,IAAI,GAAG,GAAG;YACf,MAAM,EAAE,EAAE;SACb,EAAE;YACC,KAAK,EAAE,IAAI,GAAG,GAAG;YACjB,GAAG,EAAE,IAAI,GAAG,CAAC;YACb,MAAM,EAAE,EAAE;SACb,EAAE;YACC,KAAK,EAAE,IAAI,GAAG,CAAC;YACf,MAAM,EAAE,CAAC;SACZ,CAAC,CAAC,CAAC;AACR,CAAC"}
|
|
@@ -1,7 +1,8 @@
|
|
|
1
1
|
import { LlamaContextOptions } from "../../../evaluator/LlamaContext/types.js";
|
|
2
2
|
import { GgufInsights } from "../GgufInsights.js";
|
|
3
3
|
import { BuildGpu } from "../../../bindings/types.js";
|
|
4
|
-
|
|
4
|
+
import type { GgmlType } from "../../types/GgufTensorInfoTypes.js";
|
|
5
|
+
export declare function resolveContextContextSizeOption({ contextSize, batchSize, sequences, modelFileInsights, modelGpuLayers, modelTrainContextSize, flashAttention, kvCacheKeyType, kvCacheValueType, swaFullCache, getVramState, getRamState, getSwapState, ignoreMemorySafetyChecks, isEmbeddingContext, maxContextSizeSwapUse }: {
|
|
5
6
|
contextSize?: LlamaContextOptions["contextSize"];
|
|
6
7
|
batchSize?: LlamaContextOptions["batchSize"];
|
|
7
8
|
sequences: number;
|
|
@@ -9,6 +10,8 @@ export declare function resolveContextContextSizeOption({ contextSize, batchSize
|
|
|
9
10
|
modelGpuLayers: number;
|
|
10
11
|
modelTrainContextSize: number;
|
|
11
12
|
flashAttention: boolean;
|
|
13
|
+
kvCacheKeyType?: GgmlType;
|
|
14
|
+
kvCacheValueType?: GgmlType;
|
|
12
15
|
swaFullCache: boolean;
|
|
13
16
|
getVramState(): Promise<{
|
|
14
17
|
total: number;
|
|
@@ -3,7 +3,7 @@ import { getDefaultContextBatchSize, getDefaultModelContextSize } from "../../..
|
|
|
3
3
|
import { InsufficientMemoryError } from "../../../utils/InsufficientMemoryError.js";
|
|
4
4
|
import { getRamUsageFromUnifiedVram } from "./getRamUsageFromUnifiedVram.js";
|
|
5
5
|
const defaultMaxContextSizeSwapUse = 2048;
|
|
6
|
-
export async function resolveContextContextSizeOption({ contextSize, batchSize, sequences, modelFileInsights, modelGpuLayers, modelTrainContextSize, flashAttention, swaFullCache, getVramState, getRamState, getSwapState, ignoreMemorySafetyChecks = false, isEmbeddingContext = false, maxContextSizeSwapUse = defaultMaxContextSizeSwapUse }) {
|
|
6
|
+
export async function resolveContextContextSizeOption({ contextSize, batchSize, sequences, modelFileInsights, modelGpuLayers, modelTrainContextSize, flashAttention, kvCacheKeyType, kvCacheValueType, swaFullCache, getVramState, getRamState, getSwapState, ignoreMemorySafetyChecks = false, isEmbeddingContext = false, maxContextSizeSwapUse = defaultMaxContextSizeSwapUse }) {
|
|
7
7
|
if (contextSize == null)
|
|
8
8
|
contextSize = "auto";
|
|
9
9
|
if (typeof contextSize === "number") {
|
|
@@ -21,6 +21,8 @@ export async function resolveContextContextSizeOption({ contextSize, batchSize,
|
|
|
21
21
|
modelGpuLayers: modelGpuLayers,
|
|
22
22
|
sequences,
|
|
23
23
|
flashAttention,
|
|
24
|
+
kvCacheKeyType,
|
|
25
|
+
kvCacheValueType,
|
|
24
26
|
swaFullCache,
|
|
25
27
|
isEmbeddingContext
|
|
26
28
|
});
|
|
@@ -51,6 +53,8 @@ export async function resolveContextContextSizeOption({ contextSize, batchSize,
|
|
|
51
53
|
modelGpuLayers: modelGpuLayers,
|
|
52
54
|
sequences,
|
|
53
55
|
flashAttention,
|
|
56
|
+
kvCacheKeyType,
|
|
57
|
+
kvCacheValueType,
|
|
54
58
|
swaFullCache,
|
|
55
59
|
isEmbeddingContext
|
|
56
60
|
});
|
|
@@ -90,6 +94,8 @@ export async function resolveContextContextSizeOption({ contextSize, batchSize,
|
|
|
90
94
|
modelGpuLayers: modelGpuLayers,
|
|
91
95
|
sequences,
|
|
92
96
|
flashAttention,
|
|
97
|
+
kvCacheKeyType,
|
|
98
|
+
kvCacheValueType,
|
|
93
99
|
swaFullCache,
|
|
94
100
|
isEmbeddingContext
|
|
95
101
|
});
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"resolveContextContextSizeOption.js","sourceRoot":"","sources":["../../../../src/gguf/insights/utils/resolveContextContextSizeOption.ts"],"names":[],"mappings":"AAGA,OAAO,EAAC,mCAAmC,EAAC,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,iDAAiD,CAAC;AACvH,OAAO,EAAC,uBAAuB,EAAC,MAAM,2CAA2C,CAAC;AAClF,OAAO,EAAC,0BAA0B,EAAC,MAAM,iCAAiC,CAAC;
|
|
1
|
+
{"version":3,"file":"resolveContextContextSizeOption.js","sourceRoot":"","sources":["../../../../src/gguf/insights/utils/resolveContextContextSizeOption.ts"],"names":[],"mappings":"AAGA,OAAO,EAAC,mCAAmC,EAAC,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,iDAAiD,CAAC;AACvH,OAAO,EAAC,uBAAuB,EAAC,MAAM,2CAA2C,CAAC;AAClF,OAAO,EAAC,0BAA0B,EAAC,MAAM,iCAAiC,CAAC;AAG3E,MAAM,4BAA4B,GAAG,IAAI,CAAC;AAE1C,MAAM,CAAC,KAAK,UAAU,+BAA+B,CAAC,EAClD,WAAW,EAAE,SAAS,EAAE,SAAS,EAAE,iBAAiB,EAAE,cAAc,EAAE,qBAAqB,EAAE,cAAc,EAC3G,cAAc,EAAE,gBAAgB,EAAE,YAAY,EAC9C,YAAY,EAAE,WAAW,EAAE,YAAY,EAAE,wBAAwB,GAAG,KAAK,EAAE,kBAAkB,GAAG,KAAK,EACrG,qBAAqB,GAAG,4BAA4B,EAmBvD;IACG,IAAI,WAAW,IAAI,IAAI;QACnB,WAAW,GAAG,MAAM,CAAC;IAEzB,IAAI,OAAO,WAAW,KAAK,QAAQ,EAAE,CAAC;QAClC,MAAM,mBAAmB,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,WAAW,CAAC,CAAC,CAAC;QAEjE,IAAI,wBAAwB;YACxB,OAAO,mBAAmB,CAAC;QAE/B,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QACH,MAAM,2BAA2B,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;YACtF,WAAW,EAAE,mBAAmB;YAChC,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,mBAAmB,EAAE,SAAS,EAAC,CAAC;YACjG,cAAc,EAAE,cAAc;YAC9B,SAAS;YACT,cAAc;YACd,cAAc;YACd,gBAAgB;YAChB,YAAY;YACZ,kBAAkB;SACrB,CAAC,CAAC;QAEH,IAAI,2BAA2B,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YACpD,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,mBAAmB,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,CAAC,CAAC;aACvK,IAAI,2BAA2B,CAAC,MAAM,GAAG,CAC1C,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,CAC9G;YACG,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,mBAAmB,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;QAE5N,OAAO,mBAAmB,CAAC;IAC/B,CAAC;SAAM,IAAI,WAAW,KAAK,MAAM,IAAI,OAAO,WAAW,KAAK,QAAQ,EAAE,CAAC;QACnE,MAAM,CACF,SAAS,EACT,QAAQ,EACR,SAAS,CACZ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAClB,YAAY,EAAE;YACd,WAAW,EAAE;YACb,YAAY,EAAE;SACjB,CAAC,CAAC;QAEH,MAAM,cAAc,GAAG,WAAW,KAAK,MAAM;YACzC,CAAC,CAAC,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC;YACvE,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,WAAW,CAAC,GAAG,IAAI,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC,EACxF,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,qBAAqB,EAAC,CAAC,CACxE,CAAC;QAEN,MAAM,cAAc,GAAG,WAAW,KAAK,MAAM;YACzC,CAAC,CAAC,mCAAmC;YACrC,CAAC,CAAC,IAAI,CAAC,GAAG,CACN,WAAW,CAAC,GAAG,IAAI,mCAAmC,EACtD,mCAAmC,CACtC,CAAC;QAEN,IAAI,4BAA4B,GAAkB,IAAI,CAAC;QACvD,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,cAAc,GAAG,cAAc,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC3E,KAAK,IAAI,eAAe,GAAG,cAAc,EAAE,eAAe,IAAI,cAAc,IAAI,eAAe,IAAI,cAAc,GAAG,CAAC;YACjH,MAAM,2BAA2B,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;gBACtF,WAAW,EAAE,eAAe;gBAC5B,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,eAAe,EAAE,SAAS,EAAC,CAAC;gBAC7F,cAAc,EAAE,cAAc;gBAC9B,SAAS;gBACT,cAAc;gBACd,cAAc;gBACd,gBAAgB;gBAChB,YAAY;gBACZ,kBAAkB;aACrB,CAAC,CAAC;YAEH,IAAI,2BAA2B,CAAC,OAAO,IAAI,SAAS,CAAC,IAAI;gBACrD,2BAA2B,CAAC,MAAM,IAAI,CAClC,QAAQ,CAAC,IAAI,GAAG,0BAA0B,CAAC,2BAA2B,CAAC,OAAO,EAAE,SAAS,CAAC,GAAG,CACzF,eAAe,IAAI,qBAAqB;oBACpC,CAAC,CAAC,SAAS,CAAC,IAAI;oBAChB,CAAC,CAAC,CAAC,CACV,CACJ,EACH,CAAC;gBACC,IAAI,4BAA4B,IAAI,IAAI,IAAI,eAAe,IAAI,4BAA4B,EAAE,CAAC;oBAC1F,4BAA4B,GAAG,eAAe,CAAC;oBAE/C,IAAI,IAAI,KAAK,CAAC,CAAC;wBACX,MAAM;yBACL,IAAI,IAAI,GAAG,CAAC;wBACb,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;gBAClD,CAAC;YACL,CAAC;iBAAM,IAAI,IAAI,GAAG,CAAC;gBACf,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;YAE9C,IAAI,eAAe,IAAI,cAAc,IAAI,IAAI,KAAK,CAAC,CAAC;gBAChD,MAAM;YAEV,eAAe,IAAI,IAAI,CAAC;YACxB,IAAI,eAAe,GAAG,cAAc,EAAE,CAAC;gBACnC,eAAe,GAAG,cAAc,CAAC;gBACjC,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACvD,CAAC;iBAAM,IAAI,eAAe,GAAG,cAAc,EAAE,CAAC;gBAC1C,eAAe,GAAG,cAAc,CAAC;gBACjC,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACxD,CAAC;QACL,CAAC;QAED,IAAI,4BAA4B,IAAI,IAAI;YACpC,OAAO,4BAA4B,CAAC;QAExC,IAAI,wBAAwB;YACxB,OAAO,cAAc,CAAC;QAE1B,MAAM,kCAAkC,GAAG,iBAAiB,CAAC,mCAAmC,CAAC;YAC7F,WAAW,EAAE,cAAc;YAC3B,SAAS,EAAE,SAAS,IAAI,0BAA0B,CAAC,EAAC,WAAW,EAAE,cAAc,EAAE,SAAS,EAAC,CAAC;YAC5F,cAAc,EAAE,cAAc;YAC9B,SAAS;YACT,cAAc;YACd,cAAc;YACd,gBAAgB;YAChB,YAAY;YACZ,kBAAkB;SACrB,CAAC,CAAC;QAEH,MAAM,eAAe,GAAG,0BAA0B,CAAC,kCAAkC,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC;QAC1G,IAAI,kCAAkC,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YAC3D,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,eAAe;YAE5F,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,+CAA+C,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;aAC3N,IAAI,kCAAkC,CAAC,OAAO,GAAG,SAAS,CAAC,IAAI;YAChE,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,CAAC,CAAC;aAClK,IAAI,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,SAAS,CAAC,IAAI,GAAG,eAAe;YACjG,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,sCAAsC,SAAS,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,mBAAmB,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;aAClN,IAAI,kCAAkC,CAAC,MAAM,GAAG,QAAQ,CAAC,IAAI,GAAG,eAAe;YAChF,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,qCAAqC,CAAC,CAAC;;YAElK,MAAM,IAAI,uBAAuB,CAAC,qBAAqB,cAAc,GAAG,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,SAAS,YAAY,CAAC,CAAC,CAAC,EAAE,2CAA2C,CAAC,CAAC;IAChL,CAAC;IAED,MAAM,IAAI,KAAK,CAAC,0BAA0B,WAAW,GAAG,CAAC,CAAC;AAC9D,CAAC"}
|
|
@@ -1,7 +1,8 @@
|
|
|
1
1
|
import { LlamaModelOptions } from "../../../evaluator/LlamaModel/LlamaModel.js";
|
|
2
2
|
import { BuildGpu } from "../../../bindings/types.js";
|
|
3
|
+
import type { GgmlType } from "../../types/GgufTensorInfoTypes.js";
|
|
3
4
|
import type { GgufInsights } from "../GgufInsights.js";
|
|
4
|
-
export declare function resolveModelGpuLayersOption(gpuLayers: LlamaModelOptions["gpuLayers"], { ggufInsights, ignoreMemorySafetyChecks, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading, defaultContextFlashAttention, defaultContextSwaFullCache, useMmap }: {
|
|
5
|
+
export declare function resolveModelGpuLayersOption(gpuLayers: LlamaModelOptions["gpuLayers"], { ggufInsights, ignoreMemorySafetyChecks, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading, defaultContextFlashAttention, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache, useMmap }: {
|
|
5
6
|
ggufInsights: GgufInsights;
|
|
6
7
|
ignoreMemorySafetyChecks?: boolean;
|
|
7
8
|
getVramState(): Promise<{
|
|
@@ -12,6 +13,8 @@ export declare function resolveModelGpuLayersOption(gpuLayers: LlamaModelOptions
|
|
|
12
13
|
llamaGpu: BuildGpu;
|
|
13
14
|
llamaSupportsGpuOffloading: boolean;
|
|
14
15
|
defaultContextFlashAttention: boolean;
|
|
16
|
+
defaultContextKvCacheKeyType?: GgmlType;
|
|
17
|
+
defaultContextKvCacheValueType?: GgmlType;
|
|
15
18
|
defaultContextSwaFullCache: boolean;
|
|
16
19
|
useMmap?: boolean;
|
|
17
20
|
}): Promise<number>;
|
|
@@ -4,7 +4,7 @@ import { getDefaultContextBatchSize, getDefaultModelContextSize } from "../../..
|
|
|
4
4
|
import { minAllowedContextSizeInCalculations } from "../../../config.js";
|
|
5
5
|
import { scoreLevels } from "./scoreLevels.js";
|
|
6
6
|
const fitContextExtraMemoryPaddingPercentage = 0.5;
|
|
7
|
-
export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ignoreMemorySafetyChecks = false, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading, defaultContextFlashAttention, defaultContextSwaFullCache, useMmap }) {
|
|
7
|
+
export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ignoreMemorySafetyChecks = false, getVramState, llamaVramPaddingSize, llamaGpu, llamaSupportsGpuOffloading, defaultContextFlashAttention, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache, useMmap }) {
|
|
8
8
|
if (gpuLayers == null)
|
|
9
9
|
gpuLayers = "auto";
|
|
10
10
|
if (!llamaSupportsGpuOffloading)
|
|
@@ -21,6 +21,8 @@ export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ign
|
|
|
21
21
|
ggufInsights,
|
|
22
22
|
currentVram: vramState.free,
|
|
23
23
|
defaultContextFlashAttention,
|
|
24
|
+
defaultContextKvCacheKeyType,
|
|
25
|
+
defaultContextKvCacheValueType,
|
|
24
26
|
defaultContextSwaFullCache,
|
|
25
27
|
useMmap
|
|
26
28
|
});
|
|
@@ -53,6 +55,8 @@ export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ign
|
|
|
53
55
|
? gpuLayers.max
|
|
54
56
|
: undefined,
|
|
55
57
|
defaultContextFlashAttention,
|
|
58
|
+
defaultContextKvCacheKeyType,
|
|
59
|
+
defaultContextKvCacheValueType,
|
|
56
60
|
defaultContextSwaFullCache,
|
|
57
61
|
useMmap
|
|
58
62
|
});
|
|
@@ -64,7 +68,7 @@ export async function resolveModelGpuLayersOption(gpuLayers, { ggufInsights, ign
|
|
|
64
68
|
}
|
|
65
69
|
throw new Error(`Invalid gpuLayers value: ${gpuLayers}`);
|
|
66
70
|
}
|
|
67
|
-
function getBestGpuLayersForFreeVram({ ggufInsights, freeVram, fitContext, minGpuLayers, maxGpuLayers, defaultContextFlashAttention, defaultContextSwaFullCache, useMmap }) {
|
|
71
|
+
function getBestGpuLayersForFreeVram({ ggufInsights, freeVram, fitContext, minGpuLayers, maxGpuLayers, defaultContextFlashAttention, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache, useMmap }) {
|
|
68
72
|
return findBestOption({
|
|
69
73
|
*generator() {
|
|
70
74
|
const minLayers = Math.floor(Math.max(0, minGpuLayers ?? 0));
|
|
@@ -83,6 +87,8 @@ function getBestGpuLayersForFreeVram({ ggufInsights, freeVram, fitContext, minGp
|
|
|
83
87
|
fitContext,
|
|
84
88
|
defaultContextFlashAttention,
|
|
85
89
|
defaultContextSwaFullCache,
|
|
90
|
+
defaultContextKvCacheKeyType,
|
|
91
|
+
defaultContextKvCacheValueType,
|
|
86
92
|
useMmap
|
|
87
93
|
});
|
|
88
94
|
if (layersRequirements == null)
|
|
@@ -130,7 +136,7 @@ function scoreGpuLayersAndContextCombination({ gpuLayers, contextSize }, { total
|
|
|
130
136
|
}
|
|
131
137
|
return scoreGpuLayers() + scoreContextSize();
|
|
132
138
|
}
|
|
133
|
-
function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fitContext, defaultContextFlashAttention = false, defaultContextSwaFullCache = false, useMmap }) {
|
|
139
|
+
function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fitContext, defaultContextFlashAttention = false, defaultContextKvCacheKeyType, defaultContextKvCacheValueType, defaultContextSwaFullCache = false, useMmap }) {
|
|
134
140
|
const modelVram = ggufInsights.estimateModelResourceRequirements({
|
|
135
141
|
gpuLayers,
|
|
136
142
|
useMmap
|
|
@@ -145,6 +151,8 @@ function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fit
|
|
|
145
151
|
sequences: 1,
|
|
146
152
|
isEmbeddingContext: fitContext.embeddingContext ?? false,
|
|
147
153
|
flashAttention: defaultContextFlashAttention,
|
|
154
|
+
kvCacheKeyType: defaultContextKvCacheKeyType,
|
|
155
|
+
kvCacheValueType: defaultContextKvCacheValueType,
|
|
148
156
|
swaFullCache: defaultContextSwaFullCache
|
|
149
157
|
}).gpuVram;
|
|
150
158
|
const totalVram = modelVram + contextVram;
|
|
@@ -162,6 +170,8 @@ function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fit
|
|
|
162
170
|
vram: currentVram - modelVram,
|
|
163
171
|
isEmbeddingContext: fitContext?.embeddingContext ?? false,
|
|
164
172
|
flashAttention: defaultContextFlashAttention,
|
|
173
|
+
kvCacheKeyType: defaultContextKvCacheKeyType,
|
|
174
|
+
kvCacheValueType: defaultContextKvCacheValueType,
|
|
165
175
|
swaFullCache: defaultContextSwaFullCache
|
|
166
176
|
});
|
|
167
177
|
if (maxContext == null || modelVram + maxContext.vram > currentVram)
|
|
@@ -172,7 +182,7 @@ function getVramRequiredForGpuLayers({ gpuLayers, ggufInsights, currentVram, fit
|
|
|
172
182
|
totalVram: modelVram + maxContext.vram
|
|
173
183
|
};
|
|
174
184
|
}
|
|
175
|
-
function findMaxPossibleContextSizeForVram({ gpuLayers, ggufInsights, vram, isEmbeddingContext, flashAttention, swaFullCache }) {
|
|
185
|
+
function findMaxPossibleContextSizeForVram({ gpuLayers, ggufInsights, vram, isEmbeddingContext, flashAttention, kvCacheKeyType, kvCacheValueType, swaFullCache }) {
|
|
176
186
|
const maxContextSize = getDefaultModelContextSize({ trainContextSize: ggufInsights.trainContextSize });
|
|
177
187
|
return findMaxValidValue({
|
|
178
188
|
maxValue: maxContextSize,
|
|
@@ -186,6 +196,8 @@ function findMaxPossibleContextSizeForVram({ gpuLayers, ggufInsights, vram, isEm
|
|
|
186
196
|
sequences: 1,
|
|
187
197
|
isEmbeddingContext,
|
|
188
198
|
flashAttention,
|
|
199
|
+
kvCacheKeyType,
|
|
200
|
+
kvCacheValueType,
|
|
189
201
|
swaFullCache
|
|
190
202
|
}).gpuVram;
|
|
191
203
|
if (contextVram <= vram)
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"resolveModelGpuLayersOption.js","sourceRoot":"","sources":["../../../../src/gguf/insights/utils/resolveModelGpuLayersOption.ts"],"names":[],"mappings":"AAEA,OAAO,EAAC,uBAAuB,EAAC,MAAM,2CAA2C,CAAC;AAClF,OAAO,EAAC,cAAc,EAAC,MAAM,kCAAkC,CAAC;AAChE,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,iDAAiD,CAAC;AACvH,OAAO,EAAC,mCAAmC,EAAC,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAC,WAAW,EAAC,MAAM,kBAAkB,CAAC;
|
|
1
|
+
{"version":3,"file":"resolveModelGpuLayersOption.js","sourceRoot":"","sources":["../../../../src/gguf/insights/utils/resolveModelGpuLayersOption.ts"],"names":[],"mappings":"AAEA,OAAO,EAAC,uBAAuB,EAAC,MAAM,2CAA2C,CAAC;AAClF,OAAO,EAAC,cAAc,EAAC,MAAM,kCAAkC,CAAC;AAChE,OAAO,EAAC,0BAA0B,EAAE,0BAA0B,EAAC,MAAM,iDAAiD,CAAC;AACvH,OAAO,EAAC,mCAAmC,EAAC,MAAM,oBAAoB,CAAC;AACvE,OAAO,EAAC,WAAW,EAAC,MAAM,kBAAkB,CAAC;AAI7C,MAAM,sCAAsC,GAAG,GAAG,CAAC;AAEnD,MAAM,CAAC,KAAK,UAAU,2BAA2B,CAAC,SAAyC,EAAE,EACzF,YAAY,EAAE,wBAAwB,GAAG,KAAK,EAAE,YAAY,EAAE,oBAAoB,EAClF,QAAQ,EAAE,0BAA0B,EAAE,4BAA4B,EAClE,4BAA4B,EAAE,8BAA8B,EAAE,0BAA0B,EAAE,OAAO,EAOpG;IACG,IAAI,SAAS,IAAI,IAAI;QACjB,SAAS,GAAG,MAAM,CAAC;IAEvB,IAAI,CAAC,0BAA0B;QAC3B,OAAO,CAAC,CAAC;IAEb,IAAI,SAAS,KAAK,KAAK,IAAI,OAAO,SAAS,KAAK,QAAQ,EAAE,CAAC;QACvD,MAAM,iBAAiB,GAAG,OAAO,SAAS,KAAK,QAAQ;YACnD,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,YAAY,CAAC,WAAW,EAAE,SAAS,CAAC,CAAC;YAC5D,CAAC,CAAC,YAAY,CAAC,WAAW,CAAC;QAE/B,IAAI,wBAAwB;YACxB,OAAO,iBAAiB,CAAC;QAE7B,MAAM,SAAS,GAAG,MAAM,YAAY,EAAE,CAAC;QACvC,MAAM,qBAAqB,GAAG,2BAA2B,CAAC;YACtD,SAAS,EAAE,iBAAiB;YAC5B,YAAY;YACZ,WAAW,EAAE,SAAS,CAAC,IAAI;YAC3B,4BAA4B;YAC5B,4BAA4B;YAC5B,8BAA8B;YAC9B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;QAEH,IAAI,qBAAqB,IAAI,IAAI;YAC7B,MAAM,IAAI,uBAAuB,CAAC,8DAA8D,CAAC,CAAC;QAEtG,OAAO,iBAAiB,CAAC;IAC7B,CAAC;SAAM,IAAI,SAAS,KAAK,MAAM,IAAI,OAAO,SAAS,KAAK,QAAQ,EAAE,CAAC;QAC/D,IAAI,QAAQ,KAAK,KAAK;YAClB,OAAO,CAAC,CAAC;QAEb,MAAM,SAAS,GAAG,MAAM,YAAY,EAAE,CAAC;QACvC,IAAI,SAAS,CAAC,KAAK,KAAK,CAAC;YACrB,OAAO,CAAC,CAAC;QAEb,IAAI,QAAQ,GAAG,SAAS,CAAC,IAAI,CAAC;QAC9B,IAAI,OAAO,SAAS,KAAK,QAAQ,IAAI,SAAS,CAAC,UAAU,EAAE,WAAW,IAAI,IAAI,EAAE,CAAC;YAC7E,QAAQ,IAAI,oBAAoB,GAAG,sCAAsC,CAAC;YAE1E,IAAI,QAAQ,GAAG,CAAC;gBACZ,QAAQ,GAAG,CAAC,CAAC;QACrB,CAAC;QAED,MAAM,mBAAmB,GAAG,2BAA2B,CAAC;YACpD,YAAY;YACZ,QAAQ;YACR,UAAU,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACrC,CAAC,CAAC,SAAS,CAAC,UAAU;gBACtB,CAAC,CAAC,SAAS;YACf,YAAY,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACvC,CAAC,CAAC,SAAS,CAAC,GAAG;gBACf,CAAC,CAAC,SAAS;YACf,YAAY,EAAE,OAAO,SAAS,KAAK,QAAQ;gBACvC,CAAC,CAAC,SAAS,CAAC,GAAG;gBACf,CAAC,CAAC,SAAS;YACf,4BAA4B;YAC5B,4BAA4B;YAC5B,8BAA8B;YAC9B,0BAA0B;YAC1B,OAAO;SACV,CAAC,CAAC;QAEH,MAAM,wBAAwB,GAAG,OAAO,SAAS,KAAK,QAAQ;YAC1D,CAAC,SAAS,CAAC,GAAG,IAAI,IAAI,IAAI,SAAS,CAAC,GAAG,IAAI,IAAI,IAAI,SAAS,CAAC,UAAU,EAAE,WAAW,IAAI,IAAI,CAAC,CAAC;QAElG,IAAI,CAAC,wBAAwB,IAAI,mBAAmB,IAAI,IAAI,IAAI,wBAAwB;YACpF,MAAM,IAAI,uBAAuB,CAAC,8DAA8D,CAAC,CAAC;QAEtG,OAAO,mBAAmB,IAAI,CAAC,CAAC;IACpC,CAAC;IAED,MAAM,IAAI,KAAK,CAAC,4BAA4B,SAAS,EAAE,CAAC,CAAC;AAC7D,CAAC;AAED,SAAS,2BAA2B,CAAC,EACjC,YAAY,EACZ,QAAQ,EACR,UAAU,EACV,YAAY,EACZ,YAAY,EACZ,4BAA4B,EAC5B,4BAA4B,EAC5B,8BAA8B,EAC9B,0BAA0B,EAC1B,OAAO,EAYV;IACG,OAAO,cAAc,CAAC;QAClB,CAAC,SAAS;YACN,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,YAAY,IAAI,CAAC,CAAC,CAAC,CAAC;YAC7D,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,YAAY,CAAC,WAAW,EAAE,YAAY,IAAI,YAAY,CAAC,WAAW,CAAC,CAAC,CAAC;YAE3G,KAAK,IAAI,MAAM,GAAG,SAAS,EAAE,MAAM,IAAI,SAAS,EAAE,MAAM,EAAE,EAAE,CAAC;gBACzD,MAAM;oBACF,SAAS,EAAE,MAAM;iBACpB,CAAC;YACN,CAAC;QACL,CAAC;QACD,KAAK,CAAC,MAAM;YACR,MAAM,kBAAkB,GAAG,2BAA2B,CAAC;gBACnD,SAAS,EAAE,MAAM,CAAC,SAAS;gBAC3B,YAAY;gBACZ,WAAW,EAAE,QAAQ;gBACrB,UAAU;gBACV,4BAA4B;gBAC5B,0BAA0B;gBAC1B,4BAA4B;gBAC5B,8BAA8B;gBAC9B,OAAO;aACV,CAAC,CAAC;YAEH,IAAI,kBAAkB,IAAI,IAAI;gBAC1B,OAAO,IAAI,CAAC;YAEhB,OAAO,mCAAmC,CAAC,EAAC,SAAS,EAAE,MAAM,CAAC,SAAS,EAAE,WAAW,EAAE,kBAAkB,CAAC,WAAW,EAAC,EAAE;gBACnH,cAAc,EAAE,YAAY,CAAC,WAAW;gBACxC,gBAAgB,EAAE,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,YAAY,CAAC,gBAAgB,EAAC,CAAC;aAClG,CAAC,CAAC;QACP,CAAC;KACJ,CAAC,EAAE,SAAS,IAAI,IAAI,CAAC;AAC1B,CAAC;AAED,SAAS,mCAAmC,CAAC,EAAC,SAAS,EAAE,WAAW,EAA2C,EAAE,EAC7G,cAAc,EAAE,gBAAgB,EAGnC;IACG,SAAS,cAAc;QACnB,OAAO,WAAW,CAAC,SAAS,EAAE,CAAC;gBAC3B,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,EAAE;aACb,EAAE;gBACC,KAAK,EAAE,cAAc;gBACrB,MAAM,EAAE,EAAE;gBACV,GAAG,EAAE,cAAc;aACtB,CAAC,CAAC,CAAC;IACR,CAAC;IAED,SAAS,gBAAgB;QACrB,MAAM,mBAAmB,GAAG,SAAS,GAAG,cAAc,CAAC;QAEvD,OAAO,WAAW,CAAC,WAAW,EAAE,CAAC;gBAC7B,KAAK,EAAE,CAAC;gBACR,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,CAAC;aACZ,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;aAC5C,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,EAAE;aAC7C,EAAE;gBACC,KAAK,EAAE,IAAI;gBACX,MAAM,EAAE,mBAAmB,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;gBACzC,GAAG,EAAE,IAAI,CAAC,GAAG,CAAC,gBAAgB,EAAE,KAAK,CAAC;aACzC,CAAC,CAAC,CAAC;IACR,CAAC;IAED,OAAO,cAAc,EAAE,GAAG,gBAAgB,EAAE,CAAC;AACjD,CAAC;AAED,SAAS,2BAA2B,CAAC,EACjC,SAAS,EAAE,YAAY,EAAE,WAAW,EAAE,UAAU,EAAE,4BAA4B,GAAG,KAAK,EACtF,4BAA4B,EAAE,8BAA8B,EAAE,0BAA0B,GAAG,KAAK,EAAE,OAAO,EAK5G;IACG,MAAM,SAAS,GAAG,YAAY,CAAC,iCAAiC,CAAC;QAC7D,SAAS;QACT,OAAO;KACV,CAAC,CAAC,OAAO,CAAC;IAEX,IAAI,SAAS,GAAG,WAAW;QACvB,OAAO,IAAI,CAAC;IAEhB,IAAI,UAAU,IAAI,IAAI,IAAI,UAAU,CAAC,WAAW,IAAI,IAAI,EAAE,CAAC;QACvD,MAAM,WAAW,GAAG,YAAY,CAAC,mCAAmC,CAAC;YACjE,WAAW,EAAE,UAAU,CAAC,WAAW;YACnC,SAAS,EAAE,0BAA0B,CAAC,EAAC,WAAW,EAAE,UAAU,CAAC,WAAW,EAAE,SAAS,EAAE,CAAC,EAAC,CAAC;YAC1F,cAAc,EAAE,SAAS;YACzB,SAAS,EAAE,CAAC;YACZ,kBAAkB,EAAE,UAAU,CAAC,gBAAgB,IAAI,KAAK;YACxD,cAAc,EAAE,4BAA4B;YAC5C,cAAc,EAAE,4BAA4B;YAC5C,gBAAgB,EAAE,8BAA8B;YAChD,YAAY,EAAE,0BAA0B;SAC3C,CAAC,CAAC,OAAO,CAAC;QAEX,MAAM,SAAS,GAAG,SAAS,GAAG,WAAW,CAAC;QAC1C,IAAI,SAAS,GAAG,WAAW;YACvB,OAAO,IAAI,CAAC;QAEhB,OAAO;YACH,WAAW,EAAE,UAAU,CAAC,WAAW;YACnC,WAAW;YACX,SAAS;SACZ,CAAC;IACN,CAAC;IAED,MAAM,UAAU,GAAG,iCAAiC,CAAC;QACjD,SAAS;QACT,YAAY;QACZ,IAAI,EAAE,WAAW,GAAG,SAAS;QAC7B,kBAAkB,EAAE,UAAU,EAAE,gBAAgB,IAAI,KAAK;QACzD,cAAc,EAAE,4BAA4B;QAC5C,cAAc,EAAE,4BAA4B;QAC5C,gBAAgB,EAAE,8BAA8B;QAChD,YAAY,EAAE,0BAA0B;KAC3C,CAAC,CAAC;IAEH,IAAI,UAAU,IAAI,IAAI,IAAI,SAAS,GAAG,UAAU,CAAC,IAAI,GAAG,WAAW;QAC/D,OAAO,IAAI,CAAC;IAEhB,OAAO;QACH,WAAW,EAAE,UAAU,CAAC,WAAW;QACnC,WAAW,EAAE,UAAU,CAAC,IAAI;QAC5B,SAAS,EAAE,SAAS,GAAG,UAAU,CAAC,IAAI;KACzC,CAAC;AACN,CAAC;AAED,SAAS,iCAAiC,CAAC,EACvC,SAAS,EAAE,YAAY,EAAE,IAAI,EAAE,kBAAkB,EAAE,cAAc,EAAE,cAAc,EAAE,gBAAgB,EAAE,YAAY,EAIpH;IACG,MAAM,cAAc,GAAG,0BAA0B,CAAC,EAAC,gBAAgB,EAAE,YAAY,CAAC,gBAAgB,EAAC,CAAC,CAAC;IAErG,OAAO,iBAAiB,CAAC;QACrB,QAAQ,EAAE,cAAc;QACxB,QAAQ,EAAE,mCAAmC;QAC7C,OAAO,EAAE,CAAC;QACV,IAAI,CAAC,WAAW;YACZ,MAAM,WAAW,GAAG,YAAY,CAAC,mCAAmC,CAAC;gBACjE,WAAW;gBACX,SAAS,EAAE,0BAA0B,CAAC,EAAC,WAAW,EAAE,SAAS,EAAE,CAAC,EAAC,CAAC;gBAClE,cAAc,EAAE,SAAS;gBACzB,SAAS,EAAE,CAAC;gBACZ,kBAAkB;gBAClB,cAAc;gBACd,cAAc;gBACd,gBAAgB;gBAChB,YAAY;aACf,CAAC,CAAC,OAAO,CAAC;YAEX,IAAI,WAAW,IAAI,IAAI;gBACnB,OAAO;oBACH,WAAW;oBACX,IAAI,EAAE,WAAW;iBACpB,CAAC;YAEN,OAAO,IAAI,CAAC;QAChB,CAAC;KACJ,CAAC,CAAC;AACP,CAAC;AAED,SAAS,iBAAiB,CAAI,EAC1B,QAAQ,EACR,QAAQ,EACR,OAAO,GAAG,CAAC,EACX,IAAI,EAMP;IACG,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,QAAQ,GAAG,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;IACrE,IAAI,SAAS,GAAsC,IAAI,CAAC;IAExD,KAAK,IAAI,KAAK,GAAG,QAAQ,EAAE,KAAK,IAAI,QAAQ,GAAG,CAAC;QAC5C,MAAM,MAAM,GAAa,CAAC,SAAS,IAAI,IAAI,IAAI,KAAK,KAAK,SAAS,CAAC,KAAK,CAAC;YACrE,CAAC,CAAC,SAAS,CAAC,MAAM;YAClB,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAElB,IAAI,MAAM,IAAI,IAAI,EAAE,CAAC;YACjB,IAAI,SAAS,IAAI,IAAI,IAAI,KAAK,IAAI,SAAS,CAAC,KAAK,EAAE,CAAC;gBAChD,SAAS,GAAG,EAAC,KAAK,EAAE,KAAK,EAAE,MAAM,EAAE,MAAM,EAAC,CAAC;gBAE3C,IAAI,IAAI,KAAK,CAAC,OAAO;oBACjB,MAAM;qBACL,IAAI,IAAI,GAAG,CAAC;oBACb,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;YACxD,CAAC;QACL,CAAC;aAAM,IAAI,SAAS,IAAI,IAAI,IAAI,KAAK,GAAG,SAAS,CAAC,KAAK,EAAE,CAAC;YACtD,KAAK,GAAG,SAAS,CAAC,KAAK,CAAC;YACxB,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACzD,SAAS;QACb,CAAC;aAAM,IAAI,IAAI,GAAG,CAAC;YACf,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC,CAAC;QAEpD,IAAI,KAAK,KAAK,QAAQ,IAAI,IAAI,KAAK,CAAC,OAAO;YACvC,MAAM;QAEV,KAAK,IAAI,IAAI,CAAC;QACd,IAAI,KAAK,GAAG,QAAQ,EAAE,CAAC;YACnB,KAAK,GAAG,QAAQ,CAAC;YACjB,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC7D,CAAC;aAAM,IAAI,KAAK,GAAG,QAAQ,EAAE,CAAC;YAC1B,KAAK,GAAG,QAAQ,CAAC;YACjB,IAAI,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAC9D,CAAC;IACL,CAAC;IAED,IAAI,SAAS,IAAI,IAAI;QACjB,OAAO,SAAS,CAAC,MAAM,CAAC;IAE5B,OAAO,IAAI,CAAC;AAChB,CAAC"}
|
|
@@ -18,6 +18,7 @@ export declare const enum GgufArchitectureType {
|
|
|
18
18
|
neoBert = "neo-bert",
|
|
19
19
|
jinaBertV2 = "jina-bert-v2",
|
|
20
20
|
jinaBertV3 = "jina-bert-v3",
|
|
21
|
+
eurobert = "eurobert",
|
|
21
22
|
bloom = "bloom",
|
|
22
23
|
stablelm = "stablelm",
|
|
23
24
|
qwen = "qwen",
|
|
@@ -71,6 +72,7 @@ export declare const enum GgufArchitectureType {
|
|
|
71
72
|
t5 = "t5",
|
|
72
73
|
t5encoder = "t5encoder",
|
|
73
74
|
jais = "jais",
|
|
75
|
+
jais2 = "jais2",
|
|
74
76
|
nemotron = "nemotron",
|
|
75
77
|
nemotronH = "nemotron_h",
|
|
76
78
|
nemotronHMoe = "nemotron_h_moe",
|
|
@@ -112,10 +114,13 @@ export declare const enum GgufArchitectureType {
|
|
|
112
114
|
rnd1 = "rnd1",
|
|
113
115
|
panguEmbedded = "pangu-embedded",
|
|
114
116
|
mistral3 = "mistral3",
|
|
117
|
+
mistral4 = "mistral4",
|
|
118
|
+
paddleocr = "paddleocr",
|
|
115
119
|
mimo2 = "mimo2",
|
|
116
120
|
step35 = "step35",
|
|
117
121
|
llamaEmbed = "llama-embed",
|
|
118
122
|
maincoder = "maincoder",
|
|
123
|
+
kimiLinear = "kimi-linear",
|
|
119
124
|
clip = "clip",
|
|
120
125
|
unknown = "(unknown)"
|
|
121
126
|
}
|
|
@@ -176,7 +181,8 @@ export declare enum GgufFileType {
|
|
|
176
181
|
MOSTLY_Q4_0_8_8 = 35,// deprecated
|
|
177
182
|
MOSTLY_TQ1_0 = 36,
|
|
178
183
|
MOSTLY_TQ2_0 = 37,
|
|
179
|
-
MOSTLY_MXFP4_MOE = 38
|
|
184
|
+
MOSTLY_MXFP4_MOE = 38,
|
|
185
|
+
MOSTLY_NVFP4 = 39
|
|
180
186
|
}
|
|
181
187
|
export type GgufMetadataGeneral<A extends GgufArchitectureType = GgufArchitectureType> = {
|
|
182
188
|
readonly architecture: A;
|
|
@@ -268,7 +274,7 @@ export declare const enum GgufMetadataTokenizerTokenType {
|
|
|
268
274
|
export type GgufMetadataTokenizer = {
|
|
269
275
|
readonly ggml: {
|
|
270
276
|
readonly model: "no_vocab" | "none" | "llama" | "gpt2" | "bert" | "rwkv" | "t5" | "plamo2" | string;
|
|
271
|
-
readonly pre?: "default" | "llama3" | "llama-v3" | "llama-bpe" | "deepseek-llm" | "deepseek-coder" | "falcon" | "falcon3" | "pixtral" | "mpt" | "starcoder" | "gpt-2" | "phi-2" | "jina-es" | "jina-de" | "jina-v1-en" | "jina-v2-es" | "jina-v2-de" | "jina-v2-code" | "refact" | "command-r" | "qwen2" | "stablelm2" | "olmo" | "dbrx" | "smaug-bpe" | "poro-chat" | "chatglm-bpe" | "viking" | "jais" | "tekken" | "smollm" | "codeshell" | "bloom" | "gpt3-finnish" | "exaone" | "exaone4" | "chameleon" | "minerva-7b" | "megrez" | "gpt-4o" | "superbpe" | "trillion" | "bailingmoe" | "a.x-4.0" | "mellum" | string;
|
|
277
|
+
readonly pre?: "default" | "llama3" | "llama-v3" | "llama-bpe" | "deepseek-llm" | "deepseek-coder" | "falcon" | "falcon3" | "pixtral" | "mpt" | "starcoder" | "gpt-2" | "phi-2" | "jina-es" | "jina-de" | "jina-v1-en" | "jina-v2-es" | "jina-v2-de" | "jina-v2-code" | "refact" | "command-r" | "qwen2" | "stablelm2" | "olmo" | "dbrx" | "smaug-bpe" | "poro-chat" | "chatglm-bpe" | "viking" | "jais" | "tekken" | "smollm" | "codeshell" | "bloom" | "gpt3-finnish" | "exaone" | "exaone4" | "chameleon" | "minerva-7b" | "megrez" | "gpt-4o" | "superbpe" | "trillion" | "bailingmoe" | "a.x-4.0" | "mellum" | "modern-bert" | "roberta-bpe" | "deepseek-r1-qwen" | "kormo" | "qwen35" | string;
|
|
272
278
|
readonly tokens: readonly string[];
|
|
273
279
|
readonly token_type: GgufMetadataTokenizerTokenType[];
|
|
274
280
|
readonly token_type_count?: number;
|
|
@@ -319,6 +325,7 @@ export type GgufMetadataDefaultArchitectureType = {
|
|
|
319
325
|
readonly context_length?: number;
|
|
320
326
|
readonly embedding_length?: number;
|
|
321
327
|
readonly block_count?: number;
|
|
328
|
+
readonly full_attention_interval?: number;
|
|
322
329
|
readonly feed_forward_length?: number;
|
|
323
330
|
readonly use_parallel_residual?: boolean;
|
|
324
331
|
readonly tensor_data_layout?: string;
|
|
@@ -337,11 +344,13 @@ export type GgufMetadataDefaultArchitectureType = {
|
|
|
337
344
|
readonly key_length?: number;
|
|
338
345
|
readonly value_length?: number;
|
|
339
346
|
readonly sliding_window?: number;
|
|
347
|
+
readonly sliding_window_pattern?: number | number[];
|
|
340
348
|
readonly causal?: boolean;
|
|
341
349
|
};
|
|
342
350
|
readonly rope?: {
|
|
343
351
|
readonly dimension_count?: number;
|
|
344
352
|
readonly freq_base?: number;
|
|
353
|
+
readonly freq_base_swa?: number;
|
|
345
354
|
readonly scale_linear?: number;
|
|
346
355
|
readonly scaling?: {
|
|
347
356
|
readonly type?: "none" | "linear" | "yarn" | string;
|
|
@@ -355,6 +364,13 @@ export type GgufMetadataDefaultArchitectureType = {
|
|
|
355
364
|
readonly inner_size?: number;
|
|
356
365
|
readonly state_size?: number;
|
|
357
366
|
readonly time_step_rank?: number;
|
|
367
|
+
readonly group_count?: number;
|
|
368
|
+
};
|
|
369
|
+
readonly kda?: {
|
|
370
|
+
readonly head_dim?: number;
|
|
371
|
+
};
|
|
372
|
+
readonly shortconv?: {
|
|
373
|
+
readonly l_cache?: number;
|
|
358
374
|
};
|
|
359
375
|
readonly wkv?: {
|
|
360
376
|
readonly head_size?: number;
|
|
@@ -19,6 +19,7 @@ export var GgufArchitectureType;
|
|
|
19
19
|
GgufArchitectureType["neoBert"] = "neo-bert";
|
|
20
20
|
GgufArchitectureType["jinaBertV2"] = "jina-bert-v2";
|
|
21
21
|
GgufArchitectureType["jinaBertV3"] = "jina-bert-v3";
|
|
22
|
+
GgufArchitectureType["eurobert"] = "eurobert";
|
|
22
23
|
GgufArchitectureType["bloom"] = "bloom";
|
|
23
24
|
GgufArchitectureType["stablelm"] = "stablelm";
|
|
24
25
|
GgufArchitectureType["qwen"] = "qwen";
|
|
@@ -72,6 +73,7 @@ export var GgufArchitectureType;
|
|
|
72
73
|
GgufArchitectureType["t5"] = "t5";
|
|
73
74
|
GgufArchitectureType["t5encoder"] = "t5encoder";
|
|
74
75
|
GgufArchitectureType["jais"] = "jais";
|
|
76
|
+
GgufArchitectureType["jais2"] = "jais2";
|
|
75
77
|
GgufArchitectureType["nemotron"] = "nemotron";
|
|
76
78
|
GgufArchitectureType["nemotronH"] = "nemotron_h";
|
|
77
79
|
GgufArchitectureType["nemotronHMoe"] = "nemotron_h_moe";
|
|
@@ -113,10 +115,13 @@ export var GgufArchitectureType;
|
|
|
113
115
|
GgufArchitectureType["rnd1"] = "rnd1";
|
|
114
116
|
GgufArchitectureType["panguEmbedded"] = "pangu-embedded";
|
|
115
117
|
GgufArchitectureType["mistral3"] = "mistral3";
|
|
118
|
+
GgufArchitectureType["mistral4"] = "mistral4";
|
|
119
|
+
GgufArchitectureType["paddleocr"] = "paddleocr";
|
|
116
120
|
GgufArchitectureType["mimo2"] = "mimo2";
|
|
117
121
|
GgufArchitectureType["step35"] = "step35";
|
|
118
122
|
GgufArchitectureType["llamaEmbed"] = "llama-embed";
|
|
119
123
|
GgufArchitectureType["maincoder"] = "maincoder";
|
|
124
|
+
GgufArchitectureType["kimiLinear"] = "kimi-linear";
|
|
120
125
|
GgufArchitectureType["clip"] = "clip";
|
|
121
126
|
GgufArchitectureType["unknown"] = "(unknown)";
|
|
122
127
|
})(GgufArchitectureType || (GgufArchitectureType = {}));
|
|
@@ -162,6 +167,7 @@ export var GgufFileType;
|
|
|
162
167
|
GgufFileType[GgufFileType["MOSTLY_TQ1_0"] = 36] = "MOSTLY_TQ1_0";
|
|
163
168
|
GgufFileType[GgufFileType["MOSTLY_TQ2_0"] = 37] = "MOSTLY_TQ2_0";
|
|
164
169
|
GgufFileType[GgufFileType["MOSTLY_MXFP4_MOE"] = 38] = "MOSTLY_MXFP4_MOE";
|
|
170
|
+
GgufFileType[GgufFileType["MOSTLY_NVFP4"] = 39] = "MOSTLY_NVFP4";
|
|
165
171
|
})(GgufFileType || (GgufFileType = {}));
|
|
166
172
|
export var GgufMetadataTokenizerTokenType;
|
|
167
173
|
(function (GgufMetadataTokenizerTokenType) {
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"GgufMetadataTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufMetadataTypes.ts"],"names":[],"mappings":"AAAA,MAAM,CAAN,IAAkB,
|
|
1
|
+
{"version":3,"file":"GgufMetadataTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufMetadataTypes.ts"],"names":[],"mappings":"AAAA,MAAM,CAAN,IAAkB,oBA6HjB;AA7HD,WAAkB,oBAAoB;IAClC,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,mCAAW,CAAA;IACX,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,kDAA0B,CAAA;IAC1B,gDAAwB,CAAA;IACxB,uDAA+B,CAAA;IAC/B,4CAAoB,CAAA;IACpB,mDAA2B,CAAA;IAC3B,mDAA2B,CAAA;IAC3B,6CAAqB,CAAA;IACrB,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,2CAAmB,CAAA;IACnB,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,iDAAyB,CAAA;IACzB,yCAAiB,CAAA;IACjB,+CAAuB,CAAA;IACvB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,yCAAiB,CAAA;IACjB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,yCAAiB,CAAA;IACjB,+CAAuB,CAAA;IACvB,uCAAe,CAAA;IACf,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,6CAAqB,CAAA;IACrB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,0DAAkC,CAAA;IAClC,iDAAyB,CAAA;IACzB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,uCAAe,CAAA;IACf,8CAAsB,CAAA;IACtB,yCAAiB,CAAA;IACjB,8CAAsB,CAAA;IACtB,2CAAmB,CAAA;IACnB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,2CAAmB,CAAA;IACnB,yCAAiB,CAAA;IACjB,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,0CAAkB,CAAA;IAClB,yCAAiB,CAAA;IACjB,iCAAS,CAAA;IACT,+CAAuB,CAAA;IACvB,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,gDAAwB,CAAA;IACxB,uDAA+B,CAAA;IAC/B,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,gDAAwB,CAAA;IACxB,uCAAe,CAAA;IACf,iDAAyB,CAAA;IACzB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,2CAAmB,CAAA;IACnB,iDAAyB,CAAA;IACzB,uDAA+B,CAAA;IAC/B,+CAAuB,CAAA;IACvB,4DAAoC,CAAA;IACpC,mCAAW,CAAA;IACX,iDAAyB,CAAA;IACzB,mDAA2B,CAAA;IAC3B,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,oDAA4B,CAAA;IAC5B,kDAA0B,CAAA;IAC1B,sDAA8B,CAAA;IAC9B,2CAAmB,CAAA;IACnB,0CAAkB,CAAA;IAClB,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,uCAAe,CAAA;IACf,qDAA6B,CAAA;IAC7B,uCAAe,CAAA;IACf,8CAAsB,CAAA;IACtB,4CAAoB,CAAA;IACpB,6CAAqB,CAAA;IACrB,2CAAmB,CAAA;IACnB,gDAAwB,CAAA;IACxB,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,wDAAgC,CAAA;IAChC,6CAAqB,CAAA;IACrB,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,kDAA0B,CAAA;IAC1B,+CAAuB,CAAA;IACvB,kDAA0B,CAAA;IAC1B,qCAAa,CAAA;IACb,6CAAqB,CAAA;AACzB,CAAC,EA7HiB,oBAAoB,KAApB,oBAAoB,QA6HrC;AA+BD,yEAAyE;AACzE,MAAM,CAAN,IAAY,YAyCX;AAzCD,WAAY,YAAY;IACpB,qDAAW,CAAA;IACX,2DAAc,CAAA;IACd,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,+EAAwB,CAAA;IACxB,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,8DAAgB,CAAA;IAChB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,8DAAgB,CAAA;IAChB,oEAAmB,CAAA;IACnB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,oEAAmB,CAAA;IACnB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,8DAAgB,CAAA;IAChB,sEAAoB,CAAA;IACpB,sEAAoB,CAAA;IACpB,sEAAoB,CAAA;IACpB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,wEAAqB,CAAA;IACrB,gEAAiB,CAAA;AACrB,CAAC,EAzCW,YAAY,KAAZ,YAAY,QAyCvB;AA2FD,MAAM,CAAN,IAAkB,8BAQjB;AARD,WAAkB,8BAA8B;IAC5C,6FAAa,CAAA;IACb,uFAAU,CAAA;IACV,yFAAW,CAAA;IACX,yFAAW,CAAA;IACX,iGAAe,CAAA;IACf,uFAAU,CAAA;IACV,mFAAQ,CAAA;AACZ,CAAC,EARiB,8BAA8B,KAA9B,8BAA8B,QAQ/C;AAkDD,MAAM,CAAN,IAAkB,mCAOjB;AAPD,WAAkB,mCAAmC;IACjD,4GAAgB,CAAA;IAChB,6FAAQ,CAAA;IACR,6FAAQ,CAAA;IACR,2FAAO,CAAA;IACP,6FAAQ,CAAA;IACR,6FAAQ,CAAA;AACZ,CAAC,EAPiB,mCAAmC,KAAnC,mCAAmC,QAOpD;AAgOD,MAAM,UAAU,gCAAgC,CAC5C,QAAsB,EAAE,IAAO;IAE/B,OAAO,QAAQ,EAAE,OAAO,EAAE,YAAY,KAAK,IAAI,CAAC;AACpD,CAAC"}
|
|
@@ -17,7 +17,7 @@ export type GgufTensorInfo = {
|
|
|
17
17
|
*/
|
|
18
18
|
readonly filePart: number;
|
|
19
19
|
};
|
|
20
|
-
export declare
|
|
20
|
+
export declare enum GgmlType {
|
|
21
21
|
F32 = 0,
|
|
22
22
|
F16 = 1,
|
|
23
23
|
Q4_0 = 2,
|
|
@@ -57,5 +57,7 @@ export declare const enum GgmlType {
|
|
|
57
57
|
IQ4_NL_4_4 = 36,
|
|
58
58
|
IQ4_NL_4_8 = 37,
|
|
59
59
|
IQ4_NL_8_8 = 38,
|
|
60
|
-
MXFP4 = 39
|
|
60
|
+
MXFP4 = 39,// MXFP4 (1 block)
|
|
61
|
+
NVFP4 = 40
|
|
61
62
|
}
|
|
63
|
+
export declare function resolveGgmlTypeOption(option?: keyof typeof GgmlType | GgmlType): GgmlType | undefined;
|
|
@@ -39,6 +39,16 @@ export var GgmlType;
|
|
|
39
39
|
GgmlType[GgmlType["IQ4_NL_4_4"] = 36] = "IQ4_NL_4_4";
|
|
40
40
|
GgmlType[GgmlType["IQ4_NL_4_8"] = 37] = "IQ4_NL_4_8";
|
|
41
41
|
GgmlType[GgmlType["IQ4_NL_8_8"] = 38] = "IQ4_NL_8_8";
|
|
42
|
-
GgmlType[GgmlType["MXFP4"] = 39] = "MXFP4";
|
|
42
|
+
GgmlType[GgmlType["MXFP4"] = 39] = "MXFP4";
|
|
43
|
+
GgmlType[GgmlType["NVFP4"] = 40] = "NVFP4"; // NVFP4 (4 blocks, E4M3 scale)
|
|
43
44
|
})(GgmlType || (GgmlType = {}));
|
|
45
|
+
export function resolveGgmlTypeOption(option) {
|
|
46
|
+
if (option == null)
|
|
47
|
+
return undefined;
|
|
48
|
+
if (typeof option === "number" && Object.hasOwn(GgmlType, option))
|
|
49
|
+
return option;
|
|
50
|
+
else if (typeof option === "string" && Object.hasOwn(GgmlType, option))
|
|
51
|
+
return GgmlType[option];
|
|
52
|
+
return undefined;
|
|
53
|
+
}
|
|
44
54
|
//# sourceMappingURL=GgufTensorInfoTypes.js.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"GgufTensorInfoTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufTensorInfoTypes.ts"],"names":[],"mappings":"AAsBA,MAAM,CAAN,
|
|
1
|
+
{"version":3,"file":"GgufTensorInfoTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufTensorInfoTypes.ts"],"names":[],"mappings":"AAsBA,MAAM,CAAN,IAAY,QA0CX;AA1CD,WAAY,QAAQ;IAChB,qCAAO,CAAA;IACP,qCAAO,CAAA;IACP,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,8CAAY,CAAA;IACZ,4CAAW,CAAA;IACX,8CAAY,CAAA;IACZ,0CAAU,CAAA;IACV,4CAAW,CAAA;IACX,0CAAU,CAAA;IACV,0CAAU,CAAA;IACV,4CAAW,CAAA;IACX,oCAAO,CAAA;IACP,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,0CAAU,CAAA;IACV,wCAAS,CAAA;IACT,gDAAa,CAAA;IACb,gDAAa,CAAA;IACb,gDAAa,CAAA;IACb,0CAAU,CAAA;IACV,0CAAU,CAAA;IACV,oDAAe,CAAA;IACf,oDAAe,CAAA;IACf,oDAAe,CAAA;IACf,0CAAU,CAAA;IACV,0CAAU,CAAA,CAAC,+BAA+B;AAC9C,CAAC,EA1CW,QAAQ,KAAR,QAAQ,QA0CnB;AAED,MAAM,UAAU,qBAAqB,CAAC,MAAyC;IAC3E,IAAI,MAAM,IAAI,IAAI;QACd,OAAO,SAAS,CAAC;IAErB,IAAI,OAAO,MAAM,KAAK,QAAQ,IAAI,MAAM,CAAC,MAAM,CAAC,QAAQ,EAAE,MAAM,CAAC;QAC7D,OAAO,MAAkB,CAAC;SACzB,IAAI,OAAO,MAAM,KAAK,QAAQ,IAAI,MAAM,CAAC,MAAM,CAAC,QAAQ,EAAE,MAAM,CAAC;QAClE,OAAO,QAAQ,CAAC,MAA+B,CAAC,CAAC;IAErD,OAAO,SAAS,CAAC;AACrB,CAAC"}
|
|
@@ -1,4 +1,4 @@
|
|
|
1
1
|
/**
|
|
2
2
|
* Convert a GGUF file type number to its corresponding type name
|
|
3
3
|
*/
|
|
4
|
-
export declare function getGgufFileTypeName(fileType?: number): "ALL_F32" | "MOSTLY_F16" | "MOSTLY_Q4_0" | "MOSTLY_Q4_1" | "MOSTLY_Q4_1_SOME_F16" | "MOSTLY_Q4_2" | "MOSTLY_Q4_3" | "MOSTLY_Q8_0" | "MOSTLY_Q5_0" | "MOSTLY_Q5_1" | "MOSTLY_Q2_K" | "MOSTLY_Q3_K_S" | "MOSTLY_Q3_K_M" | "MOSTLY_Q3_K_L" | "MOSTLY_Q4_K_S" | "MOSTLY_Q4_K_M" | "MOSTLY_Q5_K_S" | "MOSTLY_Q5_K_M" | "MOSTLY_Q6_K" | "MOSTLY_IQ2_XXS" | "MOSTLY_IQ2_XS" | "MOSTLY_Q2_K_S" | "MOSTLY_IQ3_XS" | "MOSTLY_IQ3_XXS" | "MOSTLY_IQ1_S" | "MOSTLY_IQ4_NL" | "MOSTLY_IQ3_S" | "MOSTLY_IQ3_M" | "MOSTLY_IQ2_S" | "MOSTLY_IQ2_M" | "MOSTLY_IQ4_XS" | "MOSTLY_IQ1_M" | "MOSTLY_BF16" | "MOSTLY_Q4_0_4_4" | "MOSTLY_Q4_0_4_8" | "MOSTLY_Q4_0_8_8" | "MOSTLY_TQ1_0" | "MOSTLY_TQ2_0" | "MOSTLY_MXFP4_MOE" | undefined;
|
|
4
|
+
export declare function getGgufFileTypeName(fileType?: number): "ALL_F32" | "MOSTLY_F16" | "MOSTLY_Q4_0" | "MOSTLY_Q4_1" | "MOSTLY_Q4_1_SOME_F16" | "MOSTLY_Q4_2" | "MOSTLY_Q4_3" | "MOSTLY_Q8_0" | "MOSTLY_Q5_0" | "MOSTLY_Q5_1" | "MOSTLY_Q2_K" | "MOSTLY_Q3_K_S" | "MOSTLY_Q3_K_M" | "MOSTLY_Q3_K_L" | "MOSTLY_Q4_K_S" | "MOSTLY_Q4_K_M" | "MOSTLY_Q5_K_S" | "MOSTLY_Q5_K_M" | "MOSTLY_Q6_K" | "MOSTLY_IQ2_XXS" | "MOSTLY_IQ2_XS" | "MOSTLY_Q2_K_S" | "MOSTLY_IQ3_XS" | "MOSTLY_IQ3_XXS" | "MOSTLY_IQ1_S" | "MOSTLY_IQ4_NL" | "MOSTLY_IQ3_S" | "MOSTLY_IQ3_M" | "MOSTLY_IQ2_S" | "MOSTLY_IQ2_M" | "MOSTLY_IQ4_XS" | "MOSTLY_IQ1_M" | "MOSTLY_BF16" | "MOSTLY_Q4_0_4_4" | "MOSTLY_Q4_0_4_8" | "MOSTLY_Q4_0_8_8" | "MOSTLY_TQ1_0" | "MOSTLY_TQ2_0" | "MOSTLY_MXFP4_MOE" | "MOSTLY_NVFP4" | undefined;
|
|
@@ -3,6 +3,7 @@ export const ggufQuantNames = new Map([
|
|
|
3
3
|
["Q4_0", GgufFileType.MOSTLY_Q4_0],
|
|
4
4
|
["Q4_1", GgufFileType.MOSTLY_Q4_1],
|
|
5
5
|
["MXFP4", GgufFileType.MOSTLY_MXFP4_MOE],
|
|
6
|
+
["NVFP4", GgufFileType.MOSTLY_MXFP4_MOE],
|
|
6
7
|
["Q5_0", GgufFileType.MOSTLY_Q5_0],
|
|
7
8
|
["Q5_1", GgufFileType.MOSTLY_Q5_1],
|
|
8
9
|
["IQ2_XXS", GgufFileType.MOSTLY_IQ2_XXS],
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"ggufQuantNames.js","sourceRoot":"","sources":["../../../src/gguf/utils/ggufQuantNames.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,YAAY,EAAC,MAAM,+BAA+B,CAAC;AAE3D,MAAM,CAAC,MAAM,cAAc,GAAG,IAAI,GAAG,CAAuB;IACxD,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,OAAO,EAAE,YAAY,CAAC,gBAAgB,CAAC;IACxC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,SAAS,EAAE,YAAY,CAAC,cAAc,CAAC;IACxC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,SAAS,EAAE,YAAY,CAAC,cAAc,CAAC;IACxC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,KAAK,EAAE,YAAY,CAAC,UAAU,CAAC;IAChC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,KAAK,EAAE,YAAY,CAAC,OAAO,CAAC;IAC7B,CAAC,MAAM,EAAE,YAAY,CAAC,OAAO,CAAC;CACjC,CAAC,CAAC"}
|
|
1
|
+
{"version":3,"file":"ggufQuantNames.js","sourceRoot":"","sources":["../../../src/gguf/utils/ggufQuantNames.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,YAAY,EAAC,MAAM,+BAA+B,CAAC;AAE3D,MAAM,CAAC,MAAM,cAAc,GAAG,IAAI,GAAG,CAAuB;IACxD,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,OAAO,EAAE,YAAY,CAAC,gBAAgB,CAAC;IACxC,CAAC,OAAO,EAAE,YAAY,CAAC,gBAAgB,CAAC;IACxC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,SAAS,EAAE,YAAY,CAAC,cAAc,CAAC;IACxC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,SAAS,EAAE,YAAY,CAAC,cAAc,CAAC;IACxC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,OAAO,EAAE,YAAY,CAAC,YAAY,CAAC;IACpC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,aAAa,CAAC;IACpC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,QAAQ,EAAE,YAAY,CAAC,aAAa,CAAC;IACtC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,KAAK,EAAE,YAAY,CAAC,UAAU,CAAC;IAChC,CAAC,MAAM,EAAE,YAAY,CAAC,WAAW,CAAC;IAClC,CAAC,KAAK,EAAE,YAAY,CAAC,OAAO,CAAC;IAC7B,CAAC,MAAM,EAAE,YAAY,CAAC,OAAO,CAAC;CACjC,CAAC,CAAC"}
|