node-llama-cpp 3.0.0-beta.9 → 3.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +42 -27
- package/bins/_linux-arm64.moved.txt +1 -0
- package/bins/_linux-armv7l.moved.txt +1 -0
- package/bins/_linux-x64-cuda.moved.txt +1 -0
- package/bins/_linux-x64-vulkan.moved.txt +1 -0
- package/bins/_linux-x64.moved.txt +1 -0
- package/bins/_mac-arm64-metal.moved.txt +1 -0
- package/bins/_mac-x64.moved.txt +1 -0
- package/bins/_win-arm64.moved.txt +1 -0
- package/bins/_win-x64-cuda.moved.txt +1 -0
- package/bins/_win-x64-vulkan.moved.txt +1 -0
- package/bins/_win-x64.moved.txt +1 -0
- package/dist/ChatWrapper.d.ts +19 -39
- package/dist/ChatWrapper.js +129 -72
- package/dist/ChatWrapper.js.map +1 -1
- package/dist/apiDocsIndex.d.ts +1 -0
- package/dist/apiDocsIndex.js +7 -0
- package/dist/apiDocsIndex.js.map +1 -0
- package/dist/bindings/AddonTypes.d.ts +88 -20
- package/dist/bindings/Llama.d.ts +43 -3
- package/dist/bindings/Llama.js +193 -23
- package/dist/bindings/Llama.js.map +1 -1
- package/dist/bindings/consts.d.ts +2 -0
- package/dist/bindings/consts.js +13 -0
- package/dist/bindings/consts.js.map +1 -0
- package/dist/bindings/getLlama.d.ts +123 -18
- package/dist/bindings/getLlama.js +264 -75
- package/dist/bindings/getLlama.js.map +1 -1
- package/dist/bindings/types.d.ts +29 -5
- package/dist/bindings/types.js +51 -2
- package/dist/bindings/types.js.map +1 -1
- package/dist/bindings/utils/MemoryOrchestrator.d.ts +21 -0
- package/dist/bindings/utils/MemoryOrchestrator.js +49 -0
- package/dist/bindings/utils/MemoryOrchestrator.js.map +1 -0
- package/dist/bindings/utils/asyncEvery.d.ts +5 -0
- package/dist/bindings/utils/asyncEvery.js +15 -0
- package/dist/bindings/utils/asyncEvery.js.map +1 -0
- package/dist/bindings/utils/asyncSome.d.ts +5 -0
- package/dist/bindings/utils/asyncSome.js +27 -0
- package/dist/bindings/utils/asyncSome.js.map +1 -0
- package/dist/bindings/utils/clearAllLocalBuilds.js.map +1 -1
- package/dist/bindings/utils/cloneLlamaCppRepo.d.ts +1 -1
- package/dist/bindings/utils/cloneLlamaCppRepo.js +39 -28
- package/dist/bindings/utils/cloneLlamaCppRepo.js.map +1 -1
- package/dist/bindings/utils/compileLLamaCpp.d.ts +11 -3
- package/dist/bindings/utils/compileLLamaCpp.js +250 -81
- package/dist/bindings/utils/compileLLamaCpp.js.map +1 -1
- package/dist/bindings/utils/detectAvailableComputeLayers.d.ts +14 -0
- package/dist/bindings/utils/detectAvailableComputeLayers.js +305 -0
- package/dist/bindings/utils/detectAvailableComputeLayers.js.map +1 -0
- package/dist/bindings/utils/detectGlibc.d.ts +4 -0
- package/dist/bindings/utils/detectGlibc.js +46 -0
- package/dist/bindings/utils/detectGlibc.js.map +1 -0
- package/dist/bindings/utils/getBestComputeLayersAvailable.d.ts +9 -0
- package/dist/bindings/utils/getBestComputeLayersAvailable.js +29 -0
- package/dist/bindings/utils/getBestComputeLayersAvailable.js.map +1 -0
- package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js +14 -6
- package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js.map +1 -1
- package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.js.map +1 -1
- package/dist/bindings/utils/getGpuTypesToUseForOption.d.ts +12 -0
- package/dist/bindings/utils/getGpuTypesToUseForOption.js +39 -0
- package/dist/bindings/utils/getGpuTypesToUseForOption.js.map +1 -0
- package/dist/bindings/utils/getLinuxDistroInfo.d.ts +9 -0
- package/dist/bindings/utils/getLinuxDistroInfo.js +46 -0
- package/dist/bindings/utils/getLinuxDistroInfo.js.map +1 -0
- package/dist/bindings/utils/getLlamaWithoutBackend.d.ts +5 -0
- package/dist/bindings/utils/getLlamaWithoutBackend.js +27 -0
- package/dist/bindings/utils/getLlamaWithoutBackend.js.map +1 -0
- package/dist/bindings/utils/getPlatform.js.map +1 -1
- package/dist/bindings/utils/getPlatformInfo.d.ts +5 -0
- package/dist/bindings/utils/getPlatformInfo.js +28 -0
- package/dist/bindings/utils/getPlatformInfo.js.map +1 -0
- package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.d.ts +3 -0
- package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.js +27 -0
- package/dist/bindings/utils/hasBuildingFromSourceDependenciesInstalled.js.map +1 -0
- package/dist/bindings/utils/hasFileInPath.d.ts +2 -0
- package/dist/bindings/utils/hasFileInPath.js +34 -0
- package/dist/bindings/utils/hasFileInPath.js.map +1 -0
- package/dist/bindings/utils/lastBuildInfo.js.map +1 -1
- package/dist/bindings/utils/logBinaryUsageExampleToConsole.d.ts +1 -1
- package/dist/bindings/utils/logBinaryUsageExampleToConsole.js +3 -9
- package/dist/bindings/utils/logBinaryUsageExampleToConsole.js.map +1 -1
- package/dist/bindings/utils/logDistroInstallInstruction.d.ts +14 -0
- package/dist/bindings/utils/logDistroInstallInstruction.js +48 -0
- package/dist/bindings/utils/logDistroInstallInstruction.js.map +1 -0
- package/dist/bindings/utils/resolveCustomCmakeOptions.js +26 -26
- package/dist/bindings/utils/resolveCustomCmakeOptions.js.map +1 -1
- package/dist/bindings/utils/testBindingBinary.d.ts +1 -0
- package/dist/bindings/utils/testBindingBinary.js +100 -0
- package/dist/bindings/utils/testBindingBinary.js.map +1 -0
- package/dist/bindings/utils/testCmakeBinary.d.ts +5 -0
- package/dist/bindings/utils/testCmakeBinary.js +32 -0
- package/dist/bindings/utils/testCmakeBinary.js.map +1 -0
- package/dist/chatWrappers/AlpacaChatWrapper.d.ts +2 -1
- package/dist/chatWrappers/AlpacaChatWrapper.js +10 -2
- package/dist/chatWrappers/AlpacaChatWrapper.js.map +1 -1
- package/dist/chatWrappers/ChatMLChatWrapper.d.ts +2 -14
- package/dist/chatWrappers/ChatMLChatWrapper.js +23 -21
- package/dist/chatWrappers/ChatMLChatWrapper.js.map +1 -1
- package/dist/chatWrappers/FalconChatWrapper.d.ts +4 -10
- package/dist/chatWrappers/FalconChatWrapper.js +39 -21
- package/dist/chatWrappers/FalconChatWrapper.js.map +1 -1
- package/dist/chatWrappers/FunctionaryChatWrapper.d.ts +8 -32
- package/dist/chatWrappers/FunctionaryChatWrapper.js +514 -118
- package/dist/chatWrappers/FunctionaryChatWrapper.js.map +1 -1
- package/dist/chatWrappers/GemmaChatWrapper.d.ts +7 -0
- package/dist/chatWrappers/GemmaChatWrapper.js +96 -0
- package/dist/chatWrappers/GemmaChatWrapper.js.map +1 -0
- package/dist/chatWrappers/GeneralChatWrapper.d.ts +4 -10
- package/dist/chatWrappers/GeneralChatWrapper.js +46 -22
- package/dist/chatWrappers/GeneralChatWrapper.js.map +1 -1
- package/dist/chatWrappers/Llama2ChatWrapper.d.ts +12 -0
- package/dist/chatWrappers/{LlamaChatWrapper.js → Llama2ChatWrapper.js} +37 -20
- package/dist/chatWrappers/Llama2ChatWrapper.js.map +1 -0
- package/dist/chatWrappers/Llama3ChatWrapper.d.ts +16 -0
- package/dist/chatWrappers/Llama3ChatWrapper.js +173 -0
- package/dist/chatWrappers/Llama3ChatWrapper.js.map +1 -0
- package/dist/chatWrappers/Llama3_1ChatWrapper.d.ts +35 -0
- package/dist/chatWrappers/Llama3_1ChatWrapper.js +277 -0
- package/dist/chatWrappers/Llama3_1ChatWrapper.js.map +1 -0
- package/dist/chatWrappers/MistralChatWrapper.d.ts +15 -0
- package/dist/chatWrappers/MistralChatWrapper.js +169 -0
- package/dist/chatWrappers/MistralChatWrapper.js.map +1 -0
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.d.ts +100 -0
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +409 -0
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -0
- package/dist/chatWrappers/generic/TemplateChatWrapper.d.ts +60 -0
- package/dist/chatWrappers/generic/TemplateChatWrapper.js +204 -0
- package/dist/chatWrappers/generic/TemplateChatWrapper.js.map +1 -0
- package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.d.ts +23 -0
- package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js +45 -0
- package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js.map +1 -0
- package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.d.ts +57 -0
- package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.js +119 -0
- package/dist/chatWrappers/utils/ChatModelFunctionsDocumentationGenerator.js.map +1 -0
- package/dist/chatWrappers/utils/chunkChatItems.d.ts +10 -0
- package/dist/chatWrappers/utils/chunkChatItems.js +44 -0
- package/dist/chatWrappers/utils/chunkChatItems.js.map +1 -0
- package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.d.ts +4 -0
- package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js +221 -0
- package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js.map +1 -0
- package/dist/chatWrappers/utils/jsonDumps.d.ts +7 -0
- package/dist/chatWrappers/utils/jsonDumps.js +18 -0
- package/dist/chatWrappers/utils/jsonDumps.js.map +1 -0
- package/dist/chatWrappers/utils/resolveChatWrapper.d.ts +95 -0
- package/dist/chatWrappers/utils/resolveChatWrapper.js +335 -0
- package/dist/chatWrappers/utils/resolveChatWrapper.js.map +1 -0
- package/dist/cli/cli.js +19 -11
- package/dist/cli/cli.js.map +1 -1
- package/dist/cli/commands/ChatCommand.d.ts +16 -7
- package/dist/cli/commands/ChatCommand.js +321 -190
- package/dist/cli/commands/ChatCommand.js.map +1 -1
- package/dist/cli/commands/CompleteCommand.d.ts +31 -0
- package/dist/cli/commands/CompleteCommand.js +402 -0
- package/dist/cli/commands/CompleteCommand.js.map +1 -0
- package/dist/cli/commands/DebugCommand.d.ts +7 -0
- package/dist/cli/commands/DebugCommand.js +54 -0
- package/dist/cli/commands/DebugCommand.js.map +1 -0
- package/dist/cli/commands/InfillCommand.d.ts +33 -0
- package/dist/cli/commands/InfillCommand.js +438 -0
- package/dist/cli/commands/InfillCommand.js.map +1 -0
- package/dist/cli/commands/InitCommand.d.ts +11 -0
- package/dist/cli/commands/InitCommand.js +195 -0
- package/dist/cli/commands/InitCommand.js.map +1 -0
- package/dist/cli/commands/OnPostInstallCommand.js +6 -2
- package/dist/cli/commands/OnPostInstallCommand.js.map +1 -1
- package/dist/cli/commands/PullCommand.d.ts +13 -0
- package/dist/cli/commands/PullCommand.js +158 -0
- package/dist/cli/commands/PullCommand.js.map +1 -0
- package/dist/cli/commands/inspect/InspectCommand.d.ts +4 -0
- package/dist/cli/commands/inspect/InspectCommand.js +21 -0
- package/dist/cli/commands/inspect/InspectCommand.js.map +1 -0
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.d.ts +12 -0
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.js +225 -0
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.js.map +1 -0
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.d.ts +12 -0
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +149 -0
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -0
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.d.ts +4 -0
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +202 -0
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -0
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.d.ts +18 -0
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +629 -0
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -0
- package/dist/cli/commands/source/SourceCommand.d.ts +4 -0
- package/dist/cli/commands/source/SourceCommand.js +19 -0
- package/dist/cli/commands/source/SourceCommand.js.map +1 -0
- package/dist/cli/commands/source/commands/BuildCommand.d.ts +16 -0
- package/dist/cli/commands/source/commands/BuildCommand.js +148 -0
- package/dist/cli/commands/source/commands/BuildCommand.js.map +1 -0
- package/dist/cli/commands/{ClearCommand.d.ts → source/commands/ClearCommand.d.ts} +1 -1
- package/dist/cli/commands/{ClearCommand.js → source/commands/ClearCommand.js} +11 -10
- package/dist/cli/commands/source/commands/ClearCommand.js.map +1 -0
- package/dist/cli/commands/{DownloadCommand.d.ts → source/commands/DownloadCommand.d.ts} +5 -4
- package/dist/cli/commands/source/commands/DownloadCommand.js +217 -0
- package/dist/cli/commands/source/commands/DownloadCommand.js.map +1 -0
- package/dist/cli/projectTemplates.d.ts +7 -0
- package/dist/cli/projectTemplates.js +10 -0
- package/dist/cli/projectTemplates.js.map +1 -0
- package/dist/cli/recommendedModels.d.ts +2 -0
- package/dist/cli/recommendedModels.js +585 -0
- package/dist/cli/recommendedModels.js.map +1 -0
- package/dist/cli/startCreateCli.d.ts +2 -0
- package/dist/cli/startCreateCli.js +26 -0
- package/dist/cli/startCreateCli.js.map +1 -0
- package/dist/cli/utils/ConsoleInteraction.d.ts +22 -0
- package/dist/cli/utils/ConsoleInteraction.js +122 -0
- package/dist/cli/utils/ConsoleInteraction.js.map +1 -0
- package/dist/cli/utils/ConsoleTable.d.ts +23 -0
- package/dist/cli/utils/ConsoleTable.js +86 -0
- package/dist/cli/utils/ConsoleTable.js.map +1 -0
- package/dist/cli/utils/basicChooseFromListConsoleInteraction.d.ts +13 -0
- package/dist/cli/utils/basicChooseFromListConsoleInteraction.js +111 -0
- package/dist/cli/utils/basicChooseFromListConsoleInteraction.js.map +1 -0
- package/dist/cli/utils/consolePromptQuestion.d.ts +6 -0
- package/dist/cli/utils/consolePromptQuestion.js +82 -0
- package/dist/cli/utils/consolePromptQuestion.js.map +1 -0
- package/dist/cli/utils/getReadablePath.d.ts +1 -0
- package/dist/cli/utils/getReadablePath.js +14 -0
- package/dist/cli/utils/getReadablePath.js.map +1 -0
- package/dist/cli/utils/interactivelyAskForModel.d.ts +8 -0
- package/dist/cli/utils/interactivelyAskForModel.js +450 -0
- package/dist/cli/utils/interactivelyAskForModel.js.map +1 -0
- package/dist/cli/utils/logUsedGpuTypeOption.d.ts +2 -0
- package/dist/cli/utils/logUsedGpuTypeOption.js +9 -0
- package/dist/cli/utils/logUsedGpuTypeOption.js.map +1 -0
- package/dist/cli/utils/printCommonInfoLines.d.ts +9 -0
- package/dist/cli/utils/printCommonInfoLines.js +82 -0
- package/dist/cli/utils/printCommonInfoLines.js.map +1 -0
- package/dist/cli/utils/printInfoLine.d.ts +12 -0
- package/dist/cli/utils/printInfoLine.js +54 -0
- package/dist/cli/utils/printInfoLine.js.map +1 -0
- package/dist/cli/utils/projectTemplates.d.ts +19 -0
- package/dist/cli/utils/projectTemplates.js +47 -0
- package/dist/cli/utils/projectTemplates.js.map +1 -0
- package/dist/cli/utils/renderModelCompatibilityPercentageWithColors.d.ts +6 -0
- package/dist/cli/utils/renderModelCompatibilityPercentageWithColors.js +14 -0
- package/dist/cli/utils/renderModelCompatibilityPercentageWithColors.js.map +1 -0
- package/dist/cli/utils/resolveCommandGgufPath.d.ts +5 -0
- package/dist/cli/utils/resolveCommandGgufPath.js +72 -0
- package/dist/cli/utils/resolveCommandGgufPath.js.map +1 -0
- package/dist/cli/utils/resolveHeaderFlag.d.ts +1 -0
- package/dist/cli/utils/resolveHeaderFlag.js +21 -0
- package/dist/cli/utils/resolveHeaderFlag.js.map +1 -0
- package/dist/cli/utils/resolveModelRecommendationFileOptions.d.ts +19 -0
- package/dist/cli/utils/resolveModelRecommendationFileOptions.js +7 -0
- package/dist/cli/utils/resolveModelRecommendationFileOptions.js.map +1 -0
- package/dist/cli/utils/splitAnsiToLines.d.ts +1 -0
- package/dist/cli/utils/splitAnsiToLines.js +32 -0
- package/dist/cli/utils/splitAnsiToLines.js.map +1 -0
- package/dist/cli/utils/withCliCommandDescriptionDocsUrl.d.ts +2 -0
- package/dist/cli/utils/withCliCommandDescriptionDocsUrl.js +23 -0
- package/dist/cli/utils/withCliCommandDescriptionDocsUrl.js.map +1 -0
- package/dist/commands.d.ts +4 -3
- package/dist/commands.js +6 -3
- package/dist/commands.js.map +1 -1
- package/dist/config.d.ts +35 -4
- package/dist/config.js +58 -17
- package/dist/config.js.map +1 -1
- package/dist/consts.d.ts +4 -0
- package/dist/consts.js +11 -0
- package/dist/consts.js.map +1 -0
- package/dist/evaluator/LlamaChat/LlamaChat.d.ts +151 -41
- package/dist/evaluator/LlamaChat/LlamaChat.js +1289 -437
- package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -1
- package/dist/evaluator/LlamaChat/utils/FunctionCallNameGrammar.d.ts +11 -0
- package/dist/evaluator/LlamaChat/utils/FunctionCallNameGrammar.js +55 -0
- package/dist/evaluator/LlamaChat/utils/FunctionCallNameGrammar.js.map +1 -0
- package/dist/evaluator/LlamaChat/utils/FunctionCallParamsGrammar.d.ts +16 -0
- package/dist/evaluator/LlamaChat/utils/FunctionCallParamsGrammar.js +45 -0
- package/dist/evaluator/LlamaChat/utils/FunctionCallParamsGrammar.js.map +1 -0
- package/dist/evaluator/LlamaChat/utils/LlamaFunctionCallValidationError.d.ts +8 -0
- package/dist/evaluator/LlamaChat/utils/LlamaFunctionCallValidationError.js +12 -0
- package/dist/evaluator/LlamaChat/utils/LlamaFunctionCallValidationError.js.map +1 -0
- package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js +27 -17
- package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +1 -1
- package/dist/evaluator/LlamaChatSession/LlamaChatSession.d.ts +187 -13
- package/dist/evaluator/LlamaChatSession/LlamaChatSession.js +280 -53
- package/dist/evaluator/LlamaChatSession/LlamaChatSession.js.map +1 -1
- package/dist/evaluator/LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.d.ts +40 -0
- package/dist/evaluator/LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.js +186 -0
- package/dist/evaluator/LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.js.map +1 -0
- package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.d.ts +10 -2
- package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.js +8 -0
- package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.js.map +1 -1
- package/dist/evaluator/LlamaCompletion.d.ts +168 -0
- package/dist/evaluator/LlamaCompletion.js +470 -0
- package/dist/evaluator/LlamaCompletion.js.map +1 -0
- package/dist/evaluator/LlamaContext/LlamaContext.d.ts +62 -21
- package/dist/evaluator/LlamaContext/LlamaContext.js +501 -120
- package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -1
- package/dist/evaluator/LlamaContext/LlamaSampler.d.ts +1 -0
- package/dist/evaluator/LlamaContext/LlamaSampler.js +31 -0
- package/dist/evaluator/LlamaContext/LlamaSampler.js.map +1 -0
- package/dist/evaluator/LlamaContext/types.d.ts +177 -16
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/firstInFirstOutStrategy.js.map +1 -0
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/maximumParallelismStrategy.js.map +1 -0
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.d.ts +2 -0
- package/dist/evaluator/LlamaContext/utils/{resolveBatchItemsPrioritizingStrategy.js → resolveBatchItemsPrioritizationStrategy.js} +5 -5
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js.map +1 -0
- package/dist/evaluator/LlamaEmbedding.d.ts +21 -0
- package/dist/evaluator/LlamaEmbedding.js +53 -0
- package/dist/evaluator/LlamaEmbedding.js.map +1 -0
- package/dist/evaluator/LlamaEmbeddingContext.d.ts +29 -19
- package/dist/evaluator/LlamaEmbeddingContext.js +36 -43
- package/dist/evaluator/LlamaEmbeddingContext.js.map +1 -1
- package/dist/evaluator/LlamaGrammar.d.ts +16 -13
- package/dist/evaluator/LlamaGrammar.js +17 -10
- package/dist/evaluator/LlamaGrammar.js.map +1 -1
- package/dist/evaluator/LlamaGrammarEvaluationState.d.ts +7 -3
- package/dist/evaluator/LlamaGrammarEvaluationState.js +8 -4
- package/dist/evaluator/LlamaGrammarEvaluationState.js.map +1 -1
- package/dist/evaluator/LlamaJsonSchemaGrammar.d.ts +3 -0
- package/dist/evaluator/LlamaJsonSchemaGrammar.js +5 -3
- package/dist/evaluator/LlamaJsonSchemaGrammar.js.map +1 -1
- package/dist/evaluator/LlamaModel/LlamaModel.d.ts +255 -0
- package/dist/evaluator/LlamaModel/LlamaModel.js +780 -0
- package/dist/evaluator/LlamaModel/LlamaModel.js.map +1 -0
- package/dist/evaluator/LlamaModel/utils/TokenAttributes.d.ts +29 -0
- package/dist/evaluator/LlamaModel/utils/TokenAttributes.js +65 -0
- package/dist/evaluator/LlamaModel/utils/TokenAttributes.js.map +1 -0
- package/dist/evaluator/TokenBias.d.ts +34 -0
- package/dist/evaluator/TokenBias.js +65 -0
- package/dist/evaluator/TokenBias.js.map +1 -0
- package/dist/evaluator/TokenMeter.d.ts +45 -0
- package/dist/evaluator/TokenMeter.js +74 -0
- package/dist/evaluator/TokenMeter.js.map +1 -0
- package/dist/gguf/consts.d.ts +4 -0
- package/dist/gguf/consts.js +12 -0
- package/dist/gguf/consts.js.map +1 -0
- package/dist/gguf/errors/InvalidGgufMagicError.d.ts +3 -0
- package/dist/gguf/errors/InvalidGgufMagicError.js +6 -0
- package/dist/gguf/errors/InvalidGgufMagicError.js.map +1 -0
- package/dist/gguf/errors/UnsupportedGgufValueTypeError.d.ts +4 -0
- package/dist/gguf/errors/UnsupportedGgufValueTypeError.js +9 -0
- package/dist/gguf/errors/UnsupportedGgufValueTypeError.js.map +1 -0
- package/dist/gguf/fileReaders/GgufFileReader.d.ts +36 -0
- package/dist/gguf/fileReaders/GgufFileReader.js +109 -0
- package/dist/gguf/fileReaders/GgufFileReader.js.map +1 -0
- package/dist/gguf/fileReaders/GgufFsFileReader.d.ts +16 -0
- package/dist/gguf/fileReaders/GgufFsFileReader.js +62 -0
- package/dist/gguf/fileReaders/GgufFsFileReader.js.map +1 -0
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.d.ts +25 -0
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js +92 -0
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js.map +1 -0
- package/dist/gguf/insights/GgufInsights.d.ts +50 -0
- package/dist/gguf/insights/GgufInsights.js +401 -0
- package/dist/gguf/insights/GgufInsights.js.map +1 -0
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.d.ts +146 -0
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.js +226 -0
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.js.map +1 -0
- package/dist/gguf/insights/utils/resolveContextContextSizeOption.d.ts +19 -0
- package/dist/gguf/insights/utils/resolveContextContextSizeOption.js +78 -0
- package/dist/gguf/insights/utils/resolveContextContextSizeOption.js.map +1 -0
- package/dist/gguf/insights/utils/resolveModelGpuLayersOption.d.ts +15 -0
- package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js +183 -0
- package/dist/gguf/insights/utils/resolveModelGpuLayersOption.js.map +1 -0
- package/dist/gguf/insights/utils/scoreLevels.d.ts +5 -0
- package/dist/gguf/insights/utils/scoreLevels.js +16 -0
- package/dist/gguf/insights/utils/scoreLevels.js.map +1 -0
- package/dist/gguf/parser/GgufV2Parser.d.ts +20 -0
- package/dist/gguf/parser/GgufV2Parser.js +156 -0
- package/dist/gguf/parser/GgufV2Parser.js.map +1 -0
- package/dist/gguf/parser/GgufV3Parser.d.ts +3 -0
- package/dist/gguf/parser/GgufV3Parser.js +4 -0
- package/dist/gguf/parser/GgufV3Parser.js.map +1 -0
- package/dist/gguf/parser/parseGguf.d.ts +8 -0
- package/dist/gguf/parser/parseGguf.js +61 -0
- package/dist/gguf/parser/parseGguf.js.map +1 -0
- package/dist/gguf/readGgufFileInfo.d.ts +45 -0
- package/dist/gguf/readGgufFileInfo.js +71 -0
- package/dist/gguf/readGgufFileInfo.js.map +1 -0
- package/dist/gguf/types/GgufFileInfoTypes.d.ts +84 -0
- package/dist/gguf/types/GgufFileInfoTypes.js +18 -0
- package/dist/gguf/types/GgufFileInfoTypes.js.map +1 -0
- package/dist/gguf/types/GgufMetadataTypes.d.ts +372 -0
- package/dist/gguf/types/GgufMetadataTypes.js +114 -0
- package/dist/gguf/types/GgufMetadataTypes.js.map +1 -0
- package/dist/gguf/types/GgufTensorInfoTypes.d.ts +37 -0
- package/dist/gguf/types/GgufTensorInfoTypes.js +33 -0
- package/dist/gguf/types/GgufTensorInfoTypes.js.map +1 -0
- package/dist/gguf/utils/GgufReadOffset.d.ts +6 -0
- package/dist/gguf/utils/GgufReadOffset.js +18 -0
- package/dist/gguf/utils/GgufReadOffset.js.map +1 -0
- package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.d.ts +6 -0
- package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js +76 -0
- package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js.map +1 -0
- package/dist/gguf/utils/getGgufFileTypeName.d.ts +4 -0
- package/dist/gguf/utils/getGgufFileTypeName.js +13 -0
- package/dist/gguf/utils/getGgufFileTypeName.js.map +1 -0
- package/dist/gguf/utils/getGgufMetadataArchitectureData.d.ts +3 -0
- package/dist/gguf/utils/getGgufMetadataArchitectureData.js +4 -0
- package/dist/gguf/utils/getGgufMetadataArchitectureData.js.map +1 -0
- package/dist/gguf/utils/normalizeGgufDownloadUrl.d.ts +1 -0
- package/dist/gguf/utils/normalizeGgufDownloadUrl.js +16 -0
- package/dist/gguf/utils/normalizeGgufDownloadUrl.js.map +1 -0
- package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.d.ts +2 -0
- package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.js +39 -0
- package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.js.map +1 -0
- package/dist/gguf/utils/resolveSplitGgufParts.d.ts +7 -0
- package/dist/gguf/utils/resolveSplitGgufParts.js +55 -0
- package/dist/gguf/utils/resolveSplitGgufParts.js.map +1 -0
- package/dist/index.d.ts +39 -14
- package/dist/index.js +29 -8
- package/dist/index.js.map +1 -1
- package/dist/state.d.ts +2 -0
- package/dist/state.js +7 -0
- package/dist/state.js.map +1 -1
- package/dist/tsconfig.tsbuildinfo +1 -0
- package/dist/types.d.ts +131 -5
- package/dist/types.js.map +1 -1
- package/dist/utils/DisposeGuard.d.ts +13 -0
- package/dist/utils/DisposeGuard.js +120 -0
- package/dist/utils/DisposeGuard.js.map +1 -0
- package/dist/utils/InsufficientMemoryError.d.ts +3 -0
- package/dist/utils/InsufficientMemoryError.js +6 -0
- package/dist/utils/InsufficientMemoryError.js.map +1 -0
- package/dist/utils/LlamaText.d.ts +73 -26
- package/dist/utils/LlamaText.js +475 -157
- package/dist/utils/LlamaText.js.map +1 -1
- package/dist/utils/LruCache.d.ts +12 -0
- package/dist/utils/LruCache.js +44 -0
- package/dist/utils/LruCache.js.map +1 -0
- package/dist/utils/OverridesObject.d.ts +7 -0
- package/dist/utils/OverridesObject.js +2 -0
- package/dist/utils/OverridesObject.js.map +1 -0
- package/dist/utils/ReplHistory.js +5 -1
- package/dist/utils/ReplHistory.js.map +1 -1
- package/dist/utils/StopGenerationDetector.d.ts +27 -8
- package/dist/utils/StopGenerationDetector.js +108 -22
- package/dist/utils/StopGenerationDetector.js.map +1 -1
- package/dist/utils/ThreadsSplitter.d.ts +32 -0
- package/dist/utils/ThreadsSplitter.js +177 -0
- package/dist/utils/ThreadsSplitter.js.map +1 -0
- package/dist/utils/TokenStreamRegulator.d.ts +10 -4
- package/dist/utils/TokenStreamRegulator.js +102 -10
- package/dist/utils/TokenStreamRegulator.js.map +1 -1
- package/dist/utils/UnsupportedError.d.ts +2 -0
- package/dist/utils/UnsupportedError.js +7 -0
- package/dist/utils/UnsupportedError.js.map +1 -0
- package/dist/utils/appendUserMessageToChatHistory.d.ts +4 -0
- package/dist/utils/appendUserMessageToChatHistory.js +4 -0
- package/dist/utils/appendUserMessageToChatHistory.js.map +1 -1
- package/dist/utils/clearTempFolder.js.map +1 -1
- package/dist/utils/cmake.js +23 -10
- package/dist/utils/cmake.js.map +1 -1
- package/dist/utils/compareTokens.d.ts +1 -1
- package/dist/utils/compareTokens.js.map +1 -1
- package/dist/utils/createModelDownloader.d.ts +199 -0
- package/dist/utils/createModelDownloader.js +405 -0
- package/dist/utils/createModelDownloader.js.map +1 -0
- package/dist/utils/findBestOption.d.ts +4 -0
- package/dist/utils/findBestOption.js +15 -0
- package/dist/utils/findBestOption.js.map +1 -0
- package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.d.ts +1 -0
- package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.js +23 -12
- package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.js.map +1 -1
- package/dist/utils/gbnfJson/GbnfGrammarGenerator.js.map +1 -1
- package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.d.ts +5 -0
- package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.js +11 -0
- package/dist/utils/gbnfJson/getGbnfGrammarForGbnfJsonSchema.js.map +1 -0
- package/dist/utils/gbnfJson/terminals/GbnfArray.d.ts +3 -1
- package/dist/utils/gbnfJson/terminals/GbnfArray.js +10 -5
- package/dist/utils/gbnfJson/terminals/GbnfArray.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfBoolean.d.ts +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfBoolean.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfBooleanValue.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfGrammar.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfNull.d.ts +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfNull.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfNumber.d.ts +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfNumber.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfNumberValue.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfObjectMap.d.ts +3 -1
- package/dist/utils/gbnfJson/terminals/GbnfObjectMap.js +9 -4
- package/dist/utils/gbnfJson/terminals/GbnfObjectMap.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfOr.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfRepetition.d.ts +9 -0
- package/dist/utils/gbnfJson/terminals/GbnfRepetition.js +37 -0
- package/dist/utils/gbnfJson/terminals/GbnfRepetition.js.map +1 -0
- package/dist/utils/gbnfJson/terminals/GbnfString.d.ts +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfString.js +23 -5
- package/dist/utils/gbnfJson/terminals/GbnfString.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfStringValue.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfVerbatimText.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfWhitespace.d.ts +7 -4
- package/dist/utils/gbnfJson/terminals/GbnfWhitespace.js +37 -9
- package/dist/utils/gbnfJson/terminals/GbnfWhitespace.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/gbnfConsts.d.ts +5 -4
- package/dist/utils/gbnfJson/terminals/gbnfConsts.js +14 -3
- package/dist/utils/gbnfJson/terminals/gbnfConsts.js.map +1 -1
- package/dist/utils/gbnfJson/types.d.ts +3 -0
- package/dist/utils/gbnfJson/types.js.map +1 -1
- package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.d.ts +10 -0
- package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.js +15 -0
- package/dist/utils/gbnfJson/utils/GbnfJsonScopeState.js.map +1 -0
- package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.d.ts +2 -1
- package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.js +6 -5
- package/dist/utils/gbnfJson/utils/getGbnfJsonTerminalForGbnfJsonSchema.js.map +1 -1
- package/dist/utils/gbnfJson/utils/validateObjectAgainstGbnfSchema.js +3 -3
- package/dist/utils/gbnfJson/utils/validateObjectAgainstGbnfSchema.js.map +1 -1
- package/dist/utils/getBuildDefaults.d.ts +1 -2
- package/dist/utils/getBuildDefaults.js +2 -3
- package/dist/utils/getBuildDefaults.js.map +1 -1
- package/dist/utils/getConsoleLogPrefix.d.ts +1 -1
- package/dist/utils/getConsoleLogPrefix.js +5 -4
- package/dist/utils/getConsoleLogPrefix.js.map +1 -1
- package/dist/utils/getGrammarsFolder.js +1 -1
- package/dist/utils/getGrammarsFolder.js.map +1 -1
- package/dist/utils/getQueuedTokensBeforeStopTrigger.d.ts +6 -0
- package/dist/utils/getQueuedTokensBeforeStopTrigger.js +22 -0
- package/dist/utils/getQueuedTokensBeforeStopTrigger.js.map +1 -0
- package/dist/utils/getReadableContextSize.d.ts +1 -0
- package/dist/utils/getReadableContextSize.js +7 -0
- package/dist/utils/getReadableContextSize.js.map +1 -0
- package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.js +15 -11
- package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.js.map +1 -1
- package/dist/utils/gitReleaseBundles.js +68 -1
- package/dist/utils/gitReleaseBundles.js.map +1 -1
- package/dist/utils/isToken.d.ts +2 -0
- package/dist/utils/isToken.js +4 -0
- package/dist/utils/isToken.js.map +1 -0
- package/dist/utils/isUrl.d.ts +1 -0
- package/dist/utils/isUrl.js +15 -0
- package/dist/utils/isUrl.js.map +1 -0
- package/dist/utils/mergeUnionTypes.d.ts +10 -0
- package/dist/utils/mergeUnionTypes.js +2 -0
- package/dist/utils/mergeUnionTypes.js.map +1 -0
- package/dist/utils/modelFileAccesTokens.d.ts +4 -0
- package/dist/utils/modelFileAccesTokens.js +40 -0
- package/dist/utils/modelFileAccesTokens.js.map +1 -0
- package/dist/utils/parseModelFileName.d.ts +1 -0
- package/dist/utils/parseModelFileName.js +6 -1
- package/dist/utils/parseModelFileName.js.map +1 -1
- package/dist/utils/parseTextTemplate.d.ts +66 -0
- package/dist/utils/parseTextTemplate.js +116 -0
- package/dist/utils/parseTextTemplate.js.map +1 -0
- package/dist/utils/prettyPrintObject.d.ts +10 -1
- package/dist/utils/prettyPrintObject.js +61 -15
- package/dist/utils/prettyPrintObject.js.map +1 -1
- package/dist/utils/pushAll.d.ts +6 -0
- package/dist/utils/pushAll.js +11 -0
- package/dist/utils/pushAll.js.map +1 -0
- package/dist/utils/removeNullFields.d.ts +2 -2
- package/dist/utils/removeNullFields.js.map +1 -1
- package/dist/utils/resolveGithubRelease.d.ts +2 -2
- package/dist/utils/resolveGithubRelease.js.map +1 -1
- package/dist/utils/resolveLastTokens.d.ts +2 -0
- package/dist/utils/resolveLastTokens.js +12 -0
- package/dist/utils/resolveLastTokens.js.map +1 -0
- package/dist/utils/runtime.d.ts +4 -0
- package/dist/utils/runtime.js +8 -0
- package/dist/utils/runtime.js.map +1 -0
- package/dist/utils/safeEventCallback.d.ts +6 -0
- package/dist/utils/safeEventCallback.js +29 -0
- package/dist/utils/safeEventCallback.js.map +1 -0
- package/dist/utils/spawnCommand.d.ts +11 -2
- package/dist/utils/spawnCommand.js +55 -7
- package/dist/utils/spawnCommand.js.map +1 -1
- package/dist/utils/tokenizeInput.d.ts +1 -1
- package/dist/utils/tokenizeInput.js +6 -3
- package/dist/utils/tokenizeInput.js.map +1 -1
- package/dist/utils/transformPromisable.d.ts +40 -0
- package/dist/utils/transformPromisable.js +64 -0
- package/dist/utils/transformPromisable.js.map +1 -0
- package/dist/utils/truncateTextAndRoundToWords.d.ts +2 -0
- package/dist/utils/truncateTextAndRoundToWords.js +32 -0
- package/dist/utils/truncateTextAndRoundToWords.js.map +1 -1
- package/dist/utils/utilTypes.d.ts +3 -0
- package/dist/utils/utilTypes.js +2 -0
- package/dist/utils/utilTypes.js.map +1 -0
- package/dist/utils/waitForLockfileRelease.js.map +1 -1
- package/dist/utils/withLockfile.js.map +1 -1
- package/dist/utils/withOra.d.ts +2 -0
- package/dist/utils/withOra.js +16 -6
- package/dist/utils/withOra.js.map +1 -1
- package/dist/utils/withProgressLog.d.ts +22 -0
- package/dist/utils/withProgressLog.js +211 -0
- package/dist/utils/withProgressLog.js.map +1 -0
- package/dist/utils/withStatusLogs.js +1 -1
- package/dist/utils/withStatusLogs.js.map +1 -1
- package/dist/utils/wrapAbortSignal.d.ts +1 -0
- package/dist/utils/wrapAbortSignal.js +9 -0
- package/dist/utils/wrapAbortSignal.js.map +1 -0
- package/llama/CMakeLists.txt +134 -5
- package/llama/addon/AddonContext.cpp +629 -0
- package/llama/addon/AddonContext.h +52 -0
- package/llama/addon/AddonGrammar.cpp +39 -0
- package/llama/addon/AddonGrammar.h +19 -0
- package/llama/addon/AddonGrammarEvaluationState.cpp +25 -0
- package/llama/addon/AddonGrammarEvaluationState.h +17 -0
- package/llama/addon/AddonModel.cpp +672 -0
- package/llama/addon/AddonModel.h +61 -0
- package/llama/addon/AddonModelData.cpp +25 -0
- package/llama/addon/AddonModelData.h +15 -0
- package/llama/addon/AddonModelLora.cpp +105 -0
- package/llama/addon/AddonModelLora.h +28 -0
- package/llama/addon/AddonSampler.cpp +513 -0
- package/llama/addon/AddonSampler.h +65 -0
- package/llama/addon/RingBuffer.h +109 -0
- package/llama/addon/addon.cpp +223 -0
- package/llama/addon/addonGlobals.cpp +22 -0
- package/llama/addon/addonGlobals.h +12 -0
- package/llama/addon/globals/addonLog.cpp +136 -0
- package/llama/addon/globals/addonLog.h +21 -0
- package/llama/addon/globals/addonProgress.cpp +15 -0
- package/llama/addon/globals/addonProgress.h +15 -0
- package/llama/addon/globals/getGpuInfo.cpp +108 -0
- package/llama/addon/globals/getGpuInfo.h +6 -0
- package/llama/binariesGithubRelease.json +1 -1
- package/llama/gitRelease.bundle +0 -0
- package/llama/gpuInfo/cuda-gpu-info.cu +120 -0
- package/llama/gpuInfo/cuda-gpu-info.h +10 -0
- package/llama/gpuInfo/metal-gpu-info.h +8 -0
- package/llama/gpuInfo/metal-gpu-info.mm +30 -0
- package/llama/gpuInfo/vulkan-gpu-info.cpp +83 -0
- package/llama/gpuInfo/vulkan-gpu-info.h +9 -0
- package/llama/grammars/README.md +297 -6
- package/llama/grammars/json.gbnf +4 -4
- package/llama/grammars/json_arr.gbnf +4 -4
- package/llama/llama.cpp.info.json +1 -1
- package/llama/toolchains/win32.host-x64.target-arm64.cmake +41 -0
- package/package.json +109 -59
- package/templates/packed/electron-typescript-react.json +1 -0
- package/templates/packed/node-typescript.json +1 -0
- package/dist/AbortError.d.ts +0 -2
- package/dist/AbortError.js +0 -7
- package/dist/AbortError.js.map +0 -1
- package/dist/chatWrappers/LlamaChatWrapper.d.ts +0 -13
- package/dist/chatWrappers/LlamaChatWrapper.js.map +0 -1
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.d.ts +0 -13
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js +0 -57
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js.map +0 -1
- package/dist/cli/commands/BuildCommand.d.ts +0 -11
- package/dist/cli/commands/BuildCommand.js +0 -106
- package/dist/cli/commands/BuildCommand.js.map +0 -1
- package/dist/cli/commands/ClearCommand.js.map +0 -1
- package/dist/cli/commands/DownloadCommand.js +0 -169
- package/dist/cli/commands/DownloadCommand.js.map +0 -1
- package/dist/evaluator/LlamaChat/utils/FunctionCallGrammar.d.ts +0 -22
- package/dist/evaluator/LlamaChat/utils/FunctionCallGrammar.js +0 -121
- package/dist/evaluator/LlamaChat/utils/FunctionCallGrammar.js.map +0 -1
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js.map +0 -1
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js.map +0 -1
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.d.ts +0 -2
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js.map +0 -1
- package/dist/evaluator/LlamaModel.d.ts +0 -120
- package/dist/evaluator/LlamaModel.js +0 -320
- package/dist/evaluator/LlamaModel.js.map +0 -1
- package/dist/utils/getGbnfGrammarForGbnfJsonSchema.d.ts +0 -2
- package/dist/utils/getGbnfGrammarForGbnfJsonSchema.js +0 -9
- package/dist/utils/getGbnfGrammarForGbnfJsonSchema.js.map +0 -1
- package/dist/utils/parseModelTypeDescription.d.ts +0 -6
- package/dist/utils/parseModelTypeDescription.js +0 -9
- package/dist/utils/parseModelTypeDescription.js.map +0 -1
- package/dist/utils/resolveChatWrapper.d.ts +0 -4
- package/dist/utils/resolveChatWrapper.js +0 -16
- package/dist/utils/resolveChatWrapper.js.map +0 -1
- package/llama/addon.cpp +0 -950
- package/llamaBins/linux-arm64/.buildMetadata.json +0 -1
- package/llamaBins/linux-arm64/llama-addon.node +0 -0
- package/llamaBins/linux-armv7l/.buildMetadata.json +0 -1
- package/llamaBins/linux-armv7l/llama-addon.node +0 -0
- package/llamaBins/linux-x64/.buildMetadata.json +0 -1
- package/llamaBins/linux-x64/llama-addon.node +0 -0
- package/llamaBins/linux-x64-cuda/.buildMetadata.json +0 -1
- package/llamaBins/linux-x64-cuda/llama-addon.node +0 -0
- package/llamaBins/mac-arm64-metal/.buildMetadata.json +0 -1
- package/llamaBins/mac-arm64-metal/ggml-metal.metal +0 -6119
- package/llamaBins/mac-arm64-metal/llama-addon.node +0 -0
- package/llamaBins/mac-x64/.buildMetadata.json +0 -1
- package/llamaBins/mac-x64/llama-addon.node +0 -0
- package/llamaBins/win-x64/.buildMetadata.json +0 -1
- package/llamaBins/win-x64/llama-addon.exp +0 -0
- package/llamaBins/win-x64/llama-addon.lib +0 -0
- package/llamaBins/win-x64/llama-addon.node +0 -0
- package/llamaBins/win-x64-cuda/.buildMetadata.json +0 -1
- package/llamaBins/win-x64-cuda/llama-addon.exp +0 -0
- package/llamaBins/win-x64-cuda/llama-addon.lib +0 -0
- package/llamaBins/win-x64-cuda/llama-addon.node +0 -0
- /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.d.ts +0 -0
- /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.js +0 -0
- /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/maximumParallelismStrategy.d.ts +0 -0
- /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/maximumParallelismStrategy.js +0 -0
|
@@ -0,0 +1,84 @@
|
|
|
1
|
+
import type { GgufReadOffset } from "../utils/GgufReadOffset.js";
|
|
2
|
+
import type { GgufFileReader } from "../fileReaders/GgufFileReader.js";
|
|
3
|
+
import type { MergeOptionalUnionTypes } from "../../utils/mergeUnionTypes.js";
|
|
4
|
+
import type { GgufArchitectureType, GgufMetadata } from "./GgufMetadataTypes.js";
|
|
5
|
+
import type { GgufTensorInfo } from "./GgufTensorInfoTypes.js";
|
|
6
|
+
export type MetadataValue = string | number | bigint | boolean | MetadataValue[];
|
|
7
|
+
export type MetadataKeyValueRecord = Record<string, MetadataValue>;
|
|
8
|
+
export type MetadataNestedObject = {
|
|
9
|
+
[key: string]: MetadataValue | MetadataNestedObject;
|
|
10
|
+
};
|
|
11
|
+
export type GgufFileInfo = {
|
|
12
|
+
readonly version: 2 | 3 | number;
|
|
13
|
+
readonly tensorCount: number | bigint;
|
|
14
|
+
readonly metadata: GgufMetadata;
|
|
15
|
+
readonly metadataSize: number;
|
|
16
|
+
/** Same value as `metadata[metadata.general.architecture]`, but with merged types for convenience */
|
|
17
|
+
readonly architectureMetadata: MergeOptionalUnionTypes<Exclude<GgufMetadata[GgufArchitectureType], undefined>>;
|
|
18
|
+
/** can be null if `readTensorInfo` is set to `false` */
|
|
19
|
+
readonly tensorInfo?: GgufTensorInfo[];
|
|
20
|
+
/** can be null if `readTensorInfo` is set to `false` */
|
|
21
|
+
readonly tensorInfoSize?: number;
|
|
22
|
+
/**
|
|
23
|
+
* For spliced metadata of multiple file parts,
|
|
24
|
+
* this will be the number of files parts read and spliced into this metadata.
|
|
25
|
+
*
|
|
26
|
+
* Whe no splicing is done, this will be `1`.
|
|
27
|
+
*/
|
|
28
|
+
readonly splicedParts: number;
|
|
29
|
+
/**
|
|
30
|
+
* For spliced metadata of multiple file parts, this will be the total tensor count from all the parts
|
|
31
|
+
*
|
|
32
|
+
* When no splicing is done, this will be the same as `tensorCount`.
|
|
33
|
+
*/
|
|
34
|
+
readonly totalTensorCount: number | bigint;
|
|
35
|
+
/**
|
|
36
|
+
* For spliced metadata of multiple file parts, this will be the total metadata size from all the parts
|
|
37
|
+
*
|
|
38
|
+
* When no splicing is done, this will be the same as `metadataSize`.
|
|
39
|
+
*/
|
|
40
|
+
readonly totalMetadataSize: number;
|
|
41
|
+
/**
|
|
42
|
+
* For spliced metadata of multiple file parts, this will be the spliced tensorInfo from all the parts.
|
|
43
|
+
* Can be null if `readTensorInfo` is set to `false`
|
|
44
|
+
*
|
|
45
|
+
* When no splicing is done, this will be the same as `tensorInfo`.
|
|
46
|
+
*/
|
|
47
|
+
readonly fullTensorInfo?: GgufTensorInfo[];
|
|
48
|
+
/**
|
|
49
|
+
* For spliced metadata of multiple file parts, this will be the total tensor info size from all the parts
|
|
50
|
+
*
|
|
51
|
+
* When no splicing is done, this will be the same as `tensorInfoSize`.
|
|
52
|
+
*/
|
|
53
|
+
readonly totalTensorInfoSize?: number;
|
|
54
|
+
};
|
|
55
|
+
export declare const enum GgufValueType {
|
|
56
|
+
Uint8 = 0,
|
|
57
|
+
Int8 = 1,
|
|
58
|
+
Uint16 = 2,
|
|
59
|
+
Int16 = 3,
|
|
60
|
+
Uint32 = 4,
|
|
61
|
+
Int32 = 5,
|
|
62
|
+
Float32 = 6,
|
|
63
|
+
Bool = 7,
|
|
64
|
+
String = 8,
|
|
65
|
+
Array = 9,
|
|
66
|
+
Uint64 = 10,
|
|
67
|
+
Int64 = 11,
|
|
68
|
+
Float64 = 12
|
|
69
|
+
}
|
|
70
|
+
export type GgufVersionParserOptions = {
|
|
71
|
+
fileReader: GgufFileReader;
|
|
72
|
+
readTensorInfo?: boolean;
|
|
73
|
+
ignoreKeys?: string[];
|
|
74
|
+
version: number;
|
|
75
|
+
readOffset: GgufReadOffset;
|
|
76
|
+
logWarnings: boolean;
|
|
77
|
+
};
|
|
78
|
+
export type GgufVersionParserResult = {
|
|
79
|
+
tensorCount: number | bigint;
|
|
80
|
+
metadata: GgufMetadata;
|
|
81
|
+
tensorInfo?: GgufTensorInfo[];
|
|
82
|
+
metadataSize: number;
|
|
83
|
+
tensorInfoSize?: number;
|
|
84
|
+
};
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
// source: `enum gguf_type` in `ggml.h` in the `llama.cpp` source code
|
|
2
|
+
export var GgufValueType;
|
|
3
|
+
(function (GgufValueType) {
|
|
4
|
+
GgufValueType[GgufValueType["Uint8"] = 0] = "Uint8";
|
|
5
|
+
GgufValueType[GgufValueType["Int8"] = 1] = "Int8";
|
|
6
|
+
GgufValueType[GgufValueType["Uint16"] = 2] = "Uint16";
|
|
7
|
+
GgufValueType[GgufValueType["Int16"] = 3] = "Int16";
|
|
8
|
+
GgufValueType[GgufValueType["Uint32"] = 4] = "Uint32";
|
|
9
|
+
GgufValueType[GgufValueType["Int32"] = 5] = "Int32";
|
|
10
|
+
GgufValueType[GgufValueType["Float32"] = 6] = "Float32";
|
|
11
|
+
GgufValueType[GgufValueType["Bool"] = 7] = "Bool";
|
|
12
|
+
GgufValueType[GgufValueType["String"] = 8] = "String";
|
|
13
|
+
GgufValueType[GgufValueType["Array"] = 9] = "Array";
|
|
14
|
+
GgufValueType[GgufValueType["Uint64"] = 10] = "Uint64";
|
|
15
|
+
GgufValueType[GgufValueType["Int64"] = 11] = "Int64";
|
|
16
|
+
GgufValueType[GgufValueType["Float64"] = 12] = "Float64";
|
|
17
|
+
})(GgufValueType || (GgufValueType = {}));
|
|
18
|
+
//# sourceMappingURL=GgufFileInfoTypes.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"GgufFileInfoTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufFileInfoTypes.ts"],"names":[],"mappings":"AAkEA,sEAAsE;AACtE,MAAM,CAAN,IAAkB,aAcjB;AAdD,WAAkB,aAAa;IAC3B,mDAAS,CAAA;IACT,iDAAQ,CAAA;IACR,qDAAU,CAAA;IACV,mDAAS,CAAA;IACT,qDAAU,CAAA;IACV,mDAAS,CAAA;IACT,uDAAW,CAAA;IACX,iDAAQ,CAAA;IACR,qDAAU,CAAA;IACV,mDAAS,CAAA;IACT,sDAAW,CAAA;IACX,oDAAU,CAAA;IACV,wDAAY,CAAA;AAChB,CAAC,EAdiB,aAAa,KAAb,aAAa,QAc9B"}
|
|
@@ -0,0 +1,372 @@
|
|
|
1
|
+
export declare const enum GgufArchitectureType {
|
|
2
|
+
llama = "llama",
|
|
3
|
+
falcon = "falcon",
|
|
4
|
+
grok = "grok",
|
|
5
|
+
gpt2 = "gpt2",
|
|
6
|
+
gptj = "gptj",
|
|
7
|
+
gptneox = "gptneox",
|
|
8
|
+
mpt = "mpt",
|
|
9
|
+
baichuan = "baichuan",
|
|
10
|
+
starcoder = "starcoder",
|
|
11
|
+
refact = "refact",
|
|
12
|
+
bert = "bert",
|
|
13
|
+
nomicBert = "nomic-bert",
|
|
14
|
+
jinaBertV2 = "jina-bert-v2",
|
|
15
|
+
bloom = "bloom",
|
|
16
|
+
stablelm = "stablelm",
|
|
17
|
+
qwen = "qwen",
|
|
18
|
+
qwen2 = "qwen2",
|
|
19
|
+
qwen2moe = "qwen2moe",
|
|
20
|
+
phi2 = "phi2",
|
|
21
|
+
phi3 = "phi3",
|
|
22
|
+
plamo = "plamo",
|
|
23
|
+
codeshell = "codeshell",
|
|
24
|
+
orion = "orion",
|
|
25
|
+
internlm2 = "internlm2",
|
|
26
|
+
minicpm = "minicpm",
|
|
27
|
+
minicpm3 = "minicpm3",
|
|
28
|
+
gemma = "gemma",
|
|
29
|
+
gemma2 = "gemma2",
|
|
30
|
+
starcoder2 = "starcoder2",
|
|
31
|
+
mamba = "mamba",
|
|
32
|
+
xverse = "xverse",
|
|
33
|
+
commandR = "command-r",
|
|
34
|
+
dbrx = "dbrx",
|
|
35
|
+
olmo = "olmo",
|
|
36
|
+
olmoe = "olmoe",
|
|
37
|
+
openelm = "openelm",
|
|
38
|
+
arctic = "arctic",
|
|
39
|
+
deepseek2 = "deepseek2",
|
|
40
|
+
chatglm = "chatglm",
|
|
41
|
+
bitnet = "bitnet",
|
|
42
|
+
t5 = "t5",
|
|
43
|
+
t5encoder = "t5encoder",
|
|
44
|
+
jais = "jais",
|
|
45
|
+
nemotron = "nemotron",
|
|
46
|
+
exaone = "exaone",
|
|
47
|
+
rwkv6 = "rwkv6",
|
|
48
|
+
unknown = "(unknown)"
|
|
49
|
+
}
|
|
50
|
+
export type GgufMetadata<A extends GgufArchitectureType = GgufArchitectureType> = {
|
|
51
|
+
readonly general: GgufMetadataGeneral<A>;
|
|
52
|
+
readonly tokenizer: GgufMetadataTokenizer;
|
|
53
|
+
} & (GgufArchitectureType extends A ? {
|
|
54
|
+
readonly [key in GgufArchitectureType]?: key extends keyof GgufMetadataLlmToType ? GgufMetadataLlmToType[key] : GgufMetadataDefaultArchitectureType;
|
|
55
|
+
} : {
|
|
56
|
+
readonly [key in A]: key extends keyof GgufMetadataLlmToType ? GgufMetadataLlmToType[key] : GgufMetadataDefaultArchitectureType;
|
|
57
|
+
});
|
|
58
|
+
export type GgufMetadataLlmToType = {
|
|
59
|
+
[GgufArchitectureType.llama]: GgufMetadataLlmLLaMA;
|
|
60
|
+
[GgufArchitectureType.mpt]: GgufMetadataMPT;
|
|
61
|
+
[GgufArchitectureType.gptneox]: GgufMetadataGPTNeoX;
|
|
62
|
+
[GgufArchitectureType.gptj]: GgufMetadataGPTJ;
|
|
63
|
+
[GgufArchitectureType.gpt2]: GgufMetadataGPT2;
|
|
64
|
+
[GgufArchitectureType.bloom]: GgufMetadataBloom;
|
|
65
|
+
[GgufArchitectureType.falcon]: GgufMetadataFalcon;
|
|
66
|
+
[GgufArchitectureType.mamba]: GgufMetadataMamba;
|
|
67
|
+
};
|
|
68
|
+
export declare enum GgufFileType {
|
|
69
|
+
ALL_F32 = 0,
|
|
70
|
+
MOSTLY_F16 = 1,
|
|
71
|
+
MOSTLY_Q4_0 = 2,
|
|
72
|
+
MOSTLY_Q4_1 = 3,
|
|
73
|
+
MOSTLY_Q4_1_SOME_F16 = 4,
|
|
74
|
+
MOSTLY_Q4_2 = 5,
|
|
75
|
+
MOSTLY_Q4_3 = 6,
|
|
76
|
+
MOSTLY_Q8_0 = 7,
|
|
77
|
+
MOSTLY_Q5_0 = 8,
|
|
78
|
+
MOSTLY_Q5_1 = 9,
|
|
79
|
+
MOSTLY_Q2_K = 10,
|
|
80
|
+
MOSTLY_Q3_K_S = 11,
|
|
81
|
+
MOSTLY_Q3_K_M = 12,
|
|
82
|
+
MOSTLY_Q3_K_L = 13,
|
|
83
|
+
MOSTLY_Q4_K_S = 14,
|
|
84
|
+
MOSTLY_Q4_K_M = 15,
|
|
85
|
+
MOSTLY_Q5_K_S = 16,
|
|
86
|
+
MOSTLY_Q5_K_M = 17,
|
|
87
|
+
MOSTLY_Q6_K = 18,
|
|
88
|
+
MOSTLY_IQ2_XXS = 19,
|
|
89
|
+
MOSTLY_IQ2_XS = 20,
|
|
90
|
+
MOSTLY_Q2_K_S = 21,
|
|
91
|
+
MOSTLY_IQ3_XS = 22,
|
|
92
|
+
MOSTLY_IQ3_XXS = 23,
|
|
93
|
+
MOSTLY_IQ1_S = 24,
|
|
94
|
+
MOSTLY_IQ4_NL = 25,
|
|
95
|
+
MOSTLY_IQ3_S = 26,
|
|
96
|
+
MOSTLY_IQ3_M = 27,
|
|
97
|
+
MOSTLY_IQ2_S = 28,
|
|
98
|
+
MOSTLY_IQ2_M = 29,
|
|
99
|
+
MOSTLY_IQ4_XS = 30,
|
|
100
|
+
MOSTLY_IQ1_M = 31,
|
|
101
|
+
MOSTLY_BF16 = 32,
|
|
102
|
+
MOSTLY_Q4_0_4_4 = 33,
|
|
103
|
+
MOSTLY_Q4_0_4_8 = 34,
|
|
104
|
+
MOSTLY_Q4_0_8_8 = 35,
|
|
105
|
+
LLAMA_FTYPE_MOSTLY_TQ1_0 = 36,
|
|
106
|
+
LLAMA_FTYPE_MOSTLY_TQ2_0 = 37
|
|
107
|
+
}
|
|
108
|
+
export type GgufMetadataGeneral<A extends GgufArchitectureType = GgufArchitectureType> = {
|
|
109
|
+
readonly architecture: A;
|
|
110
|
+
/**
|
|
111
|
+
* The version of the quantization format. Not required if the model is not
|
|
112
|
+
* quantized (i.e. no tensors are quantized). If any tensors are quantized,
|
|
113
|
+
* this must be present. This is separate to the quantization scheme of the
|
|
114
|
+
* tensors itself; the quantization version may change without changing the
|
|
115
|
+
* scheme's name (e.g. the quantization scheme is Q5_K, and the quantization
|
|
116
|
+
* version is 4).
|
|
117
|
+
*/
|
|
118
|
+
readonly quantization_version: string;
|
|
119
|
+
/**
|
|
120
|
+
* the global alignment to use, as described above. This can vary to allow
|
|
121
|
+
* for different alignment schemes, but it must be a multiple of 8. Some
|
|
122
|
+
* writers may not write the alignment. If the alignment is not specified,
|
|
123
|
+
* assume it is `32`.
|
|
124
|
+
*/
|
|
125
|
+
readonly alignment?: string;
|
|
126
|
+
/**
|
|
127
|
+
* The name of the model. This should be a human-readable name that can be
|
|
128
|
+
* used to identify the model. It should be unique within the community
|
|
129
|
+
* that the model is defined in.
|
|
130
|
+
*/
|
|
131
|
+
readonly name?: string;
|
|
132
|
+
readonly basename?: string;
|
|
133
|
+
readonly size_label?: string;
|
|
134
|
+
readonly author?: string;
|
|
135
|
+
/**
|
|
136
|
+
* URL to the model's homepage. This can be a GitHub repo, a paper, etc.
|
|
137
|
+
*/
|
|
138
|
+
readonly url?: string;
|
|
139
|
+
/**
|
|
140
|
+
* free-form description of the model including anything that isn't
|
|
141
|
+
* covered by the other fields
|
|
142
|
+
*/
|
|
143
|
+
readonly description?: string;
|
|
144
|
+
/**
|
|
145
|
+
* License of the model, expressed as a SPDX license expression
|
|
146
|
+
* (e.g. `MIT OR Apache-2.0`). *Should not* include any other information,
|
|
147
|
+
* such as the license text or the URL to the license.
|
|
148
|
+
*/
|
|
149
|
+
readonly license?: string;
|
|
150
|
+
readonly "license.name"?: string;
|
|
151
|
+
readonly "license.link"?: string;
|
|
152
|
+
/**
|
|
153
|
+
* Information about where this model came from. This is useful for tracking
|
|
154
|
+
* the provenance of the model, and for finding the original source if the
|
|
155
|
+
* model is modified. For a model that was converted from GGML, for
|
|
156
|
+
* example, these keys would point to the model that was converted from.
|
|
157
|
+
*/
|
|
158
|
+
readonly source?: {
|
|
159
|
+
/**
|
|
160
|
+
* URL to the source of the model. Can be a GitHub repo, a paper, etc.
|
|
161
|
+
*/
|
|
162
|
+
readonly url?: string;
|
|
163
|
+
readonly huggingface?: {
|
|
164
|
+
readonly repository?: string;
|
|
165
|
+
};
|
|
166
|
+
};
|
|
167
|
+
/**
|
|
168
|
+
* An enumerated value describing the type of the majority of the tensors
|
|
169
|
+
* in the file. Optional; can be inferred from the tensor types.
|
|
170
|
+
*/
|
|
171
|
+
readonly file_type?: GgufFileType | undefined;
|
|
172
|
+
readonly base_model?: {
|
|
173
|
+
readonly count: number;
|
|
174
|
+
readonly [key: `${bigint}`]: {
|
|
175
|
+
readonly name?: string;
|
|
176
|
+
readonly author?: string;
|
|
177
|
+
readonly version?: string;
|
|
178
|
+
readonly organization?: string;
|
|
179
|
+
readonly url?: string;
|
|
180
|
+
readonly doi?: string;
|
|
181
|
+
readonly uuid?: string;
|
|
182
|
+
readonly repo_url?: string;
|
|
183
|
+
};
|
|
184
|
+
};
|
|
185
|
+
};
|
|
186
|
+
export declare const enum GgufMetadataTokenizerTokenType {
|
|
187
|
+
undefined = 0,
|
|
188
|
+
normal = 1,
|
|
189
|
+
unknown = 2,
|
|
190
|
+
control = 3,
|
|
191
|
+
userDefined = 4,
|
|
192
|
+
unused = 5,
|
|
193
|
+
byte = 6
|
|
194
|
+
}
|
|
195
|
+
export type GgufMetadataTokenizer = {
|
|
196
|
+
readonly ggml: {
|
|
197
|
+
readonly model: "no_vocab" | "llama" | "gpt2" | "bert" | string;
|
|
198
|
+
readonly pre?: "default" | "llama3" | "llama-v3" | "llama-bpe" | "deepseek-llm" | "deepseek-coder" | "falcon" | "mpt" | "starcoder" | "gpt-2" | "jina-es" | "jina-de" | "jina-v2-es" | "jina-v2-de" | "refact" | "command-r" | "qwen2" | "stablelm2" | "olmo" | "dbrx" | "smaug-bpe" | string;
|
|
199
|
+
readonly tokens: readonly string[];
|
|
200
|
+
readonly token_type: GgufMetadataTokenizerTokenType[];
|
|
201
|
+
readonly token_type_count?: number;
|
|
202
|
+
readonly scores?: readonly number[];
|
|
203
|
+
readonly merges?: readonly string[];
|
|
204
|
+
readonly bos_token_id?: number;
|
|
205
|
+
readonly eos_token_id?: number;
|
|
206
|
+
readonly unknown_token_id?: number;
|
|
207
|
+
readonly separator_token_id?: number;
|
|
208
|
+
readonly padding_token_id?: number;
|
|
209
|
+
readonly add_bos_token?: boolean;
|
|
210
|
+
readonly add_eos_token?: boolean;
|
|
211
|
+
readonly add_space_prefix?: boolean;
|
|
212
|
+
readonly added_tokens?: readonly string[];
|
|
213
|
+
readonly prefix_token_id?: number;
|
|
214
|
+
readonly suffix_token_id?: number;
|
|
215
|
+
readonly middle_token_id?: number;
|
|
216
|
+
readonly eot_token_id?: number;
|
|
217
|
+
};
|
|
218
|
+
readonly huggingface?: {
|
|
219
|
+
readonly json?: string;
|
|
220
|
+
};
|
|
221
|
+
readonly chat_template?: string;
|
|
222
|
+
};
|
|
223
|
+
export declare const enum GgufMetadataArchitecturePoolingType {
|
|
224
|
+
unspecified = -1,
|
|
225
|
+
none = 0,
|
|
226
|
+
mean = 1,
|
|
227
|
+
cls = 2,
|
|
228
|
+
last = 3
|
|
229
|
+
}
|
|
230
|
+
export type GgufMetadataDefaultArchitectureType = {
|
|
231
|
+
readonly vocab_size?: number;
|
|
232
|
+
readonly context_length?: number;
|
|
233
|
+
readonly embedding_length?: number;
|
|
234
|
+
readonly block_count?: number;
|
|
235
|
+
readonly feed_forward_length?: number;
|
|
236
|
+
readonly use_parallel_residual?: boolean;
|
|
237
|
+
readonly tensor_data_layout?: string;
|
|
238
|
+
readonly expert_count?: number;
|
|
239
|
+
readonly expert_used_count?: number;
|
|
240
|
+
readonly pooling_type?: GgufMetadataArchitecturePoolingType;
|
|
241
|
+
readonly logit_scale?: number;
|
|
242
|
+
readonly attention?: {
|
|
243
|
+
readonly head_count?: number;
|
|
244
|
+
readonly head_count_kv?: number;
|
|
245
|
+
readonly max_alibi_bias?: number;
|
|
246
|
+
readonly clamp_kqv?: number;
|
|
247
|
+
readonly layer_norm_epsilon?: number;
|
|
248
|
+
readonly layer_norm_rms_epsilon?: number;
|
|
249
|
+
readonly key_length?: number;
|
|
250
|
+
readonly value_length?: number;
|
|
251
|
+
readonly causal?: boolean;
|
|
252
|
+
};
|
|
253
|
+
readonly rope?: {
|
|
254
|
+
readonly dimension_count?: number;
|
|
255
|
+
readonly freq_base?: number;
|
|
256
|
+
readonly scale_linear?: number;
|
|
257
|
+
readonly scaling?: {
|
|
258
|
+
readonly type?: "none" | "linear" | "yarn" | string;
|
|
259
|
+
readonly factor?: number;
|
|
260
|
+
readonly original_context_length?: number;
|
|
261
|
+
readonly finetuned?: boolean;
|
|
262
|
+
};
|
|
263
|
+
};
|
|
264
|
+
readonly ssm?: {
|
|
265
|
+
readonly conv_kernel?: number;
|
|
266
|
+
readonly inner_size?: number;
|
|
267
|
+
readonly state_size?: number;
|
|
268
|
+
readonly time_step_rank?: number;
|
|
269
|
+
};
|
|
270
|
+
};
|
|
271
|
+
export type GgufMetadataLlmLLaMA = {
|
|
272
|
+
readonly context_length: number;
|
|
273
|
+
readonly embedding_length: number;
|
|
274
|
+
readonly block_count: number;
|
|
275
|
+
readonly feed_forward_length: number;
|
|
276
|
+
readonly attention: {
|
|
277
|
+
readonly head_count: number;
|
|
278
|
+
readonly layer_norm_rms_epsilon: number;
|
|
279
|
+
readonly head_count_kv?: number;
|
|
280
|
+
};
|
|
281
|
+
readonly rope: {
|
|
282
|
+
readonly dimension_count: number;
|
|
283
|
+
readonly scale?: number;
|
|
284
|
+
};
|
|
285
|
+
readonly expert_count?: number;
|
|
286
|
+
readonly expert_used_count?: number;
|
|
287
|
+
readonly tensor_data_layout?: string;
|
|
288
|
+
};
|
|
289
|
+
export type GgufMetadataMPT = {
|
|
290
|
+
readonly context_length: number;
|
|
291
|
+
readonly embedding_length: number;
|
|
292
|
+
readonly block_count: number;
|
|
293
|
+
readonly attention: {
|
|
294
|
+
readonly head_count: number;
|
|
295
|
+
readonly alibi_bias_max: number;
|
|
296
|
+
readonly clip_kqv: number;
|
|
297
|
+
readonly layer_norm_epsilon: number;
|
|
298
|
+
};
|
|
299
|
+
};
|
|
300
|
+
export type GgufMetadataGPTNeoX = {
|
|
301
|
+
readonly context_length: number;
|
|
302
|
+
readonly embedding_length: number;
|
|
303
|
+
readonly block_count: number;
|
|
304
|
+
readonly use_parallel_residual: boolean;
|
|
305
|
+
readonly rope: {
|
|
306
|
+
readonly dimension_count: number;
|
|
307
|
+
readonly scale?: number;
|
|
308
|
+
};
|
|
309
|
+
readonly attention: {
|
|
310
|
+
readonly head_count: number;
|
|
311
|
+
readonly layer_norm_epsilon: number;
|
|
312
|
+
};
|
|
313
|
+
};
|
|
314
|
+
export type GgufMetadataGPTJ = {
|
|
315
|
+
readonly context_length: number;
|
|
316
|
+
readonly embedding_length: number;
|
|
317
|
+
readonly block_count: number;
|
|
318
|
+
readonly rope: {
|
|
319
|
+
readonly dimension_count: number;
|
|
320
|
+
readonly scale?: number;
|
|
321
|
+
};
|
|
322
|
+
readonly attention: {
|
|
323
|
+
readonly head_count: number;
|
|
324
|
+
readonly layer_norm_epsilon: number;
|
|
325
|
+
};
|
|
326
|
+
};
|
|
327
|
+
export type GgufMetadataGPT2 = {
|
|
328
|
+
readonly context_length: number;
|
|
329
|
+
readonly embedding_length: number;
|
|
330
|
+
readonly block_count: number;
|
|
331
|
+
readonly attention: {
|
|
332
|
+
readonly head_count: number;
|
|
333
|
+
readonly layer_norm_epsilon: number;
|
|
334
|
+
};
|
|
335
|
+
};
|
|
336
|
+
export type GgufMetadataBloom = {
|
|
337
|
+
readonly context_length: number;
|
|
338
|
+
readonly embedding_length: number;
|
|
339
|
+
readonly block_count: number;
|
|
340
|
+
readonly feed_forward_length: number;
|
|
341
|
+
readonly attention: {
|
|
342
|
+
readonly head_count: number;
|
|
343
|
+
readonly layer_norm_epsilon: number;
|
|
344
|
+
};
|
|
345
|
+
};
|
|
346
|
+
export type GgufMetadataFalcon = {
|
|
347
|
+
readonly context_length: number;
|
|
348
|
+
readonly embedding_length: number;
|
|
349
|
+
readonly block_count: number;
|
|
350
|
+
readonly attention: {
|
|
351
|
+
readonly head_count: number;
|
|
352
|
+
readonly head_count_kv: number;
|
|
353
|
+
readonly use_norm: boolean;
|
|
354
|
+
readonly layer_norm_epsilon: number;
|
|
355
|
+
};
|
|
356
|
+
readonly tensor_data_layout?: string;
|
|
357
|
+
};
|
|
358
|
+
export type GgufMetadataMamba = {
|
|
359
|
+
readonly context_length: number;
|
|
360
|
+
readonly embedding_length: number;
|
|
361
|
+
readonly block_count: number;
|
|
362
|
+
readonly ssm: {
|
|
363
|
+
readonly conv_kernel: number;
|
|
364
|
+
readonly inner_size: number;
|
|
365
|
+
readonly state_size: number;
|
|
366
|
+
readonly time_step_rank: number;
|
|
367
|
+
};
|
|
368
|
+
readonly attention: {
|
|
369
|
+
readonly layer_norm_rms_epsilon: number;
|
|
370
|
+
};
|
|
371
|
+
};
|
|
372
|
+
export declare function isGgufMetadataOfArchitectureType<A extends GgufArchitectureType>(metadata: GgufMetadata, type: A): metadata is GgufMetadata<A>;
|
|
@@ -0,0 +1,114 @@
|
|
|
1
|
+
export var GgufArchitectureType;
|
|
2
|
+
(function (GgufArchitectureType) {
|
|
3
|
+
GgufArchitectureType["llama"] = "llama";
|
|
4
|
+
GgufArchitectureType["falcon"] = "falcon";
|
|
5
|
+
GgufArchitectureType["grok"] = "grok";
|
|
6
|
+
GgufArchitectureType["gpt2"] = "gpt2";
|
|
7
|
+
GgufArchitectureType["gptj"] = "gptj";
|
|
8
|
+
GgufArchitectureType["gptneox"] = "gptneox";
|
|
9
|
+
GgufArchitectureType["mpt"] = "mpt";
|
|
10
|
+
GgufArchitectureType["baichuan"] = "baichuan";
|
|
11
|
+
GgufArchitectureType["starcoder"] = "starcoder";
|
|
12
|
+
GgufArchitectureType["refact"] = "refact";
|
|
13
|
+
GgufArchitectureType["bert"] = "bert";
|
|
14
|
+
GgufArchitectureType["nomicBert"] = "nomic-bert";
|
|
15
|
+
GgufArchitectureType["jinaBertV2"] = "jina-bert-v2";
|
|
16
|
+
GgufArchitectureType["bloom"] = "bloom";
|
|
17
|
+
GgufArchitectureType["stablelm"] = "stablelm";
|
|
18
|
+
GgufArchitectureType["qwen"] = "qwen";
|
|
19
|
+
GgufArchitectureType["qwen2"] = "qwen2";
|
|
20
|
+
GgufArchitectureType["qwen2moe"] = "qwen2moe";
|
|
21
|
+
GgufArchitectureType["phi2"] = "phi2";
|
|
22
|
+
GgufArchitectureType["phi3"] = "phi3";
|
|
23
|
+
GgufArchitectureType["plamo"] = "plamo";
|
|
24
|
+
GgufArchitectureType["codeshell"] = "codeshell";
|
|
25
|
+
GgufArchitectureType["orion"] = "orion";
|
|
26
|
+
GgufArchitectureType["internlm2"] = "internlm2";
|
|
27
|
+
GgufArchitectureType["minicpm"] = "minicpm";
|
|
28
|
+
GgufArchitectureType["minicpm3"] = "minicpm3";
|
|
29
|
+
GgufArchitectureType["gemma"] = "gemma";
|
|
30
|
+
GgufArchitectureType["gemma2"] = "gemma2";
|
|
31
|
+
GgufArchitectureType["starcoder2"] = "starcoder2";
|
|
32
|
+
GgufArchitectureType["mamba"] = "mamba";
|
|
33
|
+
GgufArchitectureType["xverse"] = "xverse";
|
|
34
|
+
GgufArchitectureType["commandR"] = "command-r";
|
|
35
|
+
GgufArchitectureType["dbrx"] = "dbrx";
|
|
36
|
+
GgufArchitectureType["olmo"] = "olmo";
|
|
37
|
+
GgufArchitectureType["olmoe"] = "olmoe";
|
|
38
|
+
GgufArchitectureType["openelm"] = "openelm";
|
|
39
|
+
GgufArchitectureType["arctic"] = "arctic";
|
|
40
|
+
GgufArchitectureType["deepseek2"] = "deepseek2";
|
|
41
|
+
GgufArchitectureType["chatglm"] = "chatglm";
|
|
42
|
+
GgufArchitectureType["bitnet"] = "bitnet";
|
|
43
|
+
GgufArchitectureType["t5"] = "t5";
|
|
44
|
+
GgufArchitectureType["t5encoder"] = "t5encoder";
|
|
45
|
+
GgufArchitectureType["jais"] = "jais";
|
|
46
|
+
GgufArchitectureType["nemotron"] = "nemotron";
|
|
47
|
+
GgufArchitectureType["exaone"] = "exaone";
|
|
48
|
+
GgufArchitectureType["rwkv6"] = "rwkv6";
|
|
49
|
+
GgufArchitectureType["unknown"] = "(unknown)";
|
|
50
|
+
})(GgufArchitectureType || (GgufArchitectureType = {}));
|
|
51
|
+
// source: `enum llama_ftype` in `llama.h` in the `llama.cpp` source code
|
|
52
|
+
export var GgufFileType;
|
|
53
|
+
(function (GgufFileType) {
|
|
54
|
+
GgufFileType[GgufFileType["ALL_F32"] = 0] = "ALL_F32";
|
|
55
|
+
GgufFileType[GgufFileType["MOSTLY_F16"] = 1] = "MOSTLY_F16";
|
|
56
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_0"] = 2] = "MOSTLY_Q4_0";
|
|
57
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_1"] = 3] = "MOSTLY_Q4_1";
|
|
58
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_1_SOME_F16"] = 4] = "MOSTLY_Q4_1_SOME_F16";
|
|
59
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_2"] = 5] = "MOSTLY_Q4_2";
|
|
60
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_3"] = 6] = "MOSTLY_Q4_3";
|
|
61
|
+
GgufFileType[GgufFileType["MOSTLY_Q8_0"] = 7] = "MOSTLY_Q8_0";
|
|
62
|
+
GgufFileType[GgufFileType["MOSTLY_Q5_0"] = 8] = "MOSTLY_Q5_0";
|
|
63
|
+
GgufFileType[GgufFileType["MOSTLY_Q5_1"] = 9] = "MOSTLY_Q5_1";
|
|
64
|
+
GgufFileType[GgufFileType["MOSTLY_Q2_K"] = 10] = "MOSTLY_Q2_K";
|
|
65
|
+
GgufFileType[GgufFileType["MOSTLY_Q3_K_S"] = 11] = "MOSTLY_Q3_K_S";
|
|
66
|
+
GgufFileType[GgufFileType["MOSTLY_Q3_K_M"] = 12] = "MOSTLY_Q3_K_M";
|
|
67
|
+
GgufFileType[GgufFileType["MOSTLY_Q3_K_L"] = 13] = "MOSTLY_Q3_K_L";
|
|
68
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_K_S"] = 14] = "MOSTLY_Q4_K_S";
|
|
69
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_K_M"] = 15] = "MOSTLY_Q4_K_M";
|
|
70
|
+
GgufFileType[GgufFileType["MOSTLY_Q5_K_S"] = 16] = "MOSTLY_Q5_K_S";
|
|
71
|
+
GgufFileType[GgufFileType["MOSTLY_Q5_K_M"] = 17] = "MOSTLY_Q5_K_M";
|
|
72
|
+
GgufFileType[GgufFileType["MOSTLY_Q6_K"] = 18] = "MOSTLY_Q6_K";
|
|
73
|
+
GgufFileType[GgufFileType["MOSTLY_IQ2_XXS"] = 19] = "MOSTLY_IQ2_XXS";
|
|
74
|
+
GgufFileType[GgufFileType["MOSTLY_IQ2_XS"] = 20] = "MOSTLY_IQ2_XS";
|
|
75
|
+
GgufFileType[GgufFileType["MOSTLY_Q2_K_S"] = 21] = "MOSTLY_Q2_K_S";
|
|
76
|
+
GgufFileType[GgufFileType["MOSTLY_IQ3_XS"] = 22] = "MOSTLY_IQ3_XS";
|
|
77
|
+
GgufFileType[GgufFileType["MOSTLY_IQ3_XXS"] = 23] = "MOSTLY_IQ3_XXS";
|
|
78
|
+
GgufFileType[GgufFileType["MOSTLY_IQ1_S"] = 24] = "MOSTLY_IQ1_S";
|
|
79
|
+
GgufFileType[GgufFileType["MOSTLY_IQ4_NL"] = 25] = "MOSTLY_IQ4_NL";
|
|
80
|
+
GgufFileType[GgufFileType["MOSTLY_IQ3_S"] = 26] = "MOSTLY_IQ3_S";
|
|
81
|
+
GgufFileType[GgufFileType["MOSTLY_IQ3_M"] = 27] = "MOSTLY_IQ3_M";
|
|
82
|
+
GgufFileType[GgufFileType["MOSTLY_IQ2_S"] = 28] = "MOSTLY_IQ2_S";
|
|
83
|
+
GgufFileType[GgufFileType["MOSTLY_IQ2_M"] = 29] = "MOSTLY_IQ2_M";
|
|
84
|
+
GgufFileType[GgufFileType["MOSTLY_IQ4_XS"] = 30] = "MOSTLY_IQ4_XS";
|
|
85
|
+
GgufFileType[GgufFileType["MOSTLY_IQ1_M"] = 31] = "MOSTLY_IQ1_M";
|
|
86
|
+
GgufFileType[GgufFileType["MOSTLY_BF16"] = 32] = "MOSTLY_BF16";
|
|
87
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_0_4_4"] = 33] = "MOSTLY_Q4_0_4_4";
|
|
88
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_0_4_8"] = 34] = "MOSTLY_Q4_0_4_8";
|
|
89
|
+
GgufFileType[GgufFileType["MOSTLY_Q4_0_8_8"] = 35] = "MOSTLY_Q4_0_8_8";
|
|
90
|
+
GgufFileType[GgufFileType["LLAMA_FTYPE_MOSTLY_TQ1_0"] = 36] = "LLAMA_FTYPE_MOSTLY_TQ1_0";
|
|
91
|
+
GgufFileType[GgufFileType["LLAMA_FTYPE_MOSTLY_TQ2_0"] = 37] = "LLAMA_FTYPE_MOSTLY_TQ2_0";
|
|
92
|
+
})(GgufFileType || (GgufFileType = {}));
|
|
93
|
+
export var GgufMetadataTokenizerTokenType;
|
|
94
|
+
(function (GgufMetadataTokenizerTokenType) {
|
|
95
|
+
GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["undefined"] = 0] = "undefined";
|
|
96
|
+
GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["normal"] = 1] = "normal";
|
|
97
|
+
GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["unknown"] = 2] = "unknown";
|
|
98
|
+
GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["control"] = 3] = "control";
|
|
99
|
+
GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["userDefined"] = 4] = "userDefined";
|
|
100
|
+
GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["unused"] = 5] = "unused";
|
|
101
|
+
GgufMetadataTokenizerTokenType[GgufMetadataTokenizerTokenType["byte"] = 6] = "byte";
|
|
102
|
+
})(GgufMetadataTokenizerTokenType || (GgufMetadataTokenizerTokenType = {}));
|
|
103
|
+
export var GgufMetadataArchitecturePoolingType;
|
|
104
|
+
(function (GgufMetadataArchitecturePoolingType) {
|
|
105
|
+
GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["unspecified"] = -1] = "unspecified";
|
|
106
|
+
GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["none"] = 0] = "none";
|
|
107
|
+
GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["mean"] = 1] = "mean";
|
|
108
|
+
GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["cls"] = 2] = "cls";
|
|
109
|
+
GgufMetadataArchitecturePoolingType[GgufMetadataArchitecturePoolingType["last"] = 3] = "last";
|
|
110
|
+
})(GgufMetadataArchitecturePoolingType || (GgufMetadataArchitecturePoolingType = {}));
|
|
111
|
+
export function isGgufMetadataOfArchitectureType(metadata, type) {
|
|
112
|
+
return metadata?.general?.architecture === type;
|
|
113
|
+
}
|
|
114
|
+
//# sourceMappingURL=GgufMetadataTypes.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"GgufMetadataTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufMetadataTypes.ts"],"names":[],"mappings":"AAAA,MAAM,CAAN,IAAkB,oBAgDjB;AAhDD,WAAkB,oBAAoB;IAClC,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,2CAAmB,CAAA;IACnB,mCAAW,CAAA;IACX,6CAAqB,CAAA;IACrB,+CAAuB,CAAA;IACvB,yCAAiB,CAAA;IACjB,qCAAa,CAAA;IACb,gDAAwB,CAAA;IACxB,mDAA2B,CAAA;IAC3B,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,6CAAqB,CAAA;IACrB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,+CAAuB,CAAA;IACvB,uCAAe,CAAA;IACf,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,6CAAqB,CAAA;IACrB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,iDAAyB,CAAA;IACzB,uCAAe,CAAA;IACf,yCAAiB,CAAA;IACjB,8CAAsB,CAAA;IACtB,qCAAa,CAAA;IACb,qCAAa,CAAA;IACb,uCAAe,CAAA;IACf,2CAAmB,CAAA;IACnB,yCAAiB,CAAA;IACjB,+CAAuB,CAAA;IACvB,2CAAmB,CAAA;IACnB,yCAAiB,CAAA;IACjB,iCAAS,CAAA;IACT,+CAAuB,CAAA;IACvB,qCAAa,CAAA;IACb,6CAAqB,CAAA;IACrB,yCAAiB,CAAA;IACjB,uCAAe,CAAA;IACf,6CAAqB,CAAA;AACzB,CAAC,EAhDiB,oBAAoB,KAApB,oBAAoB,QAgDrC;AA8BD,yEAAyE;AACzE,MAAM,CAAN,IAAY,YAuCX;AAvCD,WAAY,YAAY;IACpB,qDAAW,CAAA;IACX,2DAAc,CAAA;IACd,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,+EAAwB,CAAA;IACxB,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,6DAAe,CAAA;IACf,8DAAgB,CAAA;IAChB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,8DAAgB,CAAA;IAChB,oEAAmB,CAAA;IACnB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,kEAAkB,CAAA;IAClB,oEAAmB,CAAA;IACnB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,gEAAiB,CAAA;IACjB,kEAAkB,CAAA;IAClB,gEAAiB,CAAA;IACjB,8DAAgB,CAAA;IAChB,sEAAoB,CAAA;IACpB,sEAAoB,CAAA;IACpB,sEAAoB,CAAA;IACpB,wFAA6B,CAAA;IAC7B,wFAA6B,CAAA;AACjC,CAAC,EAvCW,YAAY,KAAZ,YAAY,QAuCvB;AA2FD,MAAM,CAAN,IAAkB,8BAQjB;AARD,WAAkB,8BAA8B;IAC5C,6FAAa,CAAA;IACb,uFAAU,CAAA;IACV,yFAAW,CAAA;IACX,yFAAW,CAAA;IACX,iGAAe,CAAA;IACf,uFAAU,CAAA;IACV,mFAAQ,CAAA;AACZ,CAAC,EARiB,8BAA8B,KAA9B,8BAA8B,QAQ/C;AAiCD,MAAM,CAAN,IAAkB,mCAMjB;AAND,WAAkB,mCAAmC;IACjD,4GAAgB,CAAA;IAChB,6FAAQ,CAAA;IACR,6FAAQ,CAAA;IACR,2FAAO,CAAA;IACP,6FAAQ,CAAA;AACZ,CAAC,EANiB,mCAAmC,KAAnC,mCAAmC,QAMpD;AA8MD,MAAM,UAAU,gCAAgC,CAC5C,QAAsB,EAAE,IAAO;IAE/B,OAAO,QAAQ,EAAE,OAAO,EAAE,YAAY,KAAK,IAAI,CAAC;AACpD,CAAC"}
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
export type GgufTensorInfo = {
|
|
2
|
+
readonly name: string;
|
|
3
|
+
readonly dimensions: readonly (number | bigint)[];
|
|
4
|
+
readonly ggmlType: GgmlType;
|
|
5
|
+
readonly offset: number | bigint;
|
|
6
|
+
};
|
|
7
|
+
export declare const enum GgmlType {
|
|
8
|
+
F32 = 0,
|
|
9
|
+
F16 = 1,
|
|
10
|
+
Q4_0 = 2,
|
|
11
|
+
Q4_1 = 3,
|
|
12
|
+
Q4_2 = 4,
|
|
13
|
+
Q4_3 = 5,
|
|
14
|
+
Q5_0 = 6,
|
|
15
|
+
Q5_1 = 7,
|
|
16
|
+
Q8_0 = 8,
|
|
17
|
+
Q8_1 = 9,
|
|
18
|
+
Q2_K = 10,
|
|
19
|
+
Q3_K = 11,
|
|
20
|
+
Q4_K = 12,
|
|
21
|
+
Q5_K = 13,
|
|
22
|
+
Q6_K = 14,
|
|
23
|
+
Q8_K = 15,
|
|
24
|
+
IQ2_XXS = 16,
|
|
25
|
+
IQ2_XS = 17,
|
|
26
|
+
IQ3_XXS = 18,
|
|
27
|
+
IQ1_S = 19,
|
|
28
|
+
IQ4_NL = 20,
|
|
29
|
+
IQ3_S = 21,
|
|
30
|
+
IQ2_S = 22,
|
|
31
|
+
IQ4_XS = 23,
|
|
32
|
+
I8 = 24,
|
|
33
|
+
I16 = 25,
|
|
34
|
+
I32 = 26,
|
|
35
|
+
I64 = 27,
|
|
36
|
+
F64 = 28
|
|
37
|
+
}
|
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
export var GgmlType;
|
|
2
|
+
(function (GgmlType) {
|
|
3
|
+
GgmlType[GgmlType["F32"] = 0] = "F32";
|
|
4
|
+
GgmlType[GgmlType["F16"] = 1] = "F16";
|
|
5
|
+
GgmlType[GgmlType["Q4_0"] = 2] = "Q4_0";
|
|
6
|
+
GgmlType[GgmlType["Q4_1"] = 3] = "Q4_1";
|
|
7
|
+
GgmlType[GgmlType["Q4_2"] = 4] = "Q4_2";
|
|
8
|
+
GgmlType[GgmlType["Q4_3"] = 5] = "Q4_3";
|
|
9
|
+
GgmlType[GgmlType["Q5_0"] = 6] = "Q5_0";
|
|
10
|
+
GgmlType[GgmlType["Q5_1"] = 7] = "Q5_1";
|
|
11
|
+
GgmlType[GgmlType["Q8_0"] = 8] = "Q8_0";
|
|
12
|
+
GgmlType[GgmlType["Q8_1"] = 9] = "Q8_1";
|
|
13
|
+
GgmlType[GgmlType["Q2_K"] = 10] = "Q2_K";
|
|
14
|
+
GgmlType[GgmlType["Q3_K"] = 11] = "Q3_K";
|
|
15
|
+
GgmlType[GgmlType["Q4_K"] = 12] = "Q4_K";
|
|
16
|
+
GgmlType[GgmlType["Q5_K"] = 13] = "Q5_K";
|
|
17
|
+
GgmlType[GgmlType["Q6_K"] = 14] = "Q6_K";
|
|
18
|
+
GgmlType[GgmlType["Q8_K"] = 15] = "Q8_K";
|
|
19
|
+
GgmlType[GgmlType["IQ2_XXS"] = 16] = "IQ2_XXS";
|
|
20
|
+
GgmlType[GgmlType["IQ2_XS"] = 17] = "IQ2_XS";
|
|
21
|
+
GgmlType[GgmlType["IQ3_XXS"] = 18] = "IQ3_XXS";
|
|
22
|
+
GgmlType[GgmlType["IQ1_S"] = 19] = "IQ1_S";
|
|
23
|
+
GgmlType[GgmlType["IQ4_NL"] = 20] = "IQ4_NL";
|
|
24
|
+
GgmlType[GgmlType["IQ3_S"] = 21] = "IQ3_S";
|
|
25
|
+
GgmlType[GgmlType["IQ2_S"] = 22] = "IQ2_S";
|
|
26
|
+
GgmlType[GgmlType["IQ4_XS"] = 23] = "IQ4_XS";
|
|
27
|
+
GgmlType[GgmlType["I8"] = 24] = "I8";
|
|
28
|
+
GgmlType[GgmlType["I16"] = 25] = "I16";
|
|
29
|
+
GgmlType[GgmlType["I32"] = 26] = "I32";
|
|
30
|
+
GgmlType[GgmlType["I64"] = 27] = "I64";
|
|
31
|
+
GgmlType[GgmlType["F64"] = 28] = "F64";
|
|
32
|
+
})(GgmlType || (GgmlType = {}));
|
|
33
|
+
//# sourceMappingURL=GgufTensorInfoTypes.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"GgufTensorInfoTypes.js","sourceRoot":"","sources":["../../../src/gguf/types/GgufTensorInfoTypes.ts"],"names":[],"mappings":"AAOA,MAAM,CAAN,IAAkB,QA8BjB;AA9BD,WAAkB,QAAQ;IACtB,qCAAO,CAAA;IACP,qCAAO,CAAA;IACP,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,uCAAQ,CAAA;IACR,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,wCAAS,CAAA;IACT,8CAAY,CAAA;IACZ,4CAAW,CAAA;IACX,8CAAY,CAAA;IACZ,0CAAU,CAAA;IACV,4CAAW,CAAA;IACX,0CAAU,CAAA;IACV,0CAAU,CAAA;IACV,4CAAW,CAAA;IACX,oCAAO,CAAA;IACP,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,sCAAQ,CAAA;IACR,sCAAQ,CAAA;AACZ,CAAC,EA9BiB,QAAQ,KAAR,QAAQ,QA8BzB"}
|