node-llama-cpp 3.0.0-beta.14 → 3.0.0-beta.15
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +1 -1
- package/dist/ChatWrapper.js +4 -0
- package/dist/ChatWrapper.js.map +1 -1
- package/dist/bindings/AddonTypes.d.ts +21 -0
- package/dist/bindings/Llama.d.ts +4 -0
- package/dist/bindings/Llama.js +45 -4
- package/dist/bindings/Llama.js.map +1 -1
- package/dist/bindings/getLlama.d.ts +19 -1
- package/dist/bindings/getLlama.js +15 -5
- package/dist/bindings/getLlama.js.map +1 -1
- package/dist/bindings/types.d.ts +15 -0
- package/dist/bindings/types.js +27 -2
- package/dist/bindings/types.js.map +1 -1
- package/dist/bindings/utils/MemoryOrchestrator.d.ts +21 -0
- package/dist/bindings/utils/MemoryOrchestrator.js +49 -0
- package/dist/bindings/utils/MemoryOrchestrator.js.map +1 -0
- package/dist/bindings/utils/cloneLlamaCppRepo.d.ts +1 -1
- package/dist/bindings/utils/cloneLlamaCppRepo.js +3 -2
- package/dist/bindings/utils/cloneLlamaCppRepo.js.map +1 -1
- package/dist/bindings/utils/compileLLamaCpp.js +2 -2
- package/dist/bindings/utils/compileLLamaCpp.js.map +1 -1
- package/dist/bindings/utils/getLlamaWithoutBackend.d.ts +5 -0
- package/dist/bindings/utils/getLlamaWithoutBackend.js +27 -0
- package/dist/bindings/utils/getLlamaWithoutBackend.js.map +1 -0
- package/dist/bindings/utils/resolveCustomCmakeOptions.js +2 -2
- package/dist/bindings/utils/resolveCustomCmakeOptions.js.map +1 -1
- package/dist/chatWrappers/AlpacaChatWrapper.d.ts +2 -1
- package/dist/chatWrappers/AlpacaChatWrapper.js +9 -2
- package/dist/chatWrappers/AlpacaChatWrapper.js.map +1 -1
- package/dist/chatWrappers/ChatMLChatWrapper.js +12 -10
- package/dist/chatWrappers/ChatMLChatWrapper.js.map +1 -1
- package/dist/chatWrappers/FalconChatWrapper.d.ts +2 -1
- package/dist/chatWrappers/FalconChatWrapper.js +28 -11
- package/dist/chatWrappers/FalconChatWrapper.js.map +1 -1
- package/dist/chatWrappers/FunctionaryChatWrapper.js +59 -45
- package/dist/chatWrappers/FunctionaryChatWrapper.js.map +1 -1
- package/dist/chatWrappers/GemmaChatWrapper.js +9 -7
- package/dist/chatWrappers/GemmaChatWrapper.js.map +1 -1
- package/dist/chatWrappers/GeneralChatWrapper.d.ts +2 -1
- package/dist/chatWrappers/GeneralChatWrapper.js +35 -12
- package/dist/chatWrappers/GeneralChatWrapper.js.map +1 -1
- package/dist/chatWrappers/LlamaChatWrapper.d.ts +7 -0
- package/dist/chatWrappers/LlamaChatWrapper.js +26 -8
- package/dist/chatWrappers/LlamaChatWrapper.js.map +1 -1
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.d.ts +73 -0
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +355 -0
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -0
- package/dist/{TemplateChatWrapper.d.ts → chatWrappers/generic/TemplateChatWrapper.d.ts} +6 -9
- package/dist/{TemplateChatWrapper.js → chatWrappers/generic/TemplateChatWrapper.js} +31 -69
- package/dist/chatWrappers/generic/TemplateChatWrapper.js.map +1 -0
- package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.d.ts +33 -0
- package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js +45 -0
- package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.js.map +1 -0
- package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.d.ts +4 -0
- package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js +206 -0
- package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js.map +1 -0
- package/dist/chatWrappers/utils/resolveChatWrapper.d.ts +67 -0
- package/dist/chatWrappers/utils/resolveChatWrapper.js +206 -0
- package/dist/chatWrappers/utils/resolveChatWrapper.js.map +1 -0
- package/dist/cli/cli.js +1 -1
- package/dist/cli/cli.js.map +1 -1
- package/dist/cli/commands/ChatCommand.d.ts +7 -4
- package/dist/cli/commands/ChatCommand.js +150 -60
- package/dist/cli/commands/ChatCommand.js.map +1 -1
- package/dist/cli/commands/ClearCommand.d.ts +1 -1
- package/dist/cli/commands/ClearCommand.js +5 -5
- package/dist/cli/commands/ClearCommand.js.map +1 -1
- package/dist/cli/commands/CompleteCommand.d.ts +3 -2
- package/dist/cli/commands/CompleteCommand.js +88 -41
- package/dist/cli/commands/CompleteCommand.js.map +1 -1
- package/dist/cli/commands/InfillCommand.d.ts +3 -2
- package/dist/cli/commands/InfillCommand.js +88 -41
- package/dist/cli/commands/InfillCommand.js.map +1 -1
- package/dist/cli/commands/{InspectCommand.d.ts → inspect/InspectCommand.d.ts} +1 -4
- package/dist/cli/commands/inspect/InspectCommand.js +17 -0
- package/dist/cli/commands/inspect/InspectCommand.js.map +1 -0
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.d.ts +10 -0
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +108 -0
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -0
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.d.ts +4 -0
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +98 -0
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -0
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.d.ts +14 -0
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +577 -0
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -0
- package/dist/cli/utils/ConsoleTable.d.ts +23 -0
- package/dist/cli/utils/ConsoleTable.js +86 -0
- package/dist/cli/utils/ConsoleTable.js.map +1 -0
- package/dist/cli/utils/printCommonInfoLines.d.ts +9 -0
- package/dist/cli/utils/printCommonInfoLines.js +70 -0
- package/dist/cli/utils/printCommonInfoLines.js.map +1 -0
- package/dist/cli/utils/printInfoLine.d.ts +10 -0
- package/dist/cli/utils/printInfoLine.js +45 -0
- package/dist/cli/utils/printInfoLine.js.map +1 -0
- package/dist/cli/utils/resolveCommandGgufPath.d.ts +1 -0
- package/dist/cli/utils/resolveCommandGgufPath.js +6 -0
- package/dist/cli/utils/resolveCommandGgufPath.js.map +1 -0
- package/dist/config.d.ts +2 -0
- package/dist/config.js +6 -0
- package/dist/config.js.map +1 -1
- package/dist/evaluator/LlamaChat/LlamaChat.js +13 -5
- package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -1
- package/dist/evaluator/LlamaCompletion.js +5 -3
- package/dist/evaluator/LlamaCompletion.js.map +1 -1
- package/dist/evaluator/LlamaContext/LlamaContext.d.ts +40 -3
- package/dist/evaluator/LlamaContext/LlamaContext.js +245 -100
- package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -1
- package/dist/evaluator/LlamaContext/types.d.ts +57 -6
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/firstInFirstOutStrategy.js.map +1 -0
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/maximumParallelismStrategy.js.map +1 -0
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.d.ts +2 -0
- package/dist/evaluator/LlamaContext/utils/{resolveBatchItemsPrioritizingStrategy.js → resolveBatchItemsPrioritizationStrategy.js} +4 -4
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js.map +1 -0
- package/dist/evaluator/LlamaEmbeddingContext.d.ts +23 -2
- package/dist/evaluator/LlamaEmbeddingContext.js +4 -5
- package/dist/evaluator/LlamaEmbeddingContext.js.map +1 -1
- package/dist/evaluator/LlamaModel.d.ts +64 -6
- package/dist/evaluator/LlamaModel.js +297 -8
- package/dist/evaluator/LlamaModel.js.map +1 -1
- package/dist/evaluator/TokenMeter.d.ts +54 -0
- package/dist/evaluator/TokenMeter.js +86 -0
- package/dist/evaluator/TokenMeter.js.map +1 -0
- package/dist/gguf/GgufInsights.d.ts +40 -0
- package/dist/gguf/GgufInsights.js +350 -0
- package/dist/gguf/GgufInsights.js.map +1 -0
- package/dist/gguf/consts.d.ts +3 -0
- package/dist/gguf/consts.js +8 -0
- package/dist/gguf/consts.js.map +1 -0
- package/dist/gguf/errors/InvalidGgufMagicError.d.ts +3 -0
- package/dist/gguf/errors/InvalidGgufMagicError.js +6 -0
- package/dist/gguf/errors/InvalidGgufMagicError.js.map +1 -0
- package/dist/gguf/errors/UnsupportedGgufValueTypeError.d.ts +4 -0
- package/dist/gguf/errors/UnsupportedGgufValueTypeError.js +9 -0
- package/dist/gguf/errors/UnsupportedGgufValueTypeError.js.map +1 -0
- package/dist/gguf/fileReaders/GgufFileReader.d.ts +33 -0
- package/dist/gguf/fileReaders/GgufFileReader.js +76 -0
- package/dist/gguf/fileReaders/GgufFileReader.js.map +1 -0
- package/dist/gguf/fileReaders/GgufFsFileReader.d.ts +17 -0
- package/dist/gguf/fileReaders/GgufFsFileReader.js +45 -0
- package/dist/gguf/fileReaders/GgufFsFileReader.js.map +1 -0
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.d.ts +22 -0
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js +63 -0
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js.map +1 -0
- package/dist/gguf/parser/GgufV2Parser.d.ts +19 -0
- package/dist/gguf/parser/GgufV2Parser.js +115 -0
- package/dist/gguf/parser/GgufV2Parser.js.map +1 -0
- package/dist/gguf/parser/GgufV3Parser.d.ts +3 -0
- package/dist/gguf/parser/GgufV3Parser.js +4 -0
- package/dist/gguf/parser/GgufV3Parser.js.map +1 -0
- package/dist/gguf/parser/parseGguf.d.ts +8 -0
- package/dist/gguf/parser/parseGguf.js +58 -0
- package/dist/gguf/parser/parseGguf.js.map +1 -0
- package/dist/gguf/readGgufFileInfo.d.ts +30 -0
- package/dist/gguf/readGgufFileInfo.js +37 -0
- package/dist/gguf/readGgufFileInfo.js.map +1 -0
- package/dist/gguf/types/GgufFileInfoTypes.d.ts +52 -0
- package/dist/gguf/types/GgufFileInfoTypes.js +18 -0
- package/dist/gguf/types/GgufFileInfoTypes.js.map +1 -0
- package/dist/gguf/types/GgufMetadataTypes.d.ts +330 -0
- package/dist/gguf/types/GgufMetadataTypes.js +86 -0
- package/dist/gguf/types/GgufMetadataTypes.js.map +1 -0
- package/dist/gguf/types/GgufTensorInfoTypes.d.ts +37 -0
- package/dist/gguf/types/GgufTensorInfoTypes.js +33 -0
- package/dist/gguf/types/GgufTensorInfoTypes.js.map +1 -0
- package/dist/gguf/utils/GgufReadOffset.d.ts +6 -0
- package/dist/gguf/utils/GgufReadOffset.js +18 -0
- package/dist/gguf/utils/GgufReadOffset.js.map +1 -0
- package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.d.ts +5 -0
- package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js +38 -0
- package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js.map +1 -0
- package/dist/gguf/utils/getGgufFileTypeName.d.ts +4 -0
- package/dist/gguf/utils/getGgufFileTypeName.js +13 -0
- package/dist/gguf/utils/getGgufFileTypeName.js.map +1 -0
- package/dist/gguf/utils/getGgufMetadataArchitectureData.d.ts +3 -0
- package/dist/gguf/utils/getGgufMetadataArchitectureData.js +4 -0
- package/dist/gguf/utils/getGgufMetadataArchitectureData.js.map +1 -0
- package/dist/gguf/utils/normalizeGgufDownloadUrl.d.ts +1 -0
- package/dist/gguf/utils/normalizeGgufDownloadUrl.js +16 -0
- package/dist/gguf/utils/normalizeGgufDownloadUrl.js.map +1 -0
- package/dist/index.d.ts +13 -7
- package/dist/index.js +11 -6
- package/dist/index.js.map +1 -1
- package/dist/types.d.ts +1 -1
- package/dist/utils/InsufficientMemoryError.d.ts +3 -0
- package/dist/utils/InsufficientMemoryError.js +6 -0
- package/dist/utils/InsufficientMemoryError.js.map +1 -0
- package/dist/utils/LlamaText.d.ts +25 -10
- package/dist/utils/LlamaText.js +205 -23
- package/dist/utils/LlamaText.js.map +1 -1
- package/dist/utils/StopGenerationDetector.js +3 -1
- package/dist/utils/StopGenerationDetector.js.map +1 -1
- package/dist/utils/findBestOption.d.ts +4 -0
- package/dist/utils/findBestOption.js +15 -0
- package/dist/utils/findBestOption.js.map +1 -0
- package/dist/utils/getQueuedTokensBeforeStopTrigger.js +3 -3
- package/dist/utils/getQueuedTokensBeforeStopTrigger.js.map +1 -1
- package/dist/utils/gitReleaseBundles.js +68 -1
- package/dist/utils/gitReleaseBundles.js.map +1 -1
- package/dist/utils/mergeUnionTypes.d.ts +4 -0
- package/dist/utils/parseModelFileName.d.ts +1 -0
- package/dist/utils/parseModelFileName.js +6 -1
- package/dist/utils/parseModelFileName.js.map +1 -1
- package/dist/utils/prettyPrintObject.d.ts +10 -1
- package/dist/utils/prettyPrintObject.js +57 -13
- package/dist/utils/prettyPrintObject.js.map +1 -1
- package/dist/utils/spawnCommand.js.map +1 -1
- package/dist/utils/tokenizeInput.d.ts +1 -1
- package/dist/utils/tokenizeInput.js +3 -3
- package/dist/utils/tokenizeInput.js.map +1 -1
- package/dist/utils/withOra.d.ts +1 -0
- package/dist/utils/withOra.js +2 -2
- package/dist/utils/withOra.js.map +1 -1
- package/llama/CMakeLists.txt +5 -5
- package/llama/addon.cpp +117 -5
- package/llama/binariesGithubRelease.json +1 -1
- package/llama/gitRelease.bundle +0 -0
- package/llama/gpuInfo/cuda-gpu-info.cu +21 -0
- package/llama/gpuInfo/cuda-gpu-info.h +3 -0
- package/llama/gpuInfo/metal-gpu-info.h +4 -1
- package/llama/gpuInfo/metal-gpu-info.mm +14 -1
- package/llama/gpuInfo/vulkan-gpu-info.cpp +20 -2
- package/llama/gpuInfo/vulkan-gpu-info.h +2 -0
- package/llama/llama.cpp.info.json +1 -1
- package/llama/toolchains/win32.host-x64.target-arm64.cmake +41 -0
- package/llamaBins/linux-arm64/_nlcBuildMetadata.json +1 -1
- package/llamaBins/linux-arm64/llama-addon.node +0 -0
- package/llamaBins/linux-armv7l/_nlcBuildMetadata.json +1 -1
- package/llamaBins/linux-armv7l/llama-addon.node +0 -0
- package/llamaBins/linux-x64/_nlcBuildMetadata.json +1 -1
- package/llamaBins/linux-x64/llama-addon.node +0 -0
- package/llamaBins/linux-x64-cuda/_nlcBuildMetadata.json +1 -1
- package/llamaBins/linux-x64-cuda/llama-addon.node +0 -0
- package/llamaBins/linux-x64-vulkan/_nlcBuildMetadata.json +1 -1
- package/llamaBins/linux-x64-vulkan/llama-addon.node +0 -0
- package/llamaBins/mac-arm64-metal/_nlcBuildMetadata.json +1 -1
- package/llamaBins/mac-arm64-metal/default.metallib +0 -0
- package/llamaBins/mac-arm64-metal/llama-addon.node +0 -0
- package/llamaBins/mac-x64/_nlcBuildMetadata.json +1 -1
- package/llamaBins/mac-x64/llama-addon.node +0 -0
- package/llamaBins/win-arm64/_nlcBuildMetadata.json +1 -0
- package/llamaBins/win-arm64/llama-addon.exp +0 -0
- package/llamaBins/win-arm64/llama-addon.lib +0 -0
- package/llamaBins/win-arm64/llama-addon.node +0 -0
- package/llamaBins/win-x64/_nlcBuildMetadata.json +1 -1
- package/llamaBins/win-x64/llama-addon.node +0 -0
- package/llamaBins/win-x64-cuda/_nlcBuildMetadata.json +1 -1
- package/llamaBins/win-x64-cuda/llama-addon.node +0 -0
- package/llamaBins/win-x64-vulkan/_nlcBuildMetadata.json +1 -1
- package/llamaBins/win-x64-vulkan/llama-addon.node +0 -0
- package/package.json +8 -6
- package/dist/TemplateChatWrapper.js.map +0 -1
- package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.d.ts +0 -33
- package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.js +0 -49
- package/dist/bindings/utils/resolveChatWrapperBasedOnWrapperTypeName.js.map +0 -1
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.d.ts +0 -13
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js +0 -63
- package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js.map +0 -1
- package/dist/cli/commands/InspectCommand.js +0 -113
- package/dist/cli/commands/InspectCommand.js.map +0 -1
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js.map +0 -1
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js.map +0 -1
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.d.ts +0 -2
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js.map +0 -1
- package/dist/gguf/GGUFInsights.d.ts +0 -28
- package/dist/gguf/GGUFInsights.js +0 -58
- package/dist/gguf/GGUFInsights.js.map +0 -1
- package/dist/gguf/GGUFMetadata.d.ts +0 -19
- package/dist/gguf/GGUFMetadata.js +0 -38
- package/dist/gguf/GGUFMetadata.js.map +0 -1
- package/dist/gguf/errors/InvalidGGUFMagicError.d.ts +0 -3
- package/dist/gguf/errors/InvalidGGUFMagicError.js +0 -6
- package/dist/gguf/errors/InvalidGGUFMagicError.js.map +0 -1
- package/dist/gguf/errors/MetadataNotParsedYetError.d.ts +0 -3
- package/dist/gguf/errors/MetadataNotParsedYetError.js +0 -6
- package/dist/gguf/errors/MetadataNotParsedYetError.js.map +0 -1
- package/dist/gguf/errors/MissingNodeLlamaError.d.ts +0 -3
- package/dist/gguf/errors/MissingNodeLlamaError.js +0 -6
- package/dist/gguf/errors/MissingNodeLlamaError.js.map +0 -1
- package/dist/gguf/errors/ModelScore/NotEnoughVRamError.d.ts +0 -5
- package/dist/gguf/errors/ModelScore/NotEnoughVRamError.js +0 -11
- package/dist/gguf/errors/ModelScore/NotEnoughVRamError.js.map +0 -1
- package/dist/gguf/errors/UnsupportedMetadataTypeError.d.ts +0 -4
- package/dist/gguf/errors/UnsupportedMetadataTypeError.js +0 -8
- package/dist/gguf/errors/UnsupportedMetadataTypeError.js.map +0 -1
- package/dist/gguf/ggufParser/GGUFParser.d.ts +0 -18
- package/dist/gguf/ggufParser/GGUFParser.js +0 -123
- package/dist/gguf/ggufParser/GGUFParser.js.map +0 -1
- package/dist/gguf/ggufParser/GGUFTypes.d.ts +0 -257
- package/dist/gguf/ggufParser/GGUFTypes.js +0 -2
- package/dist/gguf/ggufParser/GGUFTypes.js.map +0 -1
- package/dist/gguf/ggufParser/checkArchitecture.d.ts +0 -14
- package/dist/gguf/ggufParser/checkArchitecture.js +0 -74
- package/dist/gguf/ggufParser/checkArchitecture.js.map +0 -1
- package/dist/gguf/ggufParser/stream/GGUFBaseStream.d.ts +0 -38
- package/dist/gguf/ggufParser/stream/GGUFBaseStream.js +0 -83
- package/dist/gguf/ggufParser/stream/GGUFBaseStream.js.map +0 -1
- package/dist/gguf/ggufParser/stream/GGUFFetchStream.d.ts +0 -14
- package/dist/gguf/ggufParser/stream/GGUFFetchStream.js +0 -35
- package/dist/gguf/ggufParser/stream/GGUFFetchStream.js.map +0 -1
- package/dist/gguf/ggufParser/stream/GGUFReadStream.d.ts +0 -15
- package/dist/gguf/ggufParser/stream/GGUFReadStream.js +0 -40
- package/dist/gguf/ggufParser/stream/GGUFReadStream.js.map +0 -1
- package/dist/utils/parseModelTypeDescription.d.ts +0 -6
- package/dist/utils/parseModelTypeDescription.js +0 -9
- package/dist/utils/parseModelTypeDescription.js.map +0 -1
- package/dist/utils/resolveChatWrapper.d.ts +0 -4
- package/dist/utils/resolveChatWrapper.js +0 -16
- package/dist/utils/resolveChatWrapper.js.map +0 -1
- /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.d.ts +0 -0
- /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/firstInFirstOutStrategy.js +0 -0
- /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/maximumParallelismStrategy.d.ts +0 -0
- /package/dist/evaluator/LlamaContext/utils/{batchItemsPrioritizingStrategies → batchItemsPrioritizationStrategies}/maximumParallelismStrategy.js +0 -0
package/llama/addon.cpp
CHANGED
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
#include "llama.h"
|
|
10
10
|
#include "napi.h"
|
|
11
11
|
|
|
12
|
-
#ifdef
|
|
12
|
+
#ifdef GPU_INFO_USE_CUDA
|
|
13
13
|
# include "gpuInfo/cuda-gpu-info.h"
|
|
14
14
|
#endif
|
|
15
15
|
#ifdef GPU_INFO_USE_VULKAN
|
|
@@ -121,7 +121,7 @@ std::string addon_model_token_to_piece(const struct llama_model* model, llama_to
|
|
|
121
121
|
return std::string(result.data(), result.size());
|
|
122
122
|
}
|
|
123
123
|
|
|
124
|
-
#ifdef
|
|
124
|
+
#ifdef GPU_INFO_USE_CUDA
|
|
125
125
|
void logCudaError(const char* message) {
|
|
126
126
|
addonLlamaCppLogCallback(GGML_LOG_LEVEL_ERROR, (std::string("CUDA error: ") + std::string(message)).c_str(), nullptr);
|
|
127
127
|
}
|
|
@@ -136,7 +136,7 @@ Napi::Value getGpuVramInfo(const Napi::CallbackInfo& info) {
|
|
|
136
136
|
uint64_t total = 0;
|
|
137
137
|
uint64_t used = 0;
|
|
138
138
|
|
|
139
|
-
#ifdef
|
|
139
|
+
#ifdef GPU_INFO_USE_CUDA
|
|
140
140
|
size_t cudaDeviceTotal = 0;
|
|
141
141
|
size_t cudaDeviceUsed = 0;
|
|
142
142
|
bool cudeGetInfoSuccess = gpuInfoGetTotalCudaDevicesInfo(&cudaDeviceTotal, &cudaDeviceUsed, logCudaError);
|
|
@@ -161,7 +161,7 @@ Napi::Value getGpuVramInfo(const Napi::CallbackInfo& info) {
|
|
|
161
161
|
#ifdef GPU_INFO_USE_METAL
|
|
162
162
|
uint64_t metalDeviceTotal = 0;
|
|
163
163
|
uint64_t metalDeviceUsed = 0;
|
|
164
|
-
|
|
164
|
+
getMetalGpuInfo(&metalDeviceTotal, &metalDeviceUsed);
|
|
165
165
|
|
|
166
166
|
total += metalDeviceTotal;
|
|
167
167
|
used += metalDeviceUsed;
|
|
@@ -174,8 +174,34 @@ Napi::Value getGpuVramInfo(const Napi::CallbackInfo& info) {
|
|
|
174
174
|
return result;
|
|
175
175
|
}
|
|
176
176
|
|
|
177
|
+
Napi::Value getGpuDeviceInfo(const Napi::CallbackInfo& info) {
|
|
178
|
+
std::vector<std::string> deviceNames;
|
|
179
|
+
|
|
180
|
+
#ifdef GPU_INFO_USE_CUDA
|
|
181
|
+
gpuInfoGetCudaDeviceNames(&deviceNames, logCudaError);
|
|
182
|
+
#endif
|
|
183
|
+
|
|
184
|
+
#ifdef GPU_INFO_USE_VULKAN
|
|
185
|
+
gpuInfoGetVulkanDeviceNames(&deviceNames, logVulkanWarning);
|
|
186
|
+
#endif
|
|
187
|
+
|
|
188
|
+
#ifdef GPU_INFO_USE_METAL
|
|
189
|
+
getMetalGpuDeviceNames(&deviceNames);
|
|
190
|
+
#endif
|
|
191
|
+
|
|
192
|
+
Napi::Object result = Napi::Object::New(info.Env());
|
|
193
|
+
|
|
194
|
+
Napi::Array deviceNamesNapiArray = Napi::Array::New(info.Env(), deviceNames.size());
|
|
195
|
+
for (size_t i = 0; i < deviceNames.size(); ++i) {
|
|
196
|
+
deviceNamesNapiArray[i] = Napi::String::New(info.Env(), deviceNames[i]);
|
|
197
|
+
}
|
|
198
|
+
result.Set("deviceNames", deviceNamesNapiArray);
|
|
199
|
+
|
|
200
|
+
return result;
|
|
201
|
+
}
|
|
202
|
+
|
|
177
203
|
Napi::Value getGpuType(const Napi::CallbackInfo& info) {
|
|
178
|
-
#ifdef
|
|
204
|
+
#ifdef GPU_INFO_USE_CUDA
|
|
179
205
|
return Napi::String::New(info.Env(), "cuda");
|
|
180
206
|
#endif
|
|
181
207
|
|
|
@@ -507,6 +533,16 @@ class AddonModel : public Napi::ObjectWrap<AddonModel> {
|
|
|
507
533
|
|
|
508
534
|
return Napi::Number::From(info.Env(), int32_t(tokenType));
|
|
509
535
|
}
|
|
536
|
+
Napi::Value GetVocabularyType(const Napi::CallbackInfo& info) {
|
|
537
|
+
if (disposed) {
|
|
538
|
+
Napi::Error::New(info.Env(), "Model is disposed").ThrowAsJavaScriptException();
|
|
539
|
+
return info.Env().Undefined();
|
|
540
|
+
}
|
|
541
|
+
|
|
542
|
+
auto vocabularyType = llama_vocab_type(model);
|
|
543
|
+
|
|
544
|
+
return Napi::Number::From(info.Env(), int32_t(vocabularyType));
|
|
545
|
+
}
|
|
510
546
|
Napi::Value ShouldPrependBosToken(const Napi::CallbackInfo& info) {
|
|
511
547
|
const int addBos = llama_add_bos_token(model);
|
|
512
548
|
|
|
@@ -515,6 +551,10 @@ class AddonModel : public Napi::ObjectWrap<AddonModel> {
|
|
|
515
551
|
return Napi::Boolean::New(info.Env(), shouldPrependBos);
|
|
516
552
|
}
|
|
517
553
|
|
|
554
|
+
Napi::Value GetModelSize(const Napi::CallbackInfo& info) {
|
|
555
|
+
return Napi::Number::From(info.Env(), llama_model_size(model));
|
|
556
|
+
}
|
|
557
|
+
|
|
518
558
|
static void init(Napi::Object exports) {
|
|
519
559
|
exports.Set(
|
|
520
560
|
"AddonModel",
|
|
@@ -540,7 +580,9 @@ class AddonModel : public Napi::ObjectWrap<AddonModel> {
|
|
|
540
580
|
InstanceMethod("eotToken", &AddonModel::EotToken),
|
|
541
581
|
InstanceMethod("getTokenString", &AddonModel::GetTokenString),
|
|
542
582
|
InstanceMethod("getTokenType", &AddonModel::GetTokenType),
|
|
583
|
+
InstanceMethod("getVocabularyType", &AddonModel::GetVocabularyType),
|
|
543
584
|
InstanceMethod("shouldPrependBosToken", &AddonModel::ShouldPrependBosToken),
|
|
585
|
+
InstanceMethod("getModelSize", &AddonModel::GetModelSize),
|
|
544
586
|
InstanceMethod("dispose", &AddonModel::Dispose),
|
|
545
587
|
}
|
|
546
588
|
)
|
|
@@ -822,6 +864,10 @@ class AddonContext : public Napi::ObjectWrap<AddonContext> {
|
|
|
822
864
|
context_params.n_ubatch = context_params.n_batch; // the batch queue is managed in the JS side, so there's no need for managing it on the C++ side
|
|
823
865
|
}
|
|
824
866
|
|
|
867
|
+
if (options.Has("sequences")) {
|
|
868
|
+
context_params.n_seq_max = options.Get("sequences").As<Napi::Number>().Uint32Value();
|
|
869
|
+
}
|
|
870
|
+
|
|
825
871
|
if (options.Has("embeddings")) {
|
|
826
872
|
context_params.embeddings = options.Get("embeddings").As<Napi::Boolean>().Value();
|
|
827
873
|
}
|
|
@@ -1039,6 +1085,15 @@ class AddonContext : public Napi::ObjectWrap<AddonContext> {
|
|
|
1039
1085
|
return result;
|
|
1040
1086
|
}
|
|
1041
1087
|
|
|
1088
|
+
Napi::Value GetStateSize(const Napi::CallbackInfo& info) {
|
|
1089
|
+
if (disposed) {
|
|
1090
|
+
Napi::Error::New(info.Env(), "Context is disposed").ThrowAsJavaScriptException();
|
|
1091
|
+
return info.Env().Undefined();
|
|
1092
|
+
}
|
|
1093
|
+
|
|
1094
|
+
return Napi::Number::From(info.Env(), llama_get_state_size(ctx));
|
|
1095
|
+
}
|
|
1096
|
+
|
|
1042
1097
|
Napi::Value PrintTimings(const Napi::CallbackInfo& info) {
|
|
1043
1098
|
llama_print_timings(ctx);
|
|
1044
1099
|
llama_reset_timings(ctx);
|
|
@@ -1063,6 +1118,7 @@ class AddonContext : public Napi::ObjectWrap<AddonContext> {
|
|
|
1063
1118
|
InstanceMethod("sampleToken", &AddonContext::SampleToken),
|
|
1064
1119
|
InstanceMethod("acceptGrammarEvaluationStateToken", &AddonContext::AcceptGrammarEvaluationStateToken),
|
|
1065
1120
|
InstanceMethod("getEmbedding", &AddonContext::GetEmbedding),
|
|
1121
|
+
InstanceMethod("getStateSize", &AddonContext::GetStateSize),
|
|
1066
1122
|
InstanceMethod("printTimings", &AddonContext::PrintTimings),
|
|
1067
1123
|
InstanceMethod("dispose", &AddonContext::Dispose),
|
|
1068
1124
|
}
|
|
@@ -1444,6 +1500,55 @@ Napi::Value systemInfo(const Napi::CallbackInfo& info) {
|
|
|
1444
1500
|
return Napi::String::From(info.Env(), llama_print_system_info());
|
|
1445
1501
|
}
|
|
1446
1502
|
|
|
1503
|
+
Napi::Value addonGetSupportsGpuOffloading(const Napi::CallbackInfo& info) {
|
|
1504
|
+
return Napi::Boolean::New(info.Env(), llama_supports_gpu_offload());
|
|
1505
|
+
}
|
|
1506
|
+
|
|
1507
|
+
Napi::Value addonGetSupportsMmap(const Napi::CallbackInfo& info) {
|
|
1508
|
+
return Napi::Boolean::New(info.Env(), llama_supports_mmap());
|
|
1509
|
+
}
|
|
1510
|
+
|
|
1511
|
+
Napi::Value addonGetSupportsMlock(const Napi::CallbackInfo& info) {
|
|
1512
|
+
return Napi::Boolean::New(info.Env(), llama_supports_mlock());
|
|
1513
|
+
}
|
|
1514
|
+
|
|
1515
|
+
Napi::Value addonGetBlockSizeForGgmlType(const Napi::CallbackInfo& info) {
|
|
1516
|
+
const int ggmlType = info[0].As<Napi::Number>().Int32Value();
|
|
1517
|
+
|
|
1518
|
+
if (ggmlType < 0 || ggmlType > GGML_TYPE_COUNT) {
|
|
1519
|
+
return info.Env().Undefined();
|
|
1520
|
+
}
|
|
1521
|
+
|
|
1522
|
+
const auto blockSize = ggml_blck_size(static_cast<ggml_type>(ggmlType));
|
|
1523
|
+
|
|
1524
|
+
return Napi::Number::New(info.Env(), blockSize);
|
|
1525
|
+
}
|
|
1526
|
+
|
|
1527
|
+
Napi::Value addonGetTypeSizeForGgmlType(const Napi::CallbackInfo& info) {
|
|
1528
|
+
const int ggmlType = info[0].As<Napi::Number>().Int32Value();
|
|
1529
|
+
|
|
1530
|
+
if (ggmlType < 0 || ggmlType > GGML_TYPE_COUNT) {
|
|
1531
|
+
return info.Env().Undefined();
|
|
1532
|
+
}
|
|
1533
|
+
|
|
1534
|
+
const auto typeSize = ggml_type_size(static_cast<ggml_type>(ggmlType));
|
|
1535
|
+
|
|
1536
|
+
return Napi::Number::New(info.Env(), typeSize);
|
|
1537
|
+
}
|
|
1538
|
+
|
|
1539
|
+
Napi::Value addonGetConsts(const Napi::CallbackInfo& info) {
|
|
1540
|
+
Napi::Object consts = Napi::Object::New(info.Env());
|
|
1541
|
+
consts.Set("ggmlMaxDims", Napi::Number::New(info.Env(), GGML_MAX_DIMS));
|
|
1542
|
+
consts.Set("ggmlTypeF16Size", Napi::Number::New(info.Env(), ggml_type_size(GGML_TYPE_F16)));
|
|
1543
|
+
consts.Set("ggmlTypeF32Size", Napi::Number::New(info.Env(), ggml_type_size(GGML_TYPE_F32)));
|
|
1544
|
+
consts.Set("ggmlTensorOverhead", Napi::Number::New(info.Env(), ggml_tensor_overhead()));
|
|
1545
|
+
consts.Set("llamaMaxRngState", Napi::Number::New(info.Env(), LLAMA_MAX_RNG_STATE));
|
|
1546
|
+
consts.Set("llamaPosSize", Napi::Number::New(info.Env(), sizeof(llama_pos)));
|
|
1547
|
+
consts.Set("llamaSeqIdSize", Napi::Number::New(info.Env(), sizeof(llama_seq_id)));
|
|
1548
|
+
|
|
1549
|
+
return consts;
|
|
1550
|
+
}
|
|
1551
|
+
|
|
1447
1552
|
int addonGetGgmlLogLevelNumber(ggml_log_level level) {
|
|
1448
1553
|
switch (level) {
|
|
1449
1554
|
case GGML_LOG_LEVEL_ERROR: return 2;
|
|
@@ -1693,9 +1798,16 @@ static void addonFreeLlamaBackend(Napi::Env env, int* data) {
|
|
|
1693
1798
|
Napi::Object registerCallback(Napi::Env env, Napi::Object exports) {
|
|
1694
1799
|
exports.DefineProperties({
|
|
1695
1800
|
Napi::PropertyDescriptor::Function("systemInfo", systemInfo),
|
|
1801
|
+
Napi::PropertyDescriptor::Function("getSupportsGpuOffloading", addonGetSupportsGpuOffloading),
|
|
1802
|
+
Napi::PropertyDescriptor::Function("getSupportsMmap", addonGetSupportsMmap),
|
|
1803
|
+
Napi::PropertyDescriptor::Function("getSupportsMlock", addonGetSupportsMlock),
|
|
1804
|
+
Napi::PropertyDescriptor::Function("getBlockSizeForGgmlType", addonGetBlockSizeForGgmlType),
|
|
1805
|
+
Napi::PropertyDescriptor::Function("getTypeSizeForGgmlType", addonGetTypeSizeForGgmlType),
|
|
1806
|
+
Napi::PropertyDescriptor::Function("getConsts", addonGetConsts),
|
|
1696
1807
|
Napi::PropertyDescriptor::Function("setLogger", setLogger),
|
|
1697
1808
|
Napi::PropertyDescriptor::Function("setLoggerLogLevel", setLoggerLogLevel),
|
|
1698
1809
|
Napi::PropertyDescriptor::Function("getGpuVramInfo", getGpuVramInfo),
|
|
1810
|
+
Napi::PropertyDescriptor::Function("getGpuDeviceInfo", getGpuDeviceInfo),
|
|
1699
1811
|
Napi::PropertyDescriptor::Function("getGpuType", getGpuType),
|
|
1700
1812
|
Napi::PropertyDescriptor::Function("init", addonInit),
|
|
1701
1813
|
Napi::PropertyDescriptor::Function("dispose", addonDispose),
|
package/llama/gitRelease.bundle
CHANGED
|
Binary file
|
|
@@ -1,4 +1,6 @@
|
|
|
1
1
|
#include <stddef.h>
|
|
2
|
+
#include <vector>
|
|
3
|
+
#include <string>
|
|
2
4
|
|
|
3
5
|
#if defined(GPU_INFO_USE_HIPBLAS)
|
|
4
6
|
#include <hip/hip_runtime.h>
|
|
@@ -97,3 +99,22 @@ bool gpuInfoGetTotalCudaDevicesInfo(size_t * total, size_t * used, gpuInfoCudaEr
|
|
|
97
99
|
|
|
98
100
|
return true;
|
|
99
101
|
}
|
|
102
|
+
|
|
103
|
+
void gpuInfoGetCudaDeviceNames(std::vector<std::string> * deviceNames, gpuInfoCudaErrorLogCallback_t errorLogCallback) {
|
|
104
|
+
int deviceCount = gpuInfoGetCudaDeviceCount(errorLogCallback);
|
|
105
|
+
|
|
106
|
+
if (deviceCount < 0) {
|
|
107
|
+
return;
|
|
108
|
+
}
|
|
109
|
+
|
|
110
|
+
for (int i = 0; i < deviceCount; i++) {
|
|
111
|
+
cudaDeviceProp prop;
|
|
112
|
+
auto getDevicePropertiesResult = cudaGetDeviceProperties(&prop, i);
|
|
113
|
+
|
|
114
|
+
if (getDevicePropertiesResult != cudaSuccess) {
|
|
115
|
+
errorLogCallback(cudaGetErrorString(getDevicePropertiesResult));
|
|
116
|
+
} else {
|
|
117
|
+
(*deviceNames).push_back(std::string(prop.name));
|
|
118
|
+
}
|
|
119
|
+
}
|
|
120
|
+
}
|
|
@@ -1,7 +1,10 @@
|
|
|
1
1
|
#pragma once
|
|
2
2
|
|
|
3
3
|
#include <stddef.h>
|
|
4
|
+
#include <vector>
|
|
5
|
+
#include <string>
|
|
4
6
|
|
|
5
7
|
typedef void (*gpuInfoCudaErrorLogCallback_t)(const char* message);
|
|
6
8
|
|
|
7
9
|
bool gpuInfoGetTotalCudaDevicesInfo(size_t * total, size_t * used, gpuInfoCudaErrorLogCallback_t errorLogCallback);
|
|
10
|
+
void gpuInfoGetCudaDeviceNames(std::vector<std::string> * deviceNames, gpuInfoCudaErrorLogCallback_t errorLogCallback);
|
|
@@ -1,5 +1,8 @@
|
|
|
1
1
|
#pragma once
|
|
2
2
|
|
|
3
3
|
#include <stdint.h>
|
|
4
|
+
#include <string>
|
|
5
|
+
#include <vector>
|
|
4
6
|
|
|
5
|
-
void
|
|
7
|
+
void getMetalGpuInfo(uint64_t * total, uint64_t * used);
|
|
8
|
+
void getMetalGpuDeviceNames(std::vector<std::string> * deviceNames);
|
|
@@ -1,7 +1,9 @@
|
|
|
1
1
|
#include <stdint.h>
|
|
2
|
+
#include <vector>
|
|
3
|
+
#include <string>
|
|
2
4
|
#import <Metal/Metal.h>
|
|
3
5
|
|
|
4
|
-
void
|
|
6
|
+
void getMetalGpuInfo(uint64_t * total, uint64_t * used) {
|
|
5
7
|
id<MTLDevice> device = MTLCreateSystemDefaultDevice();
|
|
6
8
|
|
|
7
9
|
if (device) {
|
|
@@ -15,3 +17,14 @@ void get_metal_gpu_info(uint64_t * total, uint64_t * used) {
|
|
|
15
17
|
[device release];
|
|
16
18
|
device = nil;
|
|
17
19
|
}
|
|
20
|
+
|
|
21
|
+
void getMetalGpuDeviceNames(std::vector<std::string> * deviceNames) {
|
|
22
|
+
NSArray<id<MTLDevice>> *devices = MTLCopyAllDevices();
|
|
23
|
+
|
|
24
|
+
for (id<MTLDevice> device in devices) {
|
|
25
|
+
(*deviceNames).push_back(std::string(([NSString stringWithUTF8String:device.name.UTF8String]).UTF8String));
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
[devices release];
|
|
29
|
+
devices = nil;
|
|
30
|
+
}
|
|
@@ -1,10 +1,11 @@
|
|
|
1
1
|
#include <stddef.h>
|
|
2
|
+
#include <vector>
|
|
2
3
|
|
|
3
4
|
#include <vulkan/vulkan.hpp>
|
|
4
5
|
|
|
5
6
|
typedef void (*gpuInfoVulkanWarningLogCallback_t)(const char* message);
|
|
6
7
|
|
|
7
|
-
bool
|
|
8
|
+
static bool enumerateVulkanDevices(size_t* total, size_t* used, bool addDeviceNames, std::vector<std::string> * deviceNames, gpuInfoVulkanWarningLogCallback_t warningLogCallback) {
|
|
8
9
|
vk::ApplicationInfo appInfo("node-llama-cpp GPU info", 1, "llama.cpp", 1, VK_API_VERSION_1_2);
|
|
9
10
|
vk::InstanceCreateInfo createInfo(vk::InstanceCreateFlags(), &appInfo, {}, {});
|
|
10
11
|
vk::Instance instance = vk::createInstance(createInfo);
|
|
@@ -41,8 +42,14 @@ bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkan
|
|
|
41
42
|
|
|
42
43
|
for (uint32_t i = 0; i < memProps.memoryHeapCount; ++i) {
|
|
43
44
|
if (memProps.memoryHeaps[i].flags & vk::MemoryHeapFlagBits::eDeviceLocal) {
|
|
44
|
-
|
|
45
|
+
const auto size = memProps.memoryHeaps[i].size;
|
|
46
|
+
totalMem += size;
|
|
45
47
|
usedMem += memoryBudgetProperties.heapUsage[i];
|
|
48
|
+
|
|
49
|
+
if (size > 0 && addDeviceNames) {
|
|
50
|
+
(*deviceNames).push_back(std::string(deviceProps.deviceName.data()));
|
|
51
|
+
}
|
|
52
|
+
|
|
46
53
|
break;
|
|
47
54
|
}
|
|
48
55
|
}
|
|
@@ -63,3 +70,14 @@ bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkan
|
|
|
63
70
|
*used = usedMem;
|
|
64
71
|
return true;
|
|
65
72
|
}
|
|
73
|
+
|
|
74
|
+
bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkanWarningLogCallback_t warningLogCallback) {
|
|
75
|
+
return enumerateVulkanDevices(total, used, false, nullptr, warningLogCallback);
|
|
76
|
+
}
|
|
77
|
+
|
|
78
|
+
bool gpuInfoGetVulkanDeviceNames(std::vector<std::string> * deviceNames, gpuInfoVulkanWarningLogCallback_t warningLogCallback) {
|
|
79
|
+
size_t vulkanDeviceTotal = 0;
|
|
80
|
+
size_t vulkanDeviceUsed = 0;
|
|
81
|
+
|
|
82
|
+
return enumerateVulkanDevices(&vulkanDeviceTotal, &vulkanDeviceUsed, true, deviceNames, warningLogCallback);
|
|
83
|
+
}
|
|
@@ -1,7 +1,9 @@
|
|
|
1
1
|
#pragma once
|
|
2
2
|
|
|
3
3
|
#include <stddef.h>
|
|
4
|
+
#include <vector>
|
|
4
5
|
|
|
5
6
|
typedef void (*gpuInfoVulkanWarningLogCallback_t)(const char* message);
|
|
6
7
|
|
|
7
8
|
bool gpuInfoGetTotalVulkanDevicesInfo(size_t* total, size_t* used, gpuInfoVulkanWarningLogCallback_t warningLogCallback);
|
|
9
|
+
bool gpuInfoGetVulkanDeviceNames(std::vector<std::string> * deviceNames, gpuInfoVulkanWarningLogCallback_t warningLogCallback);
|
|
@@ -0,0 +1,41 @@
|
|
|
1
|
+
set(CMAKE_SYSTEM_NAME Windows)
|
|
2
|
+
set(CMAKE_SYSTEM_PROCESSOR ARM64)
|
|
3
|
+
|
|
4
|
+
# Look for cl.exe in the Visual Studio installation directories
|
|
5
|
+
set(PROGRAMFILES "$ENV{ProgramFiles}")
|
|
6
|
+
set(PROGRAMFILES_X86 "$ENV{ProgramFiles\(x86\)}")
|
|
7
|
+
|
|
8
|
+
set(VS_INSTALL_PATHS
|
|
9
|
+
"${PROGRAMFILES_X86}/Microsoft Visual Studio"
|
|
10
|
+
"${PROGRAMFILES}/Microsoft Visual Studio"
|
|
11
|
+
"C:/Program Files (x86)/Microsoft Visual Studio"
|
|
12
|
+
"C:/Program Files/Microsoft Visual Studio"
|
|
13
|
+
)
|
|
14
|
+
foreach(PATH IN LISTS VS_INSTALL_PATHS)
|
|
15
|
+
if(CL_EXE_PATH)
|
|
16
|
+
break()
|
|
17
|
+
endif()
|
|
18
|
+
|
|
19
|
+
file(GLOB_RECURSE FOUND_CL_EXE "${PATH}/*/VC/Tools/MSVC/*/bin/Hostx64/arm64/cl.exe")
|
|
20
|
+
if(FOUND_CL_EXE)
|
|
21
|
+
list(GET FOUND_CL_EXE 0 CL_EXE_PATH)
|
|
22
|
+
break()
|
|
23
|
+
endif()
|
|
24
|
+
|
|
25
|
+
if(CL_EXE_PATH)
|
|
26
|
+
break()
|
|
27
|
+
endif()
|
|
28
|
+
|
|
29
|
+
file(GLOB_RECURSE FOUND_CL_EXE "${PATH}/**/*/VC/Tools/MSVC/*/bin/Hostx64/arm64/cl.exe")
|
|
30
|
+
if(FOUND_CL_EXE)
|
|
31
|
+
list(GET FOUND_CL_EXE 0 CL_EXE_PATH)
|
|
32
|
+
break()
|
|
33
|
+
endif()
|
|
34
|
+
endforeach()
|
|
35
|
+
|
|
36
|
+
if(NOT CL_EXE_PATH)
|
|
37
|
+
message(FATAL_ERROR "cl.exe not found for ARM architecture.")
|
|
38
|
+
else()
|
|
39
|
+
set(CMAKE_C_COMPILER "${CL_EXE_PATH}")
|
|
40
|
+
set(CMAKE_CXX_COMPILER "${CL_EXE_PATH}")
|
|
41
|
+
endif()
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"arm64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"arm64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"armv7l","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"armv7l","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":"cuda","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":"cuda","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":"vulkan","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"linux","platformInfo":{"name":"Ubuntu","version":"22.04"},"arch":"x64","gpu":"vulkan","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"mac","platformInfo":{"name":"macOS","version":"21.6.0"},"arch":"arm64","gpu":"metal","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"mac","platformInfo":{"name":"macOS","version":"21.6.0"},"arch":"arm64","gpu":"metal","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"mac","platformInfo":{"name":"macOS","version":"21.6.0"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"mac","platformInfo":{"name":"macOS","version":"21.6.0"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"arm64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":false,"llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":"cuda","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":"cuda","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":"vulkan","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"
|
|
1
|
+
{"buildOptions":{"customCmakeOptions":{},"progressLogs":true,"platform":"win","platformInfo":{"name":"Windows","version":"10.0.20348"},"arch":"x64","gpu":"vulkan","llamaCpp":{"repo":"ggerganov/llama.cpp","release":"b2608"}}}
|
|
Binary file
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "node-llama-cpp",
|
|
3
|
-
"version": "3.0.0-beta.
|
|
3
|
+
"version": "3.0.0-beta.15",
|
|
4
4
|
"description": "Run AI models locally on your machine with node.js bindings for llama.cpp. Force a JSON schema on the model output on the generation level",
|
|
5
5
|
"main": "dist/index.js",
|
|
6
6
|
"type": "module",
|
|
@@ -120,7 +120,7 @@
|
|
|
120
120
|
"@types/cli-progress": "^3.11.0",
|
|
121
121
|
"@types/cross-spawn": "^6.0.2",
|
|
122
122
|
"@types/fs-extra": "^11.0.4",
|
|
123
|
-
"@types/node": "^20.
|
|
123
|
+
"@types/node": "^20.11.29",
|
|
124
124
|
"@types/proper-lockfile": "^4.1.4",
|
|
125
125
|
"@types/semver": "^7.5.8",
|
|
126
126
|
"@types/uuid": "^9.0.2",
|
|
@@ -128,8 +128,8 @@
|
|
|
128
128
|
"@types/yargs": "^17.0.24",
|
|
129
129
|
"@typescript-eslint/eslint-plugin": "^6.3.0",
|
|
130
130
|
"@typescript-eslint/parser": "^6.3.0",
|
|
131
|
-
"@vitest/coverage-v8": "^1.
|
|
132
|
-
"@vitest/ui": "^1.
|
|
131
|
+
"@vitest/coverage-v8": "^1.4.0",
|
|
132
|
+
"@vitest/ui": "^1.4.0",
|
|
133
133
|
"eslint": "^8.46.0",
|
|
134
134
|
"eslint-plugin-import": "^2.28.0",
|
|
135
135
|
"eslint-plugin-jsdoc": "^46.9.0",
|
|
@@ -146,10 +146,11 @@
|
|
|
146
146
|
"typescript": "^5.2.2",
|
|
147
147
|
"vite-node": "^1.4.0",
|
|
148
148
|
"vitepress": "1.0.0-rc.22",
|
|
149
|
-
"vitest": "^1.
|
|
149
|
+
"vitest": "^1.4.0",
|
|
150
150
|
"zx": "^7.2.3"
|
|
151
151
|
},
|
|
152
152
|
"dependencies": {
|
|
153
|
+
"@huggingface/jinja": "^0.2.2",
|
|
153
154
|
"async-retry": "^1.3.3",
|
|
154
155
|
"bytes": "^3.1.2",
|
|
155
156
|
"chalk": "^5.3.0",
|
|
@@ -160,7 +161,7 @@
|
|
|
160
161
|
"cross-spawn": "^7.0.3",
|
|
161
162
|
"env-var": "^7.3.1",
|
|
162
163
|
"fs-extra": "^11.2.0",
|
|
163
|
-
"lifecycle-utils": "^1.4.
|
|
164
|
+
"lifecycle-utils": "^1.4.1",
|
|
164
165
|
"log-symbols": "^5.1.0",
|
|
165
166
|
"node-addon-api": "^7.0.0",
|
|
166
167
|
"octokit": "^3.1.0",
|
|
@@ -168,6 +169,7 @@
|
|
|
168
169
|
"proper-lockfile": "^4.1.2",
|
|
169
170
|
"semver": "^7.6.0",
|
|
170
171
|
"simple-git": "^3.19.1",
|
|
172
|
+
"slice-ansi": "^7.1.0",
|
|
171
173
|
"strip-ansi": "^7.1.0",
|
|
172
174
|
"uuid": "^9.0.0",
|
|
173
175
|
"which": "^4.0.0",
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"TemplateChatWrapper.js","sourceRoot":"","sources":["../src/TemplateChatWrapper.ts"],"names":[],"mappings":"AACA,OAAO,EAAC,mBAAmB,EAAE,SAAS,EAAkB,YAAY,EAAC,MAAM,sBAAsB,CAAC;AAClG,OAAO,EAAC,WAAW,EAAsB,MAAM,kBAAkB,CAAC;AAClE,OAAO,EAAC,iBAAiB,EAAC,MAAM,8BAA8B,CAAC;AAY/D;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA8BG;AACH,MAAM,OAAO,mBAAoB,SAAQ,WAAW;IAChC,WAAW,GAAG,UAAU,CAAC;IAChB,QAAQ,CAAsB;IAEvC,QAAQ,CAAe;IACvB,eAAe,CAAsB;IACrC,aAAa,CAAS;IACtB,YAAY,CAAS;IACrB,cAAc,CAAS;IACvB,iCAAiC,CAAU;IAE3D,gBAAgB,CAAkB,mBAAmB,CAAuC;IAC5F,gBAAgB,CAAkB,0BAA0B,CAA8C;IAE1G,YAAmB,EACf,QAAQ,EACR,eAAe,EACf,aAAa,EACb,YAAY,EACZ,cAAc,GAAG,QAAQ,EACzB,2BAA2B,EAC3B,iCAAiC,GAAG,IAAI,EACf;QACzB,KAAK,EAAE,CAAC;QAER,IAAI,CAAC,QAAQ,GAAG,QAAQ,CAAC;QACzB,IAAI,CAAC,eAAe,GAAG,eAAe,CAAC;QACvC,IAAI,CAAC,aAAa,GAAG,aAAa,CAAC;QACnC,IAAI,CAAC,YAAY,GAAG,YAAY,CAAC;QACjC,IAAI,CAAC,cAAc,GAAG,cAAc,CAAC;QACrC,IAAI,CAAC,iCAAiC,GAAG,iCAAiC,CAAC;QAE3E,IAAI,CAAC,mBAAmB,GAAG,iBAAiB,CAAC,QAAQ,CAAC,CAAC;QACvD,IAAI,CAAC,0BAA0B,GAAG,wBAAwB,CAAC,eAAe,CAAC,CAAC;QAE5E,IAAI,CAAC,QAAQ,GAAG;YACZ,GAAG,KAAK,CAAC,QAAQ;YACjB,SAAS,EAAE,gCAAgC,CAAC,2BAA2B,CAAC,IAAI,WAAW,CAAC,cAAc,CAAC,SAAS;SACnH,CAAC;IACN,CAAC;IAEe,mBAAmB,CAAC,OAAmC,EAAE,EAAC,kBAAkB,EAAE,sBAAsB,KAGhH,EAAE;QAIF,MAAM,oBAAoB,GAAG,IAAI,CAAC,2CAA2C,CAAC,OAAO,EAAE,kBAAkB,EAAE;YACvG,cAAc,EAAE,sBAAsB;SACzC,CAAC,CAAC;QAEH,MAAM,WAAW,GAIZ,EAAE,CAAC;QAER,IAAI,WAAW,GAAa,EAAE,CAAC;QAC/B,IAAI,SAAS,GAAa,EAAE,CAAC;QAC7B,IAAI,UAAU,GAAa,EAAE,CAAC;QAC9B,IAAI,qBAAqB,GAAuC,IAAI,CAAC;QAErE,SAAS,KAAK;YACV,IAAI,WAAW,CAAC,MAAM,GAAG,CAAC,IAAI,SAAS,CAAC,MAAM,GAAG,CAAC,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC;gBACvE,WAAW,CAAC,IAAI,CAAC;oBACb,MAAM,EAAE,WAAW,CAAC,IAAI,CAAC,MAAM,CAAC;oBAChC,IAAI,EAAE,SAAS,CAAC,IAAI,CAAC,MAAM,CAAC;oBAC5B,KAAK,EAAE,UAAU,CAAC,IAAI,CAAC,MAAM,CAAC;iBACjC,CAAC,CAAC;YAEP,WAAW,GAAG,EAAE,CAAC;YACjB,SAAS,GAAG,EAAE,CAAC;YACf,UAAU,GAAG,EAAE,CAAC;QACpB,CAAC;QAED,MAAM,cAAc,GAAG,CAAC,IAAiC,EAAE,IAAY,EAAE,MAAsB,EAAE,EAAE;YAC/F,MAAM,EAAC,cAAc,EAAE,aAAa,EAAE,aAAa,EAAC,GAAG,IAAI,CAAC,0BAA0B,CAAC;YACvF,OAAO,SAAS,CAAC;gBACb,IAAI,YAAY,CAAC,CAAC,MAAM,IAAI,EAAE,CAAC,GAAG,cAAc,GAAG,IAAI,GAAG,aAAa,CAAC;gBACxE,IAAI;gBACJ,IAAI,YAAY,CAAC,aAAa,CAAC;aAClC,CAAC,CAAC;QACP,CAAC,CAAC;QAEF,KAAK,MAAM,IAAI,IAAI,oBAAoB,EAAE;YACrC,IAAI,IAAI,CAAC,IAAI,KAAK,QAAQ,EAAE;gBACxB,IAAI,CAAC,IAAI,CAAC,iCAAiC,IAAI,qBAAqB,KAAK,QAAQ;oBAC7E,KAAK,EAAE,CAAC;gBAEZ,qBAAqB,GAAG,QAAQ,CAAC;gBACjC,WAAW,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;aAC/B;iBAAM,IAAI,IAAI,CAAC,IAAI,KAAK,MAAM,EAAE;gBAC7B,IAAI,CAAC,IAAI,CAAC,iCAAiC,IAAI,CAAC,qBAAqB,KAAK,QAAQ,IAAI,qBAAqB,KAAK,MAAM,CAAC;oBACnH,KAAK,EAAE,CAAC;gBAEZ,qBAAqB,GAAG,MAAM,CAAC;gBAC/B,SAAS,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;aAC7B;iBAAM,IAAI,IAAI,CAAC,IAAI,KAAK,OAAO,EAAE;gBAC9B,IAAI,CAAC,IAAI,CAAC,iCAAiC;oBACvC,KAAK,EAAE,CAAC;gBAEZ,qBAAqB,GAAG,OAAO,CAAC;gBAChC,UAAU,CAAC,IAAI,CAAC,IAAI,CAAC,yBAAyB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC,CAAC;aAClE;SACJ;QAED,KAAK,EAAE,CAAC;QAER,MAAM,WAAW,GAAG,SAAS,CACzB,WAAW,CAAC,GAAG,CAAC,CAAC,EAAC,MAAM,EAAE,IAAI,EAAE,KAAK,EAAC,EAAE,KAAK,EAAE,EAAE;YAC7C,MAAM,WAAW,GAAG,KAAK,KAAK,CAAC,CAAC;YAChC,MAAM,UAAU,GAAG,KAAK,KAAK,WAAW,CAAC,MAAM,GAAG,CAAC,CAAC;YAEpD,MAAM,GAAG,GAAG,SAAS,CAAC;gBAClB,WAAW;oBACP,CAAC,CAAC,MAAM,CAAC,MAAM,KAAK,CAAC;wBACjB,CAAC,CAAC,IAAI,YAAY,CAAC,CAAC,IAAI,CAAC,mBAAmB,CAAC,kBAAkB,IAAI,EAAE,CAAC,GAAG,IAAI,CAAC,mBAAmB,CAAC,aAAa,CAAC;wBAChH,CAAC,CAAC,IAAI,CAAC,mBAAmB,CAAC,kBAAkB,IAAI,IAAI;4BACjD,CAAC,CAAC,SAAS,CAAC;gCACR,IAAI,YAAY,CAAC,IAAI,CAAC,mBAAmB,CAAC,kBAAkB,CAAC;gCAC7D,MAAM;gCACN,IAAI,YAAY,CAAC,IAAI,CAAC,mBAAmB,CAAC,aAAa,CAAC;6BAC3D,CAAC;4BACF,CAAC,CAAC,cAAc,CAAC,QAAQ,EAAE,MAAM,EAAE,IAAI,CAAC,mBAAmB,CAAC,aAAa,CAAC;oBAClF,CAAC,CAAC,MAAM,CAAC,MAAM,KAAK,CAAC;wBACjB,CAAC,CAAC,SAAS,CAAC,EAAE,CAAC;wBACf,CAAC,CAAC,cAAc,CAAC,QAAQ,EAAE,MAAM,CAAC;gBAG1C,IAAI,CAAC,MAAM,KAAK,CAAC;oBACb,CAAC,CAAC,SAAS,CAAC,EAAE,CAAC;oBACf,CAAC,CAAC,cAAc,CAAC,MAAM,EAAE,IAAI,CAAC;gBAElC,KAAK,CAAC,MAAM,KAAK,CAAC;oBACd,CAAC,CAAC,SAAS,CAAC,EAAE,CAAC;oBACf,CAAC,CAAC,CAAC,UAAU;wBACT,CAAC,CAAC,cAAc,CAAC,OAAO,EAAE,KAAK,CAAC;wBAChC,CAAC,CAAC,SAAS,CAAC;4BACR,IAAI,YAAY,CAAC,IAAI,CAAC,mBAAmB,CAAC,gBAAgB,CAAC;4BAC3D,KAAK;yBACR,CAAC;aACb,CAAC,CAAC;YAEH,OAAO,SAAS,CACZ,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,KAAK,EAAE,EAAE;gBAC7B,IAAI,KAAK,YAAY,YAAY,EAAE;oBAC/B,MAAM,QAAQ,GAAG,GAAG,CAAC,GAAG,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;oBAErC,IAAI,QAAQ,IAAI,IAAI,IAAI,CAAC,CAAC,QAAQ,YAAY,YAAY,CAAC;wBACvD,OAAO,GAAG,CAAC,MAAM,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC;oBAE/B,OAAO,GAAG,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC;wBAC3B,IAAI,YAAY,CAAC,QAAQ,CAAC,KAAK,GAAG,KAAK,CAAC,KAAK,CAAC;qBACjD,CAAC,CAAC;iBACN;gBAED,OAAO,GAAG,CAAC,MAAM,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC;YAC/B,CAAC,EAAE,EAAsB,CAAC,CAC7B,CAAC;QACN,CAAC,CAAC,CACL,CAAC;QAEF,OAAO;YACH,WAAW;YACX,sBAAsB,EAAE;gBACpB,SAAS,CAAC,IAAI,mBAAmB,CAAC,KAAK,CAAC,CAAC;gBACzC,SAAS,CAAC,IAAI,CAAC,mBAAmB,CAAC,gBAAgB,CAAC;gBACpD,SAAS,CAAC,IAAI,YAAY,CAAC,IAAI,CAAC,mBAAmB,CAAC,gBAAgB,CAAC,CAAC;aACzE;SACJ,CAAC;IACN,CAAC;CACJ;AAUD,SAAS,gCAAgC,CAAC,QAAiD;IACvF,IAAI,QAAQ,IAAI,IAAI;QAChB,OAAO,IAAI,CAAC;IAEhB,MAAM,CAAC,oBAAoB,EAAE,0BAA0B,CAAC,GAAG,QAAQ,CAAC;IAEpE,IAAI,oBAAoB,IAAI,IAAI,IAAI,0BAA0B,IAAI,IAAI;QAClE,MAAM,IAAI,KAAK,CAAC,oEAAoE,CAAC,CAAC;IAE1F,MAAM,0BAA0B,GAAG,iBAAiB,CAAC,oBAAoB,EAAE,CAAC;YACxE,IAAI,EAAE,kBAAkB;YACxB,GAAG,EAAE,cAAc;SACtB,EAAE;YACC,IAAI,EAAE,oBAAoB;YAC1B,GAAG,EAAE,gBAAgB;SACxB,CAAC,CAAC,CAAC;IACJ,MAAM,gCAAgC,GAAG,iBAAiB,CAAC,0BAA0B,EAAE,CAAC;YACpF,IAAI,EAAE,wBAAwB;YAC9B,GAAG,EAAE,oBAAoB;SAC5B,CAAC,CAAC,CAAC;IAEJ,MAAM,UAAU,GAAG,0BAA0B,CAAC,YAAY,CAAC,MAAM,CAAC;IAClE,MAAM,gBAAgB,GAAG,0BAA0B,CAAC,cAAc,CAAC,MAAM,CAAC;IAC1E,MAAM,UAAU,GAAG,0BAA0B,CAAC,cAAc,CAAC,MAAM,CAAC;IAEpE,MAAM,YAAY,GAAG,gCAAgC,CAAC,kBAAkB,CAAC,MAAM,CAAC;IAChF,MAAM,YAAY,GAAG,gCAAgC,CAAC,kBAAkB,CAAC,MAAM,CAAC;IAEhF,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC;QACvB,MAAM,IAAI,KAAK,CAAC,iEAAiE,CAAC,CAAC;IAEvF,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC;QACvB,MAAM,IAAI,KAAK,CAAC,kEAAkE,CAAC,CAAC;IAExF,IAAI,YAAY,CAAC,MAAM,KAAK,CAAC;QACzB,MAAM,IAAI,KAAK,CAAC,8EAA8E,CAAC,CAAC;IAEpG,IAAI,YAAY,CAAC,MAAM,KAAK,CAAC;QACzB,MAAM,IAAI,KAAK,CAAC,6EAA6E,CAAC,CAAC;IAEnG,OAAO;QACH,IAAI,EAAE;YACF,mBAAmB,EAAE,IAAI;YACzB,MAAM,EAAE,UAAU;YAClB,YAAY,EAAE,gBAAgB;YAC9B,MAAM,EAAE,UAAU;SACrB;QACD,MAAM,EAAE;YACJ,MAAM,EAAE,YAAY;YACpB,MAAM,EAAE,YAAY;SACvB;KACJ,CAAC;AACN,CAAC;AAED,SAAS,iBAAiB,CAAC,QAAsB;IAM7C,MAAM,cAAc,GAAG,iBAAiB,CAAC,QAAQ,EAAE,CAAC;YAChD,IAAI,EAAE,kBAAkB;YACxB,GAAG,EAAE,cAAc;YACnB,QAAQ,EAAE,IAAI;SACjB,EAAE;YACC,IAAI,EAAE,aAAa;YACnB,GAAG,EAAE,SAAS;SACjB,EAAE;YACC,IAAI,EAAE,gBAAgB;YACtB,GAAG,EAAE,YAAY;SACpB,CAAC,CAAC,CAAC;IAEJ,IAAI,cAAc,CAAC,UAAU,CAAC,MAAM,CAAC,MAAM,IAAI,CAAC;QAC5C,MAAM,IAAI,KAAK,CAAC,qDAAqD,CAAC,CAAC;IAE3E,OAAO;QACH,kBAAkB,EAAE,cAAc,CAAC,YAAY,EAAE,MAAM,IAAI,IAAI;QAC/D,aAAa,EAAE,cAAc,CAAC,OAAO,CAAC,MAAM;QAC5C,gBAAgB,EAAE,cAAc,CAAC,UAAU,CAAC,MAAM;QAClD,gBAAgB,EAAE,cAAc,CAAC,UAAU,CAAC,MAAM;KACrD,CAAC;AACN,CAAC;AAED,SAAS,wBAAwB,CAAC,QAA6B;IAK3D,MAAM,cAAc,GAAG,iBAAiB,CAAC,QAAQ,EAAE,CAAC;YAChD,IAAI,EAAE,cAAc;YACpB,GAAG,EAAE,UAAU;SAClB,EAAE;YACC,IAAI,EAAE,aAAa;YACnB,GAAG,EAAE,SAAS;SACjB,CAAC,CAAC,CAAC;IAEJ,OAAO;QACH,cAAc,EAAE,cAAc,CAAC,QAAQ,CAAC,MAAM;QAC9C,aAAa,EAAE,cAAc,CAAC,OAAO,CAAC,MAAM;QAC5C,aAAa,EAAE,cAAc,CAAC,OAAO,CAAC,MAAM;KAC/C,CAAC;AACN,CAAC"}
|
|
@@ -1,33 +0,0 @@
|
|
|
1
|
-
import { ModelTypeDescription } from "../AddonTypes.js";
|
|
2
|
-
import { GeneralChatWrapper } from "../../chatWrappers/GeneralChatWrapper.js";
|
|
3
|
-
import { LlamaChatWrapper } from "../../chatWrappers/LlamaChatWrapper.js";
|
|
4
|
-
import { AlpacaChatWrapper } from "../../chatWrappers/AlpacaChatWrapper.js";
|
|
5
|
-
import { FunctionaryChatWrapper } from "../../chatWrappers/FunctionaryChatWrapper.js";
|
|
6
|
-
import { ChatMLChatWrapper } from "../../chatWrappers/ChatMLChatWrapper.js";
|
|
7
|
-
import { FalconChatWrapper } from "../../chatWrappers/FalconChatWrapper.js";
|
|
8
|
-
import { GemmaChatWrapper } from "../../chatWrappers/GemmaChatWrapper.js";
|
|
9
|
-
export declare const chatWrapperTypeNames: readonly ["auto", "general", "llamaChat", "alpacaChat", "functionary", "chatML", "falconChat", "gemma"];
|
|
10
|
-
export type ChatWrapperTypeName = (typeof chatWrapperTypeNames)[number];
|
|
11
|
-
declare const chatWrappers: {
|
|
12
|
-
readonly general: typeof GeneralChatWrapper;
|
|
13
|
-
readonly llamaChat: typeof LlamaChatWrapper;
|
|
14
|
-
readonly alpacaChat: typeof AlpacaChatWrapper;
|
|
15
|
-
readonly functionary: typeof FunctionaryChatWrapper;
|
|
16
|
-
readonly chatML: typeof ChatMLChatWrapper;
|
|
17
|
-
readonly falconChat: typeof FalconChatWrapper;
|
|
18
|
-
readonly gemma: typeof GemmaChatWrapper;
|
|
19
|
-
};
|
|
20
|
-
/**
|
|
21
|
-
* @param configType
|
|
22
|
-
* @param options
|
|
23
|
-
*/
|
|
24
|
-
export declare function resolveChatWrapperBasedOnWrapperTypeName(configType: ChatWrapperTypeName, { bosString, filename, typeDescription, customWrapperSettings }?: {
|
|
25
|
-
bosString?: string | null;
|
|
26
|
-
filename?: string;
|
|
27
|
-
/** @hidden this type alias is too long in the documentation */
|
|
28
|
-
typeDescription?: ModelTypeDescription;
|
|
29
|
-
customWrapperSettings?: {
|
|
30
|
-
[wrapper in keyof typeof chatWrappers]?: ConstructorParameters<(typeof chatWrappers)[wrapper]>[0];
|
|
31
|
-
};
|
|
32
|
-
}): LlamaChatWrapper | ChatMLChatWrapper | GeneralChatWrapper | FalconChatWrapper | FunctionaryChatWrapper | GemmaChatWrapper;
|
|
33
|
-
export {};
|