node-llama-cpp 3.0.0-beta.43 → 3.0.0-beta.45
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +33 -21
- package/bins/_linux-arm64.moved.txt +1 -0
- package/bins/_linux-armv7l.moved.txt +1 -0
- package/bins/_linux-x64-vulkan.moved.txt +1 -0
- package/bins/_linux-x64.moved.txt +1 -0
- package/bins/_mac-arm64-metal.moved.txt +1 -0
- package/bins/_mac-x64.moved.txt +1 -0
- package/bins/_win-arm64.moved.txt +1 -0
- package/bins/_win-x64-vulkan.moved.txt +1 -0
- package/bins/_win-x64.moved.txt +1 -0
- package/dist/ChatWrapper.d.ts +11 -1
- package/dist/ChatWrapper.js +1 -1
- package/dist/ChatWrapper.js.map +1 -1
- package/dist/bindings/AddonTypes.d.ts +30 -19
- package/dist/bindings/Llama.d.ts +9 -0
- package/dist/bindings/Llama.js +33 -6
- package/dist/bindings/Llama.js.map +1 -1
- package/dist/bindings/consts.d.ts +1 -1
- package/dist/bindings/consts.js +2 -0
- package/dist/bindings/consts.js.map +1 -1
- package/dist/bindings/getLlama.d.ts +33 -5
- package/dist/bindings/getLlama.js +14 -3
- package/dist/bindings/getLlama.js.map +1 -1
- package/dist/bindings/types.d.ts +2 -2
- package/dist/bindings/types.js +2 -0
- package/dist/bindings/types.js.map +1 -1
- package/dist/bindings/utils/cloneLlamaCppRepo.js.map +1 -1
- package/dist/bindings/utils/compileLLamaCpp.d.ts +0 -1
- package/dist/bindings/utils/compileLLamaCpp.js +45 -7
- package/dist/bindings/utils/compileLLamaCpp.js.map +1 -1
- package/dist/bindings/utils/getBestComputeLayersAvailable.d.ts +0 -1
- package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js +2 -2
- package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js.map +1 -1
- package/dist/bindings/utils/getGpuTypesToUseForOption.d.ts +0 -1
- package/dist/bindings/utils/testCmakeBinary.d.ts +0 -1
- package/dist/chatWrappers/AlpacaChatWrapper.js +4 -3
- package/dist/chatWrappers/AlpacaChatWrapper.js.map +1 -1
- package/dist/chatWrappers/ChatMLChatWrapper.js +1 -1
- package/dist/chatWrappers/ChatMLChatWrapper.js.map +1 -1
- package/dist/chatWrappers/FalconChatWrapper.js +5 -4
- package/dist/chatWrappers/FalconChatWrapper.js.map +1 -1
- package/dist/chatWrappers/FunctionaryChatWrapper.d.ts +2 -2
- package/dist/chatWrappers/FunctionaryChatWrapper.js +200 -12
- package/dist/chatWrappers/FunctionaryChatWrapper.js.map +1 -1
- package/dist/chatWrappers/GemmaChatWrapper.js +1 -1
- package/dist/chatWrappers/GemmaChatWrapper.js.map +1 -1
- package/dist/chatWrappers/GeneralChatWrapper.js +5 -4
- package/dist/chatWrappers/GeneralChatWrapper.js.map +1 -1
- package/dist/chatWrappers/Llama2ChatWrapper.js +5 -6
- package/dist/chatWrappers/Llama2ChatWrapper.js.map +1 -1
- package/dist/chatWrappers/Llama3ChatWrapper.js +1 -1
- package/dist/chatWrappers/Llama3ChatWrapper.js.map +1 -1
- package/dist/chatWrappers/Llama3_1ChatWrapper.d.ts +13 -9
- package/dist/chatWrappers/Llama3_1ChatWrapper.js +92 -38
- package/dist/chatWrappers/Llama3_1ChatWrapper.js.map +1 -1
- package/dist/chatWrappers/MistralChatWrapper.d.ts +15 -0
- package/dist/chatWrappers/MistralChatWrapper.js +169 -0
- package/dist/chatWrappers/MistralChatWrapper.js.map +1 -0
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.d.ts +25 -1
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js +50 -12
- package/dist/chatWrappers/generic/JinjaTemplateChatWrapper.js.map +1 -1
- package/dist/chatWrappers/generic/TemplateChatWrapper.d.ts +22 -16
- package/dist/chatWrappers/generic/TemplateChatWrapper.js +28 -24
- package/dist/chatWrappers/generic/TemplateChatWrapper.js.map +1 -1
- package/dist/chatWrappers/generic/utils/chatHistoryFunctionCallMessageTemplate.d.ts +1 -1
- package/dist/chatWrappers/utils/chunkChatItems.d.ts +10 -0
- package/dist/chatWrappers/utils/chunkChatItems.js +44 -0
- package/dist/chatWrappers/utils/chunkChatItems.js.map +1 -0
- package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js +37 -26
- package/dist/chatWrappers/utils/isJinjaTemplateEquivalentToSpecializedChatWrapper.js.map +1 -1
- package/dist/chatWrappers/utils/jsonDumps.d.ts +1 -1
- package/dist/chatWrappers/utils/jsonDumps.js +2 -2
- package/dist/chatWrappers/utils/jsonDumps.js.map +1 -1
- package/dist/chatWrappers/utils/resolveChatWrapper.d.ts +30 -6
- package/dist/chatWrappers/utils/resolveChatWrapper.js +71 -25
- package/dist/chatWrappers/utils/resolveChatWrapper.js.map +1 -1
- package/dist/cli/cli.js +2 -6
- package/dist/cli/cli.js.map +1 -1
- package/dist/cli/commands/ChatCommand.d.ts +2 -1
- package/dist/cli/commands/ChatCommand.js +83 -53
- package/dist/cli/commands/ChatCommand.js.map +1 -1
- package/dist/cli/commands/CompleteCommand.d.ts +2 -1
- package/dist/cli/commands/CompleteCommand.js +58 -30
- package/dist/cli/commands/CompleteCommand.js.map +1 -1
- package/dist/cli/commands/DebugCommand.js +1 -1
- package/dist/cli/commands/DebugCommand.js.map +1 -1
- package/dist/cli/commands/InfillCommand.d.ts +2 -1
- package/dist/cli/commands/InfillCommand.js +58 -30
- package/dist/cli/commands/InfillCommand.js.map +1 -1
- package/dist/cli/commands/InitCommand.js +1 -1
- package/dist/cli/commands/PullCommand.d.ts +2 -1
- package/dist/cli/commands/PullCommand.js +85 -44
- package/dist/cli/commands/PullCommand.js.map +1 -1
- package/dist/cli/commands/inspect/InspectCommand.js +5 -3
- package/dist/cli/commands/inspect/InspectCommand.js.map +1 -1
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.d.ts +12 -0
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.js +225 -0
- package/dist/cli/commands/inspect/commands/InspectEstimateCommand.js.map +1 -0
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.js +17 -4
- package/dist/cli/commands/inspect/commands/InspectGgufCommand.js.map +1 -1
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.js +31 -9
- package/dist/cli/commands/inspect/commands/InspectGpuCommand.js.map +1 -1
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js +7 -4
- package/dist/cli/commands/inspect/commands/InspectMeasureCommand.js.map +1 -1
- package/dist/cli/commands/source/SourceCommand.d.ts +4 -0
- package/dist/cli/commands/source/SourceCommand.js +19 -0
- package/dist/cli/commands/source/SourceCommand.js.map +1 -0
- package/dist/cli/commands/{BuildCommand.d.ts → source/commands/BuildCommand.d.ts} +1 -2
- package/dist/cli/commands/{BuildCommand.js → source/commands/BuildCommand.js} +21 -19
- package/dist/cli/commands/source/commands/BuildCommand.js.map +1 -0
- package/dist/cli/commands/{ClearCommand.js → source/commands/ClearCommand.js} +6 -6
- package/dist/cli/commands/source/commands/ClearCommand.js.map +1 -0
- package/dist/cli/commands/{DownloadCommand.d.ts → source/commands/DownloadCommand.d.ts} +1 -2
- package/dist/cli/commands/{DownloadCommand.js → source/commands/DownloadCommand.js} +26 -22
- package/dist/cli/commands/source/commands/DownloadCommand.js.map +1 -0
- package/dist/cli/recommendedModels.js +192 -23
- package/dist/cli/recommendedModels.js.map +1 -1
- package/dist/cli/utils/ConsoleInteraction.d.ts +0 -1
- package/dist/cli/utils/ConsoleTable.js.map +1 -1
- package/dist/cli/utils/basicChooseFromListConsoleInteraction.js.map +1 -1
- package/dist/cli/utils/interactivelyAskForModel.js +6 -17
- package/dist/cli/utils/interactivelyAskForModel.js.map +1 -1
- package/dist/cli/utils/printCommonInfoLines.js +3 -0
- package/dist/cli/utils/printCommonInfoLines.js.map +1 -1
- package/dist/cli/utils/renderModelCompatibilityPercentageWithColors.d.ts +6 -0
- package/dist/cli/utils/renderModelCompatibilityPercentageWithColors.js +14 -0
- package/dist/cli/utils/renderModelCompatibilityPercentageWithColors.js.map +1 -0
- package/dist/cli/utils/resolveModelRecommendationFileOptions.d.ts +1 -1
- package/dist/cli/utils/withCliCommandDescriptionDocsUrl.js.map +1 -1
- package/dist/commands.d.ts +3 -3
- package/dist/commands.js +3 -3
- package/dist/commands.js.map +1 -1
- package/dist/config.d.ts +7 -3
- package/dist/config.js +10 -6
- package/dist/config.js.map +1 -1
- package/dist/evaluator/LlamaChat/LlamaChat.d.ts +17 -2
- package/dist/evaluator/LlamaChat/LlamaChat.js +24 -12
- package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -1
- package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js +3 -1
- package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +1 -1
- package/dist/evaluator/LlamaChatSession/LlamaChatSession.d.ts +21 -13
- package/dist/evaluator/LlamaChatSession/LlamaChatSession.js +15 -14
- package/dist/evaluator/LlamaChatSession/LlamaChatSession.js.map +1 -1
- package/dist/evaluator/LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.d.ts +1 -0
- package/dist/evaluator/LlamaChatSession/utils/LlamaChatSessionPromptCompletionEngine.js.map +1 -1
- package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.d.ts +3 -0
- package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.js +3 -0
- package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.js.map +1 -1
- package/dist/evaluator/LlamaCompletion.d.ts +18 -4
- package/dist/evaluator/LlamaCompletion.js +51 -22
- package/dist/evaluator/LlamaCompletion.js.map +1 -1
- package/dist/evaluator/LlamaContext/LlamaContext.d.ts +21 -0
- package/dist/evaluator/LlamaContext/LlamaContext.js +256 -133
- package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -1
- package/dist/evaluator/LlamaContext/LlamaSampler.d.ts +1 -0
- package/dist/evaluator/LlamaContext/LlamaSampler.js +31 -0
- package/dist/evaluator/LlamaContext/LlamaSampler.js.map +1 -0
- package/dist/evaluator/LlamaContext/types.d.ts +71 -9
- package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizationStrategies/maximumParallelismStrategy.js.map +1 -1
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js +1 -1
- package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizationStrategy.js.map +1 -1
- package/dist/evaluator/LlamaEmbedding.d.ts +21 -0
- package/dist/evaluator/LlamaEmbedding.js +53 -0
- package/dist/evaluator/LlamaEmbedding.js.map +1 -0
- package/dist/evaluator/LlamaEmbeddingContext.d.ts +1 -5
- package/dist/evaluator/LlamaEmbeddingContext.js +6 -8
- package/dist/evaluator/LlamaEmbeddingContext.js.map +1 -1
- package/dist/evaluator/LlamaGrammar.d.ts +9 -10
- package/dist/evaluator/LlamaGrammar.js +10 -5
- package/dist/evaluator/LlamaGrammar.js.map +1 -1
- package/dist/evaluator/LlamaGrammarEvaluationState.d.ts +7 -3
- package/dist/evaluator/LlamaGrammarEvaluationState.js +8 -4
- package/dist/evaluator/LlamaGrammarEvaluationState.js.map +1 -1
- package/dist/evaluator/LlamaJsonSchemaGrammar.d.ts +3 -0
- package/dist/evaluator/LlamaJsonSchemaGrammar.js +3 -0
- package/dist/evaluator/LlamaJsonSchemaGrammar.js.map +1 -1
- package/dist/evaluator/LlamaModel/LlamaModel.d.ts +28 -15
- package/dist/evaluator/LlamaModel/LlamaModel.js +66 -51
- package/dist/evaluator/LlamaModel/LlamaModel.js.map +1 -1
- package/dist/evaluator/LlamaModel/utils/TokenAttributes.d.ts +10 -10
- package/dist/evaluator/LlamaModel/utils/TokenAttributes.js +10 -10
- package/dist/evaluator/LlamaModel/utils/TokenAttributes.js.map +1 -1
- package/dist/evaluator/TokenBias.d.ts +20 -8
- package/dist/evaluator/TokenBias.js +44 -12
- package/dist/evaluator/TokenBias.js.map +1 -1
- package/dist/evaluator/TokenMeter.d.ts +3 -12
- package/dist/evaluator/TokenMeter.js +4 -16
- package/dist/evaluator/TokenMeter.js.map +1 -1
- package/dist/gguf/fileReaders/GgufFileReader.d.ts +0 -1
- package/dist/gguf/fileReaders/GgufFileReader.js.map +1 -1
- package/dist/gguf/fileReaders/GgufFsFileReader.d.ts +0 -2
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.d.ts +5 -3
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js +26 -13
- package/dist/gguf/fileReaders/GgufNetworkFetchFileReader.js.map +1 -1
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.d.ts +57 -1
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.js +86 -4
- package/dist/gguf/insights/GgufInsightsConfigurationResolver.js.map +1 -1
- package/dist/gguf/insights/utils/scoreLevels.js.map +1 -1
- package/dist/gguf/readGgufFileInfo.d.ts +18 -6
- package/dist/gguf/readGgufFileInfo.js +8 -3
- package/dist/gguf/readGgufFileInfo.js.map +1 -1
- package/dist/gguf/types/GgufMetadataTypes.d.ts +18 -2
- package/dist/gguf/types/GgufMetadataTypes.js +16 -1
- package/dist/gguf/types/GgufMetadataTypes.js.map +1 -1
- package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js +2 -0
- package/dist/gguf/utils/convertMetadataKeyValueRecordToNestedObject.js.map +1 -1
- package/dist/gguf/utils/getGgufFileTypeName.d.ts +1 -1
- package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.js +1 -1
- package/dist/gguf/utils/resolveBinarySplitGgufPartUrls.js.map +1 -1
- package/dist/index.d.ts +8 -4
- package/dist/index.js +5 -3
- package/dist/index.js.map +1 -1
- package/dist/tsconfig.tsbuildinfo +1 -0
- package/dist/types.d.ts +1 -0
- package/dist/types.js.map +1 -1
- package/dist/utils/LlamaText.d.ts +3 -0
- package/dist/utils/LlamaText.js +7 -4
- package/dist/utils/LlamaText.js.map +1 -1
- package/dist/utils/LruCache.d.ts +2 -2
- package/dist/utils/LruCache.js.map +1 -1
- package/dist/utils/OverridesObject.d.ts +7 -0
- package/dist/utils/OverridesObject.js +2 -0
- package/dist/utils/OverridesObject.js.map +1 -0
- package/dist/utils/StopGenerationDetector.js.map +1 -1
- package/dist/utils/ThreadsSplitter.d.ts +26 -0
- package/dist/utils/ThreadsSplitter.js +164 -0
- package/dist/utils/ThreadsSplitter.js.map +1 -0
- package/dist/utils/TokenStreamRegulator.js.map +1 -1
- package/dist/utils/appendUserMessageToChatHistory.d.ts +4 -0
- package/dist/utils/appendUserMessageToChatHistory.js +4 -0
- package/dist/utils/appendUserMessageToChatHistory.js.map +1 -1
- package/dist/utils/compareTokens.d.ts +1 -1
- package/dist/utils/compareTokens.js.map +1 -1
- package/dist/utils/createModelDownloader.d.ts +94 -6
- package/dist/utils/createModelDownloader.js +174 -46
- package/dist/utils/createModelDownloader.js.map +1 -1
- package/dist/utils/gbnfJson/terminals/GbnfOr.js.map +1 -1
- package/dist/utils/gbnfJson/utils/validateObjectAgainstGbnfSchema.js +1 -1
- package/dist/utils/gbnfJson/utils/validateObjectAgainstGbnfSchema.js.map +1 -1
- package/dist/utils/getGrammarsFolder.js +1 -1
- package/dist/utils/getGrammarsFolder.js.map +1 -1
- package/dist/utils/gitReleaseBundles.js.map +1 -1
- package/dist/utils/modelFileAccesTokens.d.ts +4 -0
- package/dist/utils/modelFileAccesTokens.js +40 -0
- package/dist/utils/modelFileAccesTokens.js.map +1 -0
- package/dist/utils/parseModelFileName.js.map +1 -1
- package/dist/utils/parseTextTemplate.js.map +1 -1
- package/dist/utils/resolveGithubRelease.d.ts +1 -1
- package/dist/utils/resolveLastTokens.js.map +1 -1
- package/dist/utils/spawnCommand.d.ts +0 -1
- package/dist/utils/truncateTextAndRoundToWords.js +3 -1
- package/dist/utils/truncateTextAndRoundToWords.js.map +1 -1
- package/dist/utils/withOra.js +1 -1
- package/dist/utils/withOra.js.map +1 -1
- package/dist/utils/withProgressLog.d.ts +0 -1
- package/dist/utils/wrapAbortSignal.d.ts +0 -1
- package/llama/CMakeLists.txt +20 -12
- package/llama/addon/AddonContext.cpp +69 -202
- package/llama/addon/AddonContext.h +4 -5
- package/llama/addon/AddonGrammar.cpp +8 -11
- package/llama/addon/AddonGrammar.h +4 -3
- package/llama/addon/AddonGrammarEvaluationState.cpp +9 -10
- package/llama/addon/AddonGrammarEvaluationState.h +3 -1
- package/llama/addon/AddonModel.cpp +6 -5
- package/llama/addon/AddonSampler.cpp +513 -0
- package/llama/addon/AddonSampler.h +65 -0
- package/llama/addon/RingBuffer.h +109 -0
- package/llama/addon/addon.cpp +7 -0
- package/llama/addon/globals/addonLog.cpp +2 -1
- package/llama/binariesGithubRelease.json +1 -1
- package/llama/gitRelease.bundle +0 -0
- package/llama/grammars/README.md +1 -1
- package/llama/llama.cpp.info.json +1 -1
- package/package.json +71 -46
- package/templates/packed/electron-typescript-react.json +1 -1
- package/templates/packed/node-typescript.json +1 -1
- package/bins/linux-arm64/_nlcBuildMetadata.json +0 -1
- package/bins/linux-arm64/libggml.so +0 -0
- package/bins/linux-arm64/libllama.so +0 -0
- package/bins/linux-arm64/llama-addon.node +0 -0
- package/bins/linux-armv7l/_nlcBuildMetadata.json +0 -1
- package/bins/linux-armv7l/libggml.so +0 -0
- package/bins/linux-armv7l/libllama.so +0 -0
- package/bins/linux-armv7l/llama-addon.node +0 -0
- package/bins/linux-x64/_nlcBuildMetadata.json +0 -1
- package/bins/linux-x64/libggml.so +0 -0
- package/bins/linux-x64/libllama.so +0 -0
- package/bins/linux-x64/llama-addon.node +0 -0
- package/bins/linux-x64-vulkan/_nlcBuildMetadata.json +0 -1
- package/bins/linux-x64-vulkan/libggml.so +0 -0
- package/bins/linux-x64-vulkan/libllama.so +0 -0
- package/bins/linux-x64-vulkan/llama-addon.node +0 -0
- package/bins/linux-x64-vulkan/vulkan-shaders-gen +0 -0
- package/bins/mac-arm64-metal/_nlcBuildMetadata.json +0 -1
- package/bins/mac-arm64-metal/ggml-common.h +0 -1833
- package/bins/mac-arm64-metal/ggml-metal.metal +0 -6168
- package/bins/mac-arm64-metal/libggml.dylib +0 -0
- package/bins/mac-arm64-metal/libllama.dylib +0 -0
- package/bins/mac-arm64-metal/llama-addon.node +0 -0
- package/bins/mac-x64/_nlcBuildMetadata.json +0 -1
- package/bins/mac-x64/libggml.dylib +0 -0
- package/bins/mac-x64/libllama.dylib +0 -0
- package/bins/mac-x64/llama-addon.node +0 -0
- package/bins/win-arm64/_nlcBuildMetadata.json +0 -1
- package/bins/win-arm64/ggml.dll +0 -0
- package/bins/win-arm64/llama-addon.exp +0 -0
- package/bins/win-arm64/llama-addon.lib +0 -0
- package/bins/win-arm64/llama-addon.node +0 -0
- package/bins/win-arm64/llama.dll +0 -0
- package/bins/win-x64/_nlcBuildMetadata.json +0 -1
- package/bins/win-x64/ggml.dll +0 -0
- package/bins/win-x64/llama-addon.exp +0 -0
- package/bins/win-x64/llama-addon.lib +0 -0
- package/bins/win-x64/llama-addon.node +0 -0
- package/bins/win-x64/llama.dll +0 -0
- package/bins/win-x64-vulkan/_nlcBuildMetadata.json +0 -1
- package/bins/win-x64-vulkan/ggml.dll +0 -0
- package/bins/win-x64-vulkan/llama-addon.exp +0 -0
- package/bins/win-x64-vulkan/llama-addon.lib +0 -0
- package/bins/win-x64-vulkan/llama-addon.node +0 -0
- package/bins/win-x64-vulkan/llama.dll +0 -0
- package/bins/win-x64-vulkan/vulkan-shaders-gen.exe +0 -0
- package/dist/cli/commands/BuildCommand.js.map +0 -1
- package/dist/cli/commands/ClearCommand.js.map +0 -1
- package/dist/cli/commands/DownloadCommand.js.map +0 -1
- package/dist/utils/DeepPartialObject.d.ts +0 -3
- package/dist/utils/DeepPartialObject.js +0 -2
- package/dist/utils/DeepPartialObject.js.map +0 -1
- /package/dist/cli/commands/{ClearCommand.d.ts → source/commands/ClearCommand.d.ts} +0 -0
package/llama/addon/addon.cpp
CHANGED
|
@@ -3,6 +3,7 @@
|
|
|
3
3
|
#include "AddonModelLora.h"
|
|
4
4
|
#include "AddonGrammar.h"
|
|
5
5
|
#include "AddonGrammarEvaluationState.h"
|
|
6
|
+
#include "AddonSampler.h"
|
|
6
7
|
#include "AddonContext.h"
|
|
7
8
|
#include "globals/addonLog.h"
|
|
8
9
|
#include "globals/addonProgress.h"
|
|
@@ -27,6 +28,10 @@ Napi::Value addonGetSupportsMlock(const Napi::CallbackInfo& info) {
|
|
|
27
28
|
return Napi::Boolean::New(info.Env(), llama_supports_mlock());
|
|
28
29
|
}
|
|
29
30
|
|
|
31
|
+
Napi::Value addonGetMathCores(const Napi::CallbackInfo& info) {
|
|
32
|
+
return Napi::Number::New(info.Env(), cpu_get_num_math());
|
|
33
|
+
}
|
|
34
|
+
|
|
30
35
|
Napi::Value addonGetBlockSizeForGgmlType(const Napi::CallbackInfo& info) {
|
|
31
36
|
const int ggmlType = info[0].As<Napi::Number>().Int32Value();
|
|
32
37
|
|
|
@@ -189,6 +194,7 @@ Napi::Object registerCallback(Napi::Env env, Napi::Object exports) {
|
|
|
189
194
|
Napi::PropertyDescriptor::Function("getSupportsGpuOffloading", addonGetSupportsGpuOffloading),
|
|
190
195
|
Napi::PropertyDescriptor::Function("getSupportsMmap", addonGetSupportsMmap),
|
|
191
196
|
Napi::PropertyDescriptor::Function("getSupportsMlock", addonGetSupportsMlock),
|
|
197
|
+
Napi::PropertyDescriptor::Function("getMathCores", addonGetMathCores),
|
|
192
198
|
Napi::PropertyDescriptor::Function("getBlockSizeForGgmlType", addonGetBlockSizeForGgmlType),
|
|
193
199
|
Napi::PropertyDescriptor::Function("getTypeSizeForGgmlType", addonGetTypeSizeForGgmlType),
|
|
194
200
|
Napi::PropertyDescriptor::Function("getConsts", addonGetConsts),
|
|
@@ -205,6 +211,7 @@ Napi::Object registerCallback(Napi::Env env, Napi::Object exports) {
|
|
|
205
211
|
AddonGrammar::init(exports);
|
|
206
212
|
AddonGrammarEvaluationState::init(exports);
|
|
207
213
|
AddonContext::init(exports);
|
|
214
|
+
AddonSampler::init(exports);
|
|
208
215
|
|
|
209
216
|
llama_log_set(addonLlamaCppLogCallback, nullptr);
|
|
210
217
|
|
|
@@ -11,7 +11,8 @@ static int addonGetGgmlLogLevelNumber(ggml_log_level level) {
|
|
|
11
11
|
case GGML_LOG_LEVEL_ERROR: return 2;
|
|
12
12
|
case GGML_LOG_LEVEL_WARN: return 3;
|
|
13
13
|
case GGML_LOG_LEVEL_INFO: return 4;
|
|
14
|
-
case
|
|
14
|
+
case GGML_LOG_LEVEL_NONE: return 5;
|
|
15
|
+
case GGML_LOG_LEVEL_DEBUG: return 6;
|
|
15
16
|
}
|
|
16
17
|
|
|
17
18
|
return 1;
|
package/llama/gitRelease.bundle
CHANGED
|
Binary file
|
package/llama/grammars/README.md
CHANGED
|
@@ -120,7 +120,7 @@ You can use GBNF grammars:
|
|
|
120
120
|
|
|
121
121
|
- In [llama-server](../examples/server):
|
|
122
122
|
- For any completion endpoints, passed as the `json_schema` body field
|
|
123
|
-
- For the `/chat/completions` endpoint, passed inside the `
|
|
123
|
+
- For the `/chat/completions` endpoint, passed inside the `response_format` body field (e.g. `{"type", "json_object", "schema": {"items": {}}}` or `{ type: "json_schema", json_schema: {"schema": ...} }`)
|
|
124
124
|
- In [llama-cli](../examples/main), passed as the `--json` / `-j` flag
|
|
125
125
|
- To convert to a grammar ahead of time:
|
|
126
126
|
- in CLI, with [examples/json_schema_to_grammar.py](../examples/json_schema_to_grammar.py)
|
package/package.json
CHANGED
|
@@ -1,12 +1,13 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "node-llama-cpp",
|
|
3
|
-
"version": "3.0.0-beta.
|
|
3
|
+
"version": "3.0.0-beta.45",
|
|
4
4
|
"description": "Run AI models locally on your machine with node.js bindings for llama.cpp. Force a JSON schema on the model output on the generation level",
|
|
5
5
|
"main": "./dist/index.js",
|
|
6
6
|
"type": "module",
|
|
7
7
|
"types": "./dist/index.d.ts",
|
|
8
8
|
"bin": {
|
|
9
|
-
"node-llama-cpp": "dist/cli/cli.js"
|
|
9
|
+
"node-llama-cpp": "dist/cli/cli.js",
|
|
10
|
+
"nlc": "dist/cli/cli.js"
|
|
10
11
|
},
|
|
11
12
|
"files": [
|
|
12
13
|
"dist/",
|
|
@@ -57,15 +58,15 @@
|
|
|
57
58
|
"test:standalone:interactive": "vitest watch ./test/standalone",
|
|
58
59
|
"test:modelDependent": "vitest run ./test/modelDependent",
|
|
59
60
|
"test:modelDependent:interactive": "vitest watch ./test/modelDependent",
|
|
60
|
-
"test:typescript": "tsc --
|
|
61
|
+
"test:typescript": "tsc --noEmit --project tsconfig.json",
|
|
61
62
|
"lint": "npm run lint:eslint",
|
|
62
63
|
"lint:eslint": "eslint --ext .js --ext .ts --report-unused-disable-directives .",
|
|
63
64
|
"format": "npm run lint:eslint -- --fix",
|
|
64
65
|
"dev:setup:downloadAllTestModels": "vite-node test/utils/scripts/downloadAllTestModels.ts",
|
|
65
|
-
"dev:setup": "npm run build && node ./dist/cli/cli.js download --noUsageExample && npm run docs:generateTypedoc && npm run dev:setup:downloadAllTestModels",
|
|
66
|
-
"dev:build": "npm run build && node ./dist/cli/cli.js build --noUsageExample",
|
|
66
|
+
"dev:setup": "npm run build && node ./dist/cli/cli.js source download --noUsageExample && npm run docs:generateTypedoc && npm run dev:setup:downloadAllTestModels",
|
|
67
|
+
"dev:build": "npm run build && node ./dist/cli/cli.js source build --noUsageExample",
|
|
67
68
|
"clean": "rm -rf ./node_modules ./dist ./tsconfig.tsbuildinfo ./test/.models ./docs/api ./docs/api-overrides ./templates/packed",
|
|
68
|
-
"docs:generateTypedoc": "typedoc
|
|
69
|
+
"docs:generateTypedoc": "typedoc && rimraf ./docs/api/index.md ./docs/api/globals.md ./docs/api/functions/LlamaText.md",
|
|
69
70
|
"docs:dev": "npm run docs:generateTypedoc && vitepress dev",
|
|
70
71
|
"docs:build": "npm run docs:generateTypedoc && vitepress build",
|
|
71
72
|
"docs:preview": "npm run docs:generateTypedoc && vitepress preview"
|
|
@@ -89,6 +90,7 @@
|
|
|
89
90
|
"cuda",
|
|
90
91
|
"vulkan",
|
|
91
92
|
"grammar",
|
|
93
|
+
"embedding",
|
|
92
94
|
"json-grammar",
|
|
93
95
|
"json-schema-grammar",
|
|
94
96
|
"functions",
|
|
@@ -98,11 +100,17 @@
|
|
|
98
100
|
"minP",
|
|
99
101
|
"topK",
|
|
100
102
|
"topP",
|
|
103
|
+
"seed",
|
|
101
104
|
"json-schema",
|
|
102
105
|
"raspberry-pi",
|
|
103
106
|
"self-hosted",
|
|
104
107
|
"local",
|
|
105
|
-
"catai"
|
|
108
|
+
"catai",
|
|
109
|
+
"mistral",
|
|
110
|
+
"typescript",
|
|
111
|
+
"lora",
|
|
112
|
+
"batching",
|
|
113
|
+
"gpu"
|
|
106
114
|
],
|
|
107
115
|
"author": "Gilad S.",
|
|
108
116
|
"license": "MIT",
|
|
@@ -114,46 +122,54 @@
|
|
|
114
122
|
"type": "github",
|
|
115
123
|
"url": "https://github.com/sponsors/giladgd"
|
|
116
124
|
},
|
|
117
|
-
"homepage": "https://
|
|
125
|
+
"homepage": "https://node-llama-cpp.withcat.ai",
|
|
118
126
|
"devDependencies": {
|
|
119
|
-
"@commitlint/cli": "^19.
|
|
120
|
-
"@commitlint/config-conventional": "^19.
|
|
127
|
+
"@commitlint/cli": "^19.5.0",
|
|
128
|
+
"@commitlint/config-conventional": "^19.5.0",
|
|
129
|
+
"@fontsource/inter": "^5.1.0",
|
|
130
|
+
"@nolebase/vitepress-plugin-git-changelog": "^2.5.0",
|
|
131
|
+
"@nolebase/vitepress-plugin-og-image": "^2.5.0",
|
|
132
|
+
"@resvg/resvg-js": "^2.6.2",
|
|
121
133
|
"@semantic-release/exec": "^6.0.3",
|
|
122
|
-
"@
|
|
134
|
+
"@semantic-release/npm": "12.0.1",
|
|
135
|
+
"@shikijs/vitepress-twoslash": "^1.17.7",
|
|
123
136
|
"@types/async-retry": "^1.4.8",
|
|
124
137
|
"@types/bytes": "^3.1.4",
|
|
125
138
|
"@types/cross-spawn": "^6.0.2",
|
|
126
139
|
"@types/fs-extra": "^11.0.4",
|
|
127
|
-
"@types/node": "^
|
|
140
|
+
"@types/node": "^22.5.5",
|
|
128
141
|
"@types/proper-lockfile": "^4.1.4",
|
|
129
142
|
"@types/semver": "^7.5.8",
|
|
130
143
|
"@types/validate-npm-package-name": "^4.0.2",
|
|
131
144
|
"@types/which": "^3.0.4",
|
|
132
|
-
"@types/yargs": "^17.0.
|
|
133
|
-
"@typescript-eslint/eslint-plugin": "^7.
|
|
134
|
-
"@typescript-eslint/parser": "^7.
|
|
135
|
-
"@vitest/coverage-v8": "^1.
|
|
136
|
-
"@vitest/ui": "^1.
|
|
145
|
+
"@types/yargs": "^17.0.33",
|
|
146
|
+
"@typescript-eslint/eslint-plugin": "^7.15.0",
|
|
147
|
+
"@typescript-eslint/parser": "^7.15.0",
|
|
148
|
+
"@vitest/coverage-v8": "^2.1.1",
|
|
149
|
+
"@vitest/ui": "^2.1.1",
|
|
137
150
|
"eslint": "^8.46.0",
|
|
138
|
-
"eslint-plugin-import": "^2.
|
|
139
|
-
"eslint-plugin-jsdoc": "^
|
|
140
|
-
"eslint-plugin-n": "^17.
|
|
141
|
-
"
|
|
142
|
-
"
|
|
143
|
-
"
|
|
144
|
-
"
|
|
145
|
-
"
|
|
146
|
-
"
|
|
147
|
-
"
|
|
148
|
-
"typedoc
|
|
149
|
-
"
|
|
150
|
-
"
|
|
151
|
-
"vitepress": "^1.
|
|
152
|
-
"
|
|
153
|
-
"
|
|
151
|
+
"eslint-plugin-import": "^2.30.0",
|
|
152
|
+
"eslint-plugin-jsdoc": "^50.2.3",
|
|
153
|
+
"eslint-plugin-n": "^17.10.2",
|
|
154
|
+
"feed": "^4.2.2",
|
|
155
|
+
"husky": "^9.1.6",
|
|
156
|
+
"rehype": "^13.0.1",
|
|
157
|
+
"rimraf": "^6.0.1",
|
|
158
|
+
"semantic-release": "24.1.1",
|
|
159
|
+
"sharp": "^0.33.5",
|
|
160
|
+
"tslib": "^2.7.0",
|
|
161
|
+
"typedoc": "^0.26.7",
|
|
162
|
+
"typedoc-plugin-markdown": "^4.2.7",
|
|
163
|
+
"typedoc-plugin-mdn-links": "^3.2.12",
|
|
164
|
+
"typedoc-vitepress-theme": "^1.0.1",
|
|
165
|
+
"typescript": "^5.6.2",
|
|
166
|
+
"vite-node": "^2.1.1",
|
|
167
|
+
"vitepress": "^1.3.4",
|
|
168
|
+
"vitest": "^2.1.1",
|
|
169
|
+
"zx": "^8.1.7"
|
|
154
170
|
},
|
|
155
171
|
"dependencies": {
|
|
156
|
-
"@huggingface/jinja": "^0.
|
|
172
|
+
"@huggingface/jinja": "^0.3.1",
|
|
157
173
|
"async-retry": "^1.3.3",
|
|
158
174
|
"bytes": "^3.1.2",
|
|
159
175
|
"chalk": "^5.3.0",
|
|
@@ -164,19 +180,19 @@
|
|
|
164
180
|
"env-var": "^7.5.0",
|
|
165
181
|
"filenamify": "^6.0.0",
|
|
166
182
|
"fs-extra": "^11.2.0",
|
|
167
|
-
"ignore": "^5.3.
|
|
168
|
-
"ipull": "^3.6.
|
|
169
|
-
"is-unicode-supported": "^2.
|
|
170
|
-
"lifecycle-utils": "^1.
|
|
171
|
-
"log-symbols": "^
|
|
183
|
+
"ignore": "^5.3.2",
|
|
184
|
+
"ipull": "^3.6.2",
|
|
185
|
+
"is-unicode-supported": "^2.1.0",
|
|
186
|
+
"lifecycle-utils": "^1.7.0",
|
|
187
|
+
"log-symbols": "^7.0.0",
|
|
172
188
|
"nanoid": "^5.0.7",
|
|
173
|
-
"node-addon-api": "^8.
|
|
189
|
+
"node-addon-api": "^8.1.0",
|
|
174
190
|
"octokit": "^4.0.2",
|
|
175
|
-
"ora": "^8.0
|
|
176
|
-
"pretty-ms": "^9.
|
|
191
|
+
"ora": "^8.1.0",
|
|
192
|
+
"pretty-ms": "^9.1.0",
|
|
177
193
|
"proper-lockfile": "^4.1.2",
|
|
178
|
-
"semver": "^7.6.
|
|
179
|
-
"simple-git": "^3.
|
|
194
|
+
"semver": "^7.6.3",
|
|
195
|
+
"simple-git": "^3.26.0",
|
|
180
196
|
"slice-ansi": "^7.1.0",
|
|
181
197
|
"stdout-update": "^4.0.1",
|
|
182
198
|
"strip-ansi": "^7.1.0",
|
|
@@ -193,7 +209,16 @@
|
|
|
193
209
|
}
|
|
194
210
|
},
|
|
195
211
|
"optionalDependencies": {
|
|
196
|
-
"@node-llama-cpp/linux-
|
|
197
|
-
"@node-llama-cpp/
|
|
212
|
+
"@node-llama-cpp/linux-arm64": "3.0.0-beta.45",
|
|
213
|
+
"@node-llama-cpp/linux-armv7l": "3.0.0-beta.45",
|
|
214
|
+
"@node-llama-cpp/linux-x64": "3.0.0-beta.45",
|
|
215
|
+
"@node-llama-cpp/linux-x64-cuda": "3.0.0-beta.45",
|
|
216
|
+
"@node-llama-cpp/linux-x64-vulkan": "3.0.0-beta.45",
|
|
217
|
+
"@node-llama-cpp/mac-arm64-metal": "3.0.0-beta.45",
|
|
218
|
+
"@node-llama-cpp/mac-x64": "3.0.0-beta.45",
|
|
219
|
+
"@node-llama-cpp/win-arm64": "3.0.0-beta.45",
|
|
220
|
+
"@node-llama-cpp/win-x64": "3.0.0-beta.45",
|
|
221
|
+
"@node-llama-cpp/win-x64-cuda": "3.0.0-beta.45",
|
|
222
|
+
"@node-llama-cpp/win-x64-vulkan": "3.0.0-beta.45"
|
|
198
223
|
}
|
|
199
224
|
}
|