npm - node-llama-cpp - Versions diffs - 2.8.6 → 3.0.0-beta.10 - Mend

node-llama-cpp 2.8.6 → 3.0.0-beta.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (346) hide show

package/README.md +2 -2
package/dist/ChatWrapper.d.ts +49 -0
package/dist/ChatWrapper.js +120 -0
package/dist/ChatWrapper.js.map +1 -0
package/dist/bindings/AddonTypes.d.ts +92 -0
package/dist/bindings/AddonTypes.js +2 -0
package/dist/bindings/AddonTypes.js.map +1 -0
package/dist/bindings/Llama.d.ts +23 -0
package/dist/bindings/Llama.js +225 -0
package/dist/bindings/Llama.js.map +1 -0
package/dist/bindings/getLlama.d.ts +86 -0
package/dist/bindings/getLlama.js +225 -0
package/dist/bindings/getLlama.js.map +1 -0
package/dist/bindings/types.d.ts +33 -0
package/dist/bindings/types.js +30 -0
package/dist/bindings/types.js.map +1 -0
package/dist/bindings/utils/NoBinaryFoundError.d.ts +2 -0
package/dist/bindings/utils/NoBinaryFoundError.js +7 -0
package/dist/bindings/utils/NoBinaryFoundError.js.map +1 -0
package/dist/{utils → bindings/utils}/binariesGithubRelease.js +1 -1
package/dist/bindings/utils/binariesGithubRelease.js.map +1 -0
package/dist/bindings/utils/clearAllLocalBuilds.d.ts +1 -0
package/dist/bindings/utils/clearAllLocalBuilds.js +47 -0
package/dist/bindings/utils/clearAllLocalBuilds.js.map +1 -0
package/dist/bindings/utils/cloneLlamaCppRepo.d.ts +11 -0
package/dist/bindings/utils/cloneLlamaCppRepo.js +155 -0
package/dist/bindings/utils/cloneLlamaCppRepo.js.map +1 -0
package/dist/bindings/utils/compileLLamaCpp.d.ts +12 -0
package/dist/bindings/utils/compileLLamaCpp.js +157 -0
package/dist/bindings/utils/compileLLamaCpp.js.map +1 -0
package/dist/bindings/utils/getBuildFolderNameForBuildOptions.d.ts +5 -0
package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js +85 -0
package/dist/bindings/utils/getBuildFolderNameForBuildOptions.js.map +1 -0
package/dist/bindings/utils/getCanUsePrebuiltBinaries.d.ts +1 -0
package/dist/bindings/utils/getCanUsePrebuiltBinaries.js +8 -0
package/dist/bindings/utils/getCanUsePrebuiltBinaries.js.map +1 -0
package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.d.ts +2 -0
package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.js +21 -0
package/dist/bindings/utils/getExampleUsageCodeOfGetLlama.js.map +1 -0
package/dist/bindings/utils/getPlatform.d.ts +2 -0
package/dist/bindings/utils/getPlatform.js +15 -0
package/dist/bindings/utils/getPlatform.js.map +1 -0
package/dist/bindings/utils/lastBuildInfo.d.ts +6 -0
package/dist/bindings/utils/lastBuildInfo.js +17 -0
package/dist/bindings/utils/lastBuildInfo.js.map +1 -0
package/dist/bindings/utils/logBinaryUsageExampleToConsole.d.ts +2 -0
package/dist/bindings/utils/logBinaryUsageExampleToConsole.js +28 -0
package/dist/bindings/utils/logBinaryUsageExampleToConsole.js.map +1 -0
package/dist/bindings/utils/resolveCustomCmakeOptions.d.ts +1 -0
package/dist/bindings/utils/resolveCustomCmakeOptions.js +43 -0
package/dist/bindings/utils/resolveCustomCmakeOptions.js.map +1 -0
package/dist/chatWrappers/AlpacaChatWrapper.d.ts +12 -0
package/dist/chatWrappers/AlpacaChatWrapper.js +21 -0
package/dist/chatWrappers/AlpacaChatWrapper.js.map +1 -0
package/dist/chatWrappers/ChatMLChatWrapper.d.ts +18 -0
package/dist/chatWrappers/ChatMLChatWrapper.js +83 -0
package/dist/chatWrappers/ChatMLChatWrapper.js.map +1 -0
package/dist/chatWrappers/EmptyChatWrapper.d.ts +4 -0
package/dist/chatWrappers/EmptyChatWrapper.js +5 -0
package/dist/chatWrappers/EmptyChatWrapper.js.map +1 -0
package/dist/chatWrappers/FalconChatWrapper.d.ts +21 -0
package/dist/chatWrappers/FalconChatWrapper.js +104 -0
package/dist/chatWrappers/FalconChatWrapper.js.map +1 -0
package/dist/chatWrappers/FunctionaryChatWrapper.d.ts +41 -0
package/dist/chatWrappers/FunctionaryChatWrapper.js +200 -0
package/dist/chatWrappers/FunctionaryChatWrapper.js.map +1 -0
package/dist/chatWrappers/GeneralChatWrapper.d.ts +21 -0
package/dist/chatWrappers/GeneralChatWrapper.js +112 -0
package/dist/chatWrappers/GeneralChatWrapper.js.map +1 -0
package/dist/chatWrappers/LlamaChatWrapper.d.ts +13 -0
package/dist/chatWrappers/LlamaChatWrapper.js +78 -0
package/dist/chatWrappers/LlamaChatWrapper.js.map +1 -0
package/dist/chatWrappers/resolveChatWrapperBasedOnModel.d.ts +13 -0
package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js +60 -0
package/dist/chatWrappers/resolveChatWrapperBasedOnModel.js.map +1 -0
package/dist/cli/cli.js +5 -1
package/dist/cli/cli.js.map +1 -1
package/dist/cli/commands/BuildCommand.d.ts +2 -1
package/dist/cli/commands/BuildCommand.js +50 -10
package/dist/cli/commands/BuildCommand.js.map +1 -1
package/dist/cli/commands/ChatCommand.d.ts +10 -4
package/dist/cli/commands/ChatCommand.js +169 -57
package/dist/cli/commands/ChatCommand.js.map +1 -1
package/dist/cli/commands/ClearCommand.js +4 -6
package/dist/cli/commands/ClearCommand.js.map +1 -1
package/dist/cli/commands/DebugCommand.d.ts +7 -0
package/dist/cli/commands/DebugCommand.js +59 -0
package/dist/cli/commands/DebugCommand.js.map +1 -0
package/dist/cli/commands/DownloadCommand.d.ts +2 -1
package/dist/cli/commands/DownloadCommand.js +47 -40
package/dist/cli/commands/DownloadCommand.js.map +1 -1
package/dist/cli/commands/OnPostInstallCommand.js +7 -10
package/dist/cli/commands/OnPostInstallCommand.js.map +1 -1
package/dist/config.d.ts +10 -3
package/dist/config.js +18 -7
package/dist/config.js.map +1 -1
package/dist/evaluator/LlamaChat/LlamaChat.d.ts +185 -0
package/dist/evaluator/LlamaChat/LlamaChat.js +705 -0
package/dist/evaluator/LlamaChat/LlamaChat.js.map +1 -0
package/dist/evaluator/LlamaChat/utils/FunctionCallGrammar.d.ts +22 -0
package/dist/evaluator/LlamaChat/utils/FunctionCallGrammar.js +121 -0
package/dist/evaluator/LlamaChat/utils/FunctionCallGrammar.js.map +1 -0
package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.d.ts +16 -0
package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js +135 -0
package/dist/evaluator/LlamaChat/utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js.map +1 -0
package/dist/evaluator/LlamaChatSession/LlamaChatSession.d.ts +157 -0
package/dist/evaluator/LlamaChatSession/LlamaChatSession.js +219 -0
package/dist/evaluator/LlamaChatSession/LlamaChatSession.js.map +1 -0
package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.d.ts +7 -0
package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.js +8 -0
package/dist/evaluator/LlamaChatSession/utils/defineChatSessionFunction.js.map +1 -0
package/dist/evaluator/LlamaContext/LlamaContext.d.ts +109 -0
package/dist/evaluator/LlamaContext/LlamaContext.js +606 -0
package/dist/evaluator/LlamaContext/LlamaContext.js.map +1 -0
package/dist/evaluator/LlamaContext/types.d.ts +82 -0
package/dist/evaluator/LlamaContext/types.js +2 -0
package/dist/evaluator/LlamaContext/types.js.map +1 -0
package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.d.ts +5 -0
package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js +16 -0
package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/firstInFirstOutStrategy.js.map +1 -0
package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.d.ts +5 -0
package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js +42 -0
package/dist/evaluator/LlamaContext/utils/batchItemsPrioritizingStrategies/maximumParallelismStrategy.js.map +1 -0
package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.d.ts +2 -0
package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js +13 -0
package/dist/evaluator/LlamaContext/utils/resolveBatchItemsPrioritizingStrategy.js.map +1 -0
package/dist/evaluator/LlamaEmbeddingContext.d.ts +37 -0
package/dist/evaluator/LlamaEmbeddingContext.js +78 -0
package/dist/evaluator/LlamaEmbeddingContext.js.map +1 -0
package/dist/evaluator/LlamaGrammar.d.ts +30 -0
package/dist/{llamaEvaluator → evaluator}/LlamaGrammar.js +15 -19
package/dist/evaluator/LlamaGrammar.js.map +1 -0
package/dist/evaluator/LlamaGrammarEvaluationState.d.ts +15 -0
package/dist/evaluator/LlamaGrammarEvaluationState.js +17 -0
package/dist/evaluator/LlamaGrammarEvaluationState.js.map +1 -0
package/dist/{llamaEvaluator → evaluator}/LlamaJsonSchemaGrammar.d.ts +2 -1
package/dist/{llamaEvaluator → evaluator}/LlamaJsonSchemaGrammar.js +4 -2
package/dist/evaluator/LlamaJsonSchemaGrammar.js.map +1 -0
package/dist/evaluator/LlamaModel.d.ts +120 -0
package/dist/evaluator/LlamaModel.js +320 -0
package/dist/evaluator/LlamaModel.js.map +1 -0
package/dist/index.d.ts +29 -16
package/dist/index.js +28 -15
package/dist/index.js.map +1 -1
package/dist/state.d.ts +2 -0
package/dist/state.js +7 -0
package/dist/state.js.map +1 -1
package/dist/types.d.ts +44 -4
package/dist/types.js +5 -1
package/dist/types.js.map +1 -1
package/dist/utils/LlamaText.d.ts +42 -0
package/dist/utils/LlamaText.js +207 -0
package/dist/utils/LlamaText.js.map +1 -0
package/dist/utils/ReplHistory.js +1 -1
package/dist/utils/ReplHistory.js.map +1 -1
package/dist/utils/StopGenerationDetector.d.ts +28 -0
package/dist/utils/StopGenerationDetector.js +205 -0
package/dist/utils/StopGenerationDetector.js.map +1 -0
package/dist/utils/TokenStreamRegulator.d.ts +30 -0
package/dist/utils/TokenStreamRegulator.js +96 -0
package/dist/utils/TokenStreamRegulator.js.map +1 -0
package/dist/utils/appendUserMessageToChatHistory.d.ts +2 -0
package/dist/utils/appendUserMessageToChatHistory.js +18 -0
package/dist/utils/appendUserMessageToChatHistory.js.map +1 -0
package/dist/utils/cmake.js +16 -11
package/dist/utils/cmake.js.map +1 -1
package/dist/utils/compareTokens.d.ts +2 -0
package/dist/utils/compareTokens.js +4 -0
package/dist/utils/compareTokens.js.map +1 -0
package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.d.ts +18 -0
package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.js +61 -0
package/dist/utils/findCharacterRemovalCountToFitChatHistoryInContext.js.map +1 -0
package/dist/utils/gbnfJson/GbnfGrammarGenerator.d.ts +1 -0
package/dist/utils/gbnfJson/GbnfGrammarGenerator.js +17 -0
package/dist/utils/gbnfJson/GbnfGrammarGenerator.js.map +1 -1
package/dist/utils/gbnfJson/GbnfTerminal.d.ts +1 -1
package/dist/utils/gbnfJson/GbnfTerminal.js.map +1 -1
package/dist/utils/gbnfJson/terminals/GbnfVerbatimText.d.ts +6 -0
package/dist/utils/gbnfJson/terminals/GbnfVerbatimText.js +21 -0
package/dist/utils/gbnfJson/terminals/GbnfVerbatimText.js.map +1 -0
package/dist/utils/gbnfJson/types.d.ts +1 -1
package/dist/utils/gbnfJson/types.js.map +1 -1
package/dist/utils/gbnfJson/utils/validateObjectAgainstGbnfSchema.d.ts +1 -0
package/dist/utils/gbnfJson/utils/validateObjectAgainstGbnfSchema.js.map +1 -1
package/dist/utils/getConsoleLogPrefix.d.ts +1 -0
package/dist/utils/getConsoleLogPrefix.js +9 -0
package/dist/utils/getConsoleLogPrefix.js.map +1 -0
package/dist/utils/getGbnfGrammarForGbnfJsonSchema.js +1 -15
package/dist/utils/getGbnfGrammarForGbnfJsonSchema.js.map +1 -1
package/dist/utils/getGrammarsFolder.d.ts +2 -1
package/dist/utils/getGrammarsFolder.js +8 -7
package/dist/utils/getGrammarsFolder.js.map +1 -1
package/dist/utils/getModuleVersion.d.ts +1 -0
package/dist/utils/getModuleVersion.js +13 -0
package/dist/utils/getModuleVersion.js.map +1 -0
package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.d.ts +2 -0
package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.js +49 -0
package/dist/utils/getTypeScriptTypeStringForGbnfJsonSchema.js.map +1 -0
package/dist/utils/gitReleaseBundles.js +6 -5
package/dist/utils/gitReleaseBundles.js.map +1 -1
package/dist/utils/hashString.d.ts +1 -0
package/dist/utils/hashString.js +8 -0
package/dist/utils/hashString.js.map +1 -0
package/dist/utils/isLockfileActive.d.ts +4 -0
package/dist/utils/isLockfileActive.js +12 -0
package/dist/utils/isLockfileActive.js.map +1 -0
package/dist/utils/parseModelFileName.d.ts +9 -0
package/dist/utils/parseModelFileName.js +68 -0
package/dist/utils/parseModelFileName.js.map +1 -0
package/dist/utils/parseModelTypeDescription.d.ts +6 -0
package/dist/utils/parseModelTypeDescription.js +9 -0
package/dist/utils/parseModelTypeDescription.js.map +1 -0
package/dist/utils/prettyPrintObject.d.ts +1 -0
package/dist/utils/prettyPrintObject.js +40 -0
package/dist/utils/prettyPrintObject.js.map +1 -0
package/dist/utils/removeNullFields.d.ts +1 -0
package/dist/utils/removeNullFields.js +8 -0
package/dist/utils/removeNullFields.js.map +1 -1
package/dist/utils/resolveChatWrapper.d.ts +4 -0
package/dist/utils/resolveChatWrapper.js +16 -0
package/dist/utils/resolveChatWrapper.js.map +1 -0
package/dist/utils/resolveGithubRelease.d.ts +2 -0
package/dist/utils/resolveGithubRelease.js +36 -0
package/dist/utils/resolveGithubRelease.js.map +1 -0
package/dist/utils/spawnCommand.d.ts +1 -1
package/dist/utils/spawnCommand.js +4 -2
package/dist/utils/spawnCommand.js.map +1 -1
package/dist/utils/tokenizeInput.d.ts +3 -0
package/dist/utils/tokenizeInput.js +9 -0
package/dist/utils/tokenizeInput.js.map +1 -0
package/dist/utils/truncateTextAndRoundToWords.d.ts +8 -0
package/dist/utils/truncateTextAndRoundToWords.js +27 -0
package/dist/utils/truncateTextAndRoundToWords.js.map +1 -0
package/dist/utils/waitForLockfileRelease.d.ts +5 -0
package/dist/utils/waitForLockfileRelease.js +20 -0
package/dist/utils/waitForLockfileRelease.js.map +1 -0
package/dist/utils/withLockfile.d.ts +7 -0
package/dist/utils/withLockfile.js +44 -0
package/dist/utils/withLockfile.js.map +1 -0
package/dist/utils/withOra.js +11 -1
package/dist/utils/withOra.js.map +1 -1
package/dist/utils/withStatusLogs.d.ts +2 -1
package/dist/utils/withStatusLogs.js +11 -8
package/dist/utils/withStatusLogs.js.map +1 -1
package/llama/.clang-format +11 -11
package/llama/CMakeLists.txt +87 -2
package/llama/addon.cpp +915 -352
package/llama/binariesGithubRelease.json +1 -1
package/llama/gitRelease.bundle +0 -0
package/llama/gpuInfo/cuda-gpu-info.cu +99 -0
package/llama/gpuInfo/cuda-gpu-info.h +7 -0
package/llama/gpuInfo/metal-gpu-info.h +5 -0
package/llama/gpuInfo/metal-gpu-info.mm +17 -0
package/llama/llama.cpp.info.json +4 -0
package/llamaBins/linux-arm64/.buildMetadata.json +1 -0
package/llamaBins/linux-arm64/llama-addon.node +0 -0
package/llamaBins/linux-armv7l/.buildMetadata.json +1 -0
package/llamaBins/linux-armv7l/llama-addon.node +0 -0
package/llamaBins/linux-x64/.buildMetadata.json +1 -0
package/llamaBins/linux-x64/llama-addon.node +0 -0
package/llamaBins/linux-x64-cuda/.buildMetadata.json +1 -0
package/llamaBins/linux-x64-cuda/llama-addon.node +0 -0
package/llamaBins/mac-arm64-metal/.buildMetadata.json +1 -0
package/llamaBins/mac-arm64-metal/llama-addon.node +0 -0
package/llamaBins/mac-x64/.buildMetadata.json +1 -0
package/llamaBins/mac-x64/llama-addon.node +0 -0
package/llamaBins/win-x64/.buildMetadata.json +1 -0
package/llamaBins/win-x64/llama-addon.exp +0 -0
package/llamaBins/win-x64/llama-addon.node +0 -0
package/llamaBins/win-x64-cuda/.buildMetadata.json +1 -0
package/llamaBins/win-x64-cuda/llama-addon.exp +0 -0
package/llamaBins/win-x64-cuda/llama-addon.lib +0 -0
package/llamaBins/win-x64-cuda/llama-addon.node +0 -0
package/package.json +39 -19
package/dist/ChatPromptWrapper.d.ts +0 -11
package/dist/ChatPromptWrapper.js +0 -20
package/dist/ChatPromptWrapper.js.map +0 -1
package/dist/chatWrappers/ChatMLChatPromptWrapper.d.ts +0 -12
package/dist/chatWrappers/ChatMLChatPromptWrapper.js +0 -22
package/dist/chatWrappers/ChatMLChatPromptWrapper.js.map +0 -1
package/dist/chatWrappers/EmptyChatPromptWrapper.d.ts +0 -4
package/dist/chatWrappers/EmptyChatPromptWrapper.js +0 -5
package/dist/chatWrappers/EmptyChatPromptWrapper.js.map +0 -1
package/dist/chatWrappers/FalconChatPromptWrapper.d.ts +0 -19
package/dist/chatWrappers/FalconChatPromptWrapper.js +0 -33
package/dist/chatWrappers/FalconChatPromptWrapper.js.map +0 -1
package/dist/chatWrappers/GeneralChatPromptWrapper.d.ts +0 -19
package/dist/chatWrappers/GeneralChatPromptWrapper.js +0 -38
package/dist/chatWrappers/GeneralChatPromptWrapper.js.map +0 -1
package/dist/chatWrappers/LlamaChatPromptWrapper.d.ts +0 -12
package/dist/chatWrappers/LlamaChatPromptWrapper.js +0 -23
package/dist/chatWrappers/LlamaChatPromptWrapper.js.map +0 -1
package/dist/chatWrappers/createChatWrapperByBos.d.ts +0 -2
package/dist/chatWrappers/createChatWrapperByBos.js +0 -14
package/dist/chatWrappers/createChatWrapperByBos.js.map +0 -1
package/dist/chatWrappers/generateContextTextFromConversationHistory.d.ts +0 -23
package/dist/chatWrappers/generateContextTextFromConversationHistory.js +0 -47
package/dist/chatWrappers/generateContextTextFromConversationHistory.js.map +0 -1
package/dist/llamaEvaluator/LlamaBins.d.ts +0 -4
package/dist/llamaEvaluator/LlamaBins.js +0 -5
package/dist/llamaEvaluator/LlamaBins.js.map +0 -1
package/dist/llamaEvaluator/LlamaChatSession.d.ts +0 -122
package/dist/llamaEvaluator/LlamaChatSession.js +0 -236
package/dist/llamaEvaluator/LlamaChatSession.js.map +0 -1
package/dist/llamaEvaluator/LlamaContext.d.ts +0 -99
package/dist/llamaEvaluator/LlamaContext.js +0 -143
package/dist/llamaEvaluator/LlamaContext.js.map +0 -1
package/dist/llamaEvaluator/LlamaGrammar.d.ts +0 -32
package/dist/llamaEvaluator/LlamaGrammar.js.map +0 -1
package/dist/llamaEvaluator/LlamaGrammarEvaluationState.d.ts +0 -14
package/dist/llamaEvaluator/LlamaGrammarEvaluationState.js +0 -16
package/dist/llamaEvaluator/LlamaGrammarEvaluationState.js.map +0 -1
package/dist/llamaEvaluator/LlamaJsonSchemaGrammar.js.map +0 -1
package/dist/llamaEvaluator/LlamaModel.d.ts +0 -123
package/dist/llamaEvaluator/LlamaModel.js +0 -74
package/dist/llamaEvaluator/LlamaModel.js.map +0 -1
package/dist/utils/binariesGithubRelease.js.map +0 -1
package/dist/utils/clearLlamaBuild.d.ts +0 -1
package/dist/utils/clearLlamaBuild.js +0 -12
package/dist/utils/clearLlamaBuild.js.map +0 -1
package/dist/utils/cloneLlamaCppRepo.d.ts +0 -2
package/dist/utils/cloneLlamaCppRepo.js +0 -102
package/dist/utils/cloneLlamaCppRepo.js.map +0 -1
package/dist/utils/compileLLamaCpp.d.ts +0 -8
package/dist/utils/compileLLamaCpp.js +0 -132
package/dist/utils/compileLLamaCpp.js.map +0 -1
package/dist/utils/getBin.d.ts +0 -53
package/dist/utils/getBin.js +0 -78
package/dist/utils/getBin.js.map +0 -1
package/dist/utils/getReleaseInfo.d.ts +0 -7
package/dist/utils/getReleaseInfo.js +0 -30
package/dist/utils/getReleaseInfo.js.map +0 -1
package/dist/utils/getTextCompletion.d.ts +0 -3
package/dist/utils/getTextCompletion.js +0 -12
package/dist/utils/getTextCompletion.js.map +0 -1
package/dist/utils/usedBinFlag.d.ts +0 -6
package/dist/utils/usedBinFlag.js +0 -15
package/dist/utils/usedBinFlag.js.map +0 -1
package/dist/utils/withLock.d.ts +0 -1
package/dist/utils/withLock.js +0 -19
package/dist/utils/withLock.js.map +0 -1
package/llama/usedBin.json +0 -3
package/llamaBins/mac-arm64/llama-addon.node +0 -0
package/llamaBins/mac-x64/ggml-metal.metal +0 -6119
/package/dist/{utils → bindings/utils}/binariesGithubRelease.d.ts +0 -0
/package/llamaBins/{mac-arm64 → mac-arm64-metal}/ggml-metal.metal +0 -0

package/dist/evaluator/LlamaChat/LlamaChat.js ADDED Viewed

@@ -0,0 +1,705 @@
+import { DisposeAggregator, DisposedError, EventRelay } from "lifecycle-utils";
+import { resolveChatWrapper } from "../../utils/resolveChatWrapper.js";
+import { removeNullFields } from "../../utils/removeNullFields.js";
+import { LlamaGrammarEvaluationState } from "../LlamaGrammarEvaluationState.js";
+import { AbortError } from "../../AbortError.js";
+import { StopGenerationDetector } from "../../utils/StopGenerationDetector.js";
+import { TokenStreamRegulator } from "../../utils/TokenStreamRegulator.js";
+import { eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy } from "./utils/contextShiftStrategies/eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy.js";
+import { FunctionCallGrammar, LlamaFunctionCallValidationError } from "./utils/FunctionCallGrammar.js";
+const defaultContextShiftOptions = {
+    size: (sequence) => Math.max(1, Math.floor(sequence.context.contextSize / 10)),
+    strategy: "eraseFirstResponseAndKeepFirstSystem",
+    lastEvaluationMetadata: null
+};
+const UNKNOWN_UNICODE_CHAR = "\ufffd";
+export class LlamaChat {
+    /** @internal */ _chatWrapper;
+    /** @internal */ _disposeAggregator = new DisposeAggregator();
+    /** @internal */ _autoDisposeSequence;
+    /** @internal */ _sequence;
+    onDispose = new EventRelay();
+    constructor({ contextSequence, chatWrapper = "auto", autoDisposeSequence = true }) {
+        if (contextSequence == null)
+            throw new Error("contextSequence cannot be null");
+        if (contextSequence.disposed)
+            throw new DisposedError();
+        this._sequence = contextSequence;
+        this._autoDisposeSequence = autoDisposeSequence;
+        this._disposeAggregator.add(this._sequence.onDispose.createListener(() => {
+            this.dispose();
+        }));
+        this._disposeAggregator.add(this.onDispose.dispatchEvent);
+        this._chatWrapper = resolveChatWrapper(chatWrapper, contextSequence.model);
+    }
+    dispose({ disposeSequence = this._autoDisposeSequence } = {}) {
+        if (this._sequence == null)
+            return;
+        if (disposeSequence)
+            this._sequence.dispose();
+        this._sequence = null;
+        this._disposeAggregator.dispose();
+    }
+    /** @hidden */
+    [Symbol.dispose]() {
+        return this.dispose();
+    }
+    get disposed() {
+        return this._sequence == null;
+    }
+    get chatWrapper() {
+        if (this._sequence == null)
+            throw new DisposedError();
+        return this._chatWrapper;
+    }
+    get sequence() {
+        if (this._sequence == null)
+            throw new DisposedError();
+        return this._sequence;
+    }
+    get context() {
+        return this.sequence.context;
+    }
+    get model() {
+        return this.sequence.model;
+    }
+    async generateResponse(history, { onToken, signal, maxTokens, temperature, minP, topK, topP, grammar, trimWhitespaceSuffix = false, repeatPenalty = {}, evaluationPriority = 5, functions, documentFunctionParams, contextShift = defaultContextShiftOptions, lastEvaluationContextWindow: { history: lastEvaluationContextWindowHistory, minimumOverlapPercentageToPreventContextShift = 0.5 } = {} } = {}) {
+        const functionsEnabled = (functions != null && Object.keys(functions).length > 0);
+        if (grammar != null && functionsEnabled)
+            throw new Error("Using both grammar and functions is not supported yet");
+        if (signal?.aborted)
+            throw new AbortError();
+        if (this._sequence == null)
+            throw new DisposedError();
+        let resolvedHistory = this._sequence.isLoadedToMemory
+            ? history.slice()
+            : history.map(removeRawFromHistoryItem);
+        if (resolvedHistory.length === 0 || resolvedHistory[resolvedHistory.length - 1].type !== "model")
+            resolvedHistory.push({
+                type: "model",
+                response: []
+            });
+        const model = this._sequence.model;
+        const context = this._sequence.context;
+        const eosToken = model.tokens.eos;
+        const resolvedContextShift = {
+            ...defaultContextShiftOptions,
+            ...removeNullFields(contextShift)
+        };
+        const { lastTokens: repeatPenaltyLastTokens = 64, punishTokensFilter, penalizeNewLine, penalty, frequencyPenalty, presencePenalty } = repeatPenalty === false
+            ? { lastTokens: 0 }
+            : repeatPenalty;
+        const lastModelResponse = getLastTextModelResponseFromChatHistory(resolvedHistory);
+        const res = [];
+        const pendingTokens = [];
+        let ignoredStartTextTokens = [];
+        const functionCallTokens = [];
+        const repeatPenaltyEnabled = repeatPenaltyLastTokens > 0;
+        const grammarEvaluationState = grammar != null
+            ? new LlamaGrammarEvaluationState({ grammar })
+            : undefined;
+        let functionsGrammar = functionsEnabled
+            ? new FunctionCallGrammar(model._llama, functions, this._chatWrapper, false)
+            : undefined;
+        let functionsEvaluationState = (functionsEnabled && functionsGrammar != null)
+            ? new LlamaGrammarEvaluationState({
+                grammar: functionsGrammar
+            })
+            : undefined;
+        const streamRegulator = new TokenStreamRegulator();
+        const stopGenerationDetector = new StopGenerationDetector();
+        const functionSyntaxStartDetector = new StopGenerationDetector();
+        const functionSyntaxEndDetector = new StopGenerationDetector();
+        const disengageInitiallyEngagedFunctionMode = new StopGenerationDetector();
+        const ignoreStartTextDetector = new StopGenerationDetector();
+        const locksToReleaseOnValidGeneration = [];
+        const functionCallTokenSyntaxLocks = [];
+        let generatedTokens = 0;
+        let isFirstEvaluation = true;
+        let inFunctionEvaluationMode = false;
+        let initiallyEngagedFunctionMode = false;
+        let lastContextWindowHistory = resolvedHistory;
+        let lastHistoryCompressionMetadata = resolvedContextShift.lastEvaluationMetadata;
+        const ensureNotAborted = () => {
+            if (signal?.aborted)
+                throw new AbortError();
+            if (this._sequence == null)
+                throw new DisposedError();
+        };
+        const getPenaltyTokens = () => {
+            if (this._sequence == null)
+                throw new DisposedError();
+            let punishTokens = res.slice(-repeatPenaltyLastTokens);
+            if (punishTokensFilter != null)
+                punishTokens = punishTokensFilter(punishTokens);
+            if (!penalizeNewLine) {
+                const nlToken = model.tokens.nl;
+                if (nlToken != null)
+                    punishTokens = punishTokens.filter(token => token !== nlToken);
+            }
+            return punishTokens;
+        };
+        const getResolvedHistoryWithCurrentModelResponse = () => {
+            if (res.length === 0)
+                return resolvedHistory;
+            let modelResponse = model.detokenize(res);
+            if (grammar?.trimWhitespaceSuffix || trimWhitespaceSuffix)
+                modelResponse = modelResponse.trimEnd();
+            if (modelResponse === "")
+                return resolvedHistory;
+            return setLastModelTextResponseInChatHistory(resolvedHistory, lastModelResponse + modelResponse);
+        };
+        const removeFoundStartIgnoreTextsFromPendingTokens = () => {
+            if (res.length === 0 && pendingTokens.length > 0) {
+                ignoreStartTextDetector.clearInProgressStops();
+                ignoreStartTextDetector.clearTriggeredStops();
+                let mostExhaustiveTriggeredStops = null;
+                for (let i = 0; i < pendingTokens.length; i++) {
+                    ignoreStartTextDetector.recordGeneration({
+                        text: model.detokenize([pendingTokens[i]]),
+                        tokens: [pendingTokens[i]],
+                        startNewChecks: i === 0
+                    });
+                    if (ignoreStartTextDetector.hasTriggeredStops) {
+                        mostExhaustiveTriggeredStops = ignoreStartTextDetector.getTriggeredStops();
+                        ignoreStartTextDetector.clearTriggeredStops();
+                    }
+                    else if (!ignoreStartTextDetector.hasInProgressStops)
+                        break;
+                }
+                if (mostExhaustiveTriggeredStops != null) {
+                    const [mostExhaustiveTriggeredStop] = mostExhaustiveTriggeredStops;
+                    if (mostExhaustiveTriggeredStop != null) {
+                        ignoredStartTextTokens = mostExhaustiveTriggeredStop.stopTrigger
+                            .map((stopTrigger) => {
+                            if (typeof stopTrigger === "string")
+                                return model.tokenize(stopTrigger);
+                            else
+                                return [stopTrigger];
+                        })
+                            .flat(1);
+                        const newPendingTokens = mostExhaustiveTriggeredStop.remainingGenerations
+                            .map((generation) => {
+                            if (typeof generation === "string")
+                                return model.tokenize(generation);
+                            else
+                                return generation;
+                        })
+                            .flat(1);
+                        pendingTokens.length = 0;
+                        pendingTokens.push(...newPendingTokens);
+                    }
+                }
+            }
+        };
+        if (grammar != null)
+            StopGenerationDetector.resolveStopTriggers(grammar.stopGenerationTriggers, model.tokenize)
+                .map((stopTrigger) => stopGenerationDetector.addStopTrigger(stopTrigger));
+        if (functions != null && Object.keys(functions).length > 0)
+            functionSyntaxStartDetector.addStopTrigger([this._chatWrapper.settings.functions.call.prefix]);
+        // eslint-disable-next-line no-constant-condition
+        while (true) {
+            ensureNotAborted();
+            let shouldContextShift = false;
+            const queuedChunkTokens = streamRegulator.getAllQueuedChunkTokens();
+            const { history: contextWindowHistory, stopGenerationTriggers, tokens: contextWindowTokens, newResolvedHistory, newHistoryCompressionMetadata, ignoreStartText, functionCallInitiallyEngaged, disengageInitiallyEngagedFunctionCall } = await getContextWindow({
+                resolvedHistory: getResolvedHistoryWithCurrentModelResponse(),
+                resolvedContextShift,
+                lastHistoryCompressionMetadata,
+                pendingTokensCount: pendingTokens.length + queuedChunkTokens.length,
+                isFirstEvaluation,
+                chatWrapper: this._chatWrapper,
+                lastEvaluationContextWindowHistory,
+                minimumOverlapPercentageToPreventContextShift,
+                sequence: this._sequence,
+                minFreeContextTokens: 1,
+                functions: functionsEnabled ? functions : undefined,
+                documentFunctionParams
+            });
+            ensureNotAborted();
+            if (generatedTokens === 0) {
+                StopGenerationDetector.resolveStopTriggers(ignoreStartText, model.tokenize)
+                    .map((stopTrigger) => ignoreStartTextDetector.addStopTrigger(stopTrigger));
+                if (functionsEnabled) {
+                    initiallyEngagedFunctionMode = functionCallInitiallyEngaged;
+                    StopGenerationDetector.resolveStopTriggers(disengageInitiallyEngagedFunctionCall, model.tokenize)
+                        .map((stopTrigger) => disengageInitiallyEngagedFunctionMode.addStopTrigger(stopTrigger));
+                    if (initiallyEngagedFunctionMode) {
+                        inFunctionEvaluationMode = true;
+                        functionsGrammar = new FunctionCallGrammar(model._llama, functions, this._chatWrapper, true);
+                        functionsEvaluationState = new LlamaGrammarEvaluationState({
+                            grammar: functionsGrammar
+                        });
+                    }
+                }
+            }
+            const tokens = [...contextWindowTokens, ...ignoredStartTextTokens, ...pendingTokens, ...queuedChunkTokens];
+            resolvedHistory = newResolvedHistory;
+            lastHistoryCompressionMetadata = newHistoryCompressionMetadata;
+            lastContextWindowHistory = contextWindowHistory;
+            const contextWindowLastModelResponse = getLastTextModelResponseFromChatHistory(contextWindowHistory);
+            const contextWindowsRes = [];
+            StopGenerationDetector.resolveStopTriggers(stopGenerationTriggers, model.tokenize)
+                .map((stopTrigger) => stopGenerationDetector.addStopTrigger(stopTrigger));
+            if (functionsGrammar != null)
+                StopGenerationDetector.resolveStopTriggers(functionsGrammar.stopGenerationTriggers, model.tokenize)
+                    .map((stopTrigger) => functionSyntaxEndDetector.addStopTrigger(stopTrigger));
+            let { firstDifferentIndex } = this._sequence.compareContextTokens(tokens);
+            // we need to decode at least one token to generate a response
+            if (firstDifferentIndex === tokens.length && firstDifferentIndex > 0)
+                firstDifferentIndex -= 1;
+            tokens.splice(0, firstDifferentIndex);
+            if (firstDifferentIndex < this._sequence.nextTokenIndex) {
+                await this._sequence.eraseContextTokenRanges([{
+                        start: firstDifferentIndex,
+                        end: this._sequence.nextTokenIndex
+                    }]);
+                ensureNotAborted();
+            }
+            const evaluationIterator = this._sequence.evaluate(tokens, removeNullFields({
+                temperature, minP, topK, topP,
+                grammarEvaluationState: () => {
+                    if (inFunctionEvaluationMode)
+                        return functionsEvaluationState;
+                    return grammarEvaluationState;
+                },
+                repeatPenalty: !repeatPenaltyEnabled ? undefined : {
+                    punishTokens: getPenaltyTokens,
+                    penalty,
+                    frequencyPenalty,
+                    presencePenalty
+                },
+                evaluationPriority,
+                yieldEosToken: true
+            }));
+            for await (const token of evaluationIterator) {
+                ensureNotAborted();
+                generatedTokens++;
+                const tokens = [token];
+                const text = model.detokenize([token]);
+                const queuedTokenRelease = streamRegulator.addChunk({ tokens, text });
+                if (initiallyEngagedFunctionMode)
+                    disengageInitiallyEngagedFunctionMode.recordGeneration({ text, tokens, startNewChecks: generatedTokens === 1 });
+                if (text === UNKNOWN_UNICODE_CHAR || ((grammar?.trimWhitespaceSuffix || trimWhitespaceSuffix) && text.trim() === "")) {
+                    locksToReleaseOnValidGeneration.push(queuedTokenRelease.createTextIndexLock(0));
+                }
+                else {
+                    while (locksToReleaseOnValidGeneration.length > 0)
+                        locksToReleaseOnValidGeneration.shift().dispose();
+                }
+                functionSyntaxStartDetector.recordGeneration({ text, tokens, queuedTokenRelease });
+                if (initiallyEngagedFunctionMode && disengageInitiallyEngagedFunctionMode.hasTriggeredStops) {
+                    initiallyEngagedFunctionMode = false;
+                    let shouldStopFunctionEvaluationMode = !functionSyntaxStartDetector.hasTriggeredStops;
+                    if (!shouldStopFunctionEvaluationMode && functionsEnabled && functionsGrammar != null) {
+                        const functionCallText = model.detokenize([...functionCallTokens, ...tokens]);
+                        try {
+                            const functionName = functionsGrammar.parseFunctionNameFromPartialCall(functionCallText, {
+                                enableInternalBuiltinFunctions: true,
+                                initialFunctionCallEngaged: true
+                            });
+                            const internalBuiltinFunctions = this._chatWrapper.getInternalBuiltinFunctions({ initialFunctionCallEngaged: true });
+                            if (internalBuiltinFunctions[functionName] != null) {
+                                shouldStopFunctionEvaluationMode = true;
+                            }
+                        }
+                        catch (err) {
+                            if (!(err instanceof LlamaFunctionCallValidationError))
+                                throw err;
+                        }
+                    }
+                    if (shouldStopFunctionEvaluationMode) {
+                        inFunctionEvaluationMode = false;
+                        functionsGrammar = new FunctionCallGrammar(model._llama, functions, this._chatWrapper, false);
+                        functionsEvaluationState = new LlamaGrammarEvaluationState({
+                            grammar: functionsGrammar
+                        });
+                        functionCallTokens.length = 0;
+                        while (functionCallTokenSyntaxLocks.length > 0)
+                            functionCallTokenSyntaxLocks.shift().dispose();
+                        functionSyntaxStartDetector.clearInProgressStops();
+                        functionSyntaxStartDetector.clearTriggeredStops();
+                        functionSyntaxEndDetector.clearInProgressStops();
+                        functionSyntaxEndDetector.clearTriggeredStops();
+                    }
+                }
+                if (!inFunctionEvaluationMode && functionsEnabled && functionsGrammar != null &&
+                    functionSyntaxStartDetector.hasTriggeredStops && functionsEvaluationState != null) {
+                    inFunctionEvaluationMode = true;
+                    functionCallTokenSyntaxLocks.push(queuedTokenRelease.createTextIndexLock(0));
+                    stopGenerationDetector.clearTriggeredStops();
+                    stopGenerationDetector.clearInProgressStops();
+                    pendingTokens.push(...streamRegulator.popFreeChunkTokens());
+                    const triggeredStops = functionSyntaxStartDetector.getTriggeredStops();
+                    const partiallyFreeTokens = streamRegulator.getPartiallyFreeChunk();
+                    const queuedTokensBeforeStopTrigger = getQueuedTokensBeforeStopTrigger(triggeredStops, partiallyFreeTokens, model.tokenize);
+                    pendingTokens.push(...queuedTokensBeforeStopTrigger);
+                    const [firstRemainingGenerationAfterStop] = triggeredStops
+                        .map((stopTrigger) => stopTrigger.remainingGenerations)
+                        .filter((remainingGenerations) => remainingGenerations.length > 0)
+                        .flat(1);
+                    const remainingTextAfterStop = (firstRemainingGenerationAfterStop == null || firstRemainingGenerationAfterStop.length === 0)
+                        ? ""
+                        : typeof firstRemainingGenerationAfterStop === "string"
+                            ? firstRemainingGenerationAfterStop
+                            : model.detokenize(firstRemainingGenerationAfterStop);
+                    functionCallTokens.push(...model.tokenize(this._chatWrapper.settings.functions.call.prefix + remainingTextAfterStop));
+                    for (const functionCallToken of functionCallTokens)
+                        context._acceptTokenOnGrammarEvaluationState(functionsEvaluationState, functionCallToken);
+                }
+                else if (inFunctionEvaluationMode) {
+                    functionCallTokens.push(...tokens);
+                    functionCallTokenSyntaxLocks.push(queuedTokenRelease.createTextIndexLock(0));
+                    functionSyntaxEndDetector.recordGeneration({ text, tokens, queuedTokenRelease });
+                }
+                if (inFunctionEvaluationMode && functionSyntaxEndDetector.hasTriggeredStops && functionsGrammar != null) {
+                    const functionCallText = model.detokenize(functionCallTokens);
+                    const functionCall = functionsGrammar.parseFunctionCall(functionCallText);
+                    let modelResponse = model.detokenize(res);
+                    let contextWindowModelResponse = model.detokenize(contextWindowsRes);
+                    if (grammar?.trimWhitespaceSuffix || trimWhitespaceSuffix) {
+                        modelResponse = modelResponse.trimEnd();
+                        contextWindowModelResponse = contextWindowModelResponse.trimEnd();
+                    }
+                    return {
+                        response: modelResponse,
+                        lastEvaluation: {
+                            contextWindow: setLastModelTextResponseInChatHistory(lastContextWindowHistory, contextWindowLastModelResponse + contextWindowModelResponse),
+                            cleanHistory: setLastModelTextResponseInChatHistory(resolvedHistory, lastModelResponse + modelResponse),
+                            contextShiftMetadata: lastHistoryCompressionMetadata
+                        },
+                        // prevent infinite TS type instantiation
+                        functionCall: functionCall,
+                        metadata: {
+                            stopReason: "functionCall"
+                        }
+                    };
+                }
+                if (!inFunctionEvaluationMode)
+                    stopGenerationDetector.recordGeneration({ text, tokens, queuedTokenRelease });
+                pendingTokens.push(...streamRegulator.popFreeChunkTokens());
+                removeFoundStartIgnoreTextsFromPendingTokens();
+                if (stopGenerationDetector.hasTriggeredStops || token === eosToken) {
+                    const triggeredStops = stopGenerationDetector.getTriggeredStops();
+                    const partiallyFreeTokens = streamRegulator.getPartiallyFreeChunk();
+                    const queuedTokensBeforeStopTrigger = getQueuedTokensBeforeStopTrigger(triggeredStops, partiallyFreeTokens, model.tokenize);
+                    pendingTokens.push(...queuedTokensBeforeStopTrigger);
+                    const [firstRemainingGenerationAfterStop] = triggeredStops
+                        .map((stopTrigger) => stopTrigger.remainingGenerations)
+                        .filter((remainingGenerations) => remainingGenerations.length > 0)
+                        .flat(1);
+                    removeFoundStartIgnoreTextsFromPendingTokens();
+                    if (pendingTokens.length > 0)
+                        onToken?.(pendingTokens.slice());
+                    res.push(...pendingTokens);
+                    contextWindowsRes.push(...pendingTokens);
+                    pendingTokens.length = 0;
+                    let modelResponse = model.detokenize(res);
+                    let contextWindowModelResponse = model.detokenize(contextWindowsRes);
+                    if (grammar?.trimWhitespaceSuffix || trimWhitespaceSuffix) {
+                        modelResponse = modelResponse.trimEnd();
+                        contextWindowModelResponse = contextWindowModelResponse.trimEnd();
+                    }
+                    return {
+                        response: modelResponse,
+                        lastEvaluation: {
+                            contextWindow: setLastModelTextResponseInChatHistory(lastContextWindowHistory, contextWindowLastModelResponse + contextWindowModelResponse),
+                            cleanHistory: setLastModelTextResponseInChatHistory(resolvedHistory, lastModelResponse + modelResponse),
+                            contextShiftMetadata: lastHistoryCompressionMetadata
+                        },
+                        metadata: {
+                            remainingGenerationAfterStop: firstRemainingGenerationAfterStop,
+                            stopReason: token === eosToken
+                                ? "eosToken"
+                                : "stopGenerationTrigger"
+                        }
+                    };
+                }
+                const maxTokensTriggered = maxTokens != null && maxTokens > 0 && generatedTokens >= maxTokens;
+                if (res.length === 0) {
+                    ignoreStartTextDetector.clearInProgressStops();
+                    ignoreStartTextDetector.clearTriggeredStops();
+                    ignoreStartTextDetector.recordGeneration({
+                        text: model.detokenize(pendingTokens),
+                        tokens: pendingTokens
+                    });
+                }
+                if (pendingTokens.length > 0 && (maxTokensTriggered || !ignoreStartTextDetector.hasInProgressStops)) {
+                    removeFoundStartIgnoreTextsFromPendingTokens();
+                    if (pendingTokens.length > 0) {
+                        onToken?.(pendingTokens.slice());
+                        res.push(...pendingTokens);
+                        contextWindowsRes.push(...pendingTokens);
+                        pendingTokens.length = 0;
+                    }
+                }
+                if (maxTokensTriggered) {
+                    let modelResponse = model.detokenize(res);
+                    let contextWindowModelResponse = model.detokenize(contextWindowsRes);
+                    if (grammar?.trimWhitespaceSuffix || trimWhitespaceSuffix) {
+                        modelResponse = modelResponse.trimEnd();
+                        contextWindowModelResponse = contextWindowModelResponse.trimEnd();
+                    }
+                    return {
+                        response: modelResponse,
+                        lastEvaluation: {
+                            contextWindow: setLastModelTextResponseInChatHistory(lastContextWindowHistory, contextWindowLastModelResponse + contextWindowModelResponse),
+                            cleanHistory: setLastModelTextResponseInChatHistory(resolvedHistory, lastModelResponse + modelResponse),
+                            contextShiftMetadata: lastHistoryCompressionMetadata
+                        },
+                        metadata: {
+                            stopReason: "maxTokens"
+                        }
+                    };
+                }
+                if (this._sequence.nextTokenIndex >= context.contextSize) {
+                    shouldContextShift = true;
+                    break;
+                }
+            }
+            isFirstEvaluation = false;
+            if (shouldContextShift)
+                continue;
+            break;
+        }
+        throw new Error("The context size is too small to generate a response");
+    }
+}
+function removeRawFromHistoryItem(historyItem) {
+    if (historyItem.type === "model") {
+        const newHistoryItem = { ...historyItem };
+        newHistoryItem.response = newHistoryItem.response.map((item) => {
+            if (typeof item === "string")
+                return item;
+            else
+                return {
+                    ...item,
+                    raw: undefined
+                };
+        });
+        return newHistoryItem;
+    }
+    return historyItem;
+}
+async function compressHistoryToFitContextSize({ history, contextShiftSize, contextShiftStrategy, contextShiftLastEvaluationMetadata, contextSize, tokenizer, chatWrapper, functions, documentFunctionParams }) {
+    function checkIfHistoryFitsContext(history) {
+        const { contextText } = chatWrapper.generateContextText(history, {
+            availableFunctions: functions,
+            documentFunctionParams
+        });
+        const tokens = contextText.tokenize(tokenizer);
+        return tokens.length <= contextSize - contextShiftSize;
+    }
+    if (contextSize - contextShiftSize <= 0)
+        throw new Error(`The context size (${contextSize}) is too small to fit the context shift size (${contextShiftSize})`);
+    if (checkIfHistoryFitsContext(history))
+        return {
+            compressedHistory: history,
+            metadata: null
+        };
+    if (contextShiftStrategy instanceof Function) {
+        try {
+            const { chatHistory, metadata } = await contextShiftStrategy({
+                chatHistory: history,
+                maxTokensCount: contextSize - contextShiftSize,
+                tokenizer,
+                chatWrapper,
+                lastShiftMetadata: contextShiftLastEvaluationMetadata
+            });
+            if (checkIfHistoryFitsContext(chatHistory))
+                return {
+                    compressedHistory: chatHistory,
+                    metadata
+                };
+            console.warn("The provided context shift strategy did not return a history that fits the context size. " +
+                "Using the default strategy instead.");
+        }
+        catch (err) {
+            console.error("The provided context shift strategy threw an error. " +
+                "Using the default strategy instead.", err);
+        }
+    }
+    else if (contextShiftStrategy !== "eraseFirstResponseAndKeepFirstSystem")
+        console.warn(`Unknown context shift strategy "${contextShiftStrategy}". ` +
+            "Using the default strategy instead.");
+    const { chatHistory, metadata } = await eraseFirstResponseAndKeepFirstSystemChatContextShiftStrategy({
+        chatHistory: history,
+        maxTokensCount: contextSize - contextShiftSize,
+        tokenizer,
+        chatWrapper,
+        lastShiftMetadata: contextShiftLastEvaluationMetadata
+    });
+    if (!checkIfHistoryFitsContext(chatHistory))
+        throw new Error("The default context shift strategy did not return a history that fits the context size. " +
+            "This may happen due to the system prompt being too long");
+    return {
+        compressedHistory: chatHistory,
+        metadata
+    };
+}
+function getQueuedTokensBeforeStopTrigger(triggeredStops, partiallyFreeTokens, tokenizer) {
+    if (partiallyFreeTokens.tokens.length === 0 && partiallyFreeTokens.text.length === 0)
+        return [];
+    else if (partiallyFreeTokens.tokens.length !== 0 && partiallyFreeTokens.text.length === 0)
+        return partiallyFreeTokens.tokens;
+    else if (partiallyFreeTokens.tokens.length === 0 && partiallyFreeTokens.text.length !== 0)
+        return tokenizer(partiallyFreeTokens.text);
+    const triggerThatStartsWithStringIndex = triggeredStops.findIndex((trigger) => trigger.stopTrigger.length > 0 && typeof trigger.stopTrigger[0] === "string");
+    const triggerThatStartsWithTokenIndex = triggeredStops.findIndex((trigger) => trigger.stopTrigger.length > 0 && typeof trigger.stopTrigger[0] !== "string");
+    if (triggerThatStartsWithTokenIndex > 0 && triggerThatStartsWithStringIndex < 0)
+        return partiallyFreeTokens.tokens;
+    else if (triggerThatStartsWithStringIndex > 0 && triggerThatStartsWithTokenIndex < 0)
+        return tokenizer(partiallyFreeTokens.text);
+    const stringTokens = tokenizer(partiallyFreeTokens.text);
+    if (stringTokens.length === partiallyFreeTokens.tokens.length &&
+        stringTokens.every((value, index) => value === partiallyFreeTokens.tokens[index]))
+        return stringTokens;
+    else if (triggerThatStartsWithStringIndex < triggerThatStartsWithTokenIndex)
+        return stringTokens;
+    return partiallyFreeTokens.tokens;
+}
+function getLastTextModelResponseFromChatHistory(chatHistory) {
+    if (chatHistory.length === 0 || chatHistory[chatHistory.length - 1].type !== "model")
+        return "";
+    const lastModelResponseItem = chatHistory[chatHistory.length - 1];
+    const modelResponse = lastModelResponseItem.response;
+    if (modelResponse.length > 0 && typeof modelResponse[modelResponse.length - 1] === "string")
+        return modelResponse[modelResponse.length - 1];
+    return "";
+}
+function setLastModelTextResponseInChatHistory(chatHistory, textResponse) {
+    const newChatHistory = chatHistory.slice();
+    if (newChatHistory.length === 0 || newChatHistory[newChatHistory.length - 1].type !== "model")
+        newChatHistory.push({
+            type: "model",
+            response: []
+        });
+    const lastModelResponseItem = newChatHistory[newChatHistory.length - 1];
+    const newLastModelResponseItem = { ...lastModelResponseItem };
+    newChatHistory[newChatHistory.length - 1] = newLastModelResponseItem;
+    const modelResponse = newLastModelResponseItem.response.slice();
+    newLastModelResponseItem.response = modelResponse;
+    if (modelResponse.length > 0 && typeof modelResponse[modelResponse.length - 1] === "string") {
+        if (textResponse === "")
+            modelResponse.pop();
+        else
+            modelResponse[modelResponse.length - 1] = textResponse;
+    }
+    else if (textResponse !== "")
+        modelResponse.push(textResponse);
+    return newChatHistory;
+}
+async function getContextWindow({ resolvedHistory, resolvedContextShift, lastHistoryCompressionMetadata, pendingTokensCount = 0, isFirstEvaluation, chatWrapper, lastEvaluationContextWindowHistory, minimumOverlapPercentageToPreventContextShift, sequence, minFreeContextTokens = 1, functions, documentFunctionParams }) {
+    if (sequence == null)
+        throw new DisposedError();
+    const model = sequence.model;
+    const context = sequence.context;
+    if (isFirstEvaluation && lastEvaluationContextWindowHistory != null && sequence.isLoadedToMemory) {
+        const newContextWindow = lastEvaluationContextWindowHistory.slice();
+        if (newContextWindow.length === 0 || newContextWindow[newContextWindow.length - 1].type !== "model")
+            newContextWindow.push({
+                type: "model",
+                response: []
+            });
+        const { contextText, stopGenerationTriggers, ignoreStartText, functionCall } = chatWrapper.generateContextText(newContextWindow, {
+            availableFunctions: functions,
+            documentFunctionParams
+        });
+        const tokens = contextText.tokenize(model.tokenize);
+        if (tokens.length + pendingTokensCount + minFreeContextTokens < context.contextSize) {
+            const { firstDifferentIndex } = sequence.compareContextTokens(tokens);
+            const existingEvaluationPercentage = firstDifferentIndex / tokens.length;
+            if (existingEvaluationPercentage >= minimumOverlapPercentageToPreventContextShift)
+                return {
+                    history: newContextWindow,
+                    stopGenerationTriggers,
+                    tokens,
+                    newResolvedHistory: resolvedHistory,
+                    newHistoryCompressionMetadata: lastHistoryCompressionMetadata,
+                    ignoreStartText: ignoreStartText ?? [],
+                    functionCallInitiallyEngaged: functionCall?.initiallyEngaged ?? false,
+                    disengageInitiallyEngagedFunctionCall: functionCall?.disengageInitiallyEngaged ?? []
+                };
+        }
+    }
+    resolvedHistory = sequence.isLoadedToMemory
+        ? resolvedHistory.slice()
+        : resolvedHistory.map(removeRawFromHistoryItem);
+    if (resolvedContextShift.lastEvaluationMetadata != null) {
+        const contextShiftSize = resolvedContextShift.size instanceof Function
+            ? await resolvedContextShift.size(sequence)
+            : resolvedContextShift.size;
+        const { compressedHistory, metadata } = await compressHistoryToFitContextSize({
+            history: resolvedHistory,
+            contextShiftSize: Math.max(contextShiftSize, minFreeContextTokens) + pendingTokensCount,
+            contextShiftStrategy: resolvedContextShift.strategy,
+            contextShiftLastEvaluationMetadata: resolvedContextShift.lastEvaluationMetadata,
+            contextSize: context.contextSize,
+            tokenizer: model.tokenize,
+            chatWrapper: chatWrapper,
+            functions,
+            documentFunctionParams
+        });
+        const { contextText, stopGenerationTriggers, ignoreStartText, functionCall } = chatWrapper.generateContextText(compressedHistory, {
+            availableFunctions: functions,
+            documentFunctionParams
+        });
+        return {
+            history: compressedHistory,
+            stopGenerationTriggers,
+            tokens: contextText.tokenize(model.tokenize),
+            newResolvedHistory: resolvedHistory,
+            newHistoryCompressionMetadata: metadata,
+            ignoreStartText: ignoreStartText ?? [],
+            functionCallInitiallyEngaged: functionCall?.initiallyEngaged ?? false,
+            disengageInitiallyEngagedFunctionCall: functionCall?.disengageInitiallyEngaged ?? []
+        };
+    }
+    {
+        const { contextText, stopGenerationTriggers, ignoreStartText, functionCall } = chatWrapper.generateContextText(resolvedHistory, {
+            availableFunctions: functions,
+            documentFunctionParams
+        });
+        const tokens = contextText.tokenize(model.tokenize);
+        if (tokens.length + pendingTokensCount + minFreeContextTokens < context.contextSize)
+            return {
+                history: resolvedHistory,
+                stopGenerationTriggers,
+                tokens,
+                newResolvedHistory: resolvedHistory,
+                newHistoryCompressionMetadata: lastHistoryCompressionMetadata,
+                ignoreStartText: ignoreStartText ?? [],
+                functionCallInitiallyEngaged: functionCall?.initiallyEngaged ?? false,
+                disengageInitiallyEngagedFunctionCall: functionCall?.disengageInitiallyEngaged ?? []
+            };
+    }
+    const contextShiftSize = resolvedContextShift.size instanceof Function
+        ? await resolvedContextShift.size(sequence)
+        : resolvedContextShift.size;
+    const { compressedHistory, metadata } = await compressHistoryToFitContextSize({
+        history: resolvedHistory,
+        contextShiftSize: Math.max(contextShiftSize, minFreeContextTokens) + pendingTokensCount,
+        contextShiftStrategy: resolvedContextShift.strategy,
+        contextShiftLastEvaluationMetadata: resolvedContextShift.lastEvaluationMetadata,
+        contextSize: context.contextSize,
+        tokenizer: model.tokenize,
+        chatWrapper: chatWrapper,
+        functions,
+        documentFunctionParams
+    });
+    const { contextText, stopGenerationTriggers, ignoreStartText, functionCall } = chatWrapper.generateContextText(compressedHistory, {
+        availableFunctions: functions,
+        documentFunctionParams
+    });
+    return {
+        history: compressedHistory,
+        stopGenerationTriggers,
+        tokens: contextText.tokenize(model.tokenize),
+        newResolvedHistory: resolvedHistory,
+        newHistoryCompressionMetadata: metadata,
+        ignoreStartText: ignoreStartText ?? [],
+        functionCallInitiallyEngaged: functionCall?.initiallyEngaged ?? false,
+        disengageInitiallyEngagedFunctionCall: functionCall?.disengageInitiallyEngaged ?? []
+    };
+}
+//# sourceMappingURL=LlamaChat.js.map