modelfusion 0.0.44
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +21 -0
- package/README.md +429 -0
- package/composed-function/index.cjs +22 -0
- package/composed-function/index.d.ts +6 -0
- package/composed-function/index.js +6 -0
- package/composed-function/summarize/SummarizationFunction.cjs +2 -0
- package/composed-function/summarize/SummarizationFunction.d.ts +4 -0
- package/composed-function/summarize/SummarizationFunction.js +1 -0
- package/composed-function/summarize/summarizeRecursively.cjs +19 -0
- package/composed-function/summarize/summarizeRecursively.d.ts +11 -0
- package/composed-function/summarize/summarizeRecursively.js +15 -0
- package/composed-function/summarize/summarizeRecursivelyWithTextGenerationAndTokenSplitting.cjs +29 -0
- package/composed-function/summarize/summarizeRecursivelyWithTextGenerationAndTokenSplitting.d.ts +24 -0
- package/composed-function/summarize/summarizeRecursivelyWithTextGenerationAndTokenSplitting.js +25 -0
- package/composed-function/use-tool/NoSuchToolError.cjs +17 -0
- package/composed-function/use-tool/NoSuchToolError.d.ts +4 -0
- package/composed-function/use-tool/NoSuchToolError.js +13 -0
- package/composed-function/use-tool/Tool.cjs +43 -0
- package/composed-function/use-tool/Tool.d.ts +15 -0
- package/composed-function/use-tool/Tool.js +39 -0
- package/composed-function/use-tool/useTool.cjs +59 -0
- package/composed-function/use-tool/useTool.d.ts +36 -0
- package/composed-function/use-tool/useTool.js +54 -0
- package/cost/Cost.cjs +38 -0
- package/cost/Cost.d.ts +16 -0
- package/cost/Cost.js +34 -0
- package/cost/CostCalculator.cjs +2 -0
- package/cost/CostCalculator.d.ts +8 -0
- package/cost/CostCalculator.js +1 -0
- package/cost/calculateCost.cjs +28 -0
- package/cost/calculateCost.d.ts +7 -0
- package/cost/calculateCost.js +24 -0
- package/cost/index.cjs +19 -0
- package/cost/index.d.ts +3 -0
- package/cost/index.js +3 -0
- package/index.cjs +25 -0
- package/index.d.ts +9 -0
- package/index.js +9 -0
- package/model-function/AbstractModel.cjs +22 -0
- package/model-function/AbstractModel.d.ts +12 -0
- package/model-function/AbstractModel.js +18 -0
- package/model-function/FunctionOptions.cjs +2 -0
- package/model-function/FunctionOptions.d.ts +6 -0
- package/model-function/FunctionOptions.js +1 -0
- package/model-function/Model.cjs +2 -0
- package/model-function/Model.d.ts +23 -0
- package/model-function/Model.js +1 -0
- package/model-function/ModelCallEvent.cjs +2 -0
- package/model-function/ModelCallEvent.d.ts +18 -0
- package/model-function/ModelCallEvent.js +1 -0
- package/model-function/ModelCallEventSource.cjs +42 -0
- package/model-function/ModelCallEventSource.d.ts +13 -0
- package/model-function/ModelCallEventSource.js +38 -0
- package/model-function/ModelCallObserver.cjs +2 -0
- package/model-function/ModelCallObserver.d.ts +5 -0
- package/model-function/ModelCallObserver.js +1 -0
- package/model-function/ModelInformation.cjs +2 -0
- package/model-function/ModelInformation.d.ts +4 -0
- package/model-function/ModelInformation.js +1 -0
- package/model-function/SuccessfulModelCall.cjs +22 -0
- package/model-function/SuccessfulModelCall.d.ts +9 -0
- package/model-function/SuccessfulModelCall.js +18 -0
- package/model-function/embed-text/TextEmbeddingEvent.cjs +2 -0
- package/model-function/embed-text/TextEmbeddingEvent.d.ts +23 -0
- package/model-function/embed-text/TextEmbeddingEvent.js +1 -0
- package/model-function/embed-text/TextEmbeddingModel.cjs +2 -0
- package/model-function/embed-text/TextEmbeddingModel.d.ts +18 -0
- package/model-function/embed-text/TextEmbeddingModel.js +1 -0
- package/model-function/embed-text/embedText.cjs +90 -0
- package/model-function/embed-text/embedText.d.ts +33 -0
- package/model-function/embed-text/embedText.js +85 -0
- package/model-function/executeCall.cjs +60 -0
- package/model-function/executeCall.d.ts +27 -0
- package/model-function/executeCall.js +56 -0
- package/model-function/generate-image/ImageGenerationEvent.cjs +2 -0
- package/model-function/generate-image/ImageGenerationEvent.d.ts +22 -0
- package/model-function/generate-image/ImageGenerationEvent.js +1 -0
- package/model-function/generate-image/ImageGenerationModel.cjs +2 -0
- package/model-function/generate-image/ImageGenerationModel.d.ts +8 -0
- package/model-function/generate-image/ImageGenerationModel.js +1 -0
- package/model-function/generate-image/generateImage.cjs +63 -0
- package/model-function/generate-image/generateImage.d.ts +23 -0
- package/model-function/generate-image/generateImage.js +59 -0
- package/model-function/generate-json/GenerateJsonModel.cjs +2 -0
- package/model-function/generate-json/GenerateJsonModel.d.ts +10 -0
- package/model-function/generate-json/GenerateJsonModel.js +1 -0
- package/model-function/generate-json/GenerateJsonOrTextModel.cjs +2 -0
- package/model-function/generate-json/GenerateJsonOrTextModel.d.ts +18 -0
- package/model-function/generate-json/GenerateJsonOrTextModel.js +1 -0
- package/model-function/generate-json/JsonGenerationEvent.cjs +2 -0
- package/model-function/generate-json/JsonGenerationEvent.d.ts +22 -0
- package/model-function/generate-json/JsonGenerationEvent.js +1 -0
- package/model-function/generate-json/NoSuchSchemaError.cjs +17 -0
- package/model-function/generate-json/NoSuchSchemaError.d.ts +4 -0
- package/model-function/generate-json/NoSuchSchemaError.js +13 -0
- package/model-function/generate-json/SchemaDefinition.cjs +2 -0
- package/model-function/generate-json/SchemaDefinition.d.ts +6 -0
- package/model-function/generate-json/SchemaDefinition.js +1 -0
- package/model-function/generate-json/SchemaValidationError.cjs +36 -0
- package/model-function/generate-json/SchemaValidationError.d.ts +11 -0
- package/model-function/generate-json/SchemaValidationError.js +32 -0
- package/model-function/generate-json/generateJson.cjs +61 -0
- package/model-function/generate-json/generateJson.d.ts +9 -0
- package/model-function/generate-json/generateJson.js +57 -0
- package/model-function/generate-json/generateJsonOrText.cjs +74 -0
- package/model-function/generate-json/generateJsonOrText.d.ts +25 -0
- package/model-function/generate-json/generateJsonOrText.js +70 -0
- package/model-function/generate-text/AsyncQueue.cjs +66 -0
- package/model-function/generate-text/AsyncQueue.d.ts +17 -0
- package/model-function/generate-text/AsyncQueue.js +62 -0
- package/model-function/generate-text/DeltaEvent.cjs +2 -0
- package/model-function/generate-text/DeltaEvent.d.ts +7 -0
- package/model-function/generate-text/DeltaEvent.js +1 -0
- package/model-function/generate-text/TextDeltaEventSource.cjs +54 -0
- package/model-function/generate-text/TextDeltaEventSource.d.ts +5 -0
- package/model-function/generate-text/TextDeltaEventSource.js +46 -0
- package/model-function/generate-text/TextGenerationEvent.cjs +2 -0
- package/model-function/generate-text/TextGenerationEvent.d.ts +22 -0
- package/model-function/generate-text/TextGenerationEvent.js +1 -0
- package/model-function/generate-text/TextGenerationModel.cjs +2 -0
- package/model-function/generate-text/TextGenerationModel.d.ts +42 -0
- package/model-function/generate-text/TextGenerationModel.js +1 -0
- package/model-function/generate-text/TextStreamingEvent.cjs +2 -0
- package/model-function/generate-text/TextStreamingEvent.d.ts +22 -0
- package/model-function/generate-text/TextStreamingEvent.js +1 -0
- package/model-function/generate-text/extractTextDeltas.cjs +23 -0
- package/model-function/generate-text/extractTextDeltas.d.ts +7 -0
- package/model-function/generate-text/extractTextDeltas.js +19 -0
- package/model-function/generate-text/generateText.cjs +67 -0
- package/model-function/generate-text/generateText.d.ts +20 -0
- package/model-function/generate-text/generateText.js +63 -0
- package/model-function/generate-text/parseEventSourceReadableStream.cjs +30 -0
- package/model-function/generate-text/parseEventSourceReadableStream.d.ts +8 -0
- package/model-function/generate-text/parseEventSourceReadableStream.js +26 -0
- package/model-function/generate-text/streamText.cjs +115 -0
- package/model-function/generate-text/streamText.d.ts +11 -0
- package/model-function/generate-text/streamText.js +111 -0
- package/model-function/index.cjs +47 -0
- package/model-function/index.d.ts +31 -0
- package/model-function/index.js +31 -0
- package/model-function/tokenize-text/Tokenizer.cjs +2 -0
- package/model-function/tokenize-text/Tokenizer.d.ts +19 -0
- package/model-function/tokenize-text/Tokenizer.js +1 -0
- package/model-function/tokenize-text/countTokens.cjs +10 -0
- package/model-function/tokenize-text/countTokens.d.ts +5 -0
- package/model-function/tokenize-text/countTokens.js +6 -0
- package/model-function/transcribe-audio/TranscriptionEvent.cjs +2 -0
- package/model-function/transcribe-audio/TranscriptionEvent.d.ts +22 -0
- package/model-function/transcribe-audio/TranscriptionEvent.js +1 -0
- package/model-function/transcribe-audio/TranscriptionModel.cjs +2 -0
- package/model-function/transcribe-audio/TranscriptionModel.d.ts +8 -0
- package/model-function/transcribe-audio/TranscriptionModel.js +1 -0
- package/model-function/transcribe-audio/transcribe.cjs +62 -0
- package/model-function/transcribe-audio/transcribe.d.ts +22 -0
- package/model-function/transcribe-audio/transcribe.js +58 -0
- package/model-provider/automatic1111/Automatic1111Error.cjs +39 -0
- package/model-provider/automatic1111/Automatic1111Error.d.ts +31 -0
- package/model-provider/automatic1111/Automatic1111Error.js +31 -0
- package/model-provider/automatic1111/Automatic1111ImageGenerationModel.cjs +76 -0
- package/model-provider/automatic1111/Automatic1111ImageGenerationModel.d.ts +54 -0
- package/model-provider/automatic1111/Automatic1111ImageGenerationModel.js +72 -0
- package/model-provider/automatic1111/index.cjs +20 -0
- package/model-provider/automatic1111/index.d.ts +2 -0
- package/model-provider/automatic1111/index.js +2 -0
- package/model-provider/cohere/CohereError.cjs +36 -0
- package/model-provider/cohere/CohereError.d.ts +22 -0
- package/model-provider/cohere/CohereError.js +28 -0
- package/model-provider/cohere/CohereTextEmbeddingModel.cjs +172 -0
- package/model-provider/cohere/CohereTextEmbeddingModel.d.ts +119 -0
- package/model-provider/cohere/CohereTextEmbeddingModel.js +165 -0
- package/model-provider/cohere/CohereTextGenerationModel.cjs +283 -0
- package/model-provider/cohere/CohereTextGenerationModel.d.ts +203 -0
- package/model-provider/cohere/CohereTextGenerationModel.js +276 -0
- package/model-provider/cohere/CohereTokenizer.cjs +136 -0
- package/model-provider/cohere/CohereTokenizer.d.ts +118 -0
- package/model-provider/cohere/CohereTokenizer.js +129 -0
- package/model-provider/cohere/index.cjs +22 -0
- package/model-provider/cohere/index.d.ts +4 -0
- package/model-provider/cohere/index.js +4 -0
- package/model-provider/huggingface/HuggingFaceError.cjs +52 -0
- package/model-provider/huggingface/HuggingFaceError.d.ts +22 -0
- package/model-provider/huggingface/HuggingFaceError.js +44 -0
- package/model-provider/huggingface/HuggingFaceTextGenerationModel.cjs +174 -0
- package/model-provider/huggingface/HuggingFaceTextGenerationModel.d.ts +75 -0
- package/model-provider/huggingface/HuggingFaceTextGenerationModel.js +167 -0
- package/model-provider/huggingface/index.cjs +20 -0
- package/model-provider/huggingface/index.d.ts +2 -0
- package/model-provider/huggingface/index.js +2 -0
- package/model-provider/index.cjs +22 -0
- package/model-provider/index.d.ts +6 -0
- package/model-provider/index.js +6 -0
- package/model-provider/llamacpp/LlamaCppError.cjs +52 -0
- package/model-provider/llamacpp/LlamaCppError.d.ts +22 -0
- package/model-provider/llamacpp/LlamaCppError.js +44 -0
- package/model-provider/llamacpp/LlamaCppTextEmbeddingModel.cjs +96 -0
- package/model-provider/llamacpp/LlamaCppTextEmbeddingModel.d.ts +40 -0
- package/model-provider/llamacpp/LlamaCppTextEmbeddingModel.js +89 -0
- package/model-provider/llamacpp/LlamaCppTextGenerationModel.cjs +245 -0
- package/model-provider/llamacpp/LlamaCppTextGenerationModel.d.ts +399 -0
- package/model-provider/llamacpp/LlamaCppTextGenerationModel.js +238 -0
- package/model-provider/llamacpp/LlamaCppTokenizer.cjs +64 -0
- package/model-provider/llamacpp/LlamaCppTokenizer.d.ts +38 -0
- package/model-provider/llamacpp/LlamaCppTokenizer.js +57 -0
- package/model-provider/llamacpp/index.cjs +22 -0
- package/model-provider/llamacpp/index.d.ts +4 -0
- package/model-provider/llamacpp/index.js +4 -0
- package/model-provider/openai/OpenAICostCalculator.cjs +71 -0
- package/model-provider/openai/OpenAICostCalculator.d.ts +6 -0
- package/model-provider/openai/OpenAICostCalculator.js +67 -0
- package/model-provider/openai/OpenAIError.cjs +50 -0
- package/model-provider/openai/OpenAIError.d.ts +47 -0
- package/model-provider/openai/OpenAIError.js +42 -0
- package/model-provider/openai/OpenAIImageGenerationModel.cjs +124 -0
- package/model-provider/openai/OpenAIImageGenerationModel.d.ts +113 -0
- package/model-provider/openai/OpenAIImageGenerationModel.js +119 -0
- package/model-provider/openai/OpenAIModelSettings.cjs +2 -0
- package/model-provider/openai/OpenAIModelSettings.d.ts +8 -0
- package/model-provider/openai/OpenAIModelSettings.js +1 -0
- package/model-provider/openai/OpenAITextEmbeddingModel.cjs +171 -0
- package/model-provider/openai/OpenAITextEmbeddingModel.d.ts +122 -0
- package/model-provider/openai/OpenAITextEmbeddingModel.js +162 -0
- package/model-provider/openai/OpenAITextGenerationModel.cjs +326 -0
- package/model-provider/openai/OpenAITextGenerationModel.d.ts +254 -0
- package/model-provider/openai/OpenAITextGenerationModel.js +317 -0
- package/model-provider/openai/OpenAITranscriptionModel.cjs +195 -0
- package/model-provider/openai/OpenAITranscriptionModel.d.ts +196 -0
- package/model-provider/openai/OpenAITranscriptionModel.js +187 -0
- package/model-provider/openai/TikTokenTokenizer.cjs +86 -0
- package/model-provider/openai/TikTokenTokenizer.d.ts +35 -0
- package/model-provider/openai/TikTokenTokenizer.js +82 -0
- package/model-provider/openai/chat/OpenAIChatMessage.cjs +24 -0
- package/model-provider/openai/chat/OpenAIChatMessage.d.ts +26 -0
- package/model-provider/openai/chat/OpenAIChatMessage.js +21 -0
- package/model-provider/openai/chat/OpenAIChatModel.cjs +288 -0
- package/model-provider/openai/chat/OpenAIChatModel.d.ts +344 -0
- package/model-provider/openai/chat/OpenAIChatModel.js +279 -0
- package/model-provider/openai/chat/OpenAIChatPrompt.cjs +143 -0
- package/model-provider/openai/chat/OpenAIChatPrompt.d.ts +108 -0
- package/model-provider/openai/chat/OpenAIChatPrompt.js +135 -0
- package/model-provider/openai/chat/OpenAIChatStreamIterable.cjs +112 -0
- package/model-provider/openai/chat/OpenAIChatStreamIterable.d.ts +19 -0
- package/model-provider/openai/chat/OpenAIChatStreamIterable.js +105 -0
- package/model-provider/openai/chat/countOpenAIChatMessageTokens.cjs +28 -0
- package/model-provider/openai/chat/countOpenAIChatMessageTokens.d.ts +20 -0
- package/model-provider/openai/chat/countOpenAIChatMessageTokens.js +23 -0
- package/model-provider/openai/index.cjs +31 -0
- package/model-provider/openai/index.d.ts +13 -0
- package/model-provider/openai/index.js +12 -0
- package/model-provider/stability/StabilityError.cjs +36 -0
- package/model-provider/stability/StabilityError.d.ts +22 -0
- package/model-provider/stability/StabilityError.js +28 -0
- package/model-provider/stability/StabilityImageGenerationModel.cjs +133 -0
- package/model-provider/stability/StabilityImageGenerationModel.d.ts +95 -0
- package/model-provider/stability/StabilityImageGenerationModel.js +129 -0
- package/model-provider/stability/index.cjs +20 -0
- package/model-provider/stability/index.d.ts +2 -0
- package/model-provider/stability/index.js +2 -0
- package/package.json +87 -0
- package/prompt/InstructionPrompt.cjs +2 -0
- package/prompt/InstructionPrompt.d.ts +7 -0
- package/prompt/InstructionPrompt.js +1 -0
- package/prompt/Llama2PromptMapping.cjs +56 -0
- package/prompt/Llama2PromptMapping.d.ts +10 -0
- package/prompt/Llama2PromptMapping.js +51 -0
- package/prompt/OpenAIChatPromptMapping.cjs +62 -0
- package/prompt/OpenAIChatPromptMapping.d.ts +6 -0
- package/prompt/OpenAIChatPromptMapping.js +57 -0
- package/prompt/PromptMapping.cjs +2 -0
- package/prompt/PromptMapping.d.ts +7 -0
- package/prompt/PromptMapping.js +1 -0
- package/prompt/PromptMappingTextGenerationModel.cjs +88 -0
- package/prompt/PromptMappingTextGenerationModel.d.ts +26 -0
- package/prompt/PromptMappingTextGenerationModel.js +84 -0
- package/prompt/TextPromptMapping.cjs +50 -0
- package/prompt/TextPromptMapping.d.ts +14 -0
- package/prompt/TextPromptMapping.js +45 -0
- package/prompt/chat/ChatPrompt.cjs +2 -0
- package/prompt/chat/ChatPrompt.d.ts +33 -0
- package/prompt/chat/ChatPrompt.js +1 -0
- package/prompt/chat/trimChatPrompt.cjs +50 -0
- package/prompt/chat/trimChatPrompt.d.ts +19 -0
- package/prompt/chat/trimChatPrompt.js +46 -0
- package/prompt/chat/validateChatPrompt.cjs +36 -0
- package/prompt/chat/validateChatPrompt.d.ts +8 -0
- package/prompt/chat/validateChatPrompt.js +31 -0
- package/prompt/index.cjs +25 -0
- package/prompt/index.d.ts +9 -0
- package/prompt/index.js +9 -0
- package/run/ConsoleLogger.cjs +12 -0
- package/run/ConsoleLogger.d.ts +6 -0
- package/run/ConsoleLogger.js +8 -0
- package/run/DefaultRun.cjs +78 -0
- package/run/DefaultRun.d.ts +24 -0
- package/run/DefaultRun.js +74 -0
- package/run/IdMetadata.cjs +2 -0
- package/run/IdMetadata.d.ts +7 -0
- package/run/IdMetadata.js +1 -0
- package/run/Run.cjs +2 -0
- package/run/Run.d.ts +27 -0
- package/run/Run.js +1 -0
- package/run/RunFunction.cjs +2 -0
- package/run/RunFunction.d.ts +13 -0
- package/run/RunFunction.js +1 -0
- package/run/Vector.cjs +2 -0
- package/run/Vector.d.ts +5 -0
- package/run/Vector.js +1 -0
- package/run/index.cjs +22 -0
- package/run/index.d.ts +6 -0
- package/run/index.js +6 -0
- package/text-chunk/TextChunk.cjs +2 -0
- package/text-chunk/TextChunk.d.ts +3 -0
- package/text-chunk/TextChunk.js +1 -0
- package/text-chunk/index.cjs +22 -0
- package/text-chunk/index.d.ts +6 -0
- package/text-chunk/index.js +6 -0
- package/text-chunk/retrieve-text-chunks/TextChunkRetriever.cjs +2 -0
- package/text-chunk/retrieve-text-chunks/TextChunkRetriever.d.ts +8 -0
- package/text-chunk/retrieve-text-chunks/TextChunkRetriever.js +1 -0
- package/text-chunk/retrieve-text-chunks/retrieveTextChunks.cjs +10 -0
- package/text-chunk/retrieve-text-chunks/retrieveTextChunks.d.ts +6 -0
- package/text-chunk/retrieve-text-chunks/retrieveTextChunks.js +6 -0
- package/text-chunk/split/SplitFunction.cjs +2 -0
- package/text-chunk/split/SplitFunction.d.ts +4 -0
- package/text-chunk/split/SplitFunction.js +1 -0
- package/text-chunk/split/splitOnSeparator.cjs +12 -0
- package/text-chunk/split/splitOnSeparator.d.ts +8 -0
- package/text-chunk/split/splitOnSeparator.js +7 -0
- package/text-chunk/split/splitRecursively.cjs +41 -0
- package/text-chunk/split/splitRecursively.d.ts +22 -0
- package/text-chunk/split/splitRecursively.js +33 -0
- package/util/DurationMeasurement.cjs +42 -0
- package/util/DurationMeasurement.d.ts +5 -0
- package/util/DurationMeasurement.js +38 -0
- package/util/ErrorHandler.cjs +2 -0
- package/util/ErrorHandler.d.ts +1 -0
- package/util/ErrorHandler.js +1 -0
- package/util/SafeResult.cjs +2 -0
- package/util/SafeResult.d.ts +8 -0
- package/util/SafeResult.js +1 -0
- package/util/api/AbortError.cjs +9 -0
- package/util/api/AbortError.d.ts +3 -0
- package/util/api/AbortError.js +5 -0
- package/util/api/ApiCallError.cjs +45 -0
- package/util/api/ApiCallError.d.ts +15 -0
- package/util/api/ApiCallError.js +41 -0
- package/util/api/RetryError.cjs +24 -0
- package/util/api/RetryError.d.ts +10 -0
- package/util/api/RetryError.js +20 -0
- package/util/api/RetryFunction.cjs +2 -0
- package/util/api/RetryFunction.d.ts +1 -0
- package/util/api/RetryFunction.js +1 -0
- package/util/api/ThrottleFunction.cjs +2 -0
- package/util/api/ThrottleFunction.d.ts +1 -0
- package/util/api/ThrottleFunction.js +1 -0
- package/util/api/callWithRetryAndThrottle.cjs +7 -0
- package/util/api/callWithRetryAndThrottle.d.ts +7 -0
- package/util/api/callWithRetryAndThrottle.js +3 -0
- package/util/api/postToApi.cjs +103 -0
- package/util/api/postToApi.d.ts +29 -0
- package/util/api/postToApi.js +96 -0
- package/util/api/retryNever.cjs +8 -0
- package/util/api/retryNever.d.ts +4 -0
- package/util/api/retryNever.js +4 -0
- package/util/api/retryWithExponentialBackoff.cjs +48 -0
- package/util/api/retryWithExponentialBackoff.d.ts +10 -0
- package/util/api/retryWithExponentialBackoff.js +44 -0
- package/util/api/throttleMaxConcurrency.cjs +65 -0
- package/util/api/throttleMaxConcurrency.d.ts +7 -0
- package/util/api/throttleMaxConcurrency.js +61 -0
- package/util/api/throttleUnlimitedConcurrency.cjs +8 -0
- package/util/api/throttleUnlimitedConcurrency.d.ts +5 -0
- package/util/api/throttleUnlimitedConcurrency.js +4 -0
- package/util/cosineSimilarity.cjs +26 -0
- package/util/cosineSimilarity.d.ts +11 -0
- package/util/cosineSimilarity.js +22 -0
- package/util/index.cjs +26 -0
- package/util/index.d.ts +10 -0
- package/util/index.js +10 -0
- package/util/never.cjs +6 -0
- package/util/never.d.ts +1 -0
- package/util/never.js +2 -0
- package/util/runSafe.cjs +15 -0
- package/util/runSafe.d.ts +2 -0
- package/util/runSafe.js +11 -0
- package/vector-index/VectorIndex.cjs +2 -0
- package/vector-index/VectorIndex.d.ts +18 -0
- package/vector-index/VectorIndex.js +1 -0
- package/vector-index/VectorIndexSimilarTextChunkRetriever.cjs +57 -0
- package/vector-index/VectorIndexSimilarTextChunkRetriever.d.ts +20 -0
- package/vector-index/VectorIndexSimilarTextChunkRetriever.js +53 -0
- package/vector-index/VectorIndexTextChunkStore.cjs +77 -0
- package/vector-index/VectorIndexTextChunkStore.d.ts +35 -0
- package/vector-index/VectorIndexTextChunkStore.js +73 -0
- package/vector-index/index.cjs +22 -0
- package/vector-index/index.d.ts +6 -0
- package/vector-index/index.js +6 -0
- package/vector-index/memory/MemoryVectorIndex.cjs +63 -0
- package/vector-index/memory/MemoryVectorIndex.d.ts +31 -0
- package/vector-index/memory/MemoryVectorIndex.js +56 -0
- package/vector-index/pinecone/PineconeVectorIndex.cjs +66 -0
- package/vector-index/pinecone/PineconeVectorIndex.d.ts +29 -0
- package/vector-index/pinecone/PineconeVectorIndex.js +62 -0
- package/vector-index/upsertTextChunks.cjs +15 -0
- package/vector-index/upsertTextChunks.d.ts +11 -0
- package/vector-index/upsertTextChunks.js +11 -0
@@ -0,0 +1,44 @@
|
|
1
|
+
import SecureJSON from "secure-json-parse";
|
2
|
+
import { z } from "zod";
|
3
|
+
import { ApiCallError } from "../../util/api/ApiCallError.js";
|
4
|
+
export const llamaCppErrorDataSchema = z.object({
|
5
|
+
error: z.string(),
|
6
|
+
});
|
7
|
+
export class LlamaCppError extends ApiCallError {
|
8
|
+
constructor({ data, statusCode, url, requestBodyValues, message = data.error, }) {
|
9
|
+
super({ message, statusCode, requestBodyValues, url });
|
10
|
+
Object.defineProperty(this, "data", {
|
11
|
+
enumerable: true,
|
12
|
+
configurable: true,
|
13
|
+
writable: true,
|
14
|
+
value: void 0
|
15
|
+
});
|
16
|
+
this.data = data;
|
17
|
+
}
|
18
|
+
}
|
19
|
+
export const failedLlamaCppCallResponseHandler = async ({ response, url, requestBodyValues }) => {
|
20
|
+
const responseBody = await response.text();
|
21
|
+
try {
|
22
|
+
const parsedError = llamaCppErrorDataSchema.parse(SecureJSON.parse(responseBody));
|
23
|
+
return new LlamaCppError({
|
24
|
+
url,
|
25
|
+
requestBodyValues,
|
26
|
+
statusCode: response.status,
|
27
|
+
data: parsedError,
|
28
|
+
});
|
29
|
+
}
|
30
|
+
catch (error) {
|
31
|
+
if (error instanceof Error) {
|
32
|
+
if (error.name === "AbortError" || error instanceof ApiCallError) {
|
33
|
+
throw error;
|
34
|
+
}
|
35
|
+
}
|
36
|
+
throw new ApiCallError({
|
37
|
+
message: responseBody,
|
38
|
+
cause: error,
|
39
|
+
statusCode: response.status,
|
40
|
+
url,
|
41
|
+
requestBodyValues,
|
42
|
+
});
|
43
|
+
}
|
44
|
+
};
|
@@ -0,0 +1,96 @@
|
|
1
|
+
"use strict";
|
2
|
+
var __importDefault = (this && this.__importDefault) || function (mod) {
|
3
|
+
return (mod && mod.__esModule) ? mod : { "default": mod };
|
4
|
+
};
|
5
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
6
|
+
exports.LlamaCppTextEmbeddingModel = void 0;
|
7
|
+
const zod_1 = __importDefault(require("zod"));
|
8
|
+
const AbstractModel_js_1 = require("../../model-function/AbstractModel.cjs");
|
9
|
+
const callWithRetryAndThrottle_js_1 = require("../../util/api/callWithRetryAndThrottle.cjs");
|
10
|
+
const postToApi_js_1 = require("../../util/api/postToApi.cjs");
|
11
|
+
const LlamaCppError_js_1 = require("./LlamaCppError.cjs");
|
12
|
+
const LlamaCppTokenizer_js_1 = require("./LlamaCppTokenizer.cjs");
|
13
|
+
class LlamaCppTextEmbeddingModel extends AbstractModel_js_1.AbstractModel {
|
14
|
+
constructor(settings = {}) {
|
15
|
+
super({ settings });
|
16
|
+
Object.defineProperty(this, "provider", {
|
17
|
+
enumerable: true,
|
18
|
+
configurable: true,
|
19
|
+
writable: true,
|
20
|
+
value: "llamacpp"
|
21
|
+
});
|
22
|
+
Object.defineProperty(this, "maxTextsPerCall", {
|
23
|
+
enumerable: true,
|
24
|
+
configurable: true,
|
25
|
+
writable: true,
|
26
|
+
value: 1
|
27
|
+
});
|
28
|
+
Object.defineProperty(this, "contextWindowSize", {
|
29
|
+
enumerable: true,
|
30
|
+
configurable: true,
|
31
|
+
writable: true,
|
32
|
+
value: undefined
|
33
|
+
});
|
34
|
+
Object.defineProperty(this, "embeddingDimensions", {
|
35
|
+
enumerable: true,
|
36
|
+
configurable: true,
|
37
|
+
writable: true,
|
38
|
+
value: undefined
|
39
|
+
});
|
40
|
+
Object.defineProperty(this, "tokenizer", {
|
41
|
+
enumerable: true,
|
42
|
+
configurable: true,
|
43
|
+
writable: true,
|
44
|
+
value: void 0
|
45
|
+
});
|
46
|
+
this.tokenizer = new LlamaCppTokenizer_js_1.LlamaCppTokenizer({
|
47
|
+
baseUrl: this.settings.baseUrl,
|
48
|
+
retry: this.settings.tokenizerSettings?.retry,
|
49
|
+
throttle: this.settings.tokenizerSettings?.throttle,
|
50
|
+
});
|
51
|
+
}
|
52
|
+
get modelName() {
|
53
|
+
return null;
|
54
|
+
}
|
55
|
+
async tokenize(text) {
|
56
|
+
return this.tokenizer.tokenize(text);
|
57
|
+
}
|
58
|
+
async callAPI(texts, options) {
|
59
|
+
if (texts.length > this.maxTextsPerCall) {
|
60
|
+
throw new Error(`The Llama.cpp embedding API only supports ${this.maxTextsPerCall} texts per API call.`);
|
61
|
+
}
|
62
|
+
const run = options?.run;
|
63
|
+
const settings = options?.settings;
|
64
|
+
const callSettings = Object.assign({}, this.settings, settings, {
|
65
|
+
abortSignal: run?.abortSignal,
|
66
|
+
content: texts[0],
|
67
|
+
});
|
68
|
+
return (0, callWithRetryAndThrottle_js_1.callWithRetryAndThrottle)({
|
69
|
+
retry: this.settings.retry,
|
70
|
+
throttle: this.settings.throttle,
|
71
|
+
call: async () => callLlamaCppEmbeddingAPI(callSettings),
|
72
|
+
});
|
73
|
+
}
|
74
|
+
generateEmbeddingResponse(texts, options) {
|
75
|
+
return this.callAPI(texts, options);
|
76
|
+
}
|
77
|
+
extractEmbeddings(response) {
|
78
|
+
return [response.embedding];
|
79
|
+
}
|
80
|
+
withSettings(additionalSettings) {
|
81
|
+
return new LlamaCppTextEmbeddingModel(Object.assign({}, this.settings, additionalSettings));
|
82
|
+
}
|
83
|
+
}
|
84
|
+
exports.LlamaCppTextEmbeddingModel = LlamaCppTextEmbeddingModel;
|
85
|
+
const llamaCppTextEmbeddingResponseSchema = zod_1.default.object({
|
86
|
+
embedding: zod_1.default.array(zod_1.default.number()),
|
87
|
+
});
|
88
|
+
async function callLlamaCppEmbeddingAPI({ baseUrl = "http://127.0.0.1:8080", abortSignal, content, }) {
|
89
|
+
return (0, postToApi_js_1.postJsonToApi)({
|
90
|
+
url: `${baseUrl}/embedding`,
|
91
|
+
body: { content },
|
92
|
+
failedResponseHandler: LlamaCppError_js_1.failedLlamaCppCallResponseHandler,
|
93
|
+
successfulResponseHandler: (0, postToApi_js_1.createJsonResponseHandler)(llamaCppTextEmbeddingResponseSchema),
|
94
|
+
abortSignal,
|
95
|
+
});
|
96
|
+
}
|
@@ -0,0 +1,40 @@
|
|
1
|
+
import z from "zod";
|
2
|
+
import { AbstractModel } from "../../model-function/AbstractModel.js";
|
3
|
+
import { FunctionOptions } from "../../model-function/FunctionOptions.js";
|
4
|
+
import { TextEmbeddingModel, TextEmbeddingModelSettings } from "../../model-function/embed-text/TextEmbeddingModel.js";
|
5
|
+
import { RetryFunction } from "../../util/api/RetryFunction.js";
|
6
|
+
import { ThrottleFunction } from "../../util/api/ThrottleFunction.js";
|
7
|
+
export interface LlamaCppEmbeddingModelSettings extends TextEmbeddingModelSettings {
|
8
|
+
baseUrl?: string;
|
9
|
+
retry?: RetryFunction;
|
10
|
+
throttle?: ThrottleFunction;
|
11
|
+
tokenizerSettings?: {
|
12
|
+
retry?: RetryFunction;
|
13
|
+
throttle?: ThrottleFunction;
|
14
|
+
};
|
15
|
+
}
|
16
|
+
export declare class LlamaCppTextEmbeddingModel extends AbstractModel<LlamaCppEmbeddingModelSettings> implements TextEmbeddingModel<LlamaCppTextEmbeddingResponse, LlamaCppEmbeddingModelSettings> {
|
17
|
+
constructor(settings?: LlamaCppEmbeddingModelSettings);
|
18
|
+
readonly provider: "llamacpp";
|
19
|
+
get modelName(): null;
|
20
|
+
readonly maxTextsPerCall = 1;
|
21
|
+
readonly contextWindowSize: undefined;
|
22
|
+
readonly embeddingDimensions: undefined;
|
23
|
+
private readonly tokenizer;
|
24
|
+
tokenize(text: string): Promise<number[]>;
|
25
|
+
callAPI(texts: Array<string>, options?: FunctionOptions<LlamaCppEmbeddingModelSettings>): Promise<LlamaCppTextEmbeddingResponse>;
|
26
|
+
generateEmbeddingResponse(texts: string[], options?: FunctionOptions<LlamaCppEmbeddingModelSettings>): Promise<{
|
27
|
+
embedding: number[];
|
28
|
+
}>;
|
29
|
+
extractEmbeddings(response: LlamaCppTextEmbeddingResponse): number[][];
|
30
|
+
withSettings(additionalSettings: Partial<LlamaCppEmbeddingModelSettings>): this;
|
31
|
+
}
|
32
|
+
declare const llamaCppTextEmbeddingResponseSchema: z.ZodObject<{
|
33
|
+
embedding: z.ZodArray<z.ZodNumber, "many">;
|
34
|
+
}, "strip", z.ZodTypeAny, {
|
35
|
+
embedding: number[];
|
36
|
+
}, {
|
37
|
+
embedding: number[];
|
38
|
+
}>;
|
39
|
+
export type LlamaCppTextEmbeddingResponse = z.infer<typeof llamaCppTextEmbeddingResponseSchema>;
|
40
|
+
export {};
|
@@ -0,0 +1,89 @@
|
|
1
|
+
import z from "zod";
|
2
|
+
import { AbstractModel } from "../../model-function/AbstractModel.js";
|
3
|
+
import { callWithRetryAndThrottle } from "../../util/api/callWithRetryAndThrottle.js";
|
4
|
+
import { createJsonResponseHandler, postJsonToApi, } from "../../util/api/postToApi.js";
|
5
|
+
import { failedLlamaCppCallResponseHandler } from "./LlamaCppError.js";
|
6
|
+
import { LlamaCppTokenizer } from "./LlamaCppTokenizer.js";
|
7
|
+
export class LlamaCppTextEmbeddingModel extends AbstractModel {
|
8
|
+
constructor(settings = {}) {
|
9
|
+
super({ settings });
|
10
|
+
Object.defineProperty(this, "provider", {
|
11
|
+
enumerable: true,
|
12
|
+
configurable: true,
|
13
|
+
writable: true,
|
14
|
+
value: "llamacpp"
|
15
|
+
});
|
16
|
+
Object.defineProperty(this, "maxTextsPerCall", {
|
17
|
+
enumerable: true,
|
18
|
+
configurable: true,
|
19
|
+
writable: true,
|
20
|
+
value: 1
|
21
|
+
});
|
22
|
+
Object.defineProperty(this, "contextWindowSize", {
|
23
|
+
enumerable: true,
|
24
|
+
configurable: true,
|
25
|
+
writable: true,
|
26
|
+
value: undefined
|
27
|
+
});
|
28
|
+
Object.defineProperty(this, "embeddingDimensions", {
|
29
|
+
enumerable: true,
|
30
|
+
configurable: true,
|
31
|
+
writable: true,
|
32
|
+
value: undefined
|
33
|
+
});
|
34
|
+
Object.defineProperty(this, "tokenizer", {
|
35
|
+
enumerable: true,
|
36
|
+
configurable: true,
|
37
|
+
writable: true,
|
38
|
+
value: void 0
|
39
|
+
});
|
40
|
+
this.tokenizer = new LlamaCppTokenizer({
|
41
|
+
baseUrl: this.settings.baseUrl,
|
42
|
+
retry: this.settings.tokenizerSettings?.retry,
|
43
|
+
throttle: this.settings.tokenizerSettings?.throttle,
|
44
|
+
});
|
45
|
+
}
|
46
|
+
get modelName() {
|
47
|
+
return null;
|
48
|
+
}
|
49
|
+
async tokenize(text) {
|
50
|
+
return this.tokenizer.tokenize(text);
|
51
|
+
}
|
52
|
+
async callAPI(texts, options) {
|
53
|
+
if (texts.length > this.maxTextsPerCall) {
|
54
|
+
throw new Error(`The Llama.cpp embedding API only supports ${this.maxTextsPerCall} texts per API call.`);
|
55
|
+
}
|
56
|
+
const run = options?.run;
|
57
|
+
const settings = options?.settings;
|
58
|
+
const callSettings = Object.assign({}, this.settings, settings, {
|
59
|
+
abortSignal: run?.abortSignal,
|
60
|
+
content: texts[0],
|
61
|
+
});
|
62
|
+
return callWithRetryAndThrottle({
|
63
|
+
retry: this.settings.retry,
|
64
|
+
throttle: this.settings.throttle,
|
65
|
+
call: async () => callLlamaCppEmbeddingAPI(callSettings),
|
66
|
+
});
|
67
|
+
}
|
68
|
+
generateEmbeddingResponse(texts, options) {
|
69
|
+
return this.callAPI(texts, options);
|
70
|
+
}
|
71
|
+
extractEmbeddings(response) {
|
72
|
+
return [response.embedding];
|
73
|
+
}
|
74
|
+
withSettings(additionalSettings) {
|
75
|
+
return new LlamaCppTextEmbeddingModel(Object.assign({}, this.settings, additionalSettings));
|
76
|
+
}
|
77
|
+
}
|
78
|
+
const llamaCppTextEmbeddingResponseSchema = z.object({
|
79
|
+
embedding: z.array(z.number()),
|
80
|
+
});
|
81
|
+
async function callLlamaCppEmbeddingAPI({ baseUrl = "http://127.0.0.1:8080", abortSignal, content, }) {
|
82
|
+
return postJsonToApi({
|
83
|
+
url: `${baseUrl}/embedding`,
|
84
|
+
body: { content },
|
85
|
+
failedResponseHandler: failedLlamaCppCallResponseHandler,
|
86
|
+
successfulResponseHandler: createJsonResponseHandler(llamaCppTextEmbeddingResponseSchema),
|
87
|
+
abortSignal,
|
88
|
+
});
|
89
|
+
}
|
@@ -0,0 +1,245 @@
|
|
1
|
+
"use strict";
|
2
|
+
var __importDefault = (this && this.__importDefault) || function (mod) {
|
3
|
+
return (mod && mod.__esModule) ? mod : { "default": mod };
|
4
|
+
};
|
5
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
6
|
+
exports.LlamaCppTextGenerationResponseFormat = exports.LlamaCppTextGenerationModel = void 0;
|
7
|
+
const secure_json_parse_1 = __importDefault(require("secure-json-parse"));
|
8
|
+
const zod_1 = __importDefault(require("zod"));
|
9
|
+
const AbstractModel_js_1 = require("../../model-function/AbstractModel.cjs");
|
10
|
+
const AsyncQueue_js_1 = require("../../model-function/generate-text/AsyncQueue.cjs");
|
11
|
+
const parseEventSourceReadableStream_js_1 = require("../../model-function/generate-text/parseEventSourceReadableStream.cjs");
|
12
|
+
const PromptMappingTextGenerationModel_js_1 = require("../../prompt/PromptMappingTextGenerationModel.cjs");
|
13
|
+
const callWithRetryAndThrottle_js_1 = require("../../util/api/callWithRetryAndThrottle.cjs");
|
14
|
+
const postToApi_js_1 = require("../../util/api/postToApi.cjs");
|
15
|
+
const LlamaCppError_js_1 = require("./LlamaCppError.cjs");
|
16
|
+
const LlamaCppTokenizer_js_1 = require("./LlamaCppTokenizer.cjs");
|
17
|
+
class LlamaCppTextGenerationModel extends AbstractModel_js_1.AbstractModel {
|
18
|
+
constructor(settings = {}) {
|
19
|
+
super({ settings });
|
20
|
+
Object.defineProperty(this, "provider", {
|
21
|
+
enumerable: true,
|
22
|
+
configurable: true,
|
23
|
+
writable: true,
|
24
|
+
value: "llamacpp"
|
25
|
+
});
|
26
|
+
Object.defineProperty(this, "tokenizer", {
|
27
|
+
enumerable: true,
|
28
|
+
configurable: true,
|
29
|
+
writable: true,
|
30
|
+
value: void 0
|
31
|
+
});
|
32
|
+
this.tokenizer = new LlamaCppTokenizer_js_1.LlamaCppTokenizer({
|
33
|
+
baseUrl: this.settings.baseUrl,
|
34
|
+
retry: this.settings.tokenizerSettings?.retry,
|
35
|
+
throttle: this.settings.tokenizerSettings?.throttle,
|
36
|
+
});
|
37
|
+
}
|
38
|
+
get modelName() {
|
39
|
+
return null;
|
40
|
+
}
|
41
|
+
get contextWindowSize() {
|
42
|
+
return this.settings.contextWindowSize;
|
43
|
+
}
|
44
|
+
async callAPI(prompt, options) {
|
45
|
+
const { run, settings, responseFormat } = options;
|
46
|
+
const callSettings = Object.assign(this.settings, settings, {
|
47
|
+
abortSignal: run?.abortSignal,
|
48
|
+
prompt,
|
49
|
+
responseFormat,
|
50
|
+
});
|
51
|
+
return (0, callWithRetryAndThrottle_js_1.callWithRetryAndThrottle)({
|
52
|
+
retry: this.settings.retry,
|
53
|
+
throttle: this.settings.throttle,
|
54
|
+
call: async () => callLlamaCppTextGenerationAPI(callSettings),
|
55
|
+
});
|
56
|
+
}
|
57
|
+
async countPromptTokens(prompt) {
|
58
|
+
const tokens = await this.tokenizer.tokenize(prompt);
|
59
|
+
return tokens.length;
|
60
|
+
}
|
61
|
+
generateTextResponse(prompt, options) {
|
62
|
+
return this.callAPI(prompt, {
|
63
|
+
...options,
|
64
|
+
responseFormat: exports.LlamaCppTextGenerationResponseFormat.json,
|
65
|
+
});
|
66
|
+
}
|
67
|
+
extractText(response) {
|
68
|
+
return response.content;
|
69
|
+
}
|
70
|
+
generateDeltaStreamResponse(prompt, options) {
|
71
|
+
return this.callAPI(prompt, {
|
72
|
+
...options,
|
73
|
+
responseFormat: exports.LlamaCppTextGenerationResponseFormat.deltaIterable,
|
74
|
+
});
|
75
|
+
}
|
76
|
+
extractTextDelta(fullDelta) {
|
77
|
+
return fullDelta.delta;
|
78
|
+
}
|
79
|
+
mapPrompt(promptMapping) {
|
80
|
+
return new PromptMappingTextGenerationModel_js_1.PromptMappingTextGenerationModel({
|
81
|
+
model: this.withStopTokens(promptMapping.stopTokens),
|
82
|
+
promptMapping,
|
83
|
+
});
|
84
|
+
}
|
85
|
+
withSettings(additionalSettings) {
|
86
|
+
return new LlamaCppTextGenerationModel(Object.assign({}, this.settings, additionalSettings));
|
87
|
+
}
|
88
|
+
get maxCompletionTokens() {
|
89
|
+
return this.settings.nPredict;
|
90
|
+
}
|
91
|
+
withMaxCompletionTokens(maxCompletionTokens) {
|
92
|
+
return this.withSettings({ nPredict: maxCompletionTokens });
|
93
|
+
}
|
94
|
+
withStopTokens(stopTokens) {
|
95
|
+
return this.withSettings({ stop: stopTokens });
|
96
|
+
}
|
97
|
+
}
|
98
|
+
exports.LlamaCppTextGenerationModel = LlamaCppTextGenerationModel;
|
99
|
+
const llamaCppTextGenerationResponseSchema = zod_1.default.object({
|
100
|
+
content: zod_1.default.string(),
|
101
|
+
stop: zod_1.default.literal(true),
|
102
|
+
generation_settings: zod_1.default.object({
|
103
|
+
frequency_penalty: zod_1.default.number(),
|
104
|
+
ignore_eos: zod_1.default.boolean(),
|
105
|
+
logit_bias: zod_1.default.array(zod_1.default.number()),
|
106
|
+
mirostat: zod_1.default.number(),
|
107
|
+
mirostat_eta: zod_1.default.number(),
|
108
|
+
mirostat_tau: zod_1.default.number(),
|
109
|
+
model: zod_1.default.string(),
|
110
|
+
n_ctx: zod_1.default.number(),
|
111
|
+
n_keep: zod_1.default.number(),
|
112
|
+
n_predict: zod_1.default.number(),
|
113
|
+
n_probs: zod_1.default.number(),
|
114
|
+
penalize_nl: zod_1.default.boolean(),
|
115
|
+
presence_penalty: zod_1.default.number(),
|
116
|
+
repeat_last_n: zod_1.default.number(),
|
117
|
+
repeat_penalty: zod_1.default.number(),
|
118
|
+
seed: zod_1.default.number(),
|
119
|
+
stop: zod_1.default.array(zod_1.default.string()),
|
120
|
+
stream: zod_1.default.boolean(),
|
121
|
+
temp: zod_1.default.number(),
|
122
|
+
tfs_z: zod_1.default.number(),
|
123
|
+
top_k: zod_1.default.number(),
|
124
|
+
top_p: zod_1.default.number(),
|
125
|
+
typical_p: zod_1.default.number(),
|
126
|
+
}),
|
127
|
+
model: zod_1.default.string(),
|
128
|
+
prompt: zod_1.default.string(),
|
129
|
+
stopped_eos: zod_1.default.boolean(),
|
130
|
+
stopped_limit: zod_1.default.boolean(),
|
131
|
+
stopped_word: zod_1.default.boolean(),
|
132
|
+
stopping_word: zod_1.default.string(),
|
133
|
+
timings: zod_1.default.object({
|
134
|
+
predicted_ms: zod_1.default.number(),
|
135
|
+
predicted_n: zod_1.default.number(),
|
136
|
+
predicted_per_second: zod_1.default.number().nullable(),
|
137
|
+
predicted_per_token_ms: zod_1.default.number().nullable(),
|
138
|
+
prompt_ms: zod_1.default.number().nullable(),
|
139
|
+
prompt_n: zod_1.default.number(),
|
140
|
+
prompt_per_second: zod_1.default.number().nullable(),
|
141
|
+
prompt_per_token_ms: zod_1.default.number().nullable(),
|
142
|
+
}),
|
143
|
+
tokens_cached: zod_1.default.number(),
|
144
|
+
tokens_evaluated: zod_1.default.number(),
|
145
|
+
tokens_predicted: zod_1.default.number(),
|
146
|
+
truncated: zod_1.default.boolean(),
|
147
|
+
});
|
148
|
+
const llamaCppTextStreamingResponseSchema = zod_1.default.discriminatedUnion("stop", [
|
149
|
+
zod_1.default.object({
|
150
|
+
content: zod_1.default.string(),
|
151
|
+
stop: zod_1.default.literal(false),
|
152
|
+
}),
|
153
|
+
llamaCppTextGenerationResponseSchema,
|
154
|
+
]);
|
155
|
+
async function callLlamaCppTextGenerationAPI({ baseUrl = "http://127.0.0.1:8080", abortSignal, responseFormat, prompt, temperature, topK, topP, nPredict, nKeep, stop, tfsZ, typicalP, repeatPenalty, repeatLastN, penalizeNl, mirostat, mirostatTau, mirostatEta, seed, ignoreEos, logitBias, }) {
|
156
|
+
return (0, postToApi_js_1.postJsonToApi)({
|
157
|
+
url: `${baseUrl}/completion`,
|
158
|
+
body: {
|
159
|
+
stream: responseFormat.stream,
|
160
|
+
prompt,
|
161
|
+
temperature,
|
162
|
+
top_k: topK,
|
163
|
+
top_p: topP,
|
164
|
+
n_predict: nPredict,
|
165
|
+
n_keep: nKeep,
|
166
|
+
stop,
|
167
|
+
tfs_z: tfsZ,
|
168
|
+
typical_p: typicalP,
|
169
|
+
repeat_penalty: repeatPenalty,
|
170
|
+
repeat_last_n: repeatLastN,
|
171
|
+
penalize_nl: penalizeNl,
|
172
|
+
mirostat,
|
173
|
+
mirostat_tau: mirostatTau,
|
174
|
+
mirostat_eta: mirostatEta,
|
175
|
+
seed,
|
176
|
+
ignore_eos: ignoreEos,
|
177
|
+
logit_bias: logitBias,
|
178
|
+
},
|
179
|
+
failedResponseHandler: LlamaCppError_js_1.failedLlamaCppCallResponseHandler,
|
180
|
+
successfulResponseHandler: responseFormat.handler,
|
181
|
+
abortSignal,
|
182
|
+
});
|
183
|
+
}
|
184
|
+
async function createLlamaCppFullDeltaIterableQueue(stream) {
|
185
|
+
const queue = new AsyncQueue_js_1.AsyncQueue();
|
186
|
+
let content = "";
|
187
|
+
// process the stream asynchonously (no 'await' on purpose):
|
188
|
+
(0, parseEventSourceReadableStream_js_1.parseEventSourceReadableStream)({
|
189
|
+
stream,
|
190
|
+
callback: (event) => {
|
191
|
+
if (event.type !== "event") {
|
192
|
+
return;
|
193
|
+
}
|
194
|
+
const data = event.data;
|
195
|
+
try {
|
196
|
+
const json = secure_json_parse_1.default.parse(data);
|
197
|
+
const parseResult = llamaCppTextStreamingResponseSchema.safeParse(json);
|
198
|
+
if (!parseResult.success) {
|
199
|
+
queue.push({
|
200
|
+
type: "error",
|
201
|
+
error: parseResult.error,
|
202
|
+
});
|
203
|
+
queue.close();
|
204
|
+
return;
|
205
|
+
}
|
206
|
+
const event = parseResult.data;
|
207
|
+
content += event.content;
|
208
|
+
queue.push({
|
209
|
+
type: "delta",
|
210
|
+
fullDelta: {
|
211
|
+
content,
|
212
|
+
isComplete: event.stop,
|
213
|
+
delta: event.content,
|
214
|
+
},
|
215
|
+
});
|
216
|
+
if (event.stop) {
|
217
|
+
queue.close();
|
218
|
+
}
|
219
|
+
}
|
220
|
+
catch (error) {
|
221
|
+
queue.push({ type: "error", error });
|
222
|
+
queue.close();
|
223
|
+
return;
|
224
|
+
}
|
225
|
+
},
|
226
|
+
});
|
227
|
+
return queue;
|
228
|
+
}
|
229
|
+
exports.LlamaCppTextGenerationResponseFormat = {
|
230
|
+
/**
|
231
|
+
* Returns the response as a JSON object.
|
232
|
+
*/
|
233
|
+
json: {
|
234
|
+
stream: false,
|
235
|
+
handler: (0, postToApi_js_1.createJsonResponseHandler)(llamaCppTextGenerationResponseSchema),
|
236
|
+
},
|
237
|
+
/**
|
238
|
+
* Returns an async iterable over the full deltas (all choices, including full current state at time of event)
|
239
|
+
* of the response stream.
|
240
|
+
*/
|
241
|
+
deltaIterable: {
|
242
|
+
stream: true,
|
243
|
+
handler: async ({ response }) => createLlamaCppFullDeltaIterableQueue(response.body),
|
244
|
+
},
|
245
|
+
};
|