npm - modelfusion - Versions diffs - 0.17.0 → 0.19.0 - Mend

modelfusion 0.17.0 → 0.19.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

package/README.md CHANGED Viewed

@@ -20,7 +20,7 @@ ModelFusion is a library for building AI apps, chatbots, and agents. It provides
 - **Type inference and validation**: ModelFusion uses TypeScript and [Zod](https://github.com/colinhacks/zod) to infer types wherever possible and to validate model responses.
 - **Flexibility and control**: AI application development can be complex and unique to each project. With ModelFusion, you have complete control over the prompts and model settings, and you can access the raw responses from the models quickly to build what you need.
 - **No chains and predefined prompts**: Use the concepts provided by JavaScript (variables, functions, etc.) and explicit prompts to build applications you can easily understand and control. Not black magic.
-- **More than LLMs**: ModelFusion supports other models, e.g., text-to-image and voice-to-text, to help you build rich AI applications that go beyond just text.
+- **Multimodal Support**: Beyond just LLMs, ModelFusion encompasses a diverse array of models including text generation, text-to-speech, speech-to-text, and image generation, allowing you to build multifaceted AI applications with ease.
 - **Integrated support features**: Essential features like logging, retries, throttling, tracing, and error handling are built-in, helping you focus more on building your application.
 ## Quick Install
@@ -274,7 +274,7 @@ const transcription = await transcribe(
 );
 ```
-### Synthesize Speech
+### [Synthesize Speech](https://modelfusion.dev/guide/function/synthesize-speech)
 Turn text into speech (audio).
@@ -371,6 +371,7 @@ const { chunks } = await retrieveTextChunks(
   - [Embed Text](https://modelfusion.dev/guide/function/embed-text)
   - [Tokenize Text](https://modelfusion.dev/guide/function/tokenize-text)
   - [Transcribe Speech](https://modelfusion.dev/guide/function/transcribe-speech)
+  - [Synthesize Speech](https://modelfusion.dev/guide/function/synthesize-speech)
   - [Generate images](https://modelfusion.dev/guide/function/generate-image)
 - Summarize text
 - [Tools](https://modelfusion.dev/guide/tools)
@@ -389,18 +390,30 @@ const { chunks } = await retrieveTextChunks(
 ### Model Providers
-|                                                                                       | [OpenAI](https://modelfusion.dev/integration/model-provider/openai) | [Cohere](https://modelfusion.dev/integration/model-provider/cohere) | [Llama.cpp](https://modelfusion.dev/integration/model-provider/llamacpp) | [Hugging Face](https://modelfusion.dev/integration/model-provider/huggingface) | [Stability AI](https://modelfusion.dev/integration/model-provider/stability) | [Automatic1111](https://modelfusion.dev/integration/model-provider/automatic1111) |
-| ------------------------------------------------------------------------------------- | ------------------------------------------------------------------- | ------------------------------------------------------------------- | ------------------------------------------------------------------------ | ------------------------------------------------------------------------------ | ---------------------------------------------------------------------------- | --------------------------------------------------------------------------------- |
-| Hosting                                                                               | cloud                                                               | cloud                                                               | server (local)                                                           | cloud                                                                          | cloud                                                                        | server (local)                                                                    |
-| [Generate text](https://modelfusion.dev/guide/function/generate-text)                 | ✅                                                                  | ✅                                                                  | ✅                                                                       | ✅                                                                             |                                                                              |                                                                                   |
-| [Stream text](https://modelfusion.dev/guide/function/generate-text)                   | ✅                                                                  | ✅                                                                  | ✅                                                                       |                                                                                |                                                                              |                                                                                   |
-| [Generate JSON](https://modelfusion.dev/guide/function/generate-json)                 | chat models                                                         |                                                                     |                                                                          |                                                                                |                                                                              |                                                                                   |
-| [Generate JSON or Text](https://modelfusion.dev/guide/function/generate-json-or-text) | chat models                                                         |                                                                     |                                                                          |                                                                                |                                                                              |                                                                                   |
-| [Embed text](https://modelfusion.dev/guide/function/embed-text)                       | ✅                                                                  | ✅                                                                  | ✅                                                                       | ✅                                                                             |                                                                              |                                                                                   |
-| [Tokenize text](https://modelfusion.dev/guide/function/tokenize-text)                 | full                                                                | full                                                                | basic                                                                    |                                                                                |                                                                              |                                                                                   |
-| [Generate image](https://modelfusion.dev/guide/function/generate-image)               | ✅                                                                  |                                                                     |                                                                          |                                                                                | ✅                                                                           | ✅                                                                                |
-| [Transcribe speech](https://modelfusion.dev/guide/function/transcribe-speech)         | ✅                                                                  |                                                                     |                                                                          |                                                                                |                                                                              |                                                                                   |
-| [Cost calculation](https://modelfusion.dev/guide/run/cost-calculation)                | ✅                                                                  |                                                                     |                                                                          |                                                                                |                                                                              |                                                                                   |
+#### Text and JSON Generation
+|                                                                                       | [OpenAI](https://modelfusion.dev/integration/model-provider/openai) | [Cohere](https://modelfusion.dev/integration/model-provider/cohere) | [Llama.cpp](https://modelfusion.dev/integration/model-provider/llamacpp) | [Hugging Face](https://modelfusion.dev/integration/model-provider/huggingface) |
+| ------------------------------------------------------------------------------------- | ------------------------------------------------------------------- | ------------------------------------------------------------------- | ------------------------------------------------------------------------ | ------------------------------------------------------------------------------ |
+| [Generate text](https://modelfusion.dev/guide/function/generate-text)                 | ✅                                                                  | ✅                                                                  | ✅                                                                       | ✅                                                                             |
+| [Stream text](https://modelfusion.dev/guide/function/generate-text)                   | ✅                                                                  | ✅                                                                  | ✅                                                                       |                                                                                |
+| [Generate JSON](https://modelfusion.dev/guide/function/generate-json)                 | chat models                                                         |                                                                     |                                                                          |                                                                                |
+| [Generate JSON or Text](https://modelfusion.dev/guide/function/generate-json-or-text) | chat models                                                         |                                                                     |                                                                          |                                                                                |
+| [Embed text](https://modelfusion.dev/guide/function/embed-text)                       | ✅                                                                  | ✅                                                                  | ✅                                                                       | ✅                                                                             |
+| [Tokenize text](https://modelfusion.dev/guide/function/tokenize-text)                 | full                                                                | full                                                                | basic                                                                    |                                                                                |
+#### Image Generation
+- [OpenAI (Dall·E)](https://modelfusion.dev/integration/model-provider/openai)
+- [Stability AI](https://modelfusion.dev/integration/model-provider/stability)
+- [Automatic1111](https://modelfusion.dev/integration/model-provider/automatic1111)
+#### Speech Transcription
+- [OpenAI (Whisper)](https://modelfusion.dev/integration/model-provider/openai)
+#### Speech Synthesis
+- [Eleven Labs](https://modelfusion.dev/integration/model-provider/elevenlabs)
 ### Vector Indices

package/model-function/synthesize-speech/synthesizeSpeech.d.ts CHANGED Viewed

@@ -2,6 +2,9 @@
 import { FunctionOptions } from "../FunctionOptions.js";
 import { CallMetadata } from "../executeCall.js";
 import { SpeechSynthesisModel, SpeechSynthesisModelSettings } from "./SpeechSynthesisModel.js";
+/**
+ * Synthesizes speech from text.
+ */
 export declare function synthesizeSpeech<SETTINGS extends SpeechSynthesisModelSettings>(model: SpeechSynthesisModel<SETTINGS>, text: string, options: FunctionOptions<SETTINGS> & {
     fullResponse: true;
 }): Promise<{

package/model-provider/elevenlabs/ElevenLabsSpeechSynthesisModel.cjs CHANGED Viewed

@@ -44,6 +44,8 @@ class ElevenLabsSpeechSynthesisModel extends AbstractModel_js_1.AbstractModel {
                 apiKey: this.apiKey,
                 text,
                 voiceId: combinedSettings.voice,
+                modelId: combinedSettings.model,
+                voiceSettings: combinedSettings.voiceSettings,
             }),
         });
     }
@@ -61,7 +63,7 @@ exports.ElevenLabsSpeechSynthesisModel = ElevenLabsSpeechSynthesisModel;
 /**
  * @see https://api.elevenlabs.io/docs#/text-to-speech/Text_to_speech_v1_text_to_speech__voice_id__post
  */
-async function callElevenLabsTextToSpeechAPI({ baseUrl = "https://api.elevenlabs.io/v1", abortSignal, apiKey, text, voiceId, }) {
+async function callElevenLabsTextToSpeechAPI({ baseUrl = "https://api.elevenlabs.io/v1", abortSignal, apiKey, text, voiceId, modelId, voiceSettings, }) {
     return (0, postToApi_js_1.postJsonToApi)({
         url: `${baseUrl}/text-to-speech/${voiceId}`,
         headers: {
@@ -69,6 +71,15 @@ async function callElevenLabsTextToSpeechAPI({ baseUrl = "https://api.elevenlabs
         },
         body: {
             text,
+            model_id: modelId,
+            voice_settings: voiceSettings != null
+                ? {
+                    stability: voiceSettings.stability,
+                    similarity_boost: voiceSettings.similarityBoost,
+                    style: voiceSettings.style,
+                    use_speaker_boost: voiceSettings.useSpeakerBoost,
+                }
+                : undefined,
         },
         failedResponseHandler: ElevenLabsError_js_1.failedElevenLabsCallResponseHandler,
         successfulResponseHandler: (0, postToApi_js_1.createAudioMpegResponseHandler)(),

package/model-provider/elevenlabs/ElevenLabsSpeechSynthesisModel.d.ts CHANGED Viewed

@@ -8,6 +8,13 @@ export interface ElevenLabsSpeechSynthesisModelSettings extends SpeechSynthesisM
     voice: string;
     baseUrl?: string;
     apiKey?: string;
+    model?: string;
+    voiceSettings?: {
+        stability: number;
+        similarityBoost: number;
+        style?: number;
+        useSpeakerBoost?: boolean;
+    };
     retry?: RetryFunction;
     throttle?: ThrottleFunction;
 }

package/model-provider/elevenlabs/ElevenLabsSpeechSynthesisModel.js CHANGED Viewed

@@ -41,6 +41,8 @@ export class ElevenLabsSpeechSynthesisModel extends AbstractModel {
                 apiKey: this.apiKey,
                 text,
                 voiceId: combinedSettings.voice,
+                modelId: combinedSettings.model,
+                voiceSettings: combinedSettings.voiceSettings,
             }),
         });
     }
@@ -57,7 +59,7 @@ export class ElevenLabsSpeechSynthesisModel extends AbstractModel {
 /**
  * @see https://api.elevenlabs.io/docs#/text-to-speech/Text_to_speech_v1_text_to_speech__voice_id__post
  */
-async function callElevenLabsTextToSpeechAPI({ baseUrl = "https://api.elevenlabs.io/v1", abortSignal, apiKey, text, voiceId, }) {
+async function callElevenLabsTextToSpeechAPI({ baseUrl = "https://api.elevenlabs.io/v1", abortSignal, apiKey, text, voiceId, modelId, voiceSettings, }) {
     return postJsonToApi({
         url: `${baseUrl}/text-to-speech/${voiceId}`,
         headers: {
@@ -65,6 +67,15 @@ async function callElevenLabsTextToSpeechAPI({ baseUrl = "https://api.elevenlabs
         },
         body: {
             text,
+            model_id: modelId,
+            voice_settings: voiceSettings != null
+                ? {
+                    stability: voiceSettings.stability,
+                    similarity_boost: voiceSettings.similarityBoost,
+                    style: voiceSettings.style,
+                    use_speaker_boost: voiceSettings.useSpeakerBoost,
+                }
+                : undefined,
         },
         failedResponseHandler: failedElevenLabsCallResponseHandler,
         successfulResponseHandler: createAudioMpegResponseHandler(),

package/model-provider/openai/OpenAITextGenerationModel.cjs CHANGED Viewed

@@ -20,6 +20,14 @@ const TikTokenTokenizer_js_1 = require("./TikTokenTokenizer.cjs");
  * @see https://openai.com/pricing
  */
 exports.OPENAI_TEXT_GENERATION_MODELS = {
+    "davinci-002": {
+        contextWindowSize: 16384,
+        tokenCostInMillicents: 0.2,
+    },
+    "babbage-002": {
+        contextWindowSize: 16384,
+        tokenCostInMillicents: 0.04,
+    },
     "text-davinci-003": {
         contextWindowSize: 4096,
         tokenCostInMillicents: 2,

package/model-provider/openai/OpenAITextGenerationModel.d.ts CHANGED Viewed

@@ -16,6 +16,14 @@ import { TikTokenTokenizer } from "./TikTokenTokenizer.js";
  * @see https://openai.com/pricing
  */
 export declare const OPENAI_TEXT_GENERATION_MODELS: {
+    "davinci-002": {
+        contextWindowSize: number;
+        tokenCostInMillicents: number;
+    };
+    "babbage-002": {
+        contextWindowSize: number;
+        tokenCostInMillicents: number;
+    };
     "text-davinci-003": {
         contextWindowSize: number;
         tokenCostInMillicents: number;
@@ -58,7 +66,7 @@ export declare const OPENAI_TEXT_GENERATION_MODELS: {
     };
 };
 export type OpenAITextGenerationModelType = keyof typeof OPENAI_TEXT_GENERATION_MODELS;
-export declare const isOpenAITextGenerationModel: (model: string) => model is "text-davinci-003" | "text-davinci-002" | "code-davinci-002" | "davinci" | "text-curie-001" | "curie" | "text-babbage-001" | "babbage" | "text-ada-001" | "ada";
+export declare const isOpenAITextGenerationModel: (model: string) => model is "davinci-002" | "babbage-002" | "text-davinci-003" | "text-davinci-002" | "code-davinci-002" | "davinci" | "text-curie-001" | "curie" | "text-babbage-001" | "babbage" | "text-ada-001" | "ada";
 export declare const calculateOpenAITextGenerationCostInMillicents: ({ model, response, }: {
     model: OpenAITextGenerationModelType;
     response: OpenAITextGenerationResponse;
@@ -102,7 +110,7 @@ export interface OpenAITextGenerationModelSettings extends TextGenerationModelSe
 export declare class OpenAITextGenerationModel extends AbstractModel<OpenAITextGenerationModelSettings> implements TextGenerationModel<string, OpenAITextGenerationResponse, OpenAITextGenerationDelta, OpenAITextGenerationModelSettings> {
     constructor(settings: OpenAITextGenerationModelSettings);
     readonly provider: "openai";
-    get modelName(): "text-davinci-003" | "text-davinci-002" | "code-davinci-002" | "davinci" | "text-curie-001" | "curie" | "text-babbage-001" | "babbage" | "text-ada-001" | "ada";
+    get modelName(): "davinci-002" | "babbage-002" | "text-davinci-003" | "text-davinci-002" | "code-davinci-002" | "davinci" | "text-curie-001" | "curie" | "text-babbage-001" | "babbage" | "text-ada-001" | "ada";
     readonly contextWindowSize: number;
     readonly tokenizer: TikTokenTokenizer;
     private get apiKey();

package/model-provider/openai/OpenAITextGenerationModel.js CHANGED Viewed

@@ -14,6 +14,14 @@ import { TikTokenTokenizer } from "./TikTokenTokenizer.js";
  * @see https://openai.com/pricing
  */
 export const OPENAI_TEXT_GENERATION_MODELS = {
+    "davinci-002": {
+        contextWindowSize: 16384,
+        tokenCostInMillicents: 0.2,
+    },
+    "babbage-002": {
+        contextWindowSize: 16384,
+        tokenCostInMillicents: 0.04,
+    },
     "text-davinci-003": {
         contextWindowSize: 4096,
         tokenCostInMillicents: 2,

package/model-provider/openai/TikTokenTokenizer.cjs CHANGED Viewed

@@ -57,13 +57,17 @@ function getEncodingNameForModel(model) {
         case "text-davinci-003": {
             return "p50k_base";
         }
+        case "babbage-002":
+        case "davinci-002":
         case "ada":
         case "babbage":
         case "curie":
         case "davinci":
         case "text-ada-001":
         case "text-babbage-001":
-        case "text-curie-001":
+        case "text-curie-001": {
+            return "r50k_base";
+        }
         case "gpt-3.5-turbo":
         case "gpt-3.5-turbo-0301":
         case "gpt-3.5-turbo-0613":

package/model-provider/openai/TikTokenTokenizer.js CHANGED Viewed

@@ -53,13 +53,17 @@ function getEncodingNameForModel(model) {
         case "text-davinci-003": {
             return "p50k_base";
         }
+        case "babbage-002":
+        case "davinci-002":
         case "ada":
         case "babbage":
         case "curie":
         case "davinci":
         case "text-ada-001":
         case "text-babbage-001":
-        case "text-curie-001":
+        case "text-curie-001": {
+            return "r50k_base";
+        }
         case "gpt-3.5-turbo":
         case "gpt-3.5-turbo-0301":
         case "gpt-3.5-turbo-0613":

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "modelfusion",
   "description": "Build AI applications, chatbots, and agents with JavaScript and TypeScript.",
-  "version": "0.17.0",
+  "version": "0.19.0",
   "author": "Lars Grammel",
   "license": "MIT",
   "keywords": [