npm - langchain - Versions diffs - 0.0.176 → 0.0.178 - Mend

langchain 0.0.176 → 0.0.178

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

package/chat_models/iflytek_xinghuo/web.cjs +1 -0
package/chat_models/iflytek_xinghuo/web.d.ts +1 -0
package/chat_models/iflytek_xinghuo/web.js +1 -0
package/chat_models/iflytek_xinghuo.cjs +1 -0
package/chat_models/iflytek_xinghuo.d.ts +1 -0
package/chat_models/iflytek_xinghuo.js +1 -0
package/dist/chat_models/bedrock.cjs +25 -4
package/dist/chat_models/bedrock.d.ts +2 -1
package/dist/chat_models/bedrock.js +25 -4
package/dist/chat_models/cloudflare_workersai.cjs +70 -24
package/dist/chat_models/cloudflare_workersai.d.ts +6 -2
package/dist/chat_models/cloudflare_workersai.js +71 -25
package/dist/chat_models/iflytek_xinghuo/common.cjs +335 -0
package/dist/chat_models/iflytek_xinghuo/common.d.ts +165 -0
package/dist/chat_models/iflytek_xinghuo/common.js +331 -0
package/dist/chat_models/iflytek_xinghuo/index.cjs +35 -0
package/dist/chat_models/iflytek_xinghuo/index.d.ts +5 -0
package/dist/chat_models/iflytek_xinghuo/index.js +28 -0
package/dist/chat_models/iflytek_xinghuo/web.cjs +30 -0
package/dist/chat_models/iflytek_xinghuo/web.d.ts +5 -0
package/dist/chat_models/iflytek_xinghuo/web.js +26 -0
package/dist/chat_models/llama_cpp.cjs +31 -79
package/dist/chat_models/llama_cpp.d.ts +15 -58
package/dist/chat_models/llama_cpp.js +32 -80
package/dist/chat_models/openai.cjs +91 -6
package/dist/chat_models/openai.d.ts +10 -0
package/dist/chat_models/openai.js +91 -6
package/dist/embeddings/hf.cjs +10 -1
package/dist/embeddings/hf.d.ts +4 -2
package/dist/embeddings/hf.js +10 -1
package/dist/embeddings/llama_cpp.cjs +67 -0
package/dist/embeddings/llama_cpp.d.ts +26 -0
package/dist/embeddings/llama_cpp.js +63 -0
package/dist/embeddings/ollama.cjs +7 -1
package/dist/embeddings/ollama.js +7 -1
package/dist/graphs/neo4j_graph.cjs +36 -5
package/dist/graphs/neo4j_graph.js +14 -3
package/dist/llms/bedrock.cjs +25 -3
package/dist/llms/bedrock.d.ts +2 -1
package/dist/llms/bedrock.js +25 -3
package/dist/llms/cloudflare_workersai.cjs +59 -13
package/dist/llms/cloudflare_workersai.d.ts +9 -3
package/dist/llms/cloudflare_workersai.js +59 -13
package/dist/llms/hf.cjs +10 -1
package/dist/llms/hf.d.ts +3 -0
package/dist/llms/hf.js +10 -1
package/dist/llms/llama_cpp.cjs +25 -65
package/dist/llms/llama_cpp.d.ts +7 -43
package/dist/llms/llama_cpp.js +25 -65
package/dist/load/import_constants.cjs +3 -0
package/dist/load/import_constants.js +3 -0
package/dist/prompts/chat.cjs +8 -0
package/dist/prompts/chat.d.ts +5 -0
package/dist/prompts/chat.js +8 -0
package/dist/prompts/few_shot.cjs +162 -1
package/dist/prompts/few_shot.d.ts +90 -2
package/dist/prompts/few_shot.js +160 -0
package/dist/prompts/index.cjs +2 -1
package/dist/prompts/index.d.ts +1 -1
package/dist/prompts/index.js +1 -1
package/dist/retrievers/zep.cjs +26 -3
package/dist/retrievers/zep.d.ts +11 -2
package/dist/retrievers/zep.js +26 -3
package/dist/util/bedrock.d.ts +2 -0
package/dist/util/event-source-parse.cjs +20 -1
package/dist/util/event-source-parse.d.ts +2 -0
package/dist/util/event-source-parse.js +18 -0
package/dist/util/iflytek_websocket_stream.cjs +81 -0
package/dist/util/iflytek_websocket_stream.d.ts +27 -0
package/dist/util/iflytek_websocket_stream.js +77 -0
package/dist/util/llama_cpp.cjs +34 -0
package/dist/util/llama_cpp.d.ts +46 -0
package/dist/util/llama_cpp.js +28 -0
package/dist/util/openai-format-fndef.cjs +81 -0
package/dist/util/openai-format-fndef.d.ts +44 -0
package/dist/util/openai-format-fndef.js +77 -0
package/dist/util/openapi.d.ts +2 -2
package/dist/vectorstores/pinecone.cjs +5 -5
package/dist/vectorstores/pinecone.d.ts +2 -2
package/dist/vectorstores/pinecone.js +5 -5
package/embeddings/llama_cpp.cjs +1 -0
package/embeddings/llama_cpp.d.ts +1 -0
package/embeddings/llama_cpp.js +1 -0
package/package.json +34 -5

package/dist/embeddings/hf.js CHANGED Viewed

@@ -21,6 +21,12 @@ export class HuggingFaceInferenceEmbeddings extends Embeddings {
             writable: true,
             value: void 0
         });
+        Object.defineProperty(this, "endpointUrl", {
+            enumerable: true,
+            configurable: true,
+            writable: true,
+            value: void 0
+        });
         Object.defineProperty(this, "client", {
             enumerable: true,
             configurable: true,
@@ -31,7 +37,10 @@ export class HuggingFaceInferenceEmbeddings extends Embeddings {
             fields?.model ?? "sentence-transformers/distilbert-base-nli-mean-tokens";
         this.apiKey =
             fields?.apiKey ?? getEnvironmentVariable("HUGGINGFACEHUB_API_KEY");
-        this.client = new HfInference(this.apiKey);
+        this.endpointUrl = fields?.endpointUrl;
+        this.client = this.endpointUrl
+            ? new HfInference(this.apiKey).endpoint(this.endpointUrl)
+            : new HfInference(this.apiKey);
     }
     async _embed(texts) {
         // replace newlines, which can negatively affect performance.

package/dist/embeddings/llama_cpp.cjs ADDED Viewed

@@ -0,0 +1,67 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.LlamaCppEmbeddings = void 0;
+const llama_cpp_js_1 = require("../util/llama_cpp.cjs");
+const base_js_1 = require("./base.cjs");
+class LlamaCppEmbeddings extends base_js_1.Embeddings {
+    constructor(inputs) {
+        super(inputs);
+        Object.defineProperty(this, "_model", {
+            enumerable: true,
+            configurable: true,
+            writable: true,
+            value: void 0
+        });
+        Object.defineProperty(this, "_context", {
+            enumerable: true,
+            configurable: true,
+            writable: true,
+            value: void 0
+        });
+        const _inputs = inputs;
+        _inputs.embedding = true;
+        this._model = (0, llama_cpp_js_1.createLlamaModel)(_inputs);
+        this._context = (0, llama_cpp_js_1.createLlamaContext)(this._model, _inputs);
+    }
+    /**
+     * Generates embeddings for an array of texts.
+     * @param texts - An array of strings to generate embeddings for.
+     * @returns A Promise that resolves to an array of embeddings.
+     */
+    async embedDocuments(texts) {
+        const tokensArray = [];
+        for (const text of texts) {
+            const encodings = await this.caller.call(() => new Promise((resolve) => {
+                resolve(this._context.encode(text));
+            }));
+            tokensArray.push(encodings);
+        }
+        const embeddings = [];
+        for (const tokens of tokensArray) {
+            const embedArray = [];
+            for (let i = 0; i < tokens.length; i += 1) {
+                const nToken = +tokens[i];
+                embedArray.push(nToken);
+            }
+            embeddings.push(embedArray);
+        }
+        return embeddings;
+    }
+    /**
+     * Generates an embedding for a single text.
+     * @param text - A string to generate an embedding for.
+     * @returns A Promise that resolves to an array of numbers representing the embedding.
+     */
+    async embedQuery(text) {
+        const tokens = [];
+        const encodings = await this.caller.call(() => new Promise((resolve) => {
+            resolve(this._context.encode(text));
+        }));
+        for (let i = 0; i < encodings.length; i += 1) {
+            const token = +encodings[i];
+            tokens.push(token);
+        }
+        return tokens;
+    }
+}
+exports.LlamaCppEmbeddings = LlamaCppEmbeddings;

package/dist/embeddings/llama_cpp.d.ts ADDED Viewed

@@ -0,0 +1,26 @@
+import { LlamaModel, LlamaContext } from "node-llama-cpp";
+import { LlamaBaseCppInputs } from "../util/llama_cpp.js";
+import { Embeddings, EmbeddingsParams } from "./base.js";
+/**
+ * Note that the modelPath is the only required parameter. For testing you
+ * can set this in the environment variable `LLAMA_PATH`.
+ */
+export interface LlamaCppEmbeddingsParams extends LlamaBaseCppInputs, EmbeddingsParams {
+}
+export declare class LlamaCppEmbeddings extends Embeddings {
+    _model: LlamaModel;
+    _context: LlamaContext;
+    constructor(inputs: LlamaCppEmbeddingsParams);
+    /**
+     * Generates embeddings for an array of texts.
+     * @param texts - An array of strings to generate embeddings for.
+     * @returns A Promise that resolves to an array of embeddings.
+     */
+    embedDocuments(texts: string[]): Promise<number[][]>;
+    /**
+     * Generates an embedding for a single text.
+     * @param text - A string to generate an embedding for.
+     * @returns A Promise that resolves to an array of numbers representing the embedding.
+     */
+    embedQuery(text: string): Promise<number[]>;
+}

package/dist/embeddings/llama_cpp.js ADDED Viewed

@@ -0,0 +1,63 @@
+import { createLlamaModel, createLlamaContext, } from "../util/llama_cpp.js";
+import { Embeddings } from "./base.js";
+export class LlamaCppEmbeddings extends Embeddings {
+    constructor(inputs) {
+        super(inputs);
+        Object.defineProperty(this, "_model", {
+            enumerable: true,
+            configurable: true,
+            writable: true,
+            value: void 0
+        });
+        Object.defineProperty(this, "_context", {
+            enumerable: true,
+            configurable: true,
+            writable: true,
+            value: void 0
+        });
+        const _inputs = inputs;
+        _inputs.embedding = true;
+        this._model = createLlamaModel(_inputs);
+        this._context = createLlamaContext(this._model, _inputs);
+    }
+    /**
+     * Generates embeddings for an array of texts.
+     * @param texts - An array of strings to generate embeddings for.
+     * @returns A Promise that resolves to an array of embeddings.
+     */
+    async embedDocuments(texts) {
+        const tokensArray = [];
+        for (const text of texts) {
+            const encodings = await this.caller.call(() => new Promise((resolve) => {
+                resolve(this._context.encode(text));
+            }));
+            tokensArray.push(encodings);
+        }
+        const embeddings = [];
+        for (const tokens of tokensArray) {
+            const embedArray = [];
+            for (let i = 0; i < tokens.length; i += 1) {
+                const nToken = +tokens[i];
+                embedArray.push(nToken);
+            }
+            embeddings.push(embedArray);
+        }
+        return embeddings;
+    }
+    /**
+     * Generates an embedding for a single text.
+     * @param text - A string to generate an embedding for.
+     * @returns A Promise that resolves to an array of numbers representing the embedding.
+     */
+    async embedQuery(text) {
+        const tokens = [];
+        const encodings = await this.caller.call(() => new Promise((resolve) => {
+            resolve(this._context.encode(text));
+        }));
+        for (let i = 0; i < encodings.length; i += 1) {
+            const token = +encodings[i];
+            tokens.push(token);
+        }
+        return tokens;
+    }
+}

package/dist/embeddings/ollama.cjs CHANGED Viewed

@@ -81,7 +81,13 @@ class OllamaEmbeddings extends base_js_1.Embeddings {
     }
     async _request(prompt) {
         const { model, baseUrl, requestOptions } = this;
-        const response = await fetch(`${baseUrl}/api/embeddings`, {
+        let formattedBaseUrl = baseUrl;
+        if (formattedBaseUrl.startsWith("http://localhost:")) {
+            // Node 18 has issues with resolving "localhost"
+            // See https://github.com/node-fetch/node-fetch/issues/1624
+            formattedBaseUrl = formattedBaseUrl.replace("http://localhost:", "http://127.0.0.1:");
+        }
+        const response = await fetch(`${formattedBaseUrl}/api/embeddings`, {
             method: "POST",
             headers: { "Content-Type": "application/json" },
             body: JSON.stringify({

package/dist/embeddings/ollama.js CHANGED Viewed

@@ -78,7 +78,13 @@ export class OllamaEmbeddings extends Embeddings {
     }
     async _request(prompt) {
         const { model, baseUrl, requestOptions } = this;
-        const response = await fetch(`${baseUrl}/api/embeddings`, {
+        let formattedBaseUrl = baseUrl;
+        if (formattedBaseUrl.startsWith("http://localhost:")) {
+            // Node 18 has issues with resolving "localhost"
+            // See https://github.com/node-fetch/node-fetch/issues/1624
+            formattedBaseUrl = formattedBaseUrl.replace("http://localhost:", "http://127.0.0.1:");
+        }
+        const response = await fetch(`${formattedBaseUrl}/api/embeddings`, {
             method: "POST",
             headers: { "Content-Type": "application/json" },
             body: JSON.stringify({

package/dist/graphs/neo4j_graph.cjs CHANGED Viewed

@@ -1,10 +1,30 @@
 "use strict";
-var __importDefault = (this && this.__importDefault) || function (mod) {
-    return (mod && mod.__esModule) ? mod : { "default": mod };
+var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    var desc = Object.getOwnPropertyDescriptor(m, k);
+    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
+      desc = { enumerable: true, get: function() { return m[k]; } };
+    }
+    Object.defineProperty(o, k2, desc);
+}) : (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    o[k2] = m[k];
+}));
+var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
+    Object.defineProperty(o, "default", { enumerable: true, value: v });
+}) : function(o, v) {
+    o["default"] = v;
+});
+var __importStar = (this && this.__importStar) || function (mod) {
+    if (mod && mod.__esModule) return mod;
+    var result = {};
+    if (mod != null) for (var k in mod) if (k !== "default" && Object.prototype.hasOwnProperty.call(mod, k)) __createBinding(result, mod, k);
+    __setModuleDefault(result, mod);
+    return result;
 };
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.Neo4jGraph = void 0;
-const neo4j_driver_1 = __importDefault(require("neo4j-driver"));
+const neo4j_driver_1 = __importStar(require("neo4j-driver"));
 /**
  * @security *Security note*: Make sure that the database connection uses credentials
  * that are narrowly-scoped to only include necessary permissions.
@@ -61,7 +81,12 @@ class Neo4jGraph {
             // eslint-disable-next-line @typescript-eslint/no-explicit-any
         }
         catch (error) {
-            throw new Error(`Error: ${error.message}`);
+            const message = [
+                "Could not use APOC procedures.",
+                "Please ensure the APOC plugin is installed in Neo4j and that",
+                "'apoc.meta.data()' is allowed in Neo4j configuration",
+            ].join("\n");
+            throw new Error(message);
         }
         finally {
             console.log("Schema refreshed successfully.");
@@ -78,9 +103,15 @@ class Neo4jGraph {
                 database: this.database,
             });
             return toObjects(result.records);
+            // eslint-disable-next-line @typescript-eslint/no-explicit-any
         }
         catch (error) {
-            // ignore errors
+            if (
+            // eslint-disable-next-line
+            error instanceof neo4j_driver_1.Neo4jError &&
+                error.code === "Neo.ClientError.Procedure.ProcedureNotFound") {
+                throw new Error("Procedure not found in Neo4j.");
+            }
         }
         return undefined;
     }

package/dist/graphs/neo4j_graph.js CHANGED Viewed

@@ -1,4 +1,4 @@
-import neo4j from "neo4j-driver";
+import neo4j, { Neo4jError } from "neo4j-driver";
 /**
  * @security *Security note*: Make sure that the database connection uses credentials
  * that are narrowly-scoped to only include necessary permissions.
@@ -55,7 +55,12 @@ export class Neo4jGraph {
             // eslint-disable-next-line @typescript-eslint/no-explicit-any
         }
         catch (error) {
-            throw new Error(`Error: ${error.message}`);
+            const message = [
+                "Could not use APOC procedures.",
+                "Please ensure the APOC plugin is installed in Neo4j and that",
+                "'apoc.meta.data()' is allowed in Neo4j configuration",
+            ].join("\n");
+            throw new Error(message);
         }
         finally {
             console.log("Schema refreshed successfully.");
@@ -72,9 +77,15 @@ export class Neo4jGraph {
                 database: this.database,
             });
             return toObjects(result.records);
+            // eslint-disable-next-line @typescript-eslint/no-explicit-any
         }
         catch (error) {
-            // ignore errors
+            if (
+            // eslint-disable-next-line
+            error instanceof Neo4jError &&
+                error.code === "Neo.ClientError.Procedure.ProcedureNotFound") {
+                throw new Error("Procedure not found in Neo4j.");
+            }
         }
         return undefined;
     }

package/dist/llms/bedrock.cjs CHANGED Viewed

@@ -92,6 +92,12 @@ class Bedrock extends base_js_1.LLM {
             writable: true,
             value: new eventstream_codec_1.EventStreamCodec(util_utf8_1.toUtf8, util_utf8_1.fromUtf8)
         });
+        Object.defineProperty(this, "streaming", {
+            enumerable: true,
+            configurable: true,
+            writable: true,
+            value: false
+        });
         this.model = fields?.model ?? this.model;
         const allowedModels = ["ai21", "anthropic", "amazon"];
         if (!allowedModels.includes(this.model.split(".")[0])) {
@@ -109,6 +115,7 @@ class Bedrock extends base_js_1.LLM {
         this.endpointHost = fields?.endpointHost ?? fields?.endpointUrl;
         this.stopSequences = fields?.stopSequences;
         this.modelKwargs = fields?.modelKwargs;
+        this.streaming = fields?.streaming ?? this.streaming;
     }
     /** Call out to Bedrock service model.
       Arguments:
@@ -120,10 +127,23 @@ class Bedrock extends base_js_1.LLM {
       Example:
         response = model.call("Tell me a joke.")
     */
-    async _call(prompt, options) {
+    async _call(prompt, options, runManager) {
         const service = "bedrock-runtime";
         const endpointHost = this.endpointHost ?? `${service}.${this.region}.amazonaws.com`;
         const provider = this.model.split(".")[0];
+        if (this.streaming) {
+            const stream = this._streamResponseChunks(prompt, options, runManager);
+            let finalResult;
+            for await (const chunk of stream) {
+                if (finalResult === undefined) {
+                    finalResult = chunk;
+                }
+                else {
+                    finalResult = finalResult.concat(chunk);
+                }
+            }
+            return finalResult?.text ?? "";
+        }
         const response = await this._signedFetch(prompt, options, {
             bedrockMethod: "invoke",
             endpointHost,
@@ -204,7 +224,8 @@ class Bedrock extends base_js_1.LLM {
                         text,
                         generationInfo: {},
                     });
-                    await runManager?.handleLLMNewToken(text);
+                    // eslint-disable-next-line no-void
+                    void runManager?.handleLLMNewToken(text);
                 }
             }
         }
@@ -215,7 +236,8 @@ class Bedrock extends base_js_1.LLM {
                 text,
                 generationInfo: {},
             });
-            await runManager?.handleLLMNewToken(text);
+            // eslint-disable-next-line no-void
+            void runManager?.handleLLMNewToken(text);
         }
     }
     // eslint-disable-next-line @typescript-eslint/no-explicit-any

package/dist/llms/bedrock.d.ts CHANGED Viewed

@@ -23,6 +23,7 @@ export declare class Bedrock extends LLM implements BaseBedrockInput {
     stopSequences?: string[];
     modelKwargs?: Record<string, unknown>;
     codec: EventStreamCodec;
+    streaming: boolean;
     get lc_secrets(): {
         [key: string]: string;
     } | undefined;
@@ -39,7 +40,7 @@ export declare class Bedrock extends LLM implements BaseBedrockInput {
       Example:
         response = model.call("Tell me a joke.")
     */
-    _call(prompt: string, options: this["ParsedCallOptions"]): Promise<string>;
+    _call(prompt: string, options: this["ParsedCallOptions"], runManager?: CallbackManagerForLLMRun): Promise<string>;
     _signedFetch(prompt: string, options: this["ParsedCallOptions"], fields: {
         bedrockMethod: "invoke" | "invoke-with-response-stream";
         endpointHost: string;

package/dist/llms/bedrock.js CHANGED Viewed

@@ -89,6 +89,12 @@ export class Bedrock extends LLM {
             writable: true,
             value: new EventStreamCodec(toUtf8, fromUtf8)
         });
+        Object.defineProperty(this, "streaming", {
+            enumerable: true,
+            configurable: true,
+            writable: true,
+            value: false
+        });
         this.model = fields?.model ?? this.model;
         const allowedModels = ["ai21", "anthropic", "amazon"];
         if (!allowedModels.includes(this.model.split(".")[0])) {
@@ -106,6 +112,7 @@ export class Bedrock extends LLM {
         this.endpointHost = fields?.endpointHost ?? fields?.endpointUrl;
         this.stopSequences = fields?.stopSequences;
         this.modelKwargs = fields?.modelKwargs;
+        this.streaming = fields?.streaming ?? this.streaming;
     }
     /** Call out to Bedrock service model.
       Arguments:
@@ -117,10 +124,23 @@ export class Bedrock extends LLM {
       Example:
         response = model.call("Tell me a joke.")
     */
-    async _call(prompt, options) {
+    async _call(prompt, options, runManager) {
         const service = "bedrock-runtime";
         const endpointHost = this.endpointHost ?? `${service}.${this.region}.amazonaws.com`;
         const provider = this.model.split(".")[0];
+        if (this.streaming) {
+            const stream = this._streamResponseChunks(prompt, options, runManager);
+            let finalResult;
+            for await (const chunk of stream) {
+                if (finalResult === undefined) {
+                    finalResult = chunk;
+                }
+                else {
+                    finalResult = finalResult.concat(chunk);
+                }
+            }
+            return finalResult?.text ?? "";
+        }
         const response = await this._signedFetch(prompt, options, {
             bedrockMethod: "invoke",
             endpointHost,
@@ -201,7 +221,8 @@ export class Bedrock extends LLM {
                         text,
                         generationInfo: {},
                     });
-                    await runManager?.handleLLMNewToken(text);
+                    // eslint-disable-next-line no-void
+                    void runManager?.handleLLMNewToken(text);
                 }
             }
         }
@@ -212,7 +233,8 @@ export class Bedrock extends LLM {
                 text,
                 generationInfo: {},
             });
-            await runManager?.handleLLMNewToken(text);
+            // eslint-disable-next-line no-void
+            void runManager?.handleLLMNewToken(text);
         }
     }
     // eslint-disable-next-line @typescript-eslint/no-explicit-any

package/dist/llms/cloudflare_workersai.cjs CHANGED Viewed

@@ -3,6 +3,8 @@ Object.defineProperty(exports, "__esModule", { value: true });
 exports.CloudflareWorkersAI = void 0;
 const base_js_1 = require("./base.cjs");
 const env_js_1 = require("../util/env.cjs");
+const index_js_1 = require("../schema/index.cjs");
+const event_source_parse_js_1 = require("../util/event-source-parse.cjs");
 /**
  * Class representing the CloudflareWorkersAI language model. It extends the LLM (Large
  * Language Model) class, providing a standard interface for interacting
@@ -38,6 +40,12 @@ class CloudflareWorkersAI extends base_js_1.LLM {
             writable: true,
             value: void 0
         });
+        Object.defineProperty(this, "streaming", {
+            enumerable: true,
+            configurable: true,
+            writable: true,
+            value: false
+        });
         Object.defineProperty(this, "lc_serializable", {
             enumerable: true,
             configurable: true,
@@ -45,6 +53,7 @@ class CloudflareWorkersAI extends base_js_1.LLM {
             value: true
         });
         this.model = fields?.model ?? this.model;
+        this.streaming = fields?.streaming ?? this.streaming;
         this.cloudflareAccountId =
             fields?.cloudflareAccountId ??
                 (0, env_js_1.getEnvironmentVariable)("CLOUDFLARE_ACCOUNT_ID");
@@ -87,23 +96,15 @@ class CloudflareWorkersAI extends base_js_1.LLM {
     _llmType() {
         return "cloudflare";
     }
-    /** Call out to CloudflareWorkersAI's complete endpoint.
-     Args:
-         prompt: The prompt to pass into the model.
-         Returns:
-     The string generated by the model.
-     Example:
-     let response = CloudflareWorkersAI.call("Tell me a joke.");
-     */
-    async _call(prompt, options) {
+    async _request(prompt, options, stream) {
         this.validateEnvironment();
         const url = `${this.baseUrl}/${this.model}`;
         const headers = {
             Authorization: `Bearer ${this.cloudflareApiToken}`,
             "Content-Type": "application/json",
         };
-        const data = { prompt };
-        const responseData = await this.caller.call(async () => {
+        const data = { prompt, stream };
+        return this.caller.call(async () => {
             const response = await fetch(url, {
                 method: "POST",
                 headers,
@@ -116,9 +117,54 @@ class CloudflareWorkersAI extends base_js_1.LLM {
                 error.response = response;
                 throw error;
             }
-            return response.json();
+            return response;
         });
-        return responseData.result.response;
+    }
+    async *_streamResponseChunks(prompt, options, runManager) {
+        const response = await this._request(prompt, options, true);
+        if (!response.body) {
+            throw new Error("Empty response from Cloudflare. Please try again.");
+        }
+        const stream = (0, event_source_parse_js_1.convertEventStreamToIterableReadableDataStream)(response.body);
+        for await (const chunk of stream) {
+            if (chunk !== "[DONE]") {
+                const parsedChunk = JSON.parse(chunk);
+                const generationChunk = new index_js_1.GenerationChunk({
+                    text: parsedChunk.response,
+                });
+                yield generationChunk;
+                // eslint-disable-next-line no-void
+                void runManager?.handleLLMNewToken(generationChunk.text ?? "");
+            }
+        }
+    }
+    /** Call out to CloudflareWorkersAI's complete endpoint.
+     Args:
+         prompt: The prompt to pass into the model.
+     Returns:
+         The string generated by the model.
+     Example:
+     let response = CloudflareWorkersAI.call("Tell me a joke.");
+     */
+    async _call(prompt, options, runManager) {
+        if (!this.streaming) {
+            const response = await this._request(prompt, options);
+            const responseData = await response.json();
+            return responseData.result.response;
+        }
+        else {
+            const stream = this._streamResponseChunks(prompt, options, runManager);
+            let finalResult;
+            for await (const chunk of stream) {
+                if (finalResult === undefined) {
+                    finalResult = chunk;
+                }
+                else {
+                    finalResult = finalResult.concat(chunk);
+                }
+            }
+            return finalResult?.text ?? "";
+        }
     }
 }
 exports.CloudflareWorkersAI = CloudflareWorkersAI;

package/dist/llms/cloudflare_workersai.d.ts CHANGED Viewed

@@ -1,4 +1,6 @@
 import { LLM, BaseLLMParams } from "./base.js";
+import { CallbackManagerForLLMRun } from "../callbacks/manager.js";
+import { GenerationChunk } from "../schema/index.js";
 /**
  * Interface for CloudflareWorkersAI input parameters.
  */
@@ -7,6 +9,7 @@ export interface CloudflareWorkersAIInput {
     cloudflareApiToken?: string;
     model?: string;
     baseUrl?: string;
+    streaming?: boolean;
 }
 /**
  * Class representing the CloudflareWorkersAI language model. It extends the LLM (Large
@@ -18,6 +21,7 @@ export declare class CloudflareWorkersAI extends LLM implements CloudflareWorker
     cloudflareAccountId?: string;
     cloudflareApiToken?: string;
     baseUrl: string;
+    streaming: boolean;
     static lc_name(): string;
     lc_serializable: boolean;
     constructor(fields?: CloudflareWorkersAIInput & BaseLLMParams);
@@ -37,13 +41,15 @@ export declare class CloudflareWorkersAI extends LLM implements CloudflareWorker
     };
     /** Get the type of LLM. */
     _llmType(): string;
+    _request(prompt: string, options: this["ParsedCallOptions"], stream?: boolean): Promise<Response>;
+    _streamResponseChunks(prompt: string, options: this["ParsedCallOptions"], runManager?: CallbackManagerForLLMRun): AsyncGenerator<GenerationChunk>;
     /** Call out to CloudflareWorkersAI's complete endpoint.
      Args:
          prompt: The prompt to pass into the model.
-         Returns:
-     The string generated by the model.
+     Returns:
+         The string generated by the model.
      Example:
      let response = CloudflareWorkersAI.call("Tell me a joke.");
      */
-    _call(prompt: string, options: this["ParsedCallOptions"]): Promise<string>;
+    _call(prompt: string, options: this["ParsedCallOptions"], runManager?: CallbackManagerForLLMRun): Promise<string>;
 }