npm - @aigne/gemini - Versions diffs - 0.14.11-beta → 0.14.12-beta - Mend

@aigne/gemini 0.14.11-beta → 0.14.12-beta

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/CHANGELOG.md +35 -0
package/lib/cjs/gemini-chat-model.d.ts +1 -0
package/lib/cjs/gemini-chat-model.js +42 -4
package/lib/dts/gemini-chat-model.d.ts +1 -0
package/lib/esm/gemini-chat-model.d.ts +1 -0
package/lib/esm/gemini-chat-model.js +43 -5
package/package.json +4 -4

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,40 @@
 # Changelog
+## [0.14.12-beta](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.11...gemini-v0.14.12-beta) (2025-11-28)
+### Bug Fixes
+* bump version ([ba7ad18](https://github.com/AIGNE-io/aigne-framework/commit/ba7ad184fcf32b49bf0507a3cb638d20fb00690d))
+### Dependencies
+* The following workspace dependencies were updated
+  * dependencies
+    * @aigne/core bumped to 1.69.2-beta
+    * @aigne/platform-helpers bumped to 0.6.5-beta
+  * devDependencies
+    * @aigne/test-utils bumped to 0.5.65-beta
+## [0.14.11](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.11-beta.1...gemini-v0.14.11) (2025-11-28)
+### Dependencies
+* The following workspace dependencies were updated
+  * dependencies
+    * @aigne/core bumped to 1.69.1
+  * devDependencies
+    * @aigne/test-utils bumped to 0.5.64
+## [0.14.11-beta.1](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.11-beta...gemini-v0.14.11-beta.1) (2025-11-26)
+### Bug Fixes
+* **model:** handle large video files by uploading to Files API ([#769](https://github.com/AIGNE-io/aigne-framework/issues/769)) ([5fd7661](https://github.com/AIGNE-io/aigne-framework/commit/5fd76613bd7301cc76bde933de2095a6d86f8c7e))
 ## [0.14.11-beta](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.10...gemini-v0.14.11-beta) (2025-11-24)

package/lib/cjs/gemini-chat-model.d.ts CHANGED Viewed

@@ -104,6 +104,7 @@ export declare class GeminiChatModel extends ChatModel {
     private processInput;
     private buildConfig;
     private buildTools;
+    private buildVideoContentParts;
     private buildContents;
     private ensureMessagesHasUserMessage;
 }

package/lib/cjs/gemini-chat-model.js CHANGED Viewed

@@ -5,12 +5,14 @@ const core_1 = require("@aigne/core");
 const logger_js_1 = require("@aigne/core/utils/logger.js");
 const model_utils_js_1 = require("@aigne/core/utils/model-utils.js");
 const type_utils_js_1 = require("@aigne/core/utils/type-utils.js");
+const index_js_1 = require("@aigne/platform-helpers/nodejs/index.js");
 const uuid_1 = require("@aigne/uuid");
 const genai_1 = require("@google/genai");
 const zod_1 = require("zod");
 const zod_to_json_schema_1 = require("zod-to-json-schema");
 const GEMINI_DEFAULT_CHAT_MODEL = "gemini-2.0-flash";
 const OUTPUT_FUNCTION_NAME = "output";
+const NEED_UPLOAD_MAX_FILE_SIZE_MB = 20;
 /**
  * Implementation of the ChatModel interface for Google's Gemini API
  *
@@ -64,7 +66,7 @@ class GeminiChatModel extends core_1.ChatModel {
     // References: https://ai.google.dev/gemini-api/docs/thinking#set-budget
     thinkingBudgetModelMap = [
         {
-            pattern: /gemini-3/,
+            pattern: /gemini-3(?!.*-image-)/,
             support: true,
             type: "level",
         },
@@ -130,7 +132,7 @@ class GeminiChatModel extends core_1.ChatModel {
     async *processInput(input, options) {
         const modelOptions = await this.getModelOptions(input, options);
         const model = modelOptions.model || this.credential.model;
-        const { contents, config } = await this.buildContents(input);
+        const { contents, config } = await this.buildContents(input, options);
         const thinkingBudget = this.getThinkingBudget(model, modelOptions.reasoningEffort);
         const parameters = {
             model,
@@ -348,7 +350,39 @@ class GeminiChatModel extends core_1.ChatModel {
                         };
         return { tools, toolConfig: { functionCallingConfig } };
     }
-    async buildContents(input) {
+    async buildVideoContentParts(media, options) {
+        const { path: filePath, mimeType: fileMimeType } = await this.transformFileType("local", media, options);
+        if (filePath) {
+            const stats = await index_js_1.nodejs.fs.stat(filePath);
+            const fileSizeInBytes = stats.size;
+            const fileSizeMB = fileSizeInBytes / (1024 * 1024);
+            if (fileSizeMB > NEED_UPLOAD_MAX_FILE_SIZE_MB) {
+                const uploadedFile = await this.googleClient.files.upload({
+                    file: filePath,
+                    config: { mimeType: fileMimeType },
+                });
+                let file = uploadedFile;
+                while (file.state === "PROCESSING") {
+                    await new Promise((resolve) => setTimeout(resolve, 1000));
+                    if (file.name) {
+                        file = await this.googleClient.files.get({ name: file.name });
+                    }
+                }
+                if (file.state !== "ACTIVE") {
+                    throw new Error(`File ${file.name} failed to process: ${file.state}`);
+                }
+                if (file.uri && file.mimeType) {
+                    const result = (0, genai_1.createUserContent)([(0, genai_1.createPartFromUri)(file.uri, file.mimeType), ""]);
+                    const part = result.parts?.find((x) => x.fileData);
+                    if (part) {
+                        await index_js_1.nodejs.fs.rm(filePath);
+                        return part;
+                    }
+                }
+            }
+        }
+    }
+    async buildContents(input, options) {
         const result = {
             contents: [],
         };
@@ -431,8 +465,12 @@ class GeminiChatModel extends core_1.ChatModel {
                             return { text: item.text };
                         case "url":
                             return { fileData: { fileUri: item.url, mimeType: item.mimeType } };
-                        case "file":
+                        case "file": {
+                            const part = await this.buildVideoContentParts(item, options);
+                            if (part)
+                                return part;
                             return { inlineData: { data: item.data, mimeType: item.mimeType } };
+                        }
                         case "local":
                             throw new Error(`Unsupported local file: ${item.path}, it should be converted to base64 at ChatModel`);
                     }

package/lib/dts/gemini-chat-model.d.ts CHANGED Viewed

@@ -104,6 +104,7 @@ export declare class GeminiChatModel extends ChatModel {
     private processInput;
     private buildConfig;
     private buildTools;
+    private buildVideoContentParts;
     private buildContents;
     private ensureMessagesHasUserMessage;
 }

package/lib/esm/gemini-chat-model.d.ts CHANGED Viewed

@@ -104,6 +104,7 @@ export declare class GeminiChatModel extends ChatModel {
     private processInput;
     private buildConfig;
     private buildTools;
+    private buildVideoContentParts;
     private buildContents;
     private ensureMessagesHasUserMessage;
 }

package/lib/esm/gemini-chat-model.js CHANGED Viewed

@@ -2,12 +2,14 @@ import { agentProcessResultToObject, ChatModel, StructuredOutputError, safeParse
 import { logger } from "@aigne/core/utils/logger.js";
 import { mergeUsage } from "@aigne/core/utils/model-utils.js";
 import { isNonNullable } from "@aigne/core/utils/type-utils.js";
+import { nodejs } from "@aigne/platform-helpers/nodejs/index.js";
 import { v7 } from "@aigne/uuid";
-import { FunctionCallingConfigMode, GoogleGenAI, ThinkingLevel, } from "@google/genai";
+import { createPartFromUri, createUserContent, FunctionCallingConfigMode, GoogleGenAI, ThinkingLevel, } from "@google/genai";
 import { z } from "zod";
 import { zodToJsonSchema } from "zod-to-json-schema";
 const GEMINI_DEFAULT_CHAT_MODEL = "gemini-2.0-flash";
 const OUTPUT_FUNCTION_NAME = "output";
+const NEED_UPLOAD_MAX_FILE_SIZE_MB = 20;
 /**
  * Implementation of the ChatModel interface for Google's Gemini API
  *
@@ -61,7 +63,7 @@ export class GeminiChatModel extends ChatModel {
     // References: https://ai.google.dev/gemini-api/docs/thinking#set-budget
     thinkingBudgetModelMap = [
         {
-            pattern: /gemini-3/,
+            pattern: /gemini-3(?!.*-image-)/,
             support: true,
             type: "level",
         },
@@ -127,7 +129,7 @@ export class GeminiChatModel extends ChatModel {
     async *processInput(input, options) {
         const modelOptions = await this.getModelOptions(input, options);
         const model = modelOptions.model || this.credential.model;
-        const { contents, config } = await this.buildContents(input);
+        const { contents, config } = await this.buildContents(input, options);
         const thinkingBudget = this.getThinkingBudget(model, modelOptions.reasoningEffort);
         const parameters = {
             model,
@@ -345,7 +347,39 @@ export class GeminiChatModel extends ChatModel {
                         };
         return { tools, toolConfig: { functionCallingConfig } };
     }
-    async buildContents(input) {
+    async buildVideoContentParts(media, options) {
+        const { path: filePath, mimeType: fileMimeType } = await this.transformFileType("local", media, options);
+        if (filePath) {
+            const stats = await nodejs.fs.stat(filePath);
+            const fileSizeInBytes = stats.size;
+            const fileSizeMB = fileSizeInBytes / (1024 * 1024);
+            if (fileSizeMB > NEED_UPLOAD_MAX_FILE_SIZE_MB) {
+                const uploadedFile = await this.googleClient.files.upload({
+                    file: filePath,
+                    config: { mimeType: fileMimeType },
+                });
+                let file = uploadedFile;
+                while (file.state === "PROCESSING") {
+                    await new Promise((resolve) => setTimeout(resolve, 1000));
+                    if (file.name) {
+                        file = await this.googleClient.files.get({ name: file.name });
+                    }
+                }
+                if (file.state !== "ACTIVE") {
+                    throw new Error(`File ${file.name} failed to process: ${file.state}`);
+                }
+                if (file.uri && file.mimeType) {
+                    const result = createUserContent([createPartFromUri(file.uri, file.mimeType), ""]);
+                    const part = result.parts?.find((x) => x.fileData);
+                    if (part) {
+                        await nodejs.fs.rm(filePath);
+                        return part;
+                    }
+                }
+            }
+        }
+    }
+    async buildContents(input, options) {
         const result = {
             contents: [],
         };
@@ -428,8 +462,12 @@ export class GeminiChatModel extends ChatModel {
                             return { text: item.text };
                         case "url":
                             return { fileData: { fileUri: item.url, mimeType: item.mimeType } };
-                        case "file":
+                        case "file": {
+                            const part = await this.buildVideoContentParts(item, options);
+                            if (part)
+                                return part;
                             return { inlineData: { data: item.data, mimeType: item.mimeType } };
+                        }
                         case "local":
                             throw new Error(`Unsupported local file: ${item.path}, it should be converted to base64 at ChatModel`);
                     }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@aigne/gemini",
-  "version": "0.14.11-beta",
+  "version": "0.14.12-beta",
   "description": "AIGNE Gemini SDK for integrating with Google's Gemini AI models",
   "publishConfig": {
     "access": "public"
@@ -39,8 +39,8 @@
     "@google/genai": "^1.30.0",
     "zod": "^3.25.67",
     "zod-to-json-schema": "^3.24.6",
-    "@aigne/core": "^1.69.1-beta",
-    "@aigne/platform-helpers": "^0.6.4"
+    "@aigne/core": "^1.69.2-beta",
+    "@aigne/platform-helpers": "^0.6.5-beta"
   },
   "devDependencies": {
     "@types/bun": "^1.2.22",
@@ -48,7 +48,7 @@
     "npm-run-all": "^4.1.5",
     "rimraf": "^6.0.1",
     "typescript": "^5.9.2",
-    "@aigne/test-utils": "^0.5.64-beta"
+    "@aigne/test-utils": "^0.5.65-beta"
   },
   "scripts": {
     "lint": "tsc --noEmit",