npm - @aigne/gemini - Versions diffs - 0.14.2-beta.9 → 0.14.2 - Mend

@aigne/gemini 0.14.2-beta.9 → 0.14.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/CHANGELOG.md +54 -0
package/lib/cjs/gemini-chat-model.js +55 -13
package/lib/esm/gemini-chat-model.js +56 -14
package/package.json +5 -4

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,59 @@
 # Changelog
+## [0.14.2](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.2-beta.12...gemini-v0.14.2) (2025-10-19)
+### Dependencies
+* The following workspace dependencies were updated
+  * dependencies
+    * @aigne/core bumped to 1.63.0
+  * devDependencies
+    * @aigne/test-utils bumped to 0.5.55
+## [0.14.2-beta.12](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.2-beta.11...gemini-v0.14.2-beta.12) (2025-10-17)
+### Dependencies
+* The following workspace dependencies were updated
+  * dependencies
+    * @aigne/core bumped to 1.63.0-beta.12
+  * devDependencies
+    * @aigne/test-utils bumped to 0.5.55-beta.12
+## [0.14.2-beta.11](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.2-beta.10...gemini-v0.14.2-beta.11) (2025-10-17)
+### Bug Fixes
+* **gemini:** implement retry mechanism for empty responses with structured output fallback ([#638](https://github.com/AIGNE-io/aigne-framework/issues/638)) ([d33c8bb](https://github.com/AIGNE-io/aigne-framework/commit/d33c8bb9711aadddef9687d6cf472a179cd8ed9c))
+### Dependencies
+* The following workspace dependencies were updated
+  * dependencies
+    * @aigne/core bumped to 1.63.0-beta.11
+  * devDependencies
+    * @aigne/test-utils bumped to 0.5.55-beta.11
+## [0.14.2-beta.10](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.2-beta.9...gemini-v0.14.2-beta.10) (2025-10-16)
+### Bug Fixes
+* correct calculate token usage for gemini model ([7fd1328](https://github.com/AIGNE-io/aigne-framework/commit/7fd13289d3d0f8e062211f7c6dd5cb56e5318c1b))
+### Dependencies
+* The following workspace dependencies were updated
+  * dependencies
+    * @aigne/core bumped to 1.63.0-beta.10
+  * devDependencies
+    * @aigne/test-utils bumped to 0.5.55-beta.10
 ## [0.14.2-beta.9](https://github.com/AIGNE-io/aigne-framework/compare/gemini-v0.14.2-beta.8...gemini-v0.14.2-beta.9) (2025-10-16)

package/lib/cjs/gemini-chat-model.js CHANGED Viewed

@@ -3,11 +3,14 @@ Object.defineProperty(exports, "__esModule", { value: true });
 exports.GeminiChatModel = void 0;
 const core_1 = require("@aigne/core");
 const logger_js_1 = require("@aigne/core/utils/logger.js");
+const model_utils_js_1 = require("@aigne/core/utils/model-utils.js");
 const type_utils_js_1 = require("@aigne/core/utils/type-utils.js");
 const uuid_1 = require("@aigne/uuid");
 const genai_1 = require("@google/genai");
+const zod_1 = require("zod");
+const zod_to_json_schema_1 = require("zod-to-json-schema");
 const GEMINI_DEFAULT_CHAT_MODEL = "gemini-2.0-flash";
-const OUTPUT_JSON_FUNCTION_NAME = "output_json";
+const OUTPUT_FUNCTION_NAME = "output";
 /**
  * Implementation of the ChatModel interface for Google's Gemini API
  *
@@ -75,7 +78,7 @@ class GeminiChatModel extends core_1.ChatModel {
             },
         };
         const response = await this.googleClient.models.generateContentStream(parameters);
-        const usage = {
+        let usage = {
             inputTokens: 0,
             outputTokens: 0,
         };
@@ -107,7 +110,7 @@ class GeminiChatModel extends core_1.ChatModel {
                             });
                         }
                         if (part.functionCall?.name) {
-                            if (part.functionCall.name === OUTPUT_JSON_FUNCTION_NAME) {
+                            if (part.functionCall.name === OUTPUT_FUNCTION_NAME) {
                                 json = part.functionCall.args;
                             }
                             else {
@@ -126,8 +129,10 @@ class GeminiChatModel extends core_1.ChatModel {
                 }
             }
             if (chunk.usageMetadata) {
-                usage.inputTokens += chunk.usageMetadata.promptTokenCount || 0;
-                usage.outputTokens += chunk.usageMetadata.candidatesTokenCount || 0;
+                if (chunk.usageMetadata.promptTokenCount)
+                    usage.inputTokens = chunk.usageMetadata.promptTokenCount;
+                if (chunk.usageMetadata.candidatesTokenCount)
+                    usage.outputTokens = chunk.usageMetadata.candidatesTokenCount;
             }
         }
         if (input.responseFormat?.type === "json_schema") {
@@ -137,16 +142,53 @@ class GeminiChatModel extends core_1.ChatModel {
             else if (text) {
                 yield { delta: { json: { json: (0, core_1.safeParseJSON)(text) } } };
             }
-            else {
-                // NOTE: Trigger retry of chat model
-                throw new core_1.StructuredOutputError("No JSON response from the model");
+            else if (!toolCalls.length) {
+                throw new Error("No JSON response from the model");
             }
         }
         else if (!toolCalls.length) {
+            // NOTE: gemini-2.5-pro sometimes returns an empty response,
+            // so we check here and retry with structured output mode (empty responses occur less frequently with tool calls)
             if (!text) {
-                logger_js_1.logger.error("No text response from the model", parameters);
-                // NOTE: Trigger retry of chat model
-                throw new core_1.StructuredOutputError("No text response from the model");
+                logger_js_1.logger.warn("Empty response from Gemini, retrying with structured output mode");
+                try {
+                    const outputSchema = zod_1.z.object({
+                        output: zod_1.z.string().describe("The final answer from the model"),
+                    });
+                    const response = await this.process({
+                        ...input,
+                        responseFormat: {
+                            type: "json_schema",
+                            jsonSchema: {
+                                name: "output",
+                                schema: (0, zod_to_json_schema_1.zodToJsonSchema)(outputSchema),
+                            },
+                        },
+                    });
+                    const result = await (0, core_1.agentProcessResultToObject)(response);
+                    // Merge retry usage with the original usage
+                    usage = (0, model_utils_js_1.mergeUsage)(usage, result.usage);
+                    // Return the tool calls if retry has tool calls
+                    if (result.toolCalls?.length) {
+                        toolCalls.push(...result.toolCalls);
+                        yield { delta: { json: { toolCalls } } };
+                    }
+                    // Return the text from structured output of retry
+                    else {
+                        if (!result.json)
+                            throw new Error("Retrying with structured output mode got no json response");
+                        const parsed = outputSchema.safeParse(result.json);
+                        if (!parsed.success)
+                            throw new Error("Retrying with structured output mode got invalid json response");
+                        text = parsed.data.output;
+                        yield { delta: { text: { text } } };
+                        logger_js_1.logger.warn("Empty response from Gemini, retried with structured output mode successfully");
+                    }
+                }
+                catch (error) {
+                    logger_js_1.logger.error("Empty response from Gemini, retrying with structured output mode failed", error);
+                    throw new core_1.StructuredOutputError("No response from the model");
+                }
             }
         }
         yield { delta: { json: { usage, files: files.length ? files : undefined } } };
@@ -161,8 +203,8 @@ class GeminiChatModel extends core_1.ChatModel {
                 config.tools.push({
                     functionDeclarations: [
                         {
-                            name: OUTPUT_JSON_FUNCTION_NAME,
-                            description: "Output the final response in JSON format",
+                            name: OUTPUT_FUNCTION_NAME,
+                            description: "Output the final response",
                             parametersJsonSchema: input.responseFormat.jsonSchema.schema,
                         },
                     ],

package/lib/esm/gemini-chat-model.js CHANGED Viewed

@@ -1,10 +1,13 @@
-import { ChatModel, StructuredOutputError, safeParseJSON, } from "@aigne/core";
+import { agentProcessResultToObject, ChatModel, StructuredOutputError, safeParseJSON, } from "@aigne/core";
 import { logger } from "@aigne/core/utils/logger.js";
+import { mergeUsage } from "@aigne/core/utils/model-utils.js";
 import { isNonNullable } from "@aigne/core/utils/type-utils.js";
 import { v7 } from "@aigne/uuid";
 import { FunctionCallingConfigMode, GoogleGenAI, } from "@google/genai";
+import { z } from "zod";
+import { zodToJsonSchema } from "zod-to-json-schema";
 const GEMINI_DEFAULT_CHAT_MODEL = "gemini-2.0-flash";
-const OUTPUT_JSON_FUNCTION_NAME = "output_json";
+const OUTPUT_FUNCTION_NAME = "output";
 /**
  * Implementation of the ChatModel interface for Google's Gemini API
  *
@@ -72,7 +75,7 @@ export class GeminiChatModel extends ChatModel {
             },
         };
         const response = await this.googleClient.models.generateContentStream(parameters);
-        const usage = {
+        let usage = {
             inputTokens: 0,
             outputTokens: 0,
         };
@@ -104,7 +107,7 @@ export class GeminiChatModel extends ChatModel {
                             });
                         }
                         if (part.functionCall?.name) {
-                            if (part.functionCall.name === OUTPUT_JSON_FUNCTION_NAME) {
+                            if (part.functionCall.name === OUTPUT_FUNCTION_NAME) {
                                 json = part.functionCall.args;
                             }
                             else {
@@ -123,8 +126,10 @@ export class GeminiChatModel extends ChatModel {
                 }
             }
             if (chunk.usageMetadata) {
-                usage.inputTokens += chunk.usageMetadata.promptTokenCount || 0;
-                usage.outputTokens += chunk.usageMetadata.candidatesTokenCount || 0;
+                if (chunk.usageMetadata.promptTokenCount)
+                    usage.inputTokens = chunk.usageMetadata.promptTokenCount;
+                if (chunk.usageMetadata.candidatesTokenCount)
+                    usage.outputTokens = chunk.usageMetadata.candidatesTokenCount;
             }
         }
         if (input.responseFormat?.type === "json_schema") {
@@ -134,16 +139,53 @@ export class GeminiChatModel extends ChatModel {
             else if (text) {
                 yield { delta: { json: { json: safeParseJSON(text) } } };
             }
-            else {
-                // NOTE: Trigger retry of chat model
-                throw new StructuredOutputError("No JSON response from the model");
+            else if (!toolCalls.length) {
+                throw new Error("No JSON response from the model");
             }
         }
         else if (!toolCalls.length) {
+            // NOTE: gemini-2.5-pro sometimes returns an empty response,
+            // so we check here and retry with structured output mode (empty responses occur less frequently with tool calls)
             if (!text) {
-                logger.error("No text response from the model", parameters);
-                // NOTE: Trigger retry of chat model
-                throw new StructuredOutputError("No text response from the model");
+                logger.warn("Empty response from Gemini, retrying with structured output mode");
+                try {
+                    const outputSchema = z.object({
+                        output: z.string().describe("The final answer from the model"),
+                    });
+                    const response = await this.process({
+                        ...input,
+                        responseFormat: {
+                            type: "json_schema",
+                            jsonSchema: {
+                                name: "output",
+                                schema: zodToJsonSchema(outputSchema),
+                            },
+                        },
+                    });
+                    const result = await agentProcessResultToObject(response);
+                    // Merge retry usage with the original usage
+                    usage = mergeUsage(usage, result.usage);
+                    // Return the tool calls if retry has tool calls
+                    if (result.toolCalls?.length) {
+                        toolCalls.push(...result.toolCalls);
+                        yield { delta: { json: { toolCalls } } };
+                    }
+                    // Return the text from structured output of retry
+                    else {
+                        if (!result.json)
+                            throw new Error("Retrying with structured output mode got no json response");
+                        const parsed = outputSchema.safeParse(result.json);
+                        if (!parsed.success)
+                            throw new Error("Retrying with structured output mode got invalid json response");
+                        text = parsed.data.output;
+                        yield { delta: { text: { text } } };
+                        logger.warn("Empty response from Gemini, retried with structured output mode successfully");
+                    }
+                }
+                catch (error) {
+                    logger.error("Empty response from Gemini, retrying with structured output mode failed", error);
+                    throw new StructuredOutputError("No response from the model");
+                }
             }
         }
         yield { delta: { json: { usage, files: files.length ? files : undefined } } };
@@ -158,8 +200,8 @@ export class GeminiChatModel extends ChatModel {
                 config.tools.push({
                     functionDeclarations: [
                         {
-                            name: OUTPUT_JSON_FUNCTION_NAME,
-                            description: "Output the final response in JSON format",
+                            name: OUTPUT_FUNCTION_NAME,
+                            description: "Output the final response",
                             parametersJsonSchema: input.responseFormat.jsonSchema.schema,
                         },
                     ],

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@aigne/gemini",
-  "version": "0.14.2-beta.9",
+  "version": "0.14.2",
   "description": "AIGNE Gemini SDK for integrating with Google's Gemini AI models",
   "publishConfig": {
     "access": "public"
@@ -38,8 +38,9 @@
     "@aigne/uuid": "^13.0.1",
     "@google/genai": "^1.24.0",
     "zod": "^3.25.67",
-    "@aigne/platform-helpers": "^0.6.3",
-    "@aigne/core": "^1.63.0-beta.9"
+    "zod-to-json-schema": "^3.24.6",
+    "@aigne/core": "^1.63.0",
+    "@aigne/platform-helpers": "^0.6.3"
   },
   "devDependencies": {
     "@types/bun": "^1.2.22",
@@ -47,7 +48,7 @@
     "npm-run-all": "^4.1.5",
     "rimraf": "^6.0.1",
     "typescript": "^5.9.2",
-    "@aigne/test-utils": "^0.5.55-beta.9"
+    "@aigne/test-utils": "^0.5.55"
   },
   "scripts": {
     "lint": "tsc --noEmit",