npm - @ai-sdk/google - Versions diffs - 3.0.24 → 3.0.26 - Mend

@ai-sdk/google 3.0.24 → 3.0.26

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/CHANGELOG.md +12 -0
package/dist/index.d.mts +9 -9
package/dist/index.d.ts +9 -9
package/dist/index.js +132 -15
package/dist/index.js.map +1 -1
package/dist/index.mjs +134 -15
package/dist/index.mjs.map +1 -1
package/dist/internal/index.js +3 -3
package/dist/internal/index.js.map +1 -1
package/dist/internal/index.mjs +3 -3
package/dist/internal/index.mjs.map +1 -1
package/docs/15-google-generative-ai.mdx +111 -20
package/package.json +3 -3
package/src/google-generative-ai-embedding-model.ts +2 -2
package/src/google-generative-ai-embedding-options.ts +3 -3
package/src/google-generative-ai-image-model.ts +176 -11
package/src/google-generative-ai-image-settings.ts +4 -0
package/src/google-generative-ai-language-model.ts +3 -3
package/src/google-generative-ai-options.ts +3 -3
package/src/google-generative-ai-video-model.ts +5 -5
package/src/index.ts +20 -4

package/dist/index.mjs CHANGED Viewed

@@ -7,7 +7,7 @@ import {
 } from "@ai-sdk/provider-utils";
 // src/version.ts
-var VERSION = true ? "3.0.24" : "0.0.0-test";
+var VERSION = true ? "3.0.26" : "0.0.0-test";
 // src/google-generative-ai-embedding-model.ts
 import {
@@ -53,7 +53,7 @@ import {
   zodSchema as zodSchema2
 } from "@ai-sdk/provider-utils";
 import { z as z2 } from "zod/v4";
-var googleGenerativeAIEmbeddingProviderOptions = lazySchema2(
+var googleEmbeddingModelOptions = lazySchema2(
   () => zodSchema2(
     z2.object({
       /**
@@ -108,7 +108,7 @@ var GoogleGenerativeAIEmbeddingModel = class {
     const googleOptions = await parseProviderOptions({
       provider: "google",
       providerOptions,
-      schema: googleGenerativeAIEmbeddingProviderOptions
+      schema: googleEmbeddingModelOptions
     });
     if (values.length > this.maxEmbeddingsPerCall) {
       throw new TooManyEmbeddingValuesForCallError({
@@ -548,7 +548,7 @@ function getModelPath(modelId) {
 // src/google-generative-ai-options.ts
 import { lazySchema as lazySchema4, zodSchema as zodSchema4 } from "@ai-sdk/provider-utils";
 import { z as z4 } from "zod/v4";
-var googleGenerativeAIProviderOptions = lazySchema4(
+var googleLanguageModelOptions = lazySchema4(
   () => zodSchema4(
     z4.object({
       responseModalities: z4.array(z4.enum(["TEXT", "IMAGE"])).optional(),
@@ -932,13 +932,13 @@ var GoogleGenerativeAILanguageModel = class {
     let googleOptions = await parseProviderOptions2({
       provider: providerOptionsName,
       providerOptions,
-      schema: googleGenerativeAIProviderOptions
+      schema: googleLanguageModelOptions
     });
     if (googleOptions == null && providerOptionsName !== "google") {
       googleOptions = await parseProviderOptions2({
         provider: "google",
         providerOptions,
-        schema: googleGenerativeAIProviderOptions
+        schema: googleLanguageModelOptions
       });
     }
     if ((tools == null ? void 0 : tools.some(
@@ -1806,7 +1806,9 @@ var googleTools = {
 // src/google-generative-ai-image-model.ts
 import {
   combineHeaders as combineHeaders3,
+  convertToBase64 as convertToBase642,
   createJsonResponseHandler as createJsonResponseHandler3,
+  generateId as defaultGenerateId,
   lazySchema as lazySchema11,
   parseProviderOptions as parseProviderOptions3,
   postJsonToApi as postJsonToApi3,
@@ -1822,13 +1824,24 @@ var GoogleGenerativeAIImageModel = class {
     this.specificationVersion = "v3";
   }
   get maxImagesPerCall() {
-    var _a;
-    return (_a = this.settings.maxImagesPerCall) != null ? _a : 4;
+    if (this.settings.maxImagesPerCall != null) {
+      return this.settings.maxImagesPerCall;
+    }
+    if (isGeminiModel(this.modelId)) {
+      return 10;
+    }
+    return 4;
   }
   get provider() {
     return this.config.provider;
   }
   async doGenerate(options) {
+    if (isGeminiModel(this.modelId)) {
+      return this.doGenerateGemini(options);
+    }
+    return this.doGenerateImagen(options);
+  }
+  async doGenerateImagen(options) {
     var _a, _b, _c;
     const {
       prompt,
@@ -1845,7 +1858,7 @@ var GoogleGenerativeAIImageModel = class {
     const warnings = [];
     if (files != null && files.length > 0) {
       throw new Error(
-        "Google Generative AI does not support image editing. Use Google Vertex AI (@ai-sdk/google-vertex) for image editing capabilities."
+        "Google Generative AI does not support image editing with Imagen models. Use Google Vertex AI (@ai-sdk/google-vertex) for image editing capabilities."
       );
     }
     if (mask != null) {
@@ -1870,7 +1883,7 @@ var GoogleGenerativeAIImageModel = class {
     const googleOptions = await parseProviderOptions3({
       provider: "google",
       providerOptions,
-      schema: googleImageProviderOptionsSchema
+      schema: googleImageModelOptionsSchema
     });
     const currentDate = (_c = (_b = (_a = this.config._internal) == null ? void 0 : _a.currentDate) == null ? void 0 : _b.call(_a)) != null ? _c : /* @__PURE__ */ new Date();
     const parameters = {
@@ -1901,10 +1914,10 @@ var GoogleGenerativeAIImageModel = class {
       images: response.predictions.map(
         (p) => p.bytesBase64Encoded
       ),
-      warnings: warnings != null ? warnings : [],
+      warnings,
       providerMetadata: {
         google: {
-          images: response.predictions.map((prediction) => ({
+          images: response.predictions.map(() => ({
             // Add any prediction-specific metadata here
           }))
         }
@@ -1916,7 +1929,113 @@ var GoogleGenerativeAIImageModel = class {
       }
     };
   }
+  async doGenerateGemini(options) {
+    var _a, _b, _c, _d, _e, _f, _g, _h, _i;
+    const {
+      prompt,
+      n,
+      size,
+      aspectRatio,
+      seed,
+      providerOptions,
+      headers,
+      abortSignal,
+      files,
+      mask
+    } = options;
+    const warnings = [];
+    if (mask != null) {
+      throw new Error(
+        "Gemini image models do not support mask-based image editing."
+      );
+    }
+    if (n != null && n > 1) {
+      throw new Error(
+        "Gemini image models do not support generating a set number of images per call. Use n=1 or omit the n parameter."
+      );
+    }
+    if (size != null) {
+      warnings.push({
+        type: "unsupported",
+        feature: "size",
+        details: "This model does not support the `size` option. Use `aspectRatio` instead."
+      });
+    }
+    const userContent = [];
+    if (prompt != null) {
+      userContent.push({ type: "text", text: prompt });
+    }
+    if (files != null && files.length > 0) {
+      for (const file of files) {
+        if (file.type === "url") {
+          userContent.push({
+            type: "file",
+            data: new URL(file.url),
+            mediaType: "image/*"
+          });
+        } else {
+          userContent.push({
+            type: "file",
+            data: typeof file.data === "string" ? file.data : new Uint8Array(file.data),
+            mediaType: file.mediaType
+          });
+        }
+      }
+    }
+    const languageModelPrompt = [
+      { role: "user", content: userContent }
+    ];
+    const languageModel = new GoogleGenerativeAILanguageModel(this.modelId, {
+      provider: this.config.provider,
+      baseURL: this.config.baseURL,
+      headers: (_a = this.config.headers) != null ? _a : {},
+      fetch: this.config.fetch,
+      generateId: (_b = this.config.generateId) != null ? _b : defaultGenerateId
+    });
+    const result = await languageModel.doGenerate({
+      prompt: languageModelPrompt,
+      seed,
+      providerOptions: {
+        google: {
+          responseModalities: ["IMAGE"],
+          imageConfig: aspectRatio ? { aspectRatio } : void 0,
+          ...(_c = providerOptions == null ? void 0 : providerOptions.google) != null ? _c : {}
+        }
+      },
+      headers,
+      abortSignal
+    });
+    const currentDate = (_f = (_e = (_d = this.config._internal) == null ? void 0 : _d.currentDate) == null ? void 0 : _e.call(_d)) != null ? _f : /* @__PURE__ */ new Date();
+    const images = [];
+    for (const part of result.content) {
+      if (part.type === "file" && part.mediaType.startsWith("image/")) {
+        images.push(convertToBase642(part.data));
+      }
+    }
+    return {
+      images,
+      warnings,
+      providerMetadata: {
+        google: {
+          images: images.map(() => ({}))
+        }
+      },
+      response: {
+        timestamp: currentDate,
+        modelId: this.modelId,
+        headers: (_g = result.response) == null ? void 0 : _g.headers
+      },
+      usage: result.usage ? {
+        inputTokens: result.usage.inputTokens.total,
+        outputTokens: result.usage.outputTokens.total,
+        totalTokens: ((_h = result.usage.inputTokens.total) != null ? _h : 0) + ((_i = result.usage.outputTokens.total) != null ? _i : 0)
+      } : void 0
+    };
+  }
 };
+function isGeminiModel(modelId) {
+  return modelId.startsWith("gemini-");
+}
 var googleImageResponseSchema = lazySchema11(
   () => zodSchema11(
     z13.object({
@@ -1924,7 +2043,7 @@ var googleImageResponseSchema = lazySchema11(
     })
   )
 );
-var googleImageProviderOptionsSchema = lazySchema11(
+var googleImageModelOptionsSchema = lazySchema11(
   () => zodSchema11(
     z13.object({
       personGeneration: z13.enum(["dont_allow", "allow_adult", "allow_all"]).nullish(),
@@ -1969,7 +2088,7 @@ var GoogleGenerativeAIVideoModel = class {
     const googleOptions = await parseProviderOptions4({
       provider: "google",
       providerOptions: options.providerOptions,
-      schema: googleVideoProviderOptionsSchema
+      schema: googleVideoModelOptionsSchema
     });
     const instances = [{}];
     const instance = instances[0];
@@ -2181,7 +2300,7 @@ var googleOperationSchema = z14.object({
     }).nullish()
   }).nullish()
 });
-var googleVideoProviderOptionsSchema = lazySchema12(
+var googleVideoModelOptionsSchema = lazySchema12(
   () => zodSchema12(
     z14.object({
       pollIntervalMs: z14.number().positive().nullish(),