npm - @ai-sdk/google - Versions diffs - 3.0.25 → 3.0.27 - Mend

@ai-sdk/google 3.0.25 → 3.0.27

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/CHANGELOG.md +12 -0
package/dist/index.d.mts +1 -1
package/dist/index.d.ts +1 -1
package/dist/index.js +125 -8
package/dist/index.js.map +1 -1
package/dist/index.mjs +127 -8
package/dist/index.mjs.map +1 -1
package/dist/internal/index.js +2 -2
package/dist/internal/index.js.map +1 -1
package/dist/internal/index.mjs +2 -2
package/dist/internal/index.mjs.map +1 -1
package/docs/15-google-generative-ai.mdx +93 -4
package/package.json +1 -1
package/src/convert-to-google-generative-ai-messages.ts +5 -1
package/src/google-generative-ai-image-model.ts +172 -7
package/src/google-generative-ai-image-settings.ts +4 -0

package/dist/index.mjs CHANGED Viewed

@@ -7,7 +7,7 @@ import {
 } from "@ai-sdk/provider-utils";
 // src/version.ts
-var VERSION = true ? "3.0.25" : "0.0.0-test";
+var VERSION = true ? "3.0.27" : "0.0.0-test";
 // src/google-generative-ai-embedding-model.ts
 import {
@@ -425,8 +425,8 @@ function convertToGoogleGenerativeAIMessages(prompt, options) {
         contents.push({
           role: "model",
           parts: content.map((part) => {
-            var _a2;
-            const providerOpts = (_a2 = part.providerOptions) == null ? void 0 : _a2[providerOptionsName];
+            var _a2, _b2, _c2;
+            const providerOpts = (_c2 = (_a2 = part.providerOptions) == null ? void 0 : _a2[providerOptionsName]) != null ? _c2 : providerOptionsName !== "google" ? (_b2 = part.providerOptions) == null ? void 0 : _b2.google : void 0;
             const thoughtSignature = (providerOpts == null ? void 0 : providerOpts.thoughtSignature) != null ? String(providerOpts.thoughtSignature) : void 0;
             switch (part.type) {
               case "text": {
@@ -1806,7 +1806,9 @@ var googleTools = {
 // src/google-generative-ai-image-model.ts
 import {
   combineHeaders as combineHeaders3,
+  convertToBase64 as convertToBase642,
   createJsonResponseHandler as createJsonResponseHandler3,
+  generateId as defaultGenerateId,
   lazySchema as lazySchema11,
   parseProviderOptions as parseProviderOptions3,
   postJsonToApi as postJsonToApi3,
@@ -1822,13 +1824,24 @@ var GoogleGenerativeAIImageModel = class {
     this.specificationVersion = "v3";
   }
   get maxImagesPerCall() {
-    var _a;
-    return (_a = this.settings.maxImagesPerCall) != null ? _a : 4;
+    if (this.settings.maxImagesPerCall != null) {
+      return this.settings.maxImagesPerCall;
+    }
+    if (isGeminiModel(this.modelId)) {
+      return 10;
+    }
+    return 4;
   }
   get provider() {
     return this.config.provider;
   }
   async doGenerate(options) {
+    if (isGeminiModel(this.modelId)) {
+      return this.doGenerateGemini(options);
+    }
+    return this.doGenerateImagen(options);
+  }
+  async doGenerateImagen(options) {
     var _a, _b, _c;
     const {
       prompt,
@@ -1845,7 +1858,7 @@ var GoogleGenerativeAIImageModel = class {
     const warnings = [];
     if (files != null && files.length > 0) {
       throw new Error(
-        "Google Generative AI does not support image editing. Use Google Vertex AI (@ai-sdk/google-vertex) for image editing capabilities."
+        "Google Generative AI does not support image editing with Imagen models. Use Google Vertex AI (@ai-sdk/google-vertex) for image editing capabilities."
       );
     }
     if (mask != null) {
@@ -1901,10 +1914,10 @@ var GoogleGenerativeAIImageModel = class {
       images: response.predictions.map(
         (p) => p.bytesBase64Encoded
       ),
-      warnings: warnings != null ? warnings : [],
+      warnings,
       providerMetadata: {
         google: {
-          images: response.predictions.map((prediction) => ({
+          images: response.predictions.map(() => ({
             // Add any prediction-specific metadata here
           }))
         }
@@ -1916,7 +1929,113 @@ var GoogleGenerativeAIImageModel = class {
       }
     };
   }
+  async doGenerateGemini(options) {
+    var _a, _b, _c, _d, _e, _f, _g, _h, _i;
+    const {
+      prompt,
+      n,
+      size,
+      aspectRatio,
+      seed,
+      providerOptions,
+      headers,
+      abortSignal,
+      files,
+      mask
+    } = options;
+    const warnings = [];
+    if (mask != null) {
+      throw new Error(
+        "Gemini image models do not support mask-based image editing."
+      );
+    }
+    if (n != null && n > 1) {
+      throw new Error(
+        "Gemini image models do not support generating a set number of images per call. Use n=1 or omit the n parameter."
+      );
+    }
+    if (size != null) {
+      warnings.push({
+        type: "unsupported",
+        feature: "size",
+        details: "This model does not support the `size` option. Use `aspectRatio` instead."
+      });
+    }
+    const userContent = [];
+    if (prompt != null) {
+      userContent.push({ type: "text", text: prompt });
+    }
+    if (files != null && files.length > 0) {
+      for (const file of files) {
+        if (file.type === "url") {
+          userContent.push({
+            type: "file",
+            data: new URL(file.url),
+            mediaType: "image/*"
+          });
+        } else {
+          userContent.push({
+            type: "file",
+            data: typeof file.data === "string" ? file.data : new Uint8Array(file.data),
+            mediaType: file.mediaType
+          });
+        }
+      }
+    }
+    const languageModelPrompt = [
+      { role: "user", content: userContent }
+    ];
+    const languageModel = new GoogleGenerativeAILanguageModel(this.modelId, {
+      provider: this.config.provider,
+      baseURL: this.config.baseURL,
+      headers: (_a = this.config.headers) != null ? _a : {},
+      fetch: this.config.fetch,
+      generateId: (_b = this.config.generateId) != null ? _b : defaultGenerateId
+    });
+    const result = await languageModel.doGenerate({
+      prompt: languageModelPrompt,
+      seed,
+      providerOptions: {
+        google: {
+          responseModalities: ["IMAGE"],
+          imageConfig: aspectRatio ? { aspectRatio } : void 0,
+          ...(_c = providerOptions == null ? void 0 : providerOptions.google) != null ? _c : {}
+        }
+      },
+      headers,
+      abortSignal
+    });
+    const currentDate = (_f = (_e = (_d = this.config._internal) == null ? void 0 : _d.currentDate) == null ? void 0 : _e.call(_d)) != null ? _f : /* @__PURE__ */ new Date();
+    const images = [];
+    for (const part of result.content) {
+      if (part.type === "file" && part.mediaType.startsWith("image/")) {
+        images.push(convertToBase642(part.data));
+      }
+    }
+    return {
+      images,
+      warnings,
+      providerMetadata: {
+        google: {
+          images: images.map(() => ({}))
+        }
+      },
+      response: {
+        timestamp: currentDate,
+        modelId: this.modelId,
+        headers: (_g = result.response) == null ? void 0 : _g.headers
+      },
+      usage: result.usage ? {
+        inputTokens: result.usage.inputTokens.total,
+        outputTokens: result.usage.outputTokens.total,
+        totalTokens: ((_h = result.usage.inputTokens.total) != null ? _h : 0) + ((_i = result.usage.outputTokens.total) != null ? _i : 0)
+      } : void 0
+    };
+  }
 };
+function isGeminiModel(modelId) {
+  return modelId.startsWith("gemini-");
+}
 var googleImageResponseSchema = lazySchema11(
   () => zodSchema11(
     z13.object({