npm - climage - Versions diffs - 0.5.0 → 0.5.2 - Mend

climage 0.5.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/README.md CHANGED Viewed

@@ -23,13 +23,14 @@ Set one of:
 **Models:**
-| Model                           | Alias             | Description                                                                           |
-| ------------------------------- | ----------------- | ------------------------------------------------------------------------------------- |
-| `gemini-3-pro-image-preview`    | `nano-banana-pro` | **Default.** State-of-the-art, professional asset production, up to 4K, thinking mode |
-| `gemini-2.5-flash-image`        | `nano-banana`     | Fast & efficient, optimized for high-volume tasks                                     |
-| `imagen-4.0-generate-001`       | -                 | Imagen 4 Standard                                                                     |
-| `imagen-4.0-ultra-generate-001` | -                 | Imagen 4 Ultra (best quality)                                                         |
-| `imagen-4.0-fast-generate-001`  | -                 | Imagen 4 Fast                                                                         |
+| Model                            | Alias             | Description                                                                           |
+| -------------------------------- | ----------------- | ------------------------------------------------------------------------------------- |
+| `gemini-3-pro-image-preview`     | `nano-banana-pro` | **Default.** State-of-the-art, professional asset production, up to 4K, thinking mode |
+| `gemini-3.1-flash-image-preview` | `nano-banana-2`   | Nano Banana 2 — fast native image generation                                          |
+| `gemini-2.5-flash-image`         | `nano-banana`     | Fast & efficient, optimized for high-volume tasks                                     |
+| `imagen-4.0-generate-001`        | -                 | Imagen 4 Standard                                                                     |
+| `imagen-4.0-ultra-generate-001`  | -                 | Imagen 4 Ultra (best quality)                                                         |
+| `imagen-4.0-fast-generate-001`   | -                 | Imagen 4 Fast                                                                         |
 Example:

package/dist/cli.js CHANGED Viewed

@@ -653,6 +653,9 @@ var falProvider = {
 // src/providers/google.ts
 import { GoogleGenAI } from "@google/genai";
+import { mkdtemp, readFile, rm } from "fs/promises";
+import { tmpdir } from "os";
+import { join } from "path";
 function getGeminiApiKey(env) {
   return env.GEMINI_API_KEY || env.GOOGLE_API_KEY || env.GOOGLE_GENAI_API_KEY;
 }
@@ -674,6 +677,7 @@ function log3(...args) {
 var MODEL_ALIASES = {
   "nano-banana": "gemini-2.5-flash-image",
   "nano-banana-pro": "gemini-3-pro-image-preview",
+  "nano-banana-2": "gemini-3.1-flash-image-preview",
   // Veo (video)
   veo2: "veo-2.0-generate-001",
   "veo-2": "veo-2.0-generate-001",
@@ -700,7 +704,26 @@ function imageToGoogleFormat(imageInput) {
   }
   return { fileUri: imageInput };
 }
-var GEMINI_IMAGE_MODELS = ["gemini-2.5-flash-image", "gemini-3-pro-image-preview"];
+function imageToVeoFormat(imageInput) {
+  if (imageInput.startsWith("data:")) {
+    const parsed = parseDataUri(imageInput);
+    if (!parsed?.data) {
+      throw new Error("Failed to parse data URI for Veo image input");
+    }
+    return { imageBytes: parsed.data, mimeType: parsed.mimeType };
+  }
+  if (imageInput.startsWith("gs://")) {
+    return { gcsUri: imageInput };
+  }
+  throw new Error(
+    `Veo image inputs must be data: URIs or gs:// URIs (got ${imageInput.slice(0, 24)}...)`
+  );
+}
+var GEMINI_IMAGE_MODELS = [
+  "gemini-2.5-flash-image",
+  "gemini-3-pro-image-preview",
+  "gemini-3.1-flash-image-preview"
+];
 function resolveModel(model) {
   if (!model) return "gemini-2.5-flash-image";
   return MODEL_ALIASES[model] ?? model;
@@ -718,6 +741,31 @@ async function downloadBytes3(url) {
   log3(`Downloaded ${ab.byteLength} bytes in ${Date.now() - start}ms, type: ${ct}`);
   return { bytes: new Uint8Array(ab), mimeType: ct };
 }
+async function downloadGeneratedVideo(ai, generatedVideo) {
+  const video = generatedVideo?.video;
+  if (video?.videoBytes) {
+    return {
+      bytes: new Uint8Array(Buffer.from(video.videoBytes, "base64")),
+      mimeType: video.mimeType
+    };
+  }
+  if (video?.uri && !video.uri.startsWith("gs://")) {
+    try {
+      return await downloadBytes3(video.uri);
+    } catch (err) {
+      log3("Direct video download failed, falling back to ai.files.download:", String(err));
+    }
+  }
+  const tempDir = await mkdtemp(join(tmpdir(), "climage-veo-"));
+  const downloadPath = join(tempDir, "video.mp4");
+  try {
+    await ai.files.download({ file: generatedVideo, downloadPath });
+    const buf = await readFile(downloadPath);
+    return { bytes: new Uint8Array(buf), mimeType: video?.mimeType ?? "video/mp4" };
+  } finally {
+    await rm(tempDir, { recursive: true, force: true });
+  }
+}
 async function sleep2(ms) {
   await new Promise((r) => setTimeout(r, ms));
 }
@@ -783,15 +831,15 @@ async function generateWithVeo(ai, model, req) {
   const config = {
     numberOfVideos: req.n,
     ...req.aspectRatio ? { aspectRatio: req.aspectRatio } : {},
-    // Add duration if specified (Veo 3.1 supports 4, 6, 8)
-    ...req.duration !== void 0 ? { durationSeconds: String(req.duration) } : {}
+    // Add duration if specified (Veo supports 4-8 seconds depending on model)
+    ...req.duration !== void 0 ? { durationSeconds: req.duration } : {}
   };
   if (req.inputImages?.length && isVeo31Model(model)) {
     const referenceImages = req.inputImages.slice(0, 3).map((img) => {
-      const imageData = imageToGoogleFormat(img);
+      const imageData = imageToVeoFormat(img);
       return {
         image: imageData,
-        referenceType: "asset"
+        referenceType: "ASSET"
       };
     });
     config.referenceImages = referenceImages;
@@ -804,12 +852,12 @@ async function generateWithVeo(ai, model, req) {
   };
   const firstFrameImage = req.startFrame ?? (req.inputImages?.length === 1 ? req.inputImages[0] : void 0);
   if (firstFrameImage && isVeo31Model(model)) {
-    const imageData = imageToGoogleFormat(firstFrameImage);
+    const imageData = imageToVeoFormat(firstFrameImage);
     generateParams.image = imageData;
     log3("Added first frame image");
   }
   if (req.endFrame && isVeo31Model(model)) {
-    const lastFrameData = imageToGoogleFormat(req.endFrame);
+    const lastFrameData = imageToVeoFormat(req.endFrame);
     config.lastFrame = lastFrameData;
     log3("Added last frame for interpolation");
   }
@@ -839,26 +887,22 @@ async function generateWithVeo(ai, model, req) {
   for (let i = 0; i < Math.min(videos.length, req.n); i++) {
     const v = videos[i];
     log3(`Processing video ${i}:`, JSON.stringify(v).slice(0, 300));
-    const uri = v?.video?.uri;
-    if (!uri) {
-      log3(`Video ${i} has no URI, skipping`);
+    if (!v?.video) {
+      log3(`Video ${i} has no video payload, skipping`);
       continue;
     }
-    if (uri.startsWith("gs://")) {
-      throw new Error(
-        `Google Veo returned a gs:// URI (${uri}). Configure outputGcsUri / Vertex flow to fetch from GCS.`
-      );
-    }
-    const { bytes, mimeType } = await downloadBytes3(uri);
-    out.push({
+    const uri = v?.video?.uri;
+    const { bytes, mimeType } = await downloadGeneratedVideo(ai, v);
+    const item = {
       kind: "video",
       provider: "google",
       model,
       index: i,
-      url: uri,
       bytes,
       ...mimeType !== void 0 ? { mimeType } : {}
-    });
+    };
+    if (uri) item.url = uri;
+    out.push(item);
   }
   if (!out.length) throw new Error("Google Veo returned videos but none were downloadable");
   log3(`Successfully generated ${out.length} video(s)`);