npm - @mixio-pro/kalaasetu-mcp - Versions diffs - 1.0.3 → 1.0.5-beta - Mend

@mixio-pro/kalaasetu-mcp 1.0.3 → 1.0.5-beta

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json +1 -1
package/src/tools/image-to-video.sdk-backup.ts +161 -0
package/src/tools/image-to-video.ts +192 -121

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@mixio-pro/kalaasetu-mcp",
-  "version": "1.0.3",
+  "version": "1.0.5-beta",
   "description": "A powerful Model Context Protocol server providing AI tools for content generation and analysis",
   "type": "module",
   "module": "src/index.ts",

package/src/tools/image-to-video.sdk-backup.ts ADDED Viewed

@@ -0,0 +1,161 @@
+import { z } from "zod";
+import * as fs from "fs";
+import * as path from "path";
+import { GoogleGenAI } from "@google/genai";
+async function wait(ms: number): Promise<void> {
+  return new Promise((resolve) => setTimeout(resolve, ms));
+}
+function fileToBase64(filePath: string): { data: string; mimeType: string } {
+  if (!fs.existsSync(filePath)) {
+    throw new Error(`File not found: ${filePath}`);
+  }
+  const buf = fs.readFileSync(filePath);
+  const data = Buffer.from(buf).toString("base64");
+  // Detect mime type from extension
+  const ext = path.extname(filePath).toLowerCase();
+  const mimeType = ext === '.jpg' || ext === '.jpeg' ? 'image/jpeg' :
+                   ext === '.png' ? 'image/png' :
+                   ext === '.webp' ? 'image/webp' : 'image/png';
+  return { data, mimeType };
+}
+export const imageToVideo = {
+  name: "imageToVideo",
+  description: "Generate videos from an image as starting first frame using Vertex Veo models (predictLongRunning + fetchPredictOperation).",
+  parameters: z.object({
+    prompt: z.string().describe("Text description for the video"),
+    image_path: z.string().optional().describe("Path to source image for image-to-video generation"),
+    aspect_ratio: z.string().optional().describe("Video aspect ratio: '16:9' or '9:16' (default: '9:16')"),
+    duration_seconds: z.number().optional().describe("Video duration in seconds: 4, 6, or 8 (default: 6)"),
+    resolution: z.string().optional().describe("Video resolution: '720p' or '1080p' (default: '720p')"),
+    negative_prompt: z.string().optional().describe("Text describing what not to include in the video"),
+    person_generation: z.string().optional().describe("Controls generation of people: 'allow_adult' (default for image-to-video) or 'allow_all'"),
+    reference_images: z.array(z.string()).optional().describe("Additional image paths for reference (max 3)"),
+    output_path: z.string().optional().describe("Output MP4 file path (if multiple predictions, index suffix is added)"),
+    gemini_api_key: z.string().optional().describe("Gemini API key (uses GEMINI_API_KEY env var if not provided)"),
+    model_id: z.string().optional().describe("Model ID (default: veo-2.0-generate-001)"),
+  }),
+  execute: async (args: {
+    prompt: string;
+    image_path?: string;
+    aspect_ratio?: string;
+    duration_seconds?: number;
+    resolution?: string;
+    negative_prompt?: string;
+    person_generation?: string;
+    reference_images?: string[];
+    output_path?: string;
+    gemini_api_key?: string;
+    model_id?: string;
+  }) => {
+    const apiKey = args.gemini_api_key || process.env.GEMINI_API_KEY;
+    if (!apiKey) {
+      throw new Error("Gemini API key is required. Set GEMINI_API_KEY environment variable or pass gemini_api_key parameter. Get one at https://aistudio.google.com/app/apikey");
+    }
+    const model = args.model_id || "veo-2.0-generate-001";
+    // Initialize Google GenAI client
+    const genai = new GoogleGenAI({ apiKey });
+    // Build config for video generation
+    const config: any = {};
+    if (args.duration_seconds !== undefined) {
+      config.duration_seconds = args.duration_seconds;
+    } else {
+      config.duration_seconds = 6; // default
+    }
+    if (args.aspect_ratio) {
+      config.aspect_ratio = args.aspect_ratio;
+    }
+    try {
+      // Start video generation operation
+      console.log(`Starting video generation with model: ${model}`);
+      let operation = await genai.models.generateVideos({
+        model,
+        prompt: args.prompt,
+        config,
+      });
+      console.log("Operation started, waiting for completion...");
+      // Poll until operation is complete (max 10 minutes)
+      let tries = 0;
+      const maxTries = 60; // 10 minutes with 10s intervals
+      while (!operation.done && tries < maxTries) {
+        await wait(10000); // Wait 10 seconds
+        tries++;
+        console.log(`Polling attempt ${tries}/${maxTries}...`);
+        operation = await genai.operations.getVideosOperation({
+          operation: operation,
+        });
+      }
+      if (!operation.done) {
+        throw new Error("Video generation timed out after 10 minutes");
+      }
+      console.log("Operation completed!");
+      console.log("Full Response:", JSON.stringify(operation.response, null, 2));
+      // Extract generated videos from response
+      const generatedVideos = operation.response?.generatedVideos || [];
+      if (!generatedVideos || generatedVideos.length === 0) {
+        const respStr = JSON.stringify(operation.response, null, 2);
+        return `Video generation completed but no videos found in response.\n\nFull Response:\n${respStr.slice(0, 2000)}${respStr.length > 2000 ? '\n...(truncated)' : ''}`;
+      }
+      // Download and save videos
+      const outputs: string[] = [];
+      for (let i = 0; i < generatedVideos.length; i++) {
+        const generatedVideo = generatedVideos[i];
+        const videoUri = generatedVideo?.video?.uri;
+        if (!videoUri) {
+          console.warn(`Video ${i} has no URI`);
+          continue;
+        }
+        console.log(`Downloading video ${i + 1}/${generatedVideos.length}...`);
+        // Download video from URI
+        const videoUrl = `${videoUri}&key=${apiKey}`;
+        const response = await fetch(videoUrl);
+        if (!response.ok) {
+          throw new Error(`Failed to download video: ${response.status} ${response.statusText}`);
+        }
+        const buffer = await response.arrayBuffer();
+        // Save video to file
+        const filePath = args.output_path
+          ? (i === 0 ? args.output_path : args.output_path.replace(/\.mp4$/i, `_${i}.mp4`))
+          : `video_output_${Date.now()}${i === 0 ? '' : '_' + i}.mp4`;
+        const absPath = path.resolve(filePath);
+        fs.writeFileSync(absPath, Buffer.from(buffer));
+        outputs.push(absPath);
+        console.log(`Saved video to: ${absPath}`);
+      }
+      if (outputs.length > 0) {
+        return `Video(s) saved successfully:\n${outputs.map((p, i) => `${i + 1}. ${p}`).join('\n')}`;
+      }
+      return "Video generation completed but no videos were saved.";
+    } catch (error: any) {
+      throw new Error(`Video generation failed: ${error.message || JSON.stringify(error)}`);
+    }
+  },
+};

package/src/tools/image-to-video.ts CHANGED Viewed

@@ -1,161 +1,232 @@
-import { z } from "zod";
+// @ts-nocheck
 import * as fs from "fs";
+import { GoogleAuth } from "google-auth-library";
+import { exec } from "child_process";
 import * as path from "path";
-import { GoogleGenAI } from "@google/genai";
+import { z } from "zod";
 async function wait(ms: number): Promise<void> {
   return new Promise((resolve) => setTimeout(resolve, ms));
 }
-function fileToBase64(filePath: string): { data: string; mimeType: string } {
-  if (!fs.existsSync(filePath)) {
-    throw new Error(`File not found: ${filePath}`);
+async function fetchAccessToken(): Promise<string> {
+  try {
+    const auth = new GoogleAuth({ scopes: ["https://www.googleapis.com/auth/cloud-platform"] });
+    const client = await auth.getClient();
+    const token = await client.getAccessToken();
+    if (!token || typeof token !== "string") {
+      throw new Error("No token from GoogleAuth");
+    }
+    return token;
+  } catch (e) {
+    // Fallback to gcloud
+    return await new Promise((resolve, reject) => {
+      exec("gcloud auth print-access-token", (err, stdout, stderr) => {
+        if (err) {
+          reject(new Error(`Failed to fetch an access token (ADC and gcloud): ${stderr || err.message}`));
+          return;
+        }
+        const t = (stdout || "").trim();
+        if (!t) {
+          reject(new Error("Failed to fetch an access token: empty token from gcloud"));
+          return;
+        }
+        resolve(t);
+      });
+    });
+  }
+}
+function fileToBase64(path: string): { data: string; mimeType: string } {
+  if (!fs.existsSync(path)) {
+    throw new Error(`File not found: ${path}`);
   }
-  const buf = fs.readFileSync(filePath);
+  const buf = fs.readFileSync(path);
   const data = Buffer.from(buf).toString("base64");
-  // Detect mime type from extension
-  const ext = path.extname(filePath).toLowerCase();
-  const mimeType = ext === '.jpg' || ext === '.jpeg' ? 'image/jpeg' :
-                   ext === '.png' ? 'image/png' :
-                   ext === '.webp' ? 'image/webp' : 'image/png';
+  // Default to PNG if not sure, similar to existing code
+  const mimeType = "image/png";
   return { data, mimeType };
 }
-export const imageToVideo = {
-  name: "imageToVideo",
+export const imageToVideo = ({
+  name: "image_to_video",
   description: "Generate videos from an image as starting first frame using Vertex Veo models (predictLongRunning + fetchPredictOperation).",
   parameters: z.object({
     prompt: z.string().describe("Text description for the video"),
     image_path: z.string().optional().describe("Path to source image for image-to-video generation"),
+    last_frame_path: z.string().optional().describe("Path to last frame image to guide ending frame (optional)"),
     aspect_ratio: z.string().optional().describe("Video aspect ratio: '16:9' or '9:16' (default: '9:16')"),
-    duration_seconds: z.number().optional().describe("Video duration in seconds: 4, 6, or 8 (default: 6)"),
+    duration_seconds: z.string().optional().describe("Video duration in seconds: '4', '6', or '8' (default: '6')"),
     resolution: z.string().optional().describe("Video resolution: '720p' or '1080p' (default: '720p')"),
     negative_prompt: z.string().optional().describe("Text describing what not to include in the video"),
     person_generation: z.string().optional().describe("Controls generation of people: 'allow_adult' (default for image-to-video) or 'allow_all'"),
     reference_images: z.array(z.string()).optional().describe("Additional image paths for reference (max 3)"),
     output_path: z.string().optional().describe("Output MP4 file path (if multiple predictions, index suffix is added)"),
-    gemini_api_key: z.string().optional().describe("Gemini API key (uses GEMINI_API_KEY env var if not provided)"),
-    model_id: z.string().optional().describe("Model ID (default: veo-2.0-generate-001)"),
+    project_id: z.string().optional().describe("GCP Project ID (default: mixio-pro)"),
+    location_id: z.string().optional().describe("Vertex region (default: us-central1)"),
+    model_id: z.string().optional().describe("Model ID (default: veo-3.1-fast-generate-preview)"),
+    generate_audio: z.boolean().optional().describe("Boolean flag to enable generation of audio along with the video").default(false)
   }),
-  execute: async (args: {
-    prompt: string;
-    image_path?: string;
-    aspect_ratio?: string;
-    duration_seconds?: number;
-    resolution?: string;
-    negative_prompt?: string;
-    person_generation?: string;
-    reference_images?: string[];
-    output_path?: string;
-    gemini_api_key?: string;
-    model_id?: string;
-  }) => {
-    const apiKey = args.gemini_api_key || process.env.GEMINI_API_KEY;
-    if (!apiKey) {
-      throw new Error("Gemini API key is required. Set GEMINI_API_KEY environment variable or pass gemini_api_key parameter. Get one at https://aistudio.google.com/app/apikey");
-    }
+  async execute(args) {
+    const projectId = args.project_id || "mixio-pro";
+    const location = args.location_id || "us-central1";
+    const modelId = args.model_id || "veo-3.1-fast-generate-preview";
+    const token = await fetchAccessToken();
+    const url = `https://${location}-aiplatform.googleapis.com/v1/projects/${projectId}/locations/${location}/publishers/google/models/${modelId}:predictLongRunning`;
-    const model = args.model_id || "veo-2.0-generate-001";
-    // Initialize Google GenAI client
-    const genai = new GoogleGenAI({ apiKey });
-    // Build config for video generation
-    const config: any = {};
-    if (args.duration_seconds !== undefined) {
-      config.duration_seconds = args.duration_seconds;
-    } else {
-      config.duration_seconds = 6; // default
+    let imagePart: any = undefined;
+    if (args.image_path) {
+      const { data, mimeType } = fileToBase64(args.image_path);
+      imagePart = {
+        image: {
+          bytesBase64Encoded: data,
+          mimeType,
+        },
+      };
     }
-    if (args.aspect_ratio) {
-      config.aspect_ratio = args.aspect_ratio;
+    let lastFramePart: any = undefined;
+    if (args.last_frame_path) {
+      const { data, mimeType } = fileToBase64(args.last_frame_path);
+      lastFramePart = {
+        lastFrame: {
+          bytesBase64Encoded: data,
+          mimeType,
+        },
+      };
     }
-    try {
-      // Start video generation operation
-      console.log(`Starting video generation with model: ${model}`);
-      let operation = await genai.models.generateVideos({
-        model,
-        prompt: args.prompt,
-        config,
-      });
+    let referenceImages: any[] | undefined = undefined;
+    if (args.reference_images) {
+      let refImages: string[];
+      if (typeof args.reference_images === "string") {
+        if (args.reference_images.startsWith("[") && args.reference_images.endsWith("]")) {
+          try {
+            refImages = JSON.parse(args.reference_images);
+          } catch {
+            throw new Error("Invalid reference_images format");
+          }
+        } else {
+          refImages = [args.reference_images];
+        }
+      } else if (Array.isArray(args.reference_images)) {
+        refImages = args.reference_images;
+      } else {
+        throw new Error("Invalid reference_images: must be array or string");
+      }
-      console.log("Operation started, waiting for completion...");
-      // Poll until operation is complete (max 10 minutes)
-      let tries = 0;
-      const maxTries = 60; // 10 minutes with 10s intervals
-      while (!operation.done && tries < maxTries) {
-        await wait(10000); // Wait 10 seconds
-        tries++;
-        console.log(`Polling attempt ${tries}/${maxTries}...`);
-        operation = await genai.operations.getVideosOperation({
-          operation: operation,
+      if (refImages.length > 0) {
+        referenceImages = refImages.slice(0, 3).map((p) => {
+          const { data, mimeType } = fileToBase64(p);
+          return {
+            image: {
+              bytesBase64Encoded: data,
+              mimeType,
+            },
+            referenceType: "asset",
+          };
         });
       }
+    }
-      if (!operation.done) {
-        throw new Error("Video generation timed out after 10 minutes");
-      }
+    const personGeneration = args.person_generation || (args.image_path ? "allow_adult" : "allow_all");
-      console.log("Operation completed!");
-      console.log("Full Response:", JSON.stringify(operation.response, null, 2));
+    const instances: any[] = [
+      {
+        prompt: args.prompt,
+        ...(imagePart || {}),
+        ...(lastFramePart || {}),
+        ...(referenceImages ? { referenceImages } : {}),
+      },
+    ];
-      // Extract generated videos from response
-      const generatedVideos = operation.response?.generatedVideos || [];
-      if (!generatedVideos || generatedVideos.length === 0) {
-        const respStr = JSON.stringify(operation.response, null, 2);
-        return `Video generation completed but no videos found in response.\n\nFull Response:\n${respStr.slice(0, 2000)}${respStr.length > 2000 ? '\n...(truncated)' : ''}`;
-      }
+    const parameters: any = {
+      aspectRatio: args.aspect_ratio || "9:16",
+      durationSeconds: parseInt(args.duration_seconds) || 6,
+      resolution: args.resolution || "720p",
+      negativePrompt: args.negative_prompt,
+      generateAudio: args.generate_audio || false,
+      personGeneration,
+    };
-      // Download and save videos
-      const outputs: string[] = [];
-      for (let i = 0; i < generatedVideos.length; i++) {
-        const generatedVideo = generatedVideos[i];
-        const videoUri = generatedVideo?.video?.uri;
-        if (!videoUri) {
-          console.warn(`Video ${i} has no URI`);
-          continue;
-        }
+    const res = await fetch(url, {
+      method: "POST",
+      headers: {
+        Authorization: `Bearer ${token}`,
+        "Content-Type": "application/json",
+      },
+      body: JSON.stringify({ instances, parameters }),
+    });
-        console.log(`Downloading video ${i + 1}/${generatedVideos.length}...`);
-        // Download video from URI
-        const videoUrl = `${videoUri}&key=${apiKey}`;
-        const response = await fetch(videoUrl);
-        if (!response.ok) {
-          throw new Error(`Failed to download video: ${response.status} ${response.statusText}`);
-        }
-        const buffer = await response.arrayBuffer();
-        // Save video to file
-        const filePath = args.output_path
-          ? (i === 0 ? args.output_path : args.output_path.replace(/\.mp4$/i, `_${i}.mp4`))
-          : `video_output_${Date.now()}${i === 0 ? '' : '_' + i}.mp4`;
-        const absPath = path.resolve(filePath);
-        fs.writeFileSync(absPath, Buffer.from(buffer));
-        outputs.push(absPath);
-        console.log(`Saved video to: ${absPath}`);
-      }
+    if (!res.ok) {
+      const text = await res.text();
+      throw new Error(`Vertex request failed: ${res.status} ${text}`);
+    }
+    const op = await res.json();
+    const name: string = op.name || op.operation || "";
+    if (!name) {
+      throw new Error("Vertex did not return an operation name for long-running request");
+    }
-      if (outputs.length > 0) {
-        return `Video(s) saved successfully:\n${outputs.map((p, i) => `${i + 1}. ${p}`).join('\n')}`;
+    let current = op;
+    let done = !!op.done;
+    let tries = 0;
+    // Poll using fetchPredictOperation as per Vertex recommendation
+    const fetchUrl = `https://${location}-aiplatform.googleapis.com/v1/projects/${projectId}/locations/${location}/publishers/google/models/${modelId}:fetchPredictOperation`;
+    while (!done && tries < 60) {
+      await wait(10000);
+      const poll = await fetch(fetchUrl, {
+        method: "POST",
+        headers: {
+          Authorization: `Bearer ${token}`,
+          "Content-Type": "application/json",
+        },
+        body: JSON.stringify({ operationName: name }),
+      });
+      if (!poll.ok) {
+        const text = await poll.text();
+        throw new Error(`Vertex operation poll failed: ${poll.status} ${text}`);
       }
+      current = await poll.json();
+      done = !!current.done || !!current.response;
+      tries++;
+    }
+    const resp = current.response || current;
+    // Decode from response.videos[].bytesBase64Encoded only
+    const outputs: string[] = [];
+    const saveVideo = (base64: string, index: number) => {
+      if (!base64) return;
+      const filePath = args.output_path
+        ? (index === 0 ? args.output_path : args.output_path.replace(/\.mp4$/i, `_${index}.mp4`))
+        : `video_output_${Date.now()}${index === 0 ? '' : '_' + index}.mp4`;
+      const absPath = path.resolve(filePath);
+      const buf = Buffer.from(base64, 'base64');
+      fs.writeFileSync(absPath, buf);
+      outputs.push(absPath);
+    };
-      return "Video generation completed but no videos were saved.";
-    } catch (error: any) {
-      throw new Error(`Video generation failed: ${error.message || JSON.stringify(error)}`);
+    if (Array.isArray(resp?.videos) && resp.videos.length > 0) {
+      for (let i = 0; i < resp.videos.length; i++) {
+        const v = resp.videos[i] || {};
+        if (typeof v.bytesBase64Encoded === 'string') {
+          saveVideo(v.bytesBase64Encoded, i);
+        }
+      }
     }
+    if (outputs.length > 0) {
+      return `Video(s) saved: ${outputs.join(', ')}`;
+    }
+    // If nothing saved, return a concise summary plus head/tail snippets of JSON
+    let jsonStr = "";
+    try { jsonStr = JSON.stringify(resp); } catch {}
+    const head150 = jsonStr ? jsonStr.slice(0, 150) : "";
+    const tail50 = jsonStr ? jsonStr.slice(Math.max(0, jsonStr.length - 50)) : "";
+    return `Vertex operation done but no videos array present. operationName=${name}. json_head150=${head150} json_tail50=${tail50}`;
   },
-};
+});