npm - @r16t/multimodal-mcp - Versions diffs - 1.2.2 → 1.2.3 - Mend

@r16t/multimodal-mcp 1.2.2 → 1.2.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/build/providers/google.js +25 -19
package/build/providers/openai.js +1 -1
package/package.json +1 -1

package/build/providers/google.js CHANGED Viewed

@@ -18,12 +18,13 @@ export class GoogleProvider {
         this.apiKey = apiKey;
     }
     async generateImage(params) {
-        const response = await fetch(`${GEMINI_BASE_URL}/models/imagen-4:generateImages?key=${this.apiKey}`, {
+        const response = await fetch(`${GEMINI_BASE_URL}/models/imagen-4.0-generate-001:predict?key=${this.apiKey}`, {
             method: "POST",
             headers: { "Content-Type": "application/json" },
             body: JSON.stringify({
-                prompt: params.prompt,
-                config: {
+                instances: [{ prompt: params.prompt }],
+                parameters: {
+                    sampleCount: 1,
                     aspectRatio: params.aspectRatio,
                     ...params.providerOptions,
                 },
@@ -37,7 +38,7 @@ export class GoogleProvider {
         return {
             data: Buffer.from(base64, "base64"),
             mimeType: "image/png",
-            metadata: { model: "imagen-4", provider: "google" },
+            metadata: { model: "imagen-4.0-generate-001", provider: "google" },
         };
     }
     async editImage(params) {
@@ -50,8 +51,8 @@ export class GoogleProvider {
                         parts: [
                             { text: params.prompt },
                             {
-                                inline_data: {
-                                    mime_type: params.imageMimeType,
+                                inlineData: {
+                                    mimeType: params.imageMimeType,
                                     data: base64Image,
                                 },
                             },
@@ -82,22 +83,27 @@ export class GoogleProvider {
         };
     }
     async generateVideo(params) {
-        const requestBody = {
+        const instance = {
             prompt: params.prompt,
-            config: {
-                aspectRatio: params.aspectRatio,
-                durationSeconds: params.duration,
-                ...params.providerOptions,
-            },
         };
         if (params.imageData) {
             const base64Image = params.imageData.toString("base64");
-            requestBody.image = {
-                bytesBase64Encoded: base64Image,
-                mimeType: params.imageMimeType ?? "image/png",
+            instance.image = {
+                inlineData: {
+                    mimeType: params.imageMimeType ?? "image/png",
+                    data: base64Image,
+                },
             };
         }
-        const submitResponse = await fetch(`${GEMINI_BASE_URL}/models/veo-3.1:predictLongRunning?key=${this.apiKey}`, {
+        const requestBody = {
+            instances: [instance],
+            parameters: {
+                aspectRatio: params.aspectRatio,
+                durationSeconds: params.duration,
+                ...params.providerOptions,
+            },
+        };
+        const submitResponse = await fetch(`${GEMINI_BASE_URL}/models/veo-3.1-generate-preview:predictLongRunning?key=${this.apiKey}`, {
             method: "POST",
             headers: { "Content-Type": "application/json" },
             body: JSON.stringify(requestBody),
@@ -116,7 +122,7 @@ export class GoogleProvider {
         return {
             data,
             mimeType: "video/mp4",
-            metadata: { model: "veo-3.1", provider: "google", operationName: operation.name },
+            metadata: { model: "veo-3.1-generate-preview", provider: "google", operationName: operation.name },
         };
     }
     async generateAudio(params) {
@@ -128,8 +134,8 @@ export class GoogleProvider {
             body: JSON.stringify({
                 contents: [{ parts: [{ text: params.text }] }],
                 generationConfig: {
-                    response_modalities: ["AUDIO"],
-                    speech_config: {
+                    responseModalities: ["AUDIO"],
+                    speechConfig: {
                         voiceConfig: {
                             prebuiltVoiceConfig: { voiceName: voice },
                         },

package/build/providers/openai.js CHANGED Viewed

@@ -60,7 +60,7 @@ export class OpenAIProvider {
         const createParams = {
             model: "sora-2",
             prompt: params.prompt,
-            duration: params.duration,
+            seconds: String(params.duration),
             ...params.providerOptions,
         };
         if (params.imageData) {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@r16t/multimodal-mcp",
-  "version": "1.2.2",
+  "version": "1.2.3",
   "description": "Multi-provider media generation MCP server",
   "type": "module",
   "main": "build/index.js",