npm - @felores/kie-ai-mcp-server - Versions diffs - 3.0.1 → 3.2.0 - Mend

@felores/kie-ai-mcp-server 3.0.1 → 3.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/dist/index.js CHANGED Viewed

@@ -5,7 +5,7 @@ import { CallToolRequestSchema, ErrorCode, ListToolsRequestSchema, ListResources
 import { KieAiClient } from "./kie-ai-client.js";
 import { TaskDatabase } from "./database.js";
 import { z } from "zod";
-import { NanoBananaImageSchema, Veo3GenerateSchema, SunoGenerateSchema, ElevenLabsTTSSchema, ElevenLabsSoundEffectsSchema, ByteDanceSeedanceVideoSchema, ByteDanceSeedreamImageSchema, QwenImageSchema, RunwayAlephVideoSchema, WanVideoSchema, MidjourneyGenerateSchema, OpenAI4oImageSchema, FluxKontextImageSchema, RecraftRemoveBackgroundSchema, IdeogramReframeSchema, KlingVideoSchema, HailuoVideoSchema, SoraVideoSchema, Flux2ImageSchema, WanAnimateSchema, ZImageSchema, GrokImagineSchema, InfiniTalkSchema, KlingAvatarSchema, TopazUpscaleImageSchema, } from "./types.js";
+import { NanoBananaImageSchema, Veo3GenerateSchema, SunoGenerateSchema, ElevenLabsTTSSchema, ElevenLabsSoundEffectsSchema, ByteDanceSeedanceVideoSchema, ByteDanceSeedreamImageSchema, QwenImageSchema, RunwayAlephVideoSchema, Wan27VideoSchema, MidjourneyGenerateSchema, GptImage2Schema, FluxKontextImageSchema, RecraftRemoveBackgroundSchema, IdeogramReframeSchema, KlingVideoSchema, HailuoVideoSchema, SoraVideoSchema, Flux2ImageSchema, WanAnimateSchema, ZImageSchema, GrokImagineSchema, InfiniTalkSchema, KlingAvatarSchema, TopazUpscaleImageSchema, HappyHorseVideoSchema, } from "./types.js";
 class KieAiMcpServer {
     server;
     client;
@@ -17,7 +17,7 @@ class KieAiMcpServer {
             "nano_banana_image",
             "bytedance_seedream_image",
             "qwen_image",
-            "openai_4o_image",
+            "gpt_image_2",
             "flux_kontext_image",
             "flux2_image",
             "z_image",
@@ -33,6 +33,7 @@ class KieAiMcpServer {
             "bytedance_seedance_video",
             "wan_video",
             "wan_animate",
+            "happyhorse_video",
             "hailuo_video",
             "kling_video",
             "runway_aleph_video",
@@ -53,7 +54,7 @@ class KieAiMcpServer {
     constructor() {
         this.server = new Server({
             name: "kie-ai-mcp-server",
-            version: "3.0.1",
+            version: "3.2.0",
         });
         // Initialize client with config from environment
         this.config = {
@@ -614,66 +615,92 @@ class KieAiMcpServer {
                 },
                 {
                     name: "bytedance_seedance_video",
-                    description: "Generate videos using ByteDance Seedance models (unified tool for both text-to-video and image-to-video)",
+                    description: "Generate videos with ByteDance Seedance 2.0 — multimodal inputs (image/video/audio references), native audio generation, standard and fast modes",
                     inputSchema: {
                         type: "object",
                         properties: {
                             prompt: {
                                 type: "string",
-                                description: "Text prompt for video generation (max 10000 characters)",
-                                minLength: 1,
-                                maxLength: 10000,
+                                description: "Text prompt for video generation (3-20000 characters)",
+                                minLength: 3,
+                                maxLength: 20000,
                             },
-                            image_url: {
+                            mode: {
+                                type: "string",
+                                description: "Generation mode — standard (seedance-2, higher quality) or fast (seedance-2-fast, iterative workflows)",
+                                enum: ["standard", "fast"],
+                                default: "standard",
+                            },
+                            first_frame_url: {
                                 type: "string",
-                                description: "URL of input image for image-to-video generation (optional - if not provided, uses text-to-video)",
+                                description: "URL of image to use as the first frame (optional)",
                                 format: "uri",
                             },
-                            quality: {
+                            last_frame_url: {
                                 type: "string",
-                                description: "Model quality level - lite for faster generation, pro for higher quality",
-                                enum: ["lite", "pro"],
-                                default: "lite",
+                                description: "URL of image to use as the last frame (optional)",
+                                format: "uri",
+                            },
+                            reference_image_urls: {
+                                type: "array",
+                                description: "Reference images for style/subject guidance (up to 9)",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 9,
+                            },
+                            reference_video_urls: {
+                                type: "array",
+                                description: "Reference videos for motion/style guidance (up to 3)",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 3,
+                            },
+                            reference_audio_urls: {
+                                type: "array",
+                                description: "Reference audio for sound-guided generation (up to 3)",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 3,
                             },
                             aspect_ratio: {
                                 type: "string",
                                 description: "Aspect ratio of the generated video",
-                                enum: ["1:1", "9:16", "16:9", "4:3", "3:4", "21:9", "9:21"],
+                                enum: [
+                                    "1:1",
+                                    "9:16",
+                                    "16:9",
+                                    "4:3",
+                                    "3:4",
+                                    "21:9",
+                                    "9:21",
+                                    "adaptive",
+                                ],
                                 default: "16:9",
                             },
                             resolution: {
                                 type: "string",
-                                description: "Video resolution - 480p for faster generation, 720p for balance, 1080p for higher quality",
-                                enum: ["480p", "720p", "1080p"],
+                                description: "Video resolution — 480p for faster, 720p for balance",
+                                enum: ["480p", "720p"],
                                 default: "720p",
                             },
                             duration: {
-                                type: "string",
-                                description: "Duration of video in seconds (2-12)",
-                                pattern: "^[2-9]|1[0-2]$",
-                                default: "5",
-                            },
-                            camera_fixed: {
-                                type: "boolean",
-                                description: "Whether to fix the camera position",
-                                default: false,
-                            },
-                            seed: {
                                 type: "integer",
-                                description: "Random seed to control video generation. Use -1 for random",
-                                minimum: -1,
-                                maximum: 2147483647,
-                                default: -1,
+                                description: "Duration of video in seconds (4-15)",
+                                minimum: 4,
+                                maximum: 15,
+                                default: 5,
                             },
-                            enable_safety_checker: {
+                            generate_audio: {
                                 type: "boolean",
-                                description: "Enable content safety checking",
+                                description: "Generate native audio for the video",
                                 default: true,
                             },
-                            end_image_url: {
-                                type: "string",
-                                description: "URL of image the video should end with (image-to-video only)",
-                                format: "uri",
+                            web_search: {
+                                type: "boolean",
+                                description: "Enable web search to enhance prompt understanding",
+                                default: false,
+                            },
+                            nsfw_checker: {
+                                type: "boolean",
+                                description: "Enable NSFW content filtering",
+                                default: false,
                             },
                             callBackUrl: {
                                 type: "string",
@@ -1211,70 +1238,41 @@ class KieAiMcpServer {
                     },
                 },
                 {
-                    name: "openai_4o_image",
-                    description: "Generate images using OpenAI GPT-4o models (unified tool for text-to-image, image editing, and image variants)",
+                    name: "gpt_image_2",
+                    description: "Generate images using GPT Image 2 (text-to-image and image-to-image with up to 16 reference images)",
                     inputSchema: {
                         type: "object",
                         properties: {
                             prompt: {
                                 type: "string",
-                                description: "Text prompt describing the desired image (max 5000 characters)",
-                                maxLength: 5000,
+                                description: "Text prompt describing the desired image (max 20000 characters)",
+                                maxLength: 20000,
                             },
-                            filesUrl: {
+                            input_urls: {
                                 type: "array",
-                                description: "Array of up to 5 image URLs for editing or variants",
-                                items: {
-                                    type: "string",
-                                    format: "uri",
-                                },
-                                maxItems: 5,
+                                description: "Array of up to 16 image URLs for image-to-image mode. Omit for text-to-image.",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 16,
                             },
-                            size: {
+                            aspect_ratio: {
                                 type: "string",
                                 description: "Image aspect ratio",
-                                enum: ["1:1", "3:2", "2:3"],
-                                default: "1:1",
-                            },
-                            nVariants: {
-                                type: "string",
-                                description: "Number of image variations to generate",
-                                enum: ["1", "2", "4"],
-                                default: "4",
+                                enum: ["auto", "1:1", "9:16", "16:9", "4:3", "3:4"],
+                                default: "auto",
                             },
-                            maskUrl: {
+                            resolution: {
                                 type: "string",
-                                description: "Mask image URL for precise editing (black areas will be modified, white areas preserved)",
-                                format: "uri",
+                                description: "Output resolution",
+                                enum: ["1K", "2K", "4K"],
+                                default: "1K",
                             },
                             callBackUrl: {
                                 type: "string",
                                 description: "Optional: URL for task completion notifications (uses KIE_AI_CALLBACK_URL env var if not provided)",
                                 format: "uri",
                             },
-                            isEnhance: {
-                                type: "boolean",
-                                description: "Enable prompt enhancement for specialized scenarios like 3D renders",
-                                default: false,
-                            },
-                            uploadCn: {
-                                type: "boolean",
-                                description: "Route uploads via China servers",
-                                default: false,
-                            },
-                            enableFallback: {
-                                type: "boolean",
-                                description: "Enable automatic fallback to backup models if GPT-4o is unavailable",
-                                default: true,
-                            },
-                            fallbackModel: {
-                                type: "string",
-                                description: "Backup model to use when fallback is enabled",
-                                enum: ["GPT_IMAGE_1", "FLUX_MAX"],
-                                default: "FLUX_MAX",
-                            },
                         },
-                        required: [],
+                        required: ["prompt"],
                     },
                 },
                 {
@@ -1349,57 +1347,135 @@ class KieAiMcpServer {
                 },
                 {
                     name: "wan_video",
-                    description: "Generate videos using Alibaba Wan 2.5 models (unified tool for both text-to-video and image-to-video)",
+                    description: "Generate videos using Alibaba Wan 2.7 (text-to-video, image-to-video, reference-to-video, video-edit with native audio support)",
                     inputSchema: {
                         type: "object",
                         properties: {
+                            mode: {
+                                type: "string",
+                                description: "Generation mode: text-to-video (default), image-to-video, reference-to-video, or video-edit. Auto-detected from parameters if omitted.",
+                                enum: [
+                                    "text-to-video",
+                                    "image-to-video",
+                                    "reference-to-video",
+                                    "video-edit",
+                                ],
+                            },
                             prompt: {
                                 type: "string",
-                                description: "Text prompt for video generation (max 800 characters)",
+                                description: "Text prompt for video generation (max 5000 characters)",
                                 minLength: 1,
-                                maxLength: 800,
+                                maxLength: 5000,
                             },
-                            image_url: {
+                            negative_prompt: {
+                                type: "string",
+                                description: "Negative prompt to describe content to avoid (max 500 characters)",
+                                maxLength: 500,
+                            },
+                            audio_url: {
                                 type: "string",
-                                description: "URL of input image for image-to-video generation (optional - if not provided, uses text-to-video)",
+                                description: "Audio URL for text-to-video with audio (T2V mode only)",
                                 format: "uri",
                             },
-                            aspect_ratio: {
+                            first_frame_url: {
                                 type: "string",
-                                description: "Aspect ratio of the generated video (text-to-video only)",
-                                enum: ["16:9", "9:16", "1:1"],
-                                default: "16:9",
+                                description: "URL of first frame image for image-to-video mode",
+                                format: "uri",
+                            },
+                            last_frame_url: {
+                                type: "string",
+                                description: "URL of last frame image for image-to-video mode",
+                                format: "uri",
+                            },
+                            first_clip_url: {
+                                type: "string",
+                                description: "URL of first video clip for image-to-video mode",
+                                format: "uri",
+                            },
+                            driving_audio_url: {
+                                type: "string",
+                                description: "Audio URL to drive facial expressions (I2V mode)",
+                                format: "uri",
+                            },
+                            reference_image: {
+                                type: "array",
+                                description: "Reference images for reference-to-video mode (up to 5)",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 5,
+                            },
+                            reference_video: {
+                                type: "array",
+                                description: "Reference videos for reference-to-video mode (up to 5)",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 5,
+                            },
+                            reference_voice: {
+                                type: "string",
+                                description: "Voice reference URL for R2V mode",
+                                format: "uri",
+                            },
+                            first_frame: {
+                                type: "string",
+                                description: "First frame image URL for R2V mode",
+                                format: "uri",
+                            },
+                            video_url_edit: {
+                                type: "string",
+                                description: "Video URL to edit (video-edit mode)",
+                                format: "uri",
+                            },
+                            reference_image_edit: {
+                                type: "string",
+                                description: "Reference image URL for video-edit mode",
+                                format: "uri",
+                            },
+                            audio_setting: {
+                                type: "string",
+                                description: "Audio handling for video-edit: auto or origin",
+                                enum: ["auto", "origin"],
                             },
                             resolution: {
                                 type: "string",
-                                description: "Video resolution - 720p for faster generation, 1080p for higher quality",
+                                description: "Video resolution",
                                 enum: ["720p", "1080p"],
                                 default: "1080p",
                             },
-                            duration: {
+                            ratio: {
                                 type: "string",
-                                description: "Duration of video in seconds (image-to-video only)",
-                                enum: ["5", "10"],
-                                default: "5",
+                                description: "Aspect ratio of the generated video",
+                                enum: ["16:9", "9:16", "1:1", "4:3", "3:4"],
+                                default: "16:9",
                             },
-                            negative_prompt: {
-                                type: "string",
-                                description: "Negative prompt to describe content to avoid (max 500 characters)",
-                                maxLength: 500,
-                                default: "",
+                            duration: {
+                                type: "integer",
+                                description: "Duration in seconds (2-15)",
+                                minimum: 2,
+                                maximum: 15,
+                                default: 5,
                             },
-                            enable_prompt_expansion: {
+                            prompt_extend: {
                                 type: "boolean",
-                                description: "Whether to enable prompt rewriting using LLM (improves short prompts but increases processing time)",
+                                description: "Enable prompt rewriting using LLM for better results",
                                 default: true,
                             },
+                            watermark: {
+                                type: "boolean",
+                                description: "Add watermark to generated video",
+                                default: false,
+                            },
                             seed: {
                                 type: "integer",
-                                description: "Random seed for reproducible results",
+                                description: "Random seed for reproducible results (0-2147483647)",
+                                minimum: 0,
+                            },
+                            nsfw_checker: {
+                                type: "boolean",
+                                description: "Enable NSFW content filter",
+                                default: false,
                             },
                             callBackUrl: {
                                 type: "string",
-                                description: "Optional: URL for task completion notifications (uses KIE_AI_CALLBACK_URL env var if not provided)",
+                                description: "Optional: URL for task completion notifications",
                                 format: "uri",
                             },
                         },
@@ -1762,6 +1838,89 @@ class KieAiMcpServer {
                         required: ["video_url", "image_url"],
                     },
                 },
+                {
+                    name: "happyhorse_video",
+                    description: "Generate videos using Alibaba HappyHorse 1.0 (text-to-video, image-to-video, reference-to-video with up to 9 images, video-edit with native audio)",
+                    inputSchema: {
+                        type: "object",
+                        properties: {
+                            mode: {
+                                type: "string",
+                                description: "Generation mode: text-to-video (default), image-to-video, reference-to-video, or video-edit. Auto-detected from parameters if omitted.",
+                                enum: [
+                                    "text-to-video",
+                                    "image-to-video",
+                                    "reference-to-video",
+                                    "video-edit",
+                                ],
+                            },
+                            prompt: {
+                                type: "string",
+                                description: "Text prompt for video generation (max 5000 characters)",
+                                minLength: 1,
+                                maxLength: 5000,
+                            },
+                            image_urls: {
+                                type: "array",
+                                description: "Input image URL for image-to-video mode (max 1)",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 1,
+                            },
+                            reference_image: {
+                                type: "array",
+                                description: "Reference images for reference-to-video mode (up to 9)",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 9,
+                            },
+                            video_url: {
+                                type: "string",
+                                description: "Video URL to edit (video-edit mode)",
+                                format: "uri",
+                            },
+                            reference_image_edit: {
+                                type: "array",
+                                description: "Reference images for video-edit mode (up to 5)",
+                                items: { type: "string", format: "uri" },
+                                maxItems: 5,
+                            },
+                            audio_setting: {
+                                type: "string",
+                                description: "Audio handling for video-edit: auto or origin",
+                                enum: ["auto", "origin"],
+                            },
+                            resolution: {
+                                type: "string",
+                                description: "Video resolution",
+                                enum: ["720p", "1080p"],
+                                default: "1080p",
+                            },
+                            aspect_ratio: {
+                                type: "string",
+                                description: "Aspect ratio of the generated video",
+                                enum: ["16:9", "9:16", "1:1", "4:3", "3:4"],
+                                default: "16:9",
+                            },
+                            duration: {
+                                type: "integer",
+                                description: "Duration in seconds (3-15)",
+                                minimum: 3,
+                                maximum: 15,
+                                default: 5,
+                            },
+                            seed: {
+                                type: "integer",
+                                description: "Random seed for reproducible results (0-2147483647)",
+                                minimum: 0,
+                            },
+                            callBackUrl: {
+                                type: "string",
+                                description: "Optional: URL for task completion notifications",
+                                format: "uri",
+                            },
+                        },
+                        required: ["prompt"],
+                    },
+                },
                 {
                     name: "sora_video",
                     description: "Generate videos using OpenAI's Sora 2 models (unified tool for text-to-video, image-to-video, and storyboard generation with standard/high quality)",
@@ -1856,14 +2015,16 @@ class KieAiMcpServer {
                         return await this.handleKlingAvatar(args);
                     case "midjourney_generate":
                         return await this.handleMidjourneyGenerate(args);
-                    case "openai_4o_image":
-                        return await this.handleOpenAI4oImage(args);
+                    case "gpt_image_2":
+                        return await this.handleGptImage2(args);
                     case "flux_kontext_image":
                         return await this.handleFluxKontextImage(args);
                     case "runway_aleph_video":
                         return await this.handleRunwayAlephVideo(args);
                     case "wan_video":
                         return await this.handleWanVideo(args);
+                    case "happyhorse_video":
+                        return await this.handleHappyHorseVideo(args);
                     case "topaz_upscale_image":
                         return await this.handleTopazUpscaleImage(args);
                     case "recraft_remove_background":
@@ -1928,9 +2089,9 @@ class KieAiMcpServer {
                         },
                     },
                     {
-                        uri: "kie://models/openai-4o-image",
-                        name: "OpenAI GPT-4o Image",
-                        description: "Creative variants (up to 4), mask editing, limited aspect ratios",
+                        uri: "kie://models/gpt-image-2",
+                        name: "GPT Image 2",
+                        description: "Text-to-image and image-to-image with up to 16 reference images",
                         mimeType: "text/markdown",
                         annotations: {
                             audience: ["assistant"],
@@ -1960,8 +2121,8 @@ class KieAiMcpServer {
                     },
                     {
                         uri: "kie://models/bytedance-seedance",
-                        name: "ByteDance Seedance",
-                        description: "Professional video generation with lite/pro quality modes",
+                        name: "ByteDance Seedance 2.0",
+                        description: "Multimodal video generation with native audio, image/video/audio references, standard and fast modes",
                         mimeType: "text/markdown",
                         annotations: {
                             audience: ["assistant"],
@@ -1970,8 +2131,18 @@ class KieAiMcpServer {
                     },
                     {
                         uri: "kie://models/wan-video",
-                        name: "Wan Video 2.5",
-                        description: "Fast video generation for social media content",
+                        name: "Wan 2.7 Video",
+                        description: "Multi-mode video generation: T2V, I2V, R2V, video-edit with audio",
+                        mimeType: "text/markdown",
+                        annotations: {
+                            audience: ["assistant"],
+                            priority: 0.6,
+                        },
+                    },
+                    {
+                        uri: "kie://models/happyhorse-video",
+                        name: "HappyHorse 1.0 Video",
+                        description: "Multi-mode video: T2V, I2V, R2V (up to 9 refs), video-edit with audio",
                         mimeType: "text/markdown",
                         annotations: {
                             audience: ["assistant"],
@@ -2431,25 +2602,6 @@ class KieAiMcpServer {
                             errorMessage = apiData.failMsg;
                         }
                     }
-                    else if (localTask?.api_type === "openai-4o-image") {
-                        // OpenAI 4o Image-specific status mapping
-                        const successFlag = apiData.successFlag;
-                        if (successFlag === 1)
-                            status = "completed";
-                        else if (successFlag === 2)
-                            status = "failed";
-                        else if (successFlag === 0)
-                            status = "processing";
-                        // Extract result URLs from OpenAI 4o response
-                        if (apiData.response?.result_urls &&
-                            apiData.response.result_urls.length > 0) {
-                            resultUrl = apiData.response.result_urls[0]; // Use first image URL
-                        }
-                        // Extract error message for OpenAI 4o
-                        if (apiData.errorMessage) {
-                            errorMessage = apiData.errorMessage;
-                        }
-                    }
                     else if (localTask?.api_type === "flux-kontext-image") {
                         // Flux Kontext Image-specific status mapping
                         const successFlag = apiData.successFlag;
@@ -2594,7 +2746,7 @@ class KieAiMcpServer {
                     "nano-banana-image",
                     "bytedance-seedream-image",
                     "qwen-image",
-                    "openai-4o-image",
+                    "gpt-image-2",
                     "flux-kontext-image",
                     "topaz-upscale",
                     "recraft-remove-background",
@@ -2612,6 +2764,7 @@ class KieAiMcpServer {
                     "kling-3.0-video",
                     "bytedance-seedance-video",
                     "wan-video",
+                    "happyhorse-video",
                     "hailuo",
                     "runway-aleph-video",
                 ];
@@ -3029,10 +3182,8 @@ class KieAiMcpServer {
             request.callBackUrl = this.getCallbackUrl(request.callBackUrl);
             const response = await this.client.generateByteDanceSeedanceVideo(request);
             if (response.code === 200 && response.data?.taskId) {
-                // Determine mode for user feedback
-                const isImageToVideo = !!request.image_url;
-                const mode = isImageToVideo ? "Image-to-Video" : "Text-to-Video";
-                const quality = request.quality || "lite";
+                const mode = request.mode || "standard";
+                const hasFrameInput = !!request.first_frame_url;
                 // Store task in database
                 await this.db.createTask({
                     task_id: response.data.taskId,
@@ -3046,24 +3197,35 @@ class KieAiMcpServer {
                             text: JSON.stringify({
                                 success: true,
                                 task_id: response.data.taskId,
-                                message: `ByteDance Seedance ${mode} generation task created successfully`,
+                                message: `ByteDance Seedance 2.0 ${mode} generation task created successfully`,
                                 parameters: {
-                                    mode: mode,
-                                    quality: quality,
+                                    mode,
                                     prompt: request.prompt.substring(0, 100) +
                                         (request.prompt.length > 100 ? "..." : ""),
                                     aspect_ratio: request.aspect_ratio || "16:9",
                                     resolution: request.resolution || "720p",
-                                    duration: request.duration || "5",
-                                    ...(isImageToVideo && { image_url: request.image_url }),
-                                    ...(request.end_image_url && {
-                                        end_image_url: request.end_image_url,
+                                    duration: request.duration || 5,
+                                    generate_audio: request.generate_audio !== false,
+                                    ...(hasFrameInput && {
+                                        first_frame_url: request.first_frame_url,
+                                    }),
+                                    ...(request.last_frame_url && {
+                                        last_frame_url: request.last_frame_url,
+                                    }),
+                                    ...(request.reference_image_urls?.length && {
+                                        reference_images: request.reference_image_urls.length,
+                                    }),
+                                    ...(request.reference_video_urls?.length && {
+                                        reference_videos: request.reference_video_urls.length,
+                                    }),
+                                    ...(request.reference_audio_urls?.length && {
+                                        reference_audios: request.reference_audio_urls.length,
                                     }),
                                 },
                                 next_steps: [
                                     "Use get_task_status to check generation progress",
                                     "Task completion will be sent to the provided callback URL",
-                                    `${mode} generation typically takes 2-5 minutes depending on quality and complexity`,
+                                    `${mode} mode generation typically takes 2-5 minutes depending on duration and complexity`,
                                 ],
                             }, null, 2),
                         },
@@ -3078,26 +3240,28 @@ class KieAiMcpServer {
         catch (error) {
             if (error instanceof z.ZodError) {
                 return this.formatError("bytedance_seedance_video", error, {
-                    prompt: "Required: Text prompt for video generation (max 10000 characters)",
-                    image_url: "Optional: URL of input image for image-to-video mode",
-                    quality: "Optional: Model quality - lite (faster) or pro (higher quality, default: lite)",
+                    prompt: "Required: Text prompt for video generation (3-20000 characters)",
+                    mode: 'Optional: Generation mode — "standard" or "fast" (default: standard)',
+                    first_frame_url: "Optional: URL of image to use as first frame",
+                    last_frame_url: "Optional: URL of image to use as last frame",
+                    reference_image_urls: "Optional: Reference images for style guidance (up to 9)",
+                    reference_video_urls: "Optional: Reference videos for motion guidance (up to 3)",
+                    reference_audio_urls: "Optional: Reference audio for sound-guided generation (up to 3)",
                     aspect_ratio: "Optional: Video aspect ratio (default: 16:9)",
-                    resolution: "Optional: Video resolution - 480p/720p/1080p (default: 720p)",
-                    duration: "Optional: Video duration in seconds 2-12 (default: 5)",
-                    camera_fixed: "Optional: Fix camera position (default: false)",
-                    seed: "Optional: Random seed for reproducible results (default: -1 for random)",
-                    enable_safety_checker: "Optional: Enable content safety checking (default: true)",
-                    end_image_url: "Optional: URL of ending image (image-to-video only)",
-                    callBackUrl: "Optional: URL for task completion notifications (uses KIE_AI_CALLBACK_URL env var if not provided)",
+                    resolution: 'Optional: Video resolution — "480p" or "720p" (default: 720p)',
+                    duration: "Optional: Video duration in seconds 4-15 (default: 5)",
+                    generate_audio: "Optional: Generate native audio (default: true)",
+                    web_search: "Optional: Enable web search for prompt enhancement (default: false)",
+                    nsfw_checker: "Optional: Enable NSFW content filtering (default: false)",
+                    callBackUrl: "Optional: URL for task completion notifications",
                 });
             }
             return this.formatError("bytedance_seedance_video", error, {
-                prompt: "Required: Text prompt for video generation (max 10000 characters)",
-                image_url: "Optional: URL of input image for image-to-video mode",
-                quality: "Optional: Model quality - lite or pro",
+                prompt: "Required: Text prompt for video generation",
+                mode: 'Optional: "standard" or "fast"',
                 aspect_ratio: "Optional: Video aspect ratio",
-                resolution: "Optional: Video resolution",
-                duration: "Optional: Video duration in seconds 2-12",
+                resolution: 'Optional: "480p" or "720p"',
+                duration: "Optional: Duration in seconds 4-15",
                 callBackUrl: "Optional: URL for task completion notifications",
             });
         }
@@ -3653,28 +3817,18 @@ class KieAiMcpServer {
             });
         }
     }
-    async handleOpenAI4oImage(args) {
+    async handleGptImage2(args) {
         try {
-            const request = OpenAI4oImageSchema.parse(args);
-            // Use intelligent callback URL fallback
+            const request = GptImage2Schema.parse(args);
             request.callBackUrl = this.getCallbackUrl(request.callBackUrl);
-            const response = await this.client.generateOpenAI4oImage(request);
+            const response = await this.client.generateGptImage2(request);
             if (response.code === 200 && response.data?.taskId) {
-                // Determine mode for user feedback
-                const hasPrompt = !!request.prompt;
-                const hasImages = request.filesUrl && request.filesUrl.length > 0;
-                const hasMask = !!request.maskUrl;
-                let modeDisplay = "Text-to-Image";
-                if (hasMask && hasImages) {
-                    modeDisplay = "Image Editing";
-                }
-                else if (hasImages && !hasMask) {
-                    modeDisplay = "Image Variants";
-                }
-                // Store task in database
+                const mode = request.input_urls?.length
+                    ? "Image-to-Image"
+                    : "Text-to-Image";
                 await this.db.createTask({
                     task_id: response.data.taskId,
-                    api_type: "openai-4o-image",
+                    api_type: "gpt-image-2",
                     status: "pending",
                 });
                 return {
@@ -3684,32 +3838,85 @@ class KieAiMcpServer {
                             text: JSON.stringify({
                                 success: true,
                                 task_id: response.data.taskId,
-                                message: `OpenAI 4o Image ${modeDisplay} task created successfully`,
+                                message: `GPT Image 2 ${mode} task created successfully`,
                                 parameters: {
-                                    mode: modeDisplay,
-                                    prompt: request.prompt
-                                        ? request.prompt.substring(0, 100) +
-                                            (request.prompt.length > 100 ? "..." : "")
-                                        : undefined,
-                                    size: request.size || "1:1",
-                                    n_variants: request.nVariants || "4",
-                                    is_enhance: request.isEnhance || false,
-                                    enable_fallback: request.enableFallback !== false,
-                                    fallback_model: request.fallbackModel || "FLUX_MAX",
-                                    ...(hasImages && {
-                                        files_url: request.filesUrl,
-                                    }),
-                                    ...(hasMask && {
-                                        mask_url: request.maskUrl,
+                                    mode,
+                                    prompt: request.prompt.substring(0, 100) +
+                                        (request.prompt.length > 100 ? "..." : ""),
+                                    aspect_ratio: request.aspect_ratio || "auto",
+                                    resolution: request.resolution || "1K",
+                                    ...(request.input_urls && {
+                                        input_urls: request.input_urls,
                                     }),
                                 },
                                 next_steps: [
                                     `Use get_task_status with task_id: ${response.data.taskId} to check progress`,
                                     'Generated images will be available when status is "completed"',
                                 ],
-                                usage_examples: [
-                                    `get_task_status: {"task_id": "${response.data.taskId}"}`,
-                                    `list_tasks: {"limit": 10}`,
+                            }, null, 2),
+                        },
+                    ],
+                };
+            }
+            else {
+                throw new Error(response.msg || "Failed to create GPT Image 2 task");
+            }
+        }
+        catch (error) {
+            if (error instanceof z.ZodError) {
+                return this.formatError("gpt_image_2", error, {
+                    prompt: "Required: Text prompt describing the desired image (max 20000 chars)",
+                    input_urls: "Optional: Array of up to 16 image URLs for image-to-image mode",
+                    aspect_ratio: "Optional: auto, 1:1, 9:16, 16:9, 4:3, 3:4 (default: auto)",
+                    resolution: "Optional: 1K, 2K, 4K (default: 1K)",
+                });
+            }
+            return this.formatError("gpt_image_2", error, {
+                prompt: "Required: Text prompt describing the desired image (max 20000 chars)",
+                input_urls: "Optional: Array of up to 16 image URLs for image-to-image mode",
+                aspect_ratio: "Optional: auto, 1:1, 9:16, 16:9, 4:3, 3:4 (default: auto)",
+                resolution: "Optional: 1K, 2K, 4K (default: 1K)",
+            });
+        }
+    }
+    async handleHappyHorseVideo(args) {
+        try {
+            const request = HappyHorseVideoSchema.parse(args);
+            request.callBackUrl = this.getCallbackUrl(request.callBackUrl);
+            const response = await this.client.generateHappyHorseVideo(request);
+            if (response.code === 200 && response.data?.taskId) {
+                const mode = request.mode ||
+                    (request.video_url
+                        ? "video-edit"
+                        : request.reference_image?.length
+                            ? "reference-to-video"
+                            : request.image_urls?.length
+                                ? "image-to-video"
+                                : "text-to-video");
+                await this.db.createTask({
+                    task_id: response.data.taskId,
+                    api_type: "happyhorse-video",
+                    status: "pending",
+                });
+                return {
+                    content: [
+                        {
+                            type: "text",
+                            text: JSON.stringify({
+                                success: true,
+                                task_id: response.data.taskId,
+                                message: `HappyHorse 1.0 ${mode} task created successfully`,
+                                parameters: {
+                                    mode,
+                                    prompt: request.prompt.substring(0, 100) +
+                                        (request.prompt.length > 100 ? "..." : ""),
+                                    resolution: request.resolution || "1080p",
+                                    aspect_ratio: request.aspect_ratio || "16:9",
+                                    duration: request.duration || 5,
+                                },
+                                next_steps: [
+                                    `Use get_task_status with task_id: ${response.data.taskId} to check progress`,
+                                    'Video will be available when status is "completed"',
                                 ],
                             }, null, 2),
                         },
@@ -3717,35 +3924,22 @@ class KieAiMcpServer {
                 };
             }
             else {
-                throw new Error(response.msg || "Failed to create OpenAI 4o Image task");
+                throw new Error(response.msg || "Failed to create HappyHorse task");
             }
         }
         catch (error) {
             if (error instanceof z.ZodError) {
-                return this.formatError("openai_4o_image", error, {
-                    prompt: "Optional: Text prompt describing the desired image (max 5000 chars)",
-                    filesUrl: "Optional: Array of up to 5 image URLs for editing or variants",
-                    size: "Required: Image aspect ratio (1:1, 3:2, 2:3, default: 1:1)",
-                    nVariants: "Optional: Number of image variations (1, 2, 4, default: 4)",
-                    maskUrl: "Optional: Mask image URL for precise editing (black=edit, white=preserve)",
-                    callBackUrl: "Optional: Webhook URL for completion notifications",
-                    isEnhance: "Optional: Enable prompt enhancement for specialized scenarios (default: false)",
-                    uploadCn: "Optional: Route uploads via China servers (default: false)",
-                    enableFallback: "Optional: Enable automatic fallback to backup models (default: true)",
-                    fallbackModel: "Optional: Backup model choice (GPT_IMAGE_1, FLUX_MAX, default: FLUX_MAX)",
+                return this.formatError("happyhorse_video", error, {
+                    prompt: "Required: Text prompt for video generation (max 5000 chars)",
+                    mode: "Optional: text-to-video, image-to-video, reference-to-video, video-edit",
+                    image_urls: "I2V: Single image URL",
+                    reference_image: "R2V: Up to 9 reference image URLs",
+                    video_url: "Video Edit: Video URL to edit",
                 });
             }
-            return this.formatError("openai_4o_image", error, {
-                prompt: "Optional: Text prompt describing the desired image (max 5000 chars)",
-                filesUrl: "Optional: Array of up to 5 image URLs for editing or variants",
-                size: "Required: Image aspect ratio (1:1, 3:2, 2:3, default: 1:1)",
-                nVariants: "Optional: Number of image variations (1, 2, 4, default: 4)",
-                maskUrl: "Optional: Mask image URL for precise editing (black=edit, white=preserve)",
-                callBackUrl: "Optional: Webhook URL for completion notifications",
-                isEnhance: "Optional: Enable prompt enhancement for specialized scenarios (default: false)",
-                uploadCn: "Optional: Route uploads via China servers (default: false)",
-                enableFallback: "Optional: Enable automatic fallback to backup models (default: true)",
-                fallbackModel: "Optional: Backup model choice (GPT_IMAGE_1, FLUX_MAX, default: FLUX_MAX)",
+            return this.formatError("happyhorse_video", error, {
+                prompt: "Required: Text prompt for video generation (max 5000 chars)",
+                mode: "Optional: text-to-video, image-to-video, reference-to-video, video-edit",
             });
         }
     }
@@ -3915,16 +4109,20 @@ class KieAiMcpServer {
     }
     async handleWanVideo(args) {
         try {
-            const request = WanVideoSchema.parse(args);
-            // Use intelligent callback URL fallback
+            const request = Wan27VideoSchema.parse(args);
             request.callBackUrl = this.getCallbackUrl(request.callBackUrl);
             const response = await this.client.generateWanVideo(request);
             if (response.code === 200 && response.data?.taskId) {
-                // Determine mode for user feedback
-                const isImageToVideo = !!request.image_url;
-                const mode = isImageToVideo ? "Image-to-Video" : "Text-to-Video";
-                const resolution = request.resolution || "1080p";
-                // Store task in database
+                const mode = request.mode ||
+                    (request.video_url_edit
+                        ? "video-edit"
+                        : request.reference_image?.length || request.reference_video?.length
+                            ? "reference-to-video"
+                            : request.first_frame_url ||
+                                request.last_frame_url ||
+                                request.first_clip_url
+                                ? "image-to-video"
+                                : "text-to-video");
                 await this.db.createTask({
                     task_id: response.data.taskId,
                     api_type: "wan-video",
@@ -3937,27 +4135,18 @@ class KieAiMcpServer {
                             text: JSON.stringify({
                                 success: true,
                                 task_id: response.data.taskId,
-                                message: `Alibaba Wan 2.5 ${mode} generation task created successfully`,
+                                message: `Wan 2.7 ${mode} task created successfully`,
                                 parameters: {
-                                    mode: mode,
+                                    mode,
                                     prompt: request.prompt.substring(0, 100) +
                                         (request.prompt.length > 100 ? "..." : ""),
-                                    resolution: resolution,
-                                    negative_prompt: request.negative_prompt || "",
-                                    enable_prompt_expansion: request.enable_prompt_expansion !== false,
-                                    ...(request.seed !== undefined && { seed: request.seed }),
-                                    ...(isImageToVideo && {
-                                        image_url: request.image_url,
-                                        duration: request.duration || "5",
-                                    }),
-                                    ...(!isImageToVideo && {
-                                        aspect_ratio: request.aspect_ratio || "16:9",
-                                    }),
+                                    resolution: request.resolution || "1080p",
+                                    ratio: request.ratio || "16:9",
+                                    duration: request.duration || 5,
                                 },
                                 next_steps: [
-                                    "Use get_task_status to check generation progress",
-                                    "Task completion will be sent to the provided callback URL",
-                                    `${mode} generation typically takes 2-6 minutes depending on resolution and complexity`,
+                                    `Use get_task_status with task_id: ${response.data.taskId} to check progress`,
+                                    'Video will be available when status is "completed"',
                                 ],
                             }, null, 2),
                         },
@@ -3965,29 +4154,23 @@ class KieAiMcpServer {
                 };
             }
             else {
-                throw new Error(response.msg || "Failed to create Wan 2.5 video generation task");
+                throw new Error(response.msg || "Failed to create Wan 2.7 video task");
             }
         }
         catch (error) {
             if (error instanceof z.ZodError) {
                 return this.formatError("wan_video", error, {
-                    prompt: "Required: Text prompt for video generation (max 800 characters)",
-                    image_url: "Optional: URL of input image for image-to-video mode",
-                    aspect_ratio: "Optional: Video aspect ratio for text-to-video (16:9, 9:16, 1:1, default: 16:9)",
-                    resolution: "Optional: Video resolution - 720p or 1080p (default: 1080p)",
-                    duration: "Optional: Video duration for image-to-video - 5 or 10 seconds (default: 5)",
-                    negative_prompt: "Optional: Negative prompt to describe content to avoid (max 500 characters)",
-                    enable_prompt_expansion: "Optional: Enable prompt rewriting using LLM (default: true)",
-                    seed: "Optional: Random seed for reproducible results",
-                    callBackUrl: "Optional: URL for task completion notifications (uses KIE_AI_CALLBACK_URL env var if not provided)",
+                    prompt: "Required: Text prompt for video generation (max 5000 chars)",
+                    mode: "Optional: text-to-video, image-to-video, reference-to-video, video-edit",
+                    first_frame_url: "I2V: First frame image URL",
+                    last_frame_url: "I2V: Last frame image URL",
+                    reference_image: "R2V: Up to 5 reference image URLs",
+                    video_url_edit: "Video Edit: Video URL to edit",
                 });
             }
             return this.formatError("wan_video", error, {
                 prompt: "Required: Text prompt for video generation",
-                image_url: "Optional: URL of input image",
-                aspect_ratio: "Optional: Video aspect ratio",
-                resolution: "Optional: Video resolution",
-                callBackUrl: "Optional: URL for task completion notifications",
+                mode: "Optional: text-to-video, image-to-video, reference-to-video, video-edit",
             });
         }
     }
@@ -4617,6 +4800,12 @@ class KieAiMcpServer {
                 category: "video",
                 quality: "standard",
             },
+            {
+                name: "happyhorse_video",
+                status: "available",
+                category: "video",
+                quality: "standard",
+            },
             {
                 name: "runway_aleph",
                 status: "available",
@@ -4636,7 +4825,7 @@ class KieAiMcpServer {
                 quality: "professional",
             },
             {
-                name: "openai_4o_image",
+                name: "gpt_image_2",
                 status: "available",
                 category: "image",
                 quality: "professional",
@@ -4850,10 +5039,10 @@ The system automatically detects user intent:
 ## 🔧 Intelligent Parameter Selection
 ### **Video Parameters**
-- **ByteDance Seedance**:
-  - Default: \`quality: "lite"\`, \`resolution: "720p"\`
-  - High Quality: \`quality: "pro"\`, \`resolution: "1080p"\`
-  - Professional 720p: \`quality: "pro"\`, \`resolution: "720p"\`
+- **ByteDance Seedance 2.0**:
+  - Default: \`mode: "standard"\`, \`resolution: "720p"\`, \`generate_audio: true\`
+  - Fast/Iterative: \`mode: "fast"\`, \`resolution: "480p"\`
+  - Higher Quality: \`mode: "standard"\`, \`resolution: "720p"\`
 - **Veo3**:
   - Default: \`model: "veo3_fast"\`
@@ -5001,7 +5190,7 @@ These guidelines ensure optimal balance between quality requirements and cost ma
 | Model | Max Resolution | Quality Modes | Duration | Speed | Key Strengths |
 |-------|---------------|---------------|----------|-------|---------------|
 | **Google Veo3** | 1080p | veo3/veo3_fast | Default | Medium | Premium cinematic quality, 1080p support |
-| **ByteDance Seedance** | 1080p | lite/pro | 2-12s | Medium | Professional standard, quality modes |
+| **ByteDance Seedance 2.0** | 720p | standard/fast | 4-15s | Medium | Multimodal refs, native audio, adaptive aspect |
 | **Wan Video 2.5** | 1080p | Single | 5-10s | Fast | Quick generation, social media |
 | **Runway Aleph** | 1080p | Single | Source | Medium | Video-to-video editing, style transfer |
@@ -5009,32 +5198,33 @@ These guidelines ensure optimal balance between quality requirements and cost ma
 ### Default Settings (Cost-Effective)
 - **Resolution**: 720p (unless user requests high quality)
-- **Quality Mode**: lite/fast (unless user requests high quality)
-- **Model**: ByteDance Seedance lite as default
+- **Quality Mode**: standard/fast (unless user requests "fast" explicitly)
+- **Model**: ByteDance Seedance 2.0 standard as default
 ### High Quality Upgrades
-- **User says "high quality"**: Pro models + 1080p
-- **User says "high quality in 720p"**: Pro models + 720p
+- **User says "high quality"**: Standard mode + 720p (already default)
 - **User says "cinematic"**: Veo3 model
-- **User says "fast/quick"**: Lite models + 720p (already default)
+- **User says "fast/quick"**: Seedance fast mode + 480p
 ## Use Case Recommendations
 - **Cinematic/Premium Content**: Veo3 (model: "veo3")
-- **Professional/Commercial**: ByteDance Seedance (quality: "pro")
-- **Social Media/Fast**: Wan Video 2.5 or ByteDance lite
+- **Professional/Commercial**: ByteDance Seedance 2.0 (mode: "standard")
+- **Social Media/Fast**: ByteDance Seedance 2.0 fast or Wan Video 2.5
+- **Multimodal (refs + audio)**: ByteDance Seedance 2.0 with reference URLs
 - **Video Editing**: Runway Aleph (existing video transformation)
 ## Parameter Mapping
 ### Input Methods
 - **Text-to-Video**: All models (prompt only)
-- **Image-to-Video**: Veo3 (imageUrls), ByteDance (image_url), Wan (image_url)
+- **Image-to-Video**: Veo3 (imageUrls), Seedance (first_frame_url), Wan (image_url)
 - **Video-to-Video**: Runway Aleph (videoUrl)
+- **Multimodal Refs**: Seedance 2.0 (reference_image/video/audio_urls)
 ### Quality Control
 - **Veo3**: model selection (veo3 vs veo3_fast)
-- **ByteDance**: quality parameter (lite vs pro) + resolution
+- **Seedance 2.0**: mode (standard vs fast) + resolution
 - **Wan**: resolution parameter only
 - **Runway**: implicit (no quality settings)
@@ -5053,7 +5243,7 @@ These guidelines ensure optimal balance between quality requirements and cost ma
 ### **CRITICAL COST CONTROL RULES**
 - **Resolution**: ALWAYS use \`"720p"\` unless user explicitly requests high quality
 - **Quality Level**: ALWAYS use **lite/fast** versions unless user requests "high quality"
-- **Model Selection**: bytedance_seedance_video with \`quality: "lite"\` as default
+- **Model Selection**: bytedance_seedance_video with \`mode: "standard"\` as default
 ### **Quality Upgrade Logic**
@@ -5151,15 +5341,16 @@ These guidelines ensure optimal balance between quality requirements and cost ma
             "bytedance-seedream": "bytedance_seedream-v4-text-to-image.md",
             "qwen-image": "qwen_text-to-image.md",
             "flux-kontext": "flux_kontext_image.md",
-            "openai-4o-image": "openai_4o-image.md",
+            "gpt-image-2": "gpt_image-2.md",
             "nano-banana": "google_nano-banana.md",
             "topaz-upscale": "topaz_image-upscale.md",
             "recraft-bg-removal": "recraft_remove_background.md",
             "ideogram-reframe": "ideogram_reframe_image.md",
             // Video models
             veo3: "google_veo3-text-to-image.md",
-            "bytedance-seedance": "bytedance_seedance-v1-lite-text-to-video.md",
-            "wan-video": "wan_2-5-text-to-video.md",
+            "bytedance-seedance": "bytedance_seedance-2.md",
+            "wan-video": "wan_2-7-text-to-video.md",
+            "happyhorse-video": "happyhorse_text-to-video.md",
             "runway-aleph": "runway_aleph_video.md",
             "kling-v2-1": "kling_v2-1-pro.md",
             "kling-v2-5": "kling_v2-5-turbo-text-to-video-pro.md",