npm - mulmocast - Versions diffs - 2.0.2 → 2.0.4 - Mend

mulmocast 2.0.2 → 2.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

package/README.md +22 -0
package/assets/templates/ghibli_comic_strips.json +1 -1
package/lib/actions/audio.js +2 -1
package/lib/actions/bundle.js +5 -2
package/lib/agents/image_genai_agent.js +1 -1
package/lib/agents/image_openai_agent.js +2 -2
package/lib/agents/index.d.ts +2 -1
package/lib/agents/index.js +2 -1
package/lib/agents/movie_genai_agent.js +1 -1
package/lib/agents/tts_gemini_agent.d.ts +5 -0
package/lib/agents/tts_gemini_agent.js +64 -0
package/lib/cli/commands/tool/scripting/builder.d.ts +1 -1
package/lib/cli/commands/tool/story_to_script/builder.d.ts +1 -1
package/lib/data/promptTemplates.d.ts +40 -10
package/lib/data/promptTemplates.js +55 -1
package/lib/data/templateDataSet.js +1 -1
package/lib/methods/mulmo_presentation_style.js +1 -1
package/lib/types/schema.d.ts +30 -30
package/lib/types/schema.js +4 -2
package/lib/types/type.d.ts +2 -0
package/lib/utils/context.d.ts +33 -33
package/lib/utils/ffmpeg_utils.d.ts +1 -0
package/lib/utils/ffmpeg_utils.js +23 -0
package/lib/utils/provider2agent.d.ts +10 -1
package/lib/utils/provider2agent.js +17 -8
package/lib/utils/utils.js +3 -0
package/package.json +7 -7
package/scripts/test/gpt.json +6 -0
package/scripts/test/image-2.png +0 -0
package/scripts/test/test_audio_gemini.json +67 -0
package/scripts/test/test_audio_gemini.json~ +67 -0
package/scripts/test/test_genai.json +17 -9
package/scripts/test/test_image_refs.json +1 -1
package/scripts/test/test_lipsync2.json +66 -0
package/scripts/test/test_lipsync2.json~ +24 -0
package/scripts/test/test_replicate.json +6 -6

package/README.md CHANGED Viewed

@@ -440,6 +440,28 @@ Options:
       --image_width        Image width (e.g., 400px, 50%, auto)         [string]
 ```
+```
+mulmo bundle <file>
+Generate bundle files
+Positionals:
+  file  Mulmo Script File                                    [string] [required]
+Options:
+      --version            Show version number                         [boolean]
+  -v, --verbose            verbose log     [boolean] [required] [default: false]
+  -h, --help               Show help                                   [boolean]
+  -o, --outdir             output dir                                   [string]
+  -b, --basedir            base dir                                     [string]
+  -l, --lang               target language
+  [string] [choices: "en", "ja", "fr", "es", "de", "zh-CN", "zh-TW", "ko", "it",
+                                                               "pt", "ar", "hi"]
+  -f, --force              Force regenerate           [boolean] [default: false]
+      --backup             create backup media file   [boolean] [default: false]
+  -p, --presentationStyle  Presentation Style                           [string]
+```
 ```
 mulmo tool <command>

package/assets/templates/ghibli_comic_strips.json CHANGED Viewed

@@ -13,7 +13,7 @@
     },
     "imageParams": {
       "provider": "google",
-      "model": "gemini-2.5-flash-image-preview",
+      "model": "gemini-2.5-flash-image",
       "style": "<style>Ghibli style multi-panel comic strips in landscape mode. Use speech bubbles with short, natural dialogue (1–6 words). Keep text minimal, like real comics. Let the art convey the story and emotions. Use the input image as the presenter.</style>",
       "images": {
         "presenter": {

package/lib/actions/audio.js CHANGED Viewed

@@ -2,7 +2,7 @@ import dotenv from "dotenv";
 import { GraphAI, TaskManager, GraphAILogger } from "graphai";
 import * as agents from "@graphai/vanilla";
 import { fileWriteAgent } from "@graphai/vanilla_node_agents";
-import { ttsNijivoiceAgent, ttsOpenaiAgent, ttsGoogleAgent, ttsElevenlabsAgent, addBGMAgent, combineAudioFilesAgent, mediaMockAgent } from "../agents/index.js";
+import { ttsNijivoiceAgent, ttsOpenaiAgent, ttsGoogleAgent, ttsGeminiAgent, ttsElevenlabsAgent, addBGMAgent, combineAudioFilesAgent, mediaMockAgent, } from "../agents/index.js";
 import { text2SpeechProviderSchema } from "../types/index.js";
 import { fileCacheAgentFilter, nijovoiceTextAgentFilter } from "../utils/filters.js";
 import { getAudioArtifactFilePath, getAudioFilePath, getOutputStudioFilePath, resolveDirPath, defaultBGMPath, mkdir, writingMessage } from "../utils/file.js";
@@ -221,6 +221,7 @@ const audioAgents = {
     ttsOpenaiAgent,
     ttsNijivoiceAgent,
     ttsGoogleAgent,
+    ttsGeminiAgent,
     ttsElevenlabsAgent,
     mediaMockAgent,
     addBGMAgent,

package/lib/actions/bundle.js CHANGED Viewed

@@ -58,8 +58,11 @@ export const mulmoViewerBundle = async (context) => {
     const zipper = new ZipBuilder(path.resolve(dir, zipFileName));
     // text
     const resultJson = [];
-    context.studio.script.beats.forEach((beat) => {
-        resultJson.push({ text: beat.text, duration: beat.duration, audioSources: {}, multiLinguals: {} });
+    context.studio.script.beats.forEach((beat, index) => {
+        const sudioBeats = context.studio.beats[index];
+        const { duration, startAt } = sudioBeats;
+        // console.log(context.studio.beats[index]);
+        resultJson.push({ text: beat.text, duration, startTime: startAt, endTime: (startAt ?? 0) + (duration ?? 0), audioSources: {}, multiLinguals: {} });
     });
     // audio
     for (const lang of bundleTargetLang) {

package/lib/agents/image_genai_agent.js CHANGED Viewed

@@ -71,7 +71,7 @@ export const imageGenAIAgent = async ({ namedInputs, params, config, }) => {
     }
     try {
         const ai = new GoogleGenAI({ apiKey });
-        if (model === "gemini-2.5-flash-image-preview") {
+        if (model === "gemini-2.5-flash-image" || model === "gemini-3-pro-image-preview") {
             const contents = getGeminiContents(prompt, aspectRatio, referenceImages);
             const response = await ai.models.generateContent({ model, contents });
             return geminiFlashResult(response);

package/lib/agents/image_openai_agent.js CHANGED Viewed

@@ -17,7 +17,7 @@ export const imageOpenaiAgent = async ({ namedInputs, params, config, }) => {
     const model = params.model ?? provider2ImageAgent["openai"].defaultModel;
     const openai = new OpenAI({ apiKey, baseURL });
     const size = (() => {
-        if (model === "gpt-image-1") {
+        if (model === "gpt-image-1" || model === "gpt-image-1-mini") {
             if (canvasSize.width > canvasSize.height) {
                 return "1536x1024";
             }
@@ -46,7 +46,7 @@ export const imageOpenaiAgent = async ({ namedInputs, params, config, }) => {
         n: 1,
         size,
     };
-    if (model === "gpt-image-1") {
+    if (model === "gpt-image-1" || model === "gpt-image-1-mini") {
         imageOptions.moderation = moderation || "auto";
         imageOptions.background = "opaque";
         if (quality) {

package/lib/agents/index.d.ts CHANGED Viewed

@@ -11,6 +11,7 @@ import ttsElevenlabsAgent from "./tts_elevenlabs_agent.js";
 import ttsNijivoiceAgent from "./tts_nijivoice_agent.js";
 import ttsOpenaiAgent from "./tts_openai_agent.js";
 import ttsGoogleAgent from "./tts_google_agent.js";
+import ttsGeminiAgent from "./tts_gemini_agent.js";
 import validateSchemaAgent from "./validate_schema_agent.js";
 import soundEffectReplicateAgent from "./sound_effect_replicate_agent.js";
 import lipSyncReplicateAgent from "./lipsync_replicate_agent.js";
@@ -19,4 +20,4 @@ import { browserlessAgent } from "@graphai/browserless_agent";
 import { textInputAgent } from "@graphai/input_agents";
 import { openAIAgent } from "@graphai/openai_agent";
 import { fileWriteAgent } from "@graphai/vanilla_node_agents";
-export { openAIAgent, fileWriteAgent, browserlessAgent, textInputAgent, addBGMAgent, combineAudioFilesAgent, imageGenAIAgent, imageOpenaiAgent, imageReplicateAgent, tavilySearchAgent, movieGenAIAgent, movieReplicateAgent, mediaMockAgent, ttsElevenlabsAgent, ttsNijivoiceAgent, ttsOpenaiAgent, ttsGoogleAgent, validateSchemaAgent, soundEffectReplicateAgent, lipSyncReplicateAgent, puppeteerCrawlerAgent, };
+export { openAIAgent, fileWriteAgent, browserlessAgent, textInputAgent, addBGMAgent, combineAudioFilesAgent, imageGenAIAgent, imageOpenaiAgent, imageReplicateAgent, tavilySearchAgent, movieGenAIAgent, movieReplicateAgent, mediaMockAgent, ttsElevenlabsAgent, ttsNijivoiceAgent, ttsOpenaiAgent, ttsGoogleAgent, ttsGeminiAgent, validateSchemaAgent, soundEffectReplicateAgent, lipSyncReplicateAgent, puppeteerCrawlerAgent, };

package/lib/agents/index.js CHANGED Viewed

@@ -11,6 +11,7 @@ import ttsElevenlabsAgent from "./tts_elevenlabs_agent.js";
 import ttsNijivoiceAgent from "./tts_nijivoice_agent.js";
 import ttsOpenaiAgent from "./tts_openai_agent.js";
 import ttsGoogleAgent from "./tts_google_agent.js";
+import ttsGeminiAgent from "./tts_gemini_agent.js";
 import validateSchemaAgent from "./validate_schema_agent.js";
 import soundEffectReplicateAgent from "./sound_effect_replicate_agent.js";
 import lipSyncReplicateAgent from "./lipsync_replicate_agent.js";
@@ -20,4 +21,4 @@ import { textInputAgent } from "@graphai/input_agents";
 import { openAIAgent } from "@graphai/openai_agent";
 // import * as vanilla from "@graphai/vanilla";
 import { fileWriteAgent } from "@graphai/vanilla_node_agents";
-export { openAIAgent, fileWriteAgent, browserlessAgent, textInputAgent, addBGMAgent, combineAudioFilesAgent, imageGenAIAgent, imageOpenaiAgent, imageReplicateAgent, tavilySearchAgent, movieGenAIAgent, movieReplicateAgent, mediaMockAgent, ttsElevenlabsAgent, ttsNijivoiceAgent, ttsOpenaiAgent, ttsGoogleAgent, validateSchemaAgent, soundEffectReplicateAgent, lipSyncReplicateAgent, puppeteerCrawlerAgent, };
+export { openAIAgent, fileWriteAgent, browserlessAgent, textInputAgent, addBGMAgent, combineAudioFilesAgent, imageGenAIAgent, imageOpenaiAgent, imageReplicateAgent, tavilySearchAgent, movieGenAIAgent, movieReplicateAgent, mediaMockAgent, ttsElevenlabsAgent, ttsNijivoiceAgent, ttsOpenaiAgent, ttsGoogleAgent, ttsGeminiAgent, validateSchemaAgent, soundEffectReplicateAgent, lipSyncReplicateAgent, puppeteerCrawlerAgent, };

package/lib/agents/movie_genai_agent.js CHANGED Viewed

@@ -43,7 +43,7 @@ export const movieGenAIAgent = async ({ namedInputs, params, config, }) => {
             },
             image: undefined,
         };
-        if (model === "veo-3.0-generate-preview") {
+        if (model === "veo-3.0-generate-001" || model === "veo-3.1-generate-preview") {
             payload.config.durationSeconds = undefined;
         }
         if (imagePath) {

package/lib/agents/tts_gemini_agent.d.ts ADDED Viewed

@@ -0,0 +1,5 @@
+import type { AgentFunction, AgentFunctionInfo } from "graphai";
+import type { GoogleTTSAgentParams, AgentBufferResult, AgentTextInputs, AgentErrorResult } from "../types/agent.js";
+export declare const ttsGeminiAgent: AgentFunction<GoogleTTSAgentParams, AgentBufferResult | AgentErrorResult, AgentTextInputs>;
+declare const ttsGeminiAgentInfo: AgentFunctionInfo;
+export default ttsGeminiAgentInfo;

package/lib/agents/tts_gemini_agent.js ADDED Viewed

@@ -0,0 +1,64 @@
+import { GraphAILogger } from "graphai";
+import { GoogleGenAI } from "@google/genai";
+import { provider2TTSAgent } from "../utils/provider2agent.js";
+import { apiKeyMissingError, agentGenerationError, audioAction, audioFileTarget } from "../utils/error_cause.js";
+import { pcmToMp3 } from "../utils/ffmpeg_utils.js";
+export const ttsGeminiAgent = async ({ namedInputs, params, config, }) => {
+    const { text } = namedInputs;
+    const { voice, suppressError } = params;
+    const apiKey = config?.apiKey;
+    if (!apiKey) {
+        throw new Error("Google GenAI API key is required (GEMINI_API_KEY)", {
+            cause: apiKeyMissingError("ttsGeminiAgent", audioAction, "GEMINI_API_KEY"),
+        });
+    }
+    try {
+        const ai = new GoogleGenAI({ apiKey });
+        const response = await ai.models.generateContent({
+            model: "gemini-2.5-flash-preview-tts",
+            contents: [{ parts: [{ text }] }],
+            config: {
+                responseModalities: ["AUDIO"],
+                speechConfig: {
+                    voiceConfig: {
+                        prebuiltVoiceConfig: { voiceName: voice ?? provider2TTSAgent.gemini.defaultVoice },
+                    },
+                },
+            },
+        });
+        const inlineData = response.candidates?.[0]?.content?.parts?.[0]?.inlineData;
+        const pcmBase64 = inlineData?.data;
+        const mimeType = inlineData?.mimeType;
+        if (!pcmBase64)
+            throw new Error("No audio data returned");
+        // Extract sample rate from mimeType (e.g., "audio/L16;codec=pcm;rate=24000")
+        const rateMatch = mimeType?.match(/rate=(\d+)/);
+        const sampleRate = rateMatch ? parseInt(rateMatch[1]) : 24000;
+        const rawPcm = Buffer.from(pcmBase64, "base64");
+        return { buffer: await pcmToMp3(rawPcm, sampleRate) };
+    }
+    catch (e) {
+        if (suppressError) {
+            return {
+                error: e,
+            };
+        }
+        GraphAILogger.info(e);
+        throw new Error("TTS Gemini Error", {
+            cause: agentGenerationError("ttsGeminiAgent", audioAction, audioFileTarget),
+        });
+    }
+};
+const ttsGeminiAgentInfo = {
+    name: "ttsGeminiAgent",
+    agent: ttsGeminiAgent,
+    mock: ttsGeminiAgent,
+    samples: [],
+    description: "Google Gemini TTS agent",
+    category: ["tts"],
+    author: "Receptron Team",
+    repository: "https://github.com/receptron/mulmocast-cli/",
+    license: "MIT",
+    environmentVariables: ["GEMINI_API_KEY"],
+};
+export default ttsGeminiAgentInfo;

package/lib/cli/commands/tool/scripting/builder.d.ts CHANGED Viewed

@@ -16,7 +16,7 @@ export declare const builder: (yargs: Argv) => Argv<{
 } & {
     s: string;
 } & {
-    llm: "mock" | "openai" | "anthropic" | "gemini" | "groq" | undefined;
+    llm: "mock" | "openai" | "gemini" | "anthropic" | "groq" | undefined;
 } & {
     llm_model: string | undefined;
 }>;

package/lib/cli/commands/tool/story_to_script/builder.d.ts CHANGED Viewed

@@ -10,7 +10,7 @@ export declare const builder: (yargs: Argv) => Argv<{
 } & {
     beats_per_scene: number;
 } & {
-    llm: "mock" | "openai" | "anthropic" | "gemini" | "groq" | undefined;
+    llm: "mock" | "openai" | "gemini" | "anthropic" | "groq" | undefined;
 } & {
     llm_model: string | undefined;
 } & {

package/lib/data/promptTemplates.d.ts CHANGED Viewed

@@ -39,6 +39,10 @@ export declare const promptTemplates: ({
             provider?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -58,7 +62,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -181,6 +184,10 @@ export declare const promptTemplates: ({
             style?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -200,7 +207,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -233,6 +239,10 @@ export declare const promptTemplates: ({
             provider?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -252,7 +262,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -298,6 +307,10 @@ export declare const promptTemplates: ({
             provider?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -317,7 +330,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -363,6 +375,10 @@ export declare const promptTemplates: ({
             provider: string;
             style: string;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -382,7 +398,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -434,6 +449,10 @@ export declare const promptTemplates: ({
             provider?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -453,7 +472,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -486,6 +504,10 @@ export declare const promptTemplates: ({
             provider?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -515,7 +537,6 @@ export declare const promptTemplates: ({
                 Presenter?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -548,6 +569,10 @@ export declare const promptTemplates: ({
             provider?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -567,7 +592,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -613,6 +637,10 @@ export declare const promptTemplates: ({
             provider?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -632,7 +660,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;
@@ -668,6 +695,10 @@ export declare const promptTemplates: ({
             provider?: undefined;
             model?: undefined;
         };
+        movieParams: {
+            provider: string;
+            model?: undefined;
+        };
         soundEffectParams: {
             provider: string;
         };
@@ -687,7 +718,6 @@ export declare const promptTemplates: ({
                 Teacher?: undefined;
             };
         };
-        movieParams?: undefined;
     };
     scriptName: string;
     systemPrompt: string;

package/lib/data/promptTemplates.js CHANGED Viewed

@@ -32,6 +32,9 @@ export const promptTemplates = [
                 },
                 style: "<style>AKIRA aesthetic.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -149,6 +152,9 @@ export const promptTemplates = [
                 images: {},
                 provider: "openai",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -192,6 +198,9 @@ export const promptTemplates = [
             imageParams: {
                 style: "A hand-drawn style illustration with a warm, nostalgic atmosphere. The background is rich with natural scenery—lush forests, cloudy skies, and traditional Japanese architecture. Characters have expressive eyes, soft facial features, and are portrayed with gentle lighting and subtle shading. The color palette is muted yet vivid, using earthy tones and watercolor-like textures. The overall scene feels magical and peaceful, with a sense of quiet wonder and emotional depth, reminiscent of classic 1980s and 1990s Japanese animation.",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -242,6 +251,9 @@ export const promptTemplates = [
             imageParams: {
                 style: "<style>A multi panel comic strips. 1990s American workplace humor. Clean, minimalist line art with muted colors. One character is a nerdy office worker with glasses</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -285,6 +297,9 @@ export const promptTemplates = [
             imageParams: {
                 style: "<style>Photo realistic and cinematic. Let the art convey the story and emotions without text. Use the image for the aspect ratio</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -337,6 +352,9 @@ export const promptTemplates = [
                 },
                 style: "<style>Dragon Ball/Dr. Slump aesthetic.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -389,6 +407,9 @@ export const promptTemplates = [
                 },
                 style: "<style>Ghibli style</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -439,10 +460,13 @@ export const promptTemplates = [
                         type: "image",
                     },
                 },
-                model: "gemini-2.5-flash-image-preview",
+                model: "gemini-2.5-flash-image",
                 provider: "google",
                 style: "<style>Ghibli style multi-panel comic strips in landscape mode. Use speech bubbles with short, natural dialogue (1–6 words). Keep text minimal, like real comics. Let the art convey the story and emotions. Use the input image as the presenter.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -502,6 +526,9 @@ export const promptTemplates = [
                 },
                 style: "<style>Ghost in the shell aesthetic.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -546,6 +573,9 @@ export const promptTemplates = [
                 images: {},
                 provider: "openai",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -590,6 +620,9 @@ export const promptTemplates = [
                 images: {},
                 provider: "openai",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -642,6 +675,9 @@ export const promptTemplates = [
                 },
                 style: "<style>One Piece aesthetic.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -694,6 +730,9 @@ export const promptTemplates = [
                 },
                 style: "<style>Photo realistic, cinematic.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -746,6 +785,9 @@ export const promptTemplates = [
                 },
                 style: "<style>Photo realistic, cinematic.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -789,6 +831,9 @@ export const promptTemplates = [
             imageParams: {
                 style: "<style>Ghibli style. Student (Taro) is a young teenager with a dark short hair with glasses. Teacher is a middle-aged man with grey hair and moustache.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -845,6 +890,9 @@ export const promptTemplates = [
             imageParams: {
                 style: "<style>Photo realistic, cinematic.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -898,6 +946,9 @@ export const promptTemplates = [
                 },
                 style: "<style>A dreamy, hyper-detailed anime style that blends photorealistic backgrounds with vibrant, saturated colors. The skies are often filled with luminous clouds, dazzling sunsets, or star-filled nights, rendered with a glowing, almost ethereal quality. Urban landscapes and rural scenery are meticulously illustrated, with attention to tiny details like reflections in puddles, neon lights, or the texture of grass swaying in the wind. Characters are drawn with soft, expressive features, standing out against the breathtaking environments, creating a sense of emotional depth and lyrical atmosphere. The overall mood is cinematic, romantic, and filled with a sense of fleeting beauty and longing.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },
@@ -944,6 +995,9 @@ export const promptTemplates = [
             imageParams: {
                 style: "<style>Photo realistic, cinematic.</style>",
             },
+            movieParams: {
+                provider: "replicate",
+            },
             soundEffectParams: {
                 provider: "replicate",
             },

package/lib/data/templateDataSet.js CHANGED Viewed

@@ -41,7 +41,7 @@ export const templateDataSet = {
         "```",
     ghibli_comic_strips: "Another AI will generate comic strips for each beat based on the text description of that beat. Mention the reference in one of beats, if it exists. Use the JSON below as a template.\n" +
         "```JSON\n" +
-        `{"$mulmocast":{"version":"1.1","credit":"closing"},"title":"[TITLE: Brief, engaging title for the topic]","lang":"en","references":[{"url":"[SOURCE_URL: URL of the source material]","title":"[SOURCE_TITLE: Title of the referenced article, or paper]","type":"[SOURCE_TYPE: article, paper]"}],"beats":[{"text":"[OPENING_BEAT: Introduce the topic with a hook. Reference the source material and set up why this topic matters. Usually 2-3 sentences that grab attention and provide context.]"},{"text":"[MAIN_CONCEPT: Define or explain the core concept/idea. This should be the central focus of your narrative. Keep it clear and accessible.]"},{"text":"[SUPPORTING_DETAIL_1: Additional context, examples, or elaboration that helps illustrate the main concept. This could include how it works, why it's important, or real-world applications.]"},{"text":"[SUPPORTING_DETAIL_2: Continue with more examples, deeper explanation, or different aspects of the topic if needed.]"},{"text":"[ADDITIONAL_BEATS: Add more beats as necessary to fully explore the topic. Complex topics may require 6-10+ beats to cover adequately. Each beat should advance the narrative or provide valuable information.]"},{"text":"[CONCLUSION/IMPACT: Wrap up with the significance, implications, or key takeaway. Help the audience understand why this matters to them.]"}],"canvasSize":{"width":1536,"height":1024},"imageParams":{"provider":"google","model":"gemini-2.5-flash-image-preview","style":"<style>Ghibli style multi-panel comic strips in landscape mode. Use speech bubbles with short, natural dialogue (1–6 words). Keep text minimal, like real comics. Let the art convey the story and emotions. Use the input image as the presenter.</style>","images":{"presenter":{"type":"image","source":{"kind":"url","url":"https://raw.githubusercontent.com/receptron/mulmocast-media/refs/heads/main/characters/ghibli_presenter.png"}}}}}\n` +
+        `{"$mulmocast":{"version":"1.1","credit":"closing"},"title":"[TITLE: Brief, engaging title for the topic]","lang":"en","references":[{"url":"[SOURCE_URL: URL of the source material]","title":"[SOURCE_TITLE: Title of the referenced article, or paper]","type":"[SOURCE_TYPE: article, paper]"}],"beats":[{"text":"[OPENING_BEAT: Introduce the topic with a hook. Reference the source material and set up why this topic matters. Usually 2-3 sentences that grab attention and provide context.]"},{"text":"[MAIN_CONCEPT: Define or explain the core concept/idea. This should be the central focus of your narrative. Keep it clear and accessible.]"},{"text":"[SUPPORTING_DETAIL_1: Additional context, examples, or elaboration that helps illustrate the main concept. This could include how it works, why it's important, or real-world applications.]"},{"text":"[SUPPORTING_DETAIL_2: Continue with more examples, deeper explanation, or different aspects of the topic if needed.]"},{"text":"[ADDITIONAL_BEATS: Add more beats as necessary to fully explore the topic. Complex topics may require 6-10+ beats to cover adequately. Each beat should advance the narrative or provide valuable information.]"},{"text":"[CONCLUSION/IMPACT: Wrap up with the significance, implications, or key takeaway. Help the audience understand why this matters to them.]"}],"canvasSize":{"width":1536,"height":1024},"imageParams":{"provider":"google","model":"gemini-2.5-flash-image","style":"<style>Ghibli style multi-panel comic strips in landscape mode. Use speech bubbles with short, natural dialogue (1–6 words). Keep text minimal, like real comics. Let the art convey the story and emotions. Use the input image as the presenter.</style>","images":{"presenter":{"type":"image","source":{"kind":"url","url":"https://raw.githubusercontent.com/receptron/mulmocast-media/refs/heads/main/characters/ghibli_presenter.png"}}}}}\n` +
         "```",
     ghost_comic: "Another AI will generate images for each beat based on the image prompt of that beat. Mention the reference in one of beats, if it exists. Use the JSON below as a template.\n" +
         "```JSON\n" +

package/lib/methods/mulmo_presentation_style.js CHANGED Viewed

@@ -91,7 +91,7 @@ export const MulmoPresentationStyleMethods = {
     },
     getMovieAgentInfo(presentationStyle, beat) {
         const movieParams = { ...presentationStyle.movieParams, ...beat?.movieParams };
-        const movieProvider = text2MovieProviderSchema.parse(movieParams?.provider);
+        const movieProvider = text2MovieProviderSchema.parse(movieParams?.provider ?? defaultProviders.text2movie);
         const agentInfo = provider2MovieAgent[movieProvider];
         return {
             agent: agentInfo.agentName,