npm - mulmocast - Versions diffs - 1.1.4 → 1.1.6 - Mend

mulmocast 1.1.4 → 1.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (77) hide show

package/lib/actions/audio.d.ts +0 -1
package/lib/actions/audio.js +18 -13
package/lib/actions/image_agents.d.ts +3 -12
package/lib/actions/image_agents.js +12 -8
package/lib/actions/images.js +3 -1
package/lib/actions/movie.js +1 -3
package/lib/actions/translate.js +13 -31
package/lib/agents/image_openai_agent.js +4 -1
package/lib/agents/lipsync_replicate_agent.js +10 -3
package/lib/cli/commands/audio/handler.js +1 -1
package/lib/cli/commands/image/handler.js +1 -1
package/lib/cli/commands/movie/handler.js +1 -1
package/lib/cli/commands/pdf/handler.js +1 -1
package/lib/cli/helpers.d.ts +1 -4
package/lib/cli/helpers.js +3 -2
package/lib/mcp/server.js +1 -1
package/lib/methods/mulmo_presentation_style.d.ts +5 -5
package/lib/methods/mulmo_presentation_style.js +14 -8
package/lib/methods/mulmo_script.js +4 -1
package/lib/methods/mulmo_studio_context.d.ts +1 -0
package/lib/methods/mulmo_studio_context.js +8 -0
package/lib/types/agent.d.ts +4 -0
package/lib/types/schema.d.ts +712 -8
package/lib/types/schema.js +6 -2
package/lib/types/type.d.ts +1 -1
package/lib/utils/const.js +1 -1
package/lib/utils/context.d.ts +401 -34
package/lib/utils/context.js +95 -56
package/lib/utils/file.d.ts +1 -1
package/lib/utils/file.js +5 -2
package/lib/utils/filters.d.ts +1 -0
package/lib/utils/filters.js +8 -0
package/lib/utils/preprocess.d.ts +15 -2
package/lib/utils/preprocess.js +3 -3
package/lib/utils/provider2agent.d.ts +3 -2
package/lib/utils/provider2agent.js +20 -2
package/lib/utils/string.d.ts +1 -1
package/lib/utils/string.js +11 -8
package/package.json +2 -1
package/scripts/templates/image_refs.json +1 -0
package/scripts/templates/voice_over.json +1 -0
package/scripts/test/gpt.json +33 -0
package/scripts/test/mulmo_story.json +11 -0
package/scripts/test/test.json +64 -0
package/scripts/test/test1.json +41 -0
package/scripts/test/test2.json +66 -0
package/scripts/test/test_audio.json +152 -0
package/scripts/test/test_audio_instructions.json +70 -0
package/scripts/test/test_beats.json +59 -0
package/scripts/test/test_captions.json +53 -0
package/scripts/test/test_elevenlabs_models.json +194 -0
package/scripts/test/test_en.json +29 -0
package/scripts/test/test_hello.json +18 -0
package/scripts/test/test_hello_google.json +26 -0
package/scripts/test/test_html.json +67 -0
package/scripts/test/test_image_refs.json +50 -0
package/scripts/test/test_images.json +49 -0
package/scripts/test/test_lang.json +87 -0
package/scripts/test/test_layout.json +153 -0
package/scripts/test/test_lipsync.json +62 -0
package/scripts/test/test_loop.json +35 -0
package/scripts/test/test_media.json +245 -0
package/scripts/test/test_mixed_providers.json +92 -0
package/scripts/test/test_movie.json +40 -0
package/scripts/test/test_no_audio.json +253 -0
package/scripts/test/test_no_audio_with_credit.json +254 -0
package/scripts/test/test_order.json +69 -0
package/scripts/test/test_order_portrait.json +73 -0
package/scripts/test/test_replicate.json +145 -0
package/scripts/test/test_slideout_left_no_audio.json +46 -0
package/scripts/test/test_sound_effect.json +41 -0
package/scripts/test/test_spillover.json +117 -0
package/scripts/test/test_transition.json +56 -0
package/scripts/test/test_transition_no_audio.json +46 -0
package/scripts/test/test_video_speed.json +81 -0
package/scripts/test/test_voice_over.json +105 -0
package/scripts/test/test_voices.json +55 -0

package/lib/utils/context.js CHANGED Viewed

@@ -1,44 +1,28 @@
 import { GraphAILogger } from "graphai";
 import fs from "fs";
 import { readMulmoScriptFile, fetchMulmoScriptFile } from "./file.js";
-import { createOrUpdateStudioData } from "./preprocess.js";
+import { mulmoStudioSchema, mulmoCaptionParamsSchema } from "../types/index.js";
+import { MulmoPresentationStyleMethods, MulmoScriptMethods } from "../methods/index.js";
 import { mulmoPresentationStyleSchema, mulmoStudioMultiLingualSchema } from "../types/index.js";
-export const fetchScript = async (isHttpPath, mulmoFilePath, fileOrUrl) => {
-    if (isHttpPath) {
-        const res = await fetchMulmoScriptFile(fileOrUrl);
-        if (!res.result || !res.script) {
-            GraphAILogger.info(`ERROR: HTTP error! ${res.status} ${fileOrUrl}`);
-            return null;
-        }
-        return res.script;
-    }
-    if (!fs.existsSync(mulmoFilePath)) {
-        GraphAILogger.info(`ERROR: File not exists ${mulmoFilePath}`);
-        return null;
-    }
-    return readMulmoScriptFile(mulmoFilePath, "ERROR: File does not exist " + mulmoFilePath)?.mulmoData ?? null;
-};
-export const getMultiLingual = (multilingualFilePath, studioBeatsLength) => {
-    if (fs.existsSync(multilingualFilePath)) {
-        const jsonData = readMulmoScriptFile(multilingualFilePath, "ERROR: File does not exist " + multilingualFilePath)?.mulmoData ?? null;
-        const dataSet = mulmoStudioMultiLingualSchema.parse(jsonData);
-        while (dataSet.length < studioBeatsLength) {
-            dataSet.push({ multiLingualTexts: {} });
-        }
-        dataSet.length = studioBeatsLength;
-        return dataSet;
-    }
-    return [...Array(studioBeatsLength)].map(() => ({ multiLingualTexts: {} }));
-};
-export const getPresentationStyle = (presentationStylePath) => {
-    if (presentationStylePath) {
-        if (!fs.existsSync(presentationStylePath)) {
-            throw new Error(`ERROR: File not exists ${presentationStylePath}`);
-        }
-        const jsonData = readMulmoScriptFile(presentationStylePath, "ERROR: File does not exist " + presentationStylePath)?.mulmoData ?? null;
-        return mulmoPresentationStyleSchema.parse(jsonData);
-    }
-    return null;
+const mulmoCredit = (speaker) => {
+    return {
+        speaker,
+        text: "",
+        image: {
+            type: "image",
+            source: {
+                kind: "url",
+                url: "https://github.com/receptron/mulmocast-cli/raw/refs/heads/main/assets/images/mulmocast_credit.png",
+            },
+        },
+        audio: {
+            type: "audio",
+            source: {
+                kind: "url",
+                url: "https://github.com/receptron/mulmocast-cli/raw/refs/heads/main/assets/audio/silent300.mp3",
+            },
+        },
+    };
 };
 const initSessionState = () => {
     return {
@@ -63,32 +47,87 @@ const initSessionState = () => {
         },
     };
 };
-const buildContext = (studio, files, presentationStyle, multiLingual, force, lang) => {
-    return {
-        studio,
-        fileDirs: files,
-        force: Boolean(force),
-        lang,
-        sessionState: initSessionState(),
-        presentationStyle: presentationStyle ?? studio.script,
-        multiLingual,
-    };
+export const createStudioData = (_mulmoScript, fileName, videoCaptionLang, presentationStyle) => {
+    // validate and insert default value
+    const mulmoScript = _mulmoScript.__test_invalid__ ? _mulmoScript : MulmoScriptMethods.validate(_mulmoScript);
+    // We need to parse it to fill default values
+    const studio = mulmoStudioSchema.parse({
+        script: mulmoScript,
+        filename: fileName,
+        beats: [...Array(mulmoScript.beats.length)].map(() => ({})),
+    });
+    // TODO: Move this code out of this function later
+    // Addition cloing credit
+    if (mulmoScript.$mulmocast.credit === "closing") {
+        const defaultSpeaker = MulmoPresentationStyleMethods.getDefaultSpeaker(presentationStyle ?? studio.script);
+        mulmoScript.beats.push(mulmoCredit(mulmoScript.beats[0].speaker ?? defaultSpeaker)); // First speaker
+    }
+    studio.script = MulmoScriptMethods.validate(mulmoScript); // update the script
+    studio.beats = studio.script.beats.map((_, index) => studio.beats[index] ?? {});
+    if (videoCaptionLang) {
+        studio.script.captionParams = mulmoCaptionParamsSchema.parse({
+            ...(studio.script.captionParams ?? {}),
+            lang: videoCaptionLang,
+        });
+    }
+    return studio;
+};
+export const fetchScript = async (isHttpPath, mulmoFilePath, fileOrUrl) => {
+    if (isHttpPath) {
+        const res = await fetchMulmoScriptFile(fileOrUrl);
+        if (!res.result || !res.script) {
+            GraphAILogger.info(`ERROR: HTTP error! ${res.status} ${fileOrUrl}`);
+            return null;
+        }
+        return res.script;
+    }
+    if (!fs.existsSync(mulmoFilePath)) {
+        GraphAILogger.info(`ERROR: File not exists ${mulmoFilePath}`);
+        return null;
+    }
+    return readMulmoScriptFile(mulmoFilePath, "ERROR: File does not exist " + mulmoFilePath)?.mulmoData ?? null;
+};
+export const getMultiLingual = (multilingualFilePath, studioBeatsLength) => {
+    if (!fs.existsSync(multilingualFilePath)) {
+        return [...Array(studioBeatsLength)].map(() => ({ multiLingualTexts: {} }));
+    }
+    const jsonData = readMulmoScriptFile(multilingualFilePath, "ERROR: File does not exist " + multilingualFilePath)?.mulmoData ?? null;
+    const dataSet = mulmoStudioMultiLingualSchema.parse(jsonData);
+    while (dataSet.length < studioBeatsLength) {
+        dataSet.push({ multiLingualTexts: {} });
+    }
+    dataSet.length = studioBeatsLength;
+    return dataSet;
+};
+export const getPresentationStyle = (presentationStylePath) => {
+    if (!presentationStylePath) {
+        return null;
+    }
+    if (!fs.existsSync(presentationStylePath)) {
+        throw new Error(`ERROR: File not exists ${presentationStylePath}`);
+    }
+    const jsonData = readMulmoScriptFile(presentationStylePath, "ERROR: File does not exist " + presentationStylePath)?.mulmoData ?? null;
+    return mulmoPresentationStyleSchema.parse(jsonData);
 };
-export const initializeContextFromFiles = async (files, raiseError, force, caption, lang) => {
-    const { fileName, isHttpPath, fileOrUrl, mulmoFilePath, outputStudioFilePath, presentationStylePath, outputMultilingualFilePath } = files;
-    // read mulmoScript, presentationStyle, currentStudio from files
+export const initializeContextFromFiles = async (files, raiseError, force, captionLang, targetLang) => {
+    const { fileName, isHttpPath, fileOrUrl, mulmoFilePath, presentationStylePath, outputMultilingualFilePath } = files;
     const mulmoScript = await fetchScript(isHttpPath, mulmoFilePath, fileOrUrl);
     if (!mulmoScript) {
         return null;
     }
-    const presentationStyle = getPresentationStyle(presentationStylePath);
-    // Create or update MulmoStudio file with MulmoScript
-    const currentStudio = readMulmoScriptFile(outputStudioFilePath);
     try {
-        // validate mulmoStudioSchema. skip if __test_invalid__ is true
-        const studio = createOrUpdateStudioData(mulmoScript, currentStudio?.mulmoData, fileName, caption, presentationStyle);
+        const presentationStyle = getPresentationStyle(presentationStylePath);
+        const studio = createStudioData(mulmoScript, fileName, captionLang, presentationStyle);
         const multiLingual = getMultiLingual(outputMultilingualFilePath, studio.beats.length);
-        return buildContext(studio, files, presentationStyle, multiLingual, force, lang);
+        return {
+            studio,
+            multiLingual,
+            fileDirs: files,
+            presentationStyle: presentationStyle ?? studio.script,
+            sessionState: initSessionState(),
+            force: Boolean(force),
+            lang: targetLang ?? studio.script.lang, // This lang is target Language. studio.lang is default Language
+        };
     }
     catch (error) {
         GraphAILogger.info(`Error: invalid MulmoScript Schema: ${isHttpPath ? fileOrUrl : mulmoFilePath} \n ${error}`);

package/lib/utils/file.d.ts CHANGED Viewed

@@ -21,7 +21,7 @@ export declare const getOutputStudioFilePath: (outDirPath: string, fileName: str
 export declare const getOutputMultilingualFilePath: (outDirPath: string, fileName: string) => string;
 export declare const resolveDirPath: (dirPath: string, studioFileName: string) => string;
 export declare const getAudioFilePath: (audioDirPath: string, dirName: string, fileName: string, lang?: string) => string;
-export declare const getAudioArtifactFilePath: (outDirPath: string, fileName: string) => string;
+export declare const getAudioArtifactFilePath: (context: MulmoStudioContext) => string;
 export declare const getOutputVideoFilePath: (outDirPath: string, fileName: string, lang?: string, caption?: string) => string;
 export declare const imageSuffix = "p";
 export declare const getBeatPngImagePath: (context: MulmoStudioContext, index: number) => string;

package/lib/utils/file.js CHANGED Viewed

@@ -72,8 +72,11 @@ export const getAudioFilePath = (audioDirPath, dirName, fileName, lang) => {
     }
     return path.resolve(audioDirPath, dirName, fileName + ".mp3");
 };
-export const getAudioArtifactFilePath = (outDirPath, fileName) => {
-    return path.resolve(outDirPath, fileName + ".mp3");
+export const getAudioArtifactFilePath = (context) => {
+    const suffix = context.lang ? `_${context.lang}` : "";
+    const fileName = MulmoStudioContextMethods.getFileName(context);
+    const outDirPath = MulmoStudioContextMethods.getOutDirPath(context);
+    return path.resolve(outDirPath, fileName + suffix + ".mp3");
 };
 export const getOutputVideoFilePath = (outDirPath, fileName, lang, caption) => {
     const suffix = lang ? `_${lang}` : "";

package/lib/utils/filters.d.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import "dotenv/config";
 import type { AgentFilterFunction } from "graphai";
+export declare const nijovoiceTextAgentFilter: AgentFilterFunction;
 export declare const fileCacheAgentFilter: AgentFilterFunction;
 export declare const browserlessCacheGenerator: (cacheDir: string) => AgentFilterFunction;

package/lib/utils/filters.js CHANGED Viewed

@@ -6,6 +6,14 @@ import { GraphAILogger } from "graphai";
 import { writingMessage } from "./file.js";
 import { text2hash } from "./utils.js";
 import { MulmoStudioContextMethods } from "../methods/mulmo_studio_context.js";
+import { replacementsJa, replacePairsJa } from "../utils/string.js";
+export const nijovoiceTextAgentFilter = async (context, next) => {
+    const { text, provider, lang } = context.namedInputs;
+    if (provider === "nijivoice" && lang === "ja") {
+        context.namedInputs.text = replacePairsJa(replacementsJa)(text);
+    }
+    return next(context);
+};
 export const fileCacheAgentFilter = async (context, next) => {
     const { force, file, index, mulmoContext, sessionType } = context.namedInputs.cache;
     const shouldUseCache = async () => {

package/lib/utils/preprocess.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import { MulmoStudio, MulmoScript, MulmoPresentationStyle } from "../types/index.js";
-export declare const createOrUpdateStudioData: (_mulmoScript: MulmoScript, currentStudio: MulmoStudio | undefined, fileName: string, videoCaption?: string, presentationStyle?: MulmoPresentationStyle | null) => {
+export declare const createOrUpdateStudioData: (_mulmoScript: MulmoScript, currentStudio: MulmoStudio | undefined, fileName: string, videoCaptionLang?: string, presentationStyle?: MulmoPresentationStyle | null) => {
     beats: {
         duration?: number | undefined;
         startAt?: number | undefined;
@@ -16,10 +16,12 @@ export declare const createOrUpdateStudioData: (_mulmoScript: MulmoScript, curre
         captionFile?: string | undefined;
     }[];
     script: {
+        lang: string;
         imageParams: {
             provider: string;
             model?: string | undefined;
             style?: string | undefined;
+            quality?: string | undefined;
             moderation?: string | undefined;
             images?: Record<string, {
                 type: "image";
@@ -89,6 +91,17 @@ export declare const createOrUpdateStudioData: (_mulmoScript: MulmoScript, curre
         speechParams: {
             speakers: Record<string, {
                 voiceId: string;
+                lang?: Record<string, {
+                    voiceId: string;
+                    displayName?: Record<string, string> | undefined;
+                    isDefault?: boolean | undefined;
+                    speechOptions?: {
+                        speed?: number | undefined;
+                        instruction?: string | undefined;
+                    } | undefined;
+                    provider?: string | undefined;
+                    model?: string | undefined;
+                }> | undefined;
                 displayName?: Record<string, string> | undefined;
                 isDefault?: boolean | undefined;
                 speechOptions?: {
@@ -237,6 +250,7 @@ export declare const createOrUpdateStudioData: (_mulmoScript: MulmoScript, curre
                 provider: string;
                 model?: string | undefined;
                 style?: string | undefined;
+                quality?: string | undefined;
                 moderation?: string | undefined;
                 images?: Record<string, {
                     type: "image";
@@ -299,7 +313,6 @@ export declare const createOrUpdateStudioData: (_mulmoScript: MulmoScript, curre
             } | undefined;
             enableLipSync?: boolean | undefined;
         }[];
-        lang?: string | undefined;
         title?: string | undefined;
         description?: string | undefined;
         lipSyncParams?: {

package/lib/utils/preprocess.js CHANGED Viewed

@@ -37,7 +37,7 @@ const mulmoCredit = (speaker) => {
         },
     };
 };
-export const createOrUpdateStudioData = (_mulmoScript, currentStudio, fileName, videoCaption, presentationStyle) => {
+export const createOrUpdateStudioData = (_mulmoScript, currentStudio, fileName, videoCaptionLang, presentationStyle) => {
     const mulmoScript = _mulmoScript.__test_invalid__ ? _mulmoScript : MulmoScriptMethods.validate(_mulmoScript); // validate and insert default value
     const studio = rebuildStudio(currentStudio, mulmoScript, fileName);
     // TODO: Move this code out of this function later
@@ -48,10 +48,10 @@ export const createOrUpdateStudioData = (_mulmoScript, currentStudio, fileName,
     }
     studio.script = MulmoScriptMethods.validate(mulmoScript); // update the script
     studio.beats = studio.script.beats.map((_, index) => studio.beats[index] ?? {});
-    if (videoCaption) {
+    if (videoCaptionLang) {
         studio.script.captionParams = mulmoCaptionParamsSchema.parse({
             ...(studio.script.captionParams ?? {}),
-            lang: videoCaption,
+            lang: videoCaptionLang,
         });
     }
     return studio;

package/lib/utils/provider2agent.d.ts CHANGED Viewed

@@ -67,9 +67,10 @@ export declare const provider2LipSyncAgent: {
         defaultModel: ReplicateModel;
         models: ReplicateModel[];
         modelParams: Record<ReplicateModel, {
-            identifier?: `${string}/${string}:${string}`;
-            video: string;
+            identifier?: `${string}/${string}:${string}` | `${string}/${string}`;
+            video?: string;
             audio: string;
+            image?: string;
         }>;
     };
 };

package/lib/utils/provider2agent.js CHANGED Viewed

@@ -50,6 +50,8 @@ export const provider2MovieAgent = {
             "minimax/video-01",
             "minimax/hailuo-02",
             "pixverse/pixverse-v4.5",
+            "wan-video/wan-2.2-i2v-480p-fast",
+            "wan-video/wan-2.2-t2v-480p-fast",
         ],
         modelParams: {
             "bytedance/seedance-1-lite": {
@@ -110,6 +112,16 @@ export const provider2MovieAgent = {
                 last_image: "last_frame_image",
                 price_per_sec: 0.12,
             },
+            "wan-video/wan-2.2-i2v-480p-fast": {
+                durations: [5],
+                start_image: "image",
+                price_per_sec: 0.012,
+            },
+            "wan-video/wan-2.2-t2v-480p-fast": {
+                durations: [5],
+                start_image: undefined,
+                price_per_sec: 0.012,
+            },
         },
     },
     google: {
@@ -133,8 +145,8 @@ export const provider2SoundEffectAgent = {
 export const provider2LipSyncAgent = {
     replicate: {
         agentName: "lipSyncReplicateAgent",
-        defaultModel: "bytedance/latentsync",
-        models: ["bytedance/latentsync", "tmappdev/lipsync"],
+        defaultModel: "bytedance/omni-human",
+        models: ["bytedance/latentsync", "tmappdev/lipsync", "bytedance/omni-human"],
         modelParams: {
             "bytedance/latentsync": {
                 identifier: "bytedance/latentsync:637ce1919f807ca20da3a448ddc2743535d2853649574cd52a933120e9b9e293",
@@ -146,6 +158,12 @@ export const provider2LipSyncAgent = {
                 video: "video_input",
                 audio: "audio_input",
             },
+            "bytedance/omni-human": {
+                identifier: "bytedance/omni-human",
+                image: "image",
+                audio: "audio",
+                price_per_sec: 0.14,
+            },
             /* NOTE: This model does not work with large base64 urls.
             "sync/lipsync-2": {
               video: "video",

package/lib/utils/string.d.ts CHANGED Viewed

@@ -4,6 +4,6 @@ interface Replacement {
     from: string;
     to: string;
 }
-export declare function replacePairsJa(str: string, replacements: Replacement[]): string;
+export declare function replacePairsJa(replacements: Replacement[]): (str: string) => string;
 export declare const replacementsJa: Replacement[];
 export {};

package/lib/utils/string.js CHANGED Viewed

@@ -24,14 +24,16 @@ export const recursiveSplitJa = (text) => {
     }, [text])
         .flat(1);
 };
-export function replacePairsJa(str, replacements) {
-    return replacements.reduce((tmp, current) => {
-        const { from, to } = current;
-        // Escape any special regex characters in the 'from' string.
-        const escapedFrom = from.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
-        const regex = new RegExp(escapedFrom, "g");
-        return tmp.replace(regex, to);
-    }, str);
+export function replacePairsJa(replacements) {
+    return (str) => {
+        return replacements.reduce((tmp, current) => {
+            const { from, to } = current;
+            // Escape any special regex characters in the 'from' string.
+            const escapedFrom = from.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
+            const regex = new RegExp(escapedFrom, "g");
+            return tmp.replace(regex, to);
+        }, str);
+    };
 }
 export const replacementsJa = [
     { from: "Anthropic", to: "アンスロピック" },
@@ -51,4 +53,5 @@ export const replacementsJa = [
     { from: "5つ", to: "いつつ" },
     { from: "危険な面", to: "危険なめん" },
     { from: "その通り！", to: "その通り。" },
+    { from: "%", to: "パーセント" },
 ];

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "mulmocast",
-  "version": "1.1.4",
+  "version": "1.1.6",
   "description": "",
   "type": "module",
   "main": "lib/index.node.js",
@@ -23,6 +23,7 @@
   "files": [
     "./lib",
     "./scripts/templates",
+    "./scripts/test",
     "./assets/audio/silent60sec.mp3",
     "./assets/html/",
     "./assets/templates/"

package/scripts/templates/image_refs.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "[TITLE OF THE PRESENTAITON OR STORY]",
   "imageParams": {
     "images": {

package/scripts/templates/voice_over.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Voice Over Test",
   "captionParams": {
     "lang": "en"

package/scripts/test/gpt.json ADDED Viewed

@@ -0,0 +1,33 @@
+{
+  "$mulmocast": {
+    "version": "1.1",
+    "credit": "closing"
+  },
+  "lang": "en",
+  "title": "Testing OpenAI's new Image Generation",
+  "description": "Hello",
+  "imageParams": {
+    "model": "gpt-image-1",
+    "style": "<style>Japanese animation with soft watercolor backgrounds, characters with simple rounded faces, large expressive eyes, small nose and mouth, soft jawlines, minimalist facial features, pastel color palette, detailed natural environments, whimsical magical elements, hand-drawn aesthetic, gentle lighting, flowing movement in hair and clothing, nostalgic countryside scenery with fantasy elements."
+  },
+  "speechParams": {
+    "speakers": {
+      "Host": {
+        "voiceId": "shimmer",
+        "displayName": {
+          "en": "Host"
+        }
+      }
+    }
+  },
+  "beats": [
+    {
+      "speaker": "Host",
+      "text": "How are you?",
+      "imagePrompt": "A witch in Harajuku",
+      "imageParams": {
+        "style": "Ukiyoe-style"
+      }
+    }
+  ]
+}

package/scripts/test/mulmo_story.json ADDED Viewed

@@ -0,0 +1,11 @@
+{
+  "title": "MulmoScript",
+  "scenes": [
+    {
+      "description": "MulmoCast is a multi-modal presentation platform built for the generative AI era. Traditional tools like PowerPoint and Keynote were designed decades ago for human authors. Today, however, large language models (LLMs) are generating content—and they need a native environment optimized for their capabilities.　MulmoCast is that environment.　It empowers AI to automatically create and deliver rich, multi-modal presentations—including slides, videos, podcasts, documents, and comics—using our open presentation language: MulmoScript."
+    },
+    {
+      "description": "　MulmoScript is a JSON-based language that enables LLMs to describe structured, machine-readable presentations. It supports a wide range of elements: bullet points, charts, graphs, images, voiceovers, and videos. Just as HTML unlocked the web, MulmoScript enables interoperability, customization, and ecosystem growth for AI-generated content.　MulmoCast renders this content into any format, giving end users complete flexibility in how they consume it—whether as a slideshow, podcast, video, or document. It also supports multilingual output for both reading and listening."
+    }
+  ]
+}

package/scripts/test/test.json ADDED Viewed

@@ -0,0 +1,64 @@
+{
+  "$mulmocast": {
+    "version": "1.1",
+    "credit": "closing"
+  },
+  "title": "MASAI: A Modular Future for Software Engineering AI",
+  "description": "Exploring MASAI, a modular approach for AI agents in software engineering that revolutionizes how complex coding issues are tackled.",
+  "references": [
+    {
+      "url": "https://arxiv.org/abs/2406.11638",
+      "title": "MASAI: A Modular Future for Software Engineering AI",
+      "description": "An article on MASAI, a modular approach for AI agents in software engineering."
+    }
+  ],
+  "lang": "ja",
+  "imageParams": {
+    "style": "<style>monochrome"
+  },
+  "speechParams": {
+    "speakers": {
+      "Announcer": {
+        "provider": "nijivoice",
+        "displayName": {
+          "ja": "アナウンサー"
+        },
+        "voiceId": "3708ad43-cace-486c-a4ca-8fe41186e20c",
+        "speechOptions": {
+          "speed": 1.666
+        }
+      },
+      "Student": {
+        "provider": "nijivoice",
+        "displayName": {
+          "ja": "生徒"
+        },
+        "voiceId": "a7619e48-bf6a-4f9f-843f-40485651257f"
+      },
+      "Teacher": {
+        "provider": "nijivoice",
+        "displayName": {
+          "ja": "先生"
+        },
+        "voiceId": "bc06c63f-fef6-43b6-92f7-67f919bd5dae"
+      }
+    }
+  },
+  "beats": [
+    {
+      "speaker": "Announcer",
+      "text": "こんにちは。米国で活躍するエンジニアが新しい技術やビジネスを分かりやすく解説する、中島聡のLife is beautiful。"
+    },
+    {
+      "speaker": "Announcer",
+      "text": "今日は、アメリカで発表された「スターゲート・プロジェクト」に、ついて解説します。",
+      "imagePrompt": "Blue sky, a flock of birds",
+      "imageParams": {
+        "style": "<style>sumie-style"
+      },
+      "speechOptions": {
+        "speed": 0.8
+      }
+    }
+  ]
+}

package/scripts/test/test1.json ADDED Viewed

@@ -0,0 +1,41 @@
+{
+  "$mulmocast": {
+    "version": "1.1",
+    "credit": "closing"
+  },
+  "lang": "en",
+  "title": "The Honey Trap vs. The Frontier: Engineering at Tesla and SpaceX",
+  "description": "We dive into Elon Musk's philosophy on building environments where engineers can truly flourish, contrasting the comfort-focused 'honey trap' with the high-expectation culture at Tesla and SpaceX.",
+  "speechParams": {
+    "speakers": {
+      "Host": {
+        "displayName": {
+          "ja": "司会"
+        },
+        "voiceId": "sage"
+      },
+      "Guest": {
+        "displayName": {
+          "ja": "ゲスト"
+        },
+        "voiceId": "shimmer"
+      }
+    }
+  },
+  "beats": [
+    {
+      "speaker": "Host",
+      "text": "Hello and welcome to another episode of 'life is artificial', where we explore the cutting edge of technology, innovation, and what the future could look like.",
+      "speechOptions": {
+        "instruction": "Voice: Deep and rugged, with a hearty, boisterous quality, like a seasoned sea captain who's seen many voyages.\nTone: Friendly and spirited, with a sense of adventure and enthusiasm, making every detail feel like part of a grand journey.\nDialect: Classic pirate speech with old-timey nautical phrases, dropped 'g's, and exaggerated 'Arrrs' to stay in character."
+      }
+    },
+    {
+      "speaker": "Guest",
+      "text": "こんにちは、ポッドキャスト版、ライフ・イズ・ビューティフルへようこそ。新しいテクノロジーについて分かりやすく語ります",
+      "speechOptions": {
+        "instruction": "voice: 赤ちゃん\nVoice: 高い声で、舌ったらず。甘えっぽく。語尾に’んちゃ’と付ける"
+      }
+    }
+  ]
+}

package/scripts/test/test2.json ADDED Viewed

@@ -0,0 +1,66 @@
+{
+  "$mulmocast": {
+    "version": "1.1",
+    "credit": "closing"
+  },
+  "title": "AIの進化と私たちの未来 - サム・アルトマン氏の3つの観察",
+  "description": "OpenAIのサム・アルトマン氏による、AIの進化と社会への影響に関する洞察を、高校生向けに分かりやすく解説する対話形式のスクリプト。",
+  "references": [
+    {
+      "url": "https://blog.samaltman.com/three-observations",
+      "title": "Three Observations",
+      "description": "An article on AI's evolution and its impact on society by Sam Altman."
+    }
+  ],
+  "lang": "ja",
+  "imageParams": {
+    "style": "<style>monochrome"
+  },
+  "speechParams": {
+    "provider": "nijivoice",
+    "speakers": {
+      "Announcer": {
+        "displayName": {
+          "ja": "千草朋香"
+        },
+        "voiceId": "3708ad43-cace-486c-a4ca-8fe41186e20c"
+      },
+      "Student": {
+        "displayName": {
+          "ja": "太郎"
+        },
+        "voiceId": "a7619e48-bf6a-4f9f-843f-40485651257f"
+      },
+      "Teacher": {
+        "displayName": {
+          "ja": "山田先生"
+        },
+        "voiceId": "bc06c63f-fef6-43b6-92f7-67f919bd5dae"
+      }
+    }
+  },
+  "beats": [
+    {
+      "speaker": "Announcer",
+      "text": "私たちの目の前で、人工知能の革命が静かに、",
+      "speechOptions": {
+        "speed": 1.5
+      },
+      "imagePrompt": "A futuristic scene depicting the quiet but certain advancement of AI, with digital interfaces and abstract representations of AI technology shaping the future."
+    },
+    {
+      "speaker": "Announcer",
+      "text": "しかし確実に進んでいます。",
+      "speechOptions": {
+        "speed": 1.5
+      }
+    },
+    {
+      "speaker": "Announcer",
+      "text": "オープンエーアイのサム・アルトマン氏が語る「3つの重要な観察」とは何か？",
+      "speechOptions": {
+        "speed": 1.5
+      }
+    }
+  ]
+}