npm - mulmocast - Versions diffs - 1.1.5 → 1.1.6 - Mend

mulmocast 1.1.5 → 1.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (67) hide show

package/lib/actions/audio.js +10 -1
package/lib/actions/image_agents.d.ts +3 -12
package/lib/actions/image_agents.js +12 -8
package/lib/actions/images.js +2 -1
package/lib/actions/translate.js +13 -31
package/lib/agents/lipsync_replicate_agent.js +10 -3
package/lib/cli/commands/audio/handler.js +1 -1
package/lib/cli/commands/image/handler.js +1 -1
package/lib/cli/commands/movie/handler.js +1 -1
package/lib/cli/commands/pdf/handler.js +1 -1
package/lib/cli/helpers.d.ts +1 -4
package/lib/cli/helpers.js +3 -2
package/lib/mcp/server.js +1 -1
package/lib/methods/mulmo_presentation_style.d.ts +3 -2
package/lib/methods/mulmo_script.js +4 -1
package/lib/methods/mulmo_studio_context.d.ts +1 -0
package/lib/methods/mulmo_studio_context.js +8 -0
package/lib/types/agent.d.ts +1 -0
package/lib/types/schema.d.ts +8 -8
package/lib/types/schema.js +1 -1
package/lib/types/type.d.ts +1 -1
package/lib/utils/const.js +1 -1
package/lib/utils/context.d.ts +376 -34
package/lib/utils/context.js +95 -56
package/lib/utils/filters.d.ts +1 -0
package/lib/utils/filters.js +8 -0
package/lib/utils/preprocess.d.ts +2 -2
package/lib/utils/preprocess.js +3 -3
package/lib/utils/provider2agent.d.ts +3 -2
package/lib/utils/provider2agent.js +20 -2
package/lib/utils/string.d.ts +1 -1
package/lib/utils/string.js +11 -8
package/package.json +1 -1
package/scripts/templates/image_refs.json +1 -0
package/scripts/templates/voice_over.json +1 -0
package/scripts/test/gpt.json +1 -0
package/scripts/test/test1.json +1 -0
package/scripts/test/test_audio.json +1 -0
package/scripts/test/test_audio_instructions.json +1 -0
package/scripts/test/test_beats.json +1 -0
package/scripts/test/test_captions.json +1 -0
package/scripts/test/test_elevenlabs_models.json +1 -0
package/scripts/test/test_hello.json +1 -0
package/scripts/test/test_hello_google.json +1 -0
package/scripts/test/test_html.json +1 -0
package/scripts/test/test_image_refs.json +1 -0
package/scripts/test/test_images.json +1 -0
package/scripts/test/test_lang.json +58 -2
package/scripts/test/test_layout.json +1 -0
package/scripts/test/test_lipsync.json +9 -0
package/scripts/test/test_loop.json +1 -0
package/scripts/test/test_media.json +1 -0
package/scripts/test/test_mixed_providers.json +1 -0
package/scripts/test/test_movie.json +1 -0
package/scripts/test/test_no_audio.json +1 -0
package/scripts/test/test_no_audio_with_credit.json +1 -0
package/scripts/test/test_order.json +1 -0
package/scripts/test/test_order_portrait.json +1 -0
package/scripts/test/test_replicate.json +19 -0
package/scripts/test/test_slideout_left_no_audio.json +1 -0
package/scripts/test/test_spillover.json +1 -0
package/scripts/test/test_transition.json +1 -0
package/scripts/test/test_transition_no_audio.json +1 -0
package/scripts/test/test_video_speed.json +1 -0
package/scripts/test/test_voice_over.json +1 -0
package/scripts/test/test_voices.json +1 -0
package/scripts/templates/image_prompt_only_template.ts +0 -95

package/lib/utils/provider2agent.d.ts CHANGED Viewed

@@ -67,9 +67,10 @@ export declare const provider2LipSyncAgent: {
         defaultModel: ReplicateModel;
         models: ReplicateModel[];
         modelParams: Record<ReplicateModel, {
-            identifier?: `${string}/${string}:${string}`;
-            video: string;
+            identifier?: `${string}/${string}:${string}` | `${string}/${string}`;
+            video?: string;
             audio: string;
+            image?: string;
         }>;
     };
 };

package/lib/utils/provider2agent.js CHANGED Viewed

@@ -50,6 +50,8 @@ export const provider2MovieAgent = {
             "minimax/video-01",
             "minimax/hailuo-02",
             "pixverse/pixverse-v4.5",
+            "wan-video/wan-2.2-i2v-480p-fast",
+            "wan-video/wan-2.2-t2v-480p-fast",
         ],
         modelParams: {
             "bytedance/seedance-1-lite": {
@@ -110,6 +112,16 @@ export const provider2MovieAgent = {
                 last_image: "last_frame_image",
                 price_per_sec: 0.12,
             },
+            "wan-video/wan-2.2-i2v-480p-fast": {
+                durations: [5],
+                start_image: "image",
+                price_per_sec: 0.012,
+            },
+            "wan-video/wan-2.2-t2v-480p-fast": {
+                durations: [5],
+                start_image: undefined,
+                price_per_sec: 0.012,
+            },
         },
     },
     google: {
@@ -133,8 +145,8 @@ export const provider2SoundEffectAgent = {
 export const provider2LipSyncAgent = {
     replicate: {
         agentName: "lipSyncReplicateAgent",
-        defaultModel: "bytedance/latentsync",
-        models: ["bytedance/latentsync", "tmappdev/lipsync"],
+        defaultModel: "bytedance/omni-human",
+        models: ["bytedance/latentsync", "tmappdev/lipsync", "bytedance/omni-human"],
         modelParams: {
             "bytedance/latentsync": {
                 identifier: "bytedance/latentsync:637ce1919f807ca20da3a448ddc2743535d2853649574cd52a933120e9b9e293",
@@ -146,6 +158,12 @@ export const provider2LipSyncAgent = {
                 video: "video_input",
                 audio: "audio_input",
             },
+            "bytedance/omni-human": {
+                identifier: "bytedance/omni-human",
+                image: "image",
+                audio: "audio",
+                price_per_sec: 0.14,
+            },
             /* NOTE: This model does not work with large base64 urls.
             "sync/lipsync-2": {
               video: "video",

package/lib/utils/string.d.ts CHANGED Viewed

@@ -4,6 +4,6 @@ interface Replacement {
     from: string;
     to: string;
 }
-export declare function replacePairsJa(str: string, replacements: Replacement[]): string;
+export declare function replacePairsJa(replacements: Replacement[]): (str: string) => string;
 export declare const replacementsJa: Replacement[];
 export {};

package/lib/utils/string.js CHANGED Viewed

@@ -24,14 +24,16 @@ export const recursiveSplitJa = (text) => {
     }, [text])
         .flat(1);
 };
-export function replacePairsJa(str, replacements) {
-    return replacements.reduce((tmp, current) => {
-        const { from, to } = current;
-        // Escape any special regex characters in the 'from' string.
-        const escapedFrom = from.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
-        const regex = new RegExp(escapedFrom, "g");
-        return tmp.replace(regex, to);
-    }, str);
+export function replacePairsJa(replacements) {
+    return (str) => {
+        return replacements.reduce((tmp, current) => {
+            const { from, to } = current;
+            // Escape any special regex characters in the 'from' string.
+            const escapedFrom = from.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
+            const regex = new RegExp(escapedFrom, "g");
+            return tmp.replace(regex, to);
+        }, str);
+    };
 }
 export const replacementsJa = [
     { from: "Anthropic", to: "アンスロピック" },
@@ -51,4 +53,5 @@ export const replacementsJa = [
     { from: "5つ", to: "いつつ" },
     { from: "危険な面", to: "危険なめん" },
     { from: "その通り！", to: "その通り。" },
+    { from: "%", to: "パーセント" },
 ];

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "mulmocast",
-  "version": "1.1.5",
+  "version": "1.1.6",
   "description": "",
   "type": "module",
   "main": "lib/index.node.js",

package/scripts/templates/image_refs.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "[TITLE OF THE PRESENTAITON OR STORY]",
   "imageParams": {
     "images": {

package/scripts/templates/voice_over.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Voice Over Test",
   "captionParams": {
     "lang": "en"

package/scripts/test/gpt.json CHANGED Viewed

@@ -3,6 +3,7 @@
     "version": "1.1",
     "credit": "closing"
   },
+  "lang": "en",
   "title": "Testing OpenAI's new Image Generation",
   "description": "Hello",
   "imageParams": {

package/scripts/test/test1.json CHANGED Viewed

@@ -3,6 +3,7 @@
     "version": "1.1",
     "credit": "closing"
   },
+  "lang": "en",
   "title": "The Honey Trap vs. The Frontier: Engineering at Tesla and SpaceX",
   "description": "We dive into Elon Musk's philosophy on building environments where engineers can truly flourish, contrasting the comfort-focused 'honey trap' with the high-expectation culture at Tesla and SpaceX.",
   "speechParams": {

package/scripts/test/test_audio.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Media Test",
   "audioParams": {
     "introPadding": 0,

package/scripts/test/test_audio_instructions.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Audio Instructions Test",
   "speechParams": {
     "speakers": {

package/scripts/test/test_beats.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Beat Reference Test",
   "beats": [
     {

package/scripts/test/test_captions.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "captionParams": {
     "lang": "ja",
     "styles": ["color: yellow"]

package/scripts/test/test_elevenlabs_models.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "ElevenLabs Model Test",
   "references": [
     {

package/scripts/test/test_hello.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "beats": [
     {
       "text": "Hello World",

package/scripts/test/test_hello_google.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "speechParams": {
     "speakers": {
       "Presenter": {

package/scripts/test/test_html.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "ja",
   "title": "Media Test",
   "beats": [
     {

package/scripts/test/test_image_refs.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Test Image References",
   "imageParams": {
     "style": "Ghibli-style",

package/scripts/test/test_images.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Test Images",
   "imageParams": {
     "style": "Photorealistic-style",

package/scripts/test/test_lang.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
-  "lang": "ja",
+  "lang": "en",
   "speechParams": {
     "speakers": {
       "Presenter": {
@@ -19,13 +19,69 @@
   },
   "beats": [
     {
-      "text": "こんにちは",
+      "text": "Hello World",
       "image": {
         "type": "textSlide",
         "slide": {
           "title": "Hello World"
         }
       }
+    },
+    {
+      "text": "Switching Language and Switching Screen should match.",
+      "image": {
+        "type": "textSlide",
+        "slide": {
+          "title": "Switching Language"
+        }
+      }
+    },
+    {
+      "text": "May the force be with you.",
+      "image": {
+        "type": "textSlide",
+        "slide": {
+          "title": "May the force be with you"
+        }
+      }
+    },
+    {
+      "text": "Switching Language and Switching Screen should match even with a short duration.",
+      "duration": 1,
+      "image": {
+        "type": "textSlide",
+        "slide": {
+          "title": "Switching Language (short duration)"
+        }
+      }
+    },
+    {
+      "text": "Switching Language and Switching Screen should match even with a long duration.",
+      "duration": 8,
+      "image": {
+        "type": "textSlide",
+        "slide": {
+          "title": "Switching Language (long duration)"
+        }
+      }
+    },
+    {
+      "text": "The yield of TSMC's 3nm process exceeeds 70%.",
+      "image": {
+        "type": "textSlide",
+        "slide": {
+          "title": "Text replacement test for nijivoice"
+        }
+      }
+    },
+    {
+      "text": "Goodbye",
+      "image": {
+        "type": "textSlide",
+        "slide": {
+          "title": "Goodbye"
+        }
+      }
     }
   ]
 }

package/scripts/test/test_layout.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Layout Test",
   "audioParams": {
     "introPadding": 0,

package/scripts/test/test_lipsync.json CHANGED Viewed

@@ -33,6 +33,15 @@
         "model": "tmappdev/lipsync"
       }
     },
+    {
+      "id": "future_omni_human_photo_realistic",
+      "text": "In the future, advancements in AI could revolutionize industries like healthcare, education, and transportation.",
+      "imagePrompt": "A female presenter is standing in front of a futuristic cityscape with AI-powered hospital and an autonomous vehicle. Photo realistic.",
+      "enableLipSync": true,
+      "lipSyncParams": {
+        "model": "bytedance/omni-human"
+      }
+    },
     {
       "id": "future_possibilities",
       "text": "In the future, advancements in AI could revolutionize industries like healthcare, education, and transportation.",

package/scripts/test/test_loop.json CHANGED Viewed

@@ -3,6 +3,7 @@
     "version": "1.1",
     "credit": "closing"
   },
+  "lang": "en",
   "audioParams": {
     "bgm": {
       "kind": "url",

package/scripts/test/test_media.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Media Test",
   "references": [
     {

package/scripts/test/test_mixed_providers.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Mixed Providers Test",
   "description": "Testing multiple TTS providers for different speakers",
   "speechParams": {

package/scripts/test/test_movie.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "movieParams": {
     "provider": "google"
   },

package/scripts/test/test_no_audio.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Media Test",
   "references": [
     {

package/scripts/test/test_no_audio_with_credit.json CHANGED Viewed

@@ -3,6 +3,7 @@
     "version": "1.1",
     "credit": "closing"
   },
+  "lang": "en",
   "title": "Media Test",
   "references": [
     {

package/scripts/test/test_order.json CHANGED Viewed

@@ -1,5 +1,6 @@
 {
   "$mulmocast": { "version": "1.1" },
+  "lang": "en",
   "beats": [
     {
       "text": "The number 1 stands alone—independent, bold, and often lonely. In stories, the lone hero begins their journey without companions, carving their path through courage. Think of Neo in The Matrix, 'The One', chosen to awaken humanity. Or the number 1 in binary—on or off, light or dark. It reminds us that every great movement starts with a single step, a single decision. Just one person can spark a revolution or change history. As Lao Tzu said, 'The journey of a thousand miles begins with one step.'",

package/scripts/test/test_order_portrait.json CHANGED Viewed

@@ -1,5 +1,6 @@
 {
   "$mulmocast": { "version": "1.1" },
+  "lang": "en",
   "canvasSize": {
     "width": 720,
     "height": 1280

package/scripts/test/test_replicate.json CHANGED Viewed

@@ -121,6 +121,25 @@
       "movieParams": {
         "model": "minimax/hailuo-02"
       }
+    },
+    {
+      "id": "wan-2.2-i2v-480p-fast",
+      "text": "wan-video/wan-2.2-i2v-480p-fast",
+      "duration": 5,
+      "imagePrompt": "a woman is walking through a busy Tokyo street at night, she is wearing dark sunglasses",
+      "moviePrompt": "a woman is walking through a busy Tokyo street at night, she is wearing dark sunglasses",
+      "movieParams": {
+        "model": "wan-video/wan-2.2-i2v-480p-fast"
+      }
+    },
+    {
+      "id": "wan-2.2-t2v-480p-fast",
+      "text": "wan-video/wan-2.2-t2v-480p-fast",
+      "duration": 5,
+      "moviePrompt": "a woman is walking through a busy Tokyo street at night, she is wearing dark sunglasses",
+      "movieParams": {
+        "model": "wan-video/wan-2.2-t2v-480p-fast"
+      }
     }
   ]
 }

package/scripts/test/test_slideout_left_no_audio.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Transition Test",
   "movieParams": {
     "transition": {

package/scripts/test/test_spillover.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Spillover Test",
   "beats": [
     {

package/scripts/test/test_transition.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Transition Test",
   "movieParams": {
     "transition": {

package/scripts/test/test_transition_no_audio.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Transition Test",
   "movieParams": {
     "transition": {

package/scripts/test/test_video_speed.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Video Speed",
   "beats": [
     {

package/scripts/test/test_voice_over.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Voice Over Test",
   "captionParams": {
     "lang": "en"

package/scripts/test/test_voices.json CHANGED Viewed

@@ -2,6 +2,7 @@
   "$mulmocast": {
     "version": "1.1"
   },
+  "lang": "en",
   "title": "Voice Test",
   "speechParams": {
     "speakers": {

package/scripts/templates/image_prompt_only_template.ts DELETED Viewed

@@ -1,95 +0,0 @@
-import {
-  mulmoCastCreditSchema,
-  langSchema,
-}
-export const mulmoPresentationStyleSchema = z.object({
-  $mulmocast: mulmoCastCreditSchema,
-  "lang": "en",
-  title: z.string().default("[TITLE: Brief, engaging title for the topic]")
-  lang: z.string().default("en"),
-  "references": z.array(z.object({
-    "url": "[SOURCE_URL: URL of the source material]",
-    "title": "[SOURCE_TITLE: Title of the referenced article, or paper]",
-      "type": "[SOURCE_TYPE: article, paper]"
-    }
-  ],
-  description: z.string().optional(),
-  references: z.array(mulmoReferenceSchema).optional(),
-  beats: z.array(mulmoBeatSchema).min(1),
-  // TODO: Delete it later
-  imagePath: z.string().optional(), // for keynote images movie ??
-  canvasSize: mulmoCanvasDimensionSchema, // has default value
-  speechParams: z
-    .object({
-      speakers: speakerDictionarySchema,
-    })
-    .default({
-      speakers: {
-        [defaultSpeaker]: {
-          voiceId: "shimmer",
-          displayName: {
-            en: defaultSpeaker,
-          },
-        },
-      },
-    }),
-  imageParams: mulmoImageParamsSchema.optional().default({
-    provider: defaultProviders.text2image,
-    images: {},
-  }),
-  movieParams: mulmoMovieParamsSchema.optional().default({
-    provider: defaultProviders.text2movie,
-  }),
-  soundEffectParams: mulmoSoundEffectParamsSchema.optional().default({
-    provider: defaultProviders.soundEffect,
-  }),
-  lipSyncParams: mulmoLipSyncParamsSchema.optional(),
-  htmlImageParams: mulmoHtmlImageParamsSchema
-    .extend({
-      provider: text2HtmlImageProviderSchema,
-    })
-    .optional(),
-  // for textSlides
-  textSlideParams: textSlideParamsSchema.optional(),
-  captionParams: mulmoCaptionParamsSchema.optional(),
-  audioParams: audioParamsSchema.default({
-    introPadding: 1.0,
-    padding: 0.3,
-    closingPadding: 0.8,
-    outroPadding: 1.0,
-    bgmVolume: 0.2,
-    audioVolume: 1.0,
-  }),
-});
-{
-  "beats": [
-    {
-      "text": "[OPENING_BEAT: Introduce the topic with a hook. Reference the source material and set up why this topic matters. Usually 2-3 sentences that grab attention and provide context.]",
-      "imagePrompt": "[IMAGE_PROMPT: A prompt for the image to be generated for this beat.]"
-    },
-    {
-      "text": "[MAIN_CONCEPT: Define or explain the core concept/idea. This should be the central focus of your narrative. Keep it clear and accessible.]",
-      "imagePrompt": "[IMAGE_PROMPT: A prompt for the image to be generated for this beat.]"
-    },
-    {
-      "text": "[SUPPORTING_DETAIL_1: Additional context, examples, or elaboration that helps illustrate the main concept. This could include how it works, why it's important, or real-world applications.]",
-      "imagePrompt": "[IMAGE_PROMPT: A prompt for the image to be generated for this beat.]"
-    },
-    {
-      "text": "[SUPPORTING_DETAIL_2: Continue with more examples, deeper explanation, or different aspects of the topic if needed.]",
-      "imagePrompt": "[IMAGE_PROMPT: A prompt for the image to be generated for this beat.]"
-    },
-    {
-      "text": "[ADDITIONAL_BEATS: Add more beats as necessary to fully explore the topic. Complex topics may require 6-10+ beats to cover adequately. Each beat should advance the narrative or provide valuable information.]",
-      "imagePrompt": "[IMAGE_PROMPT: A prompt for the image to be generated for this beat.]"
-    },
-    {
-      "text": "[CONCLUSION/IMPACT: Wrap up with the significance, implications, or key takeaway. Help the audience understand why this matters to them.]",
-      "imagePrompt": "[IMAGE_PROMPT: A prompt for the image to be generated for this beat.]"
-    }
-  ]
-}