npm - mulmocast - Versions diffs - 0.0.5 → 0.0.6 - Mend

mulmocast 0.0.5 → 0.0.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (132) hide show

package/README.md +257 -39
package/assets/audio/silent60sec.mp3 +0 -0
package/assets/html/caption.html +45 -0
package/assets/html/chart.html +1 -1
package/assets/html/mermaid.html +6 -2
package/assets/html/tailwind.html +13 -0
package/assets/templates/business.json +57 -4
package/assets/templates/comic_strips.json +35 -0
package/assets/templates/ghibli_strips.json +35 -0
package/lib/actions/audio.js +24 -11
package/lib/actions/captions.d.ts +2 -0
package/lib/actions/captions.js +62 -0
package/lib/actions/images.js +3 -2
package/lib/actions/index.d.ts +1 -0
package/lib/actions/index.js +1 -0
package/lib/actions/movie.js +78 -86
package/lib/actions/pdf.js +15 -5
package/lib/actions/translate.js +32 -26
package/lib/agents/add_bgm_agent.js +15 -39
package/lib/agents/combine_audio_files_agent.js +43 -36
package/lib/agents/index.d.ts +2 -3
package/lib/agents/index.js +2 -3
package/lib/agents/tts_google_agent.d.ts +4 -0
package/lib/agents/tts_google_agent.js +51 -0
package/lib/agents/validate_schema_agent.d.ts +19 -0
package/lib/agents/validate_schema_agent.js +36 -0
package/lib/cli/args.d.ts +2 -0
package/lib/cli/args.js +9 -2
package/lib/cli/bin.d.ts +3 -0
package/lib/cli/bin.js +38 -0
package/lib/cli/cli.js +34 -7
package/lib/cli/commands/audio/builder.d.ts +14 -0
package/lib/cli/commands/audio/builder.js +6 -0
package/lib/cli/commands/audio/handler.d.ts +4 -0
package/lib/cli/commands/audio/handler.js +7 -0
package/lib/cli/commands/audio/index.d.ts +4 -0
package/lib/cli/commands/audio/index.js +4 -0
package/lib/cli/commands/image/builder.d.ts +14 -0
package/lib/cli/commands/image/builder.js +6 -0
package/lib/cli/commands/image/handler.d.ts +4 -0
package/lib/cli/commands/image/handler.js +7 -0
package/lib/cli/commands/image/index.d.ts +4 -0
package/lib/cli/commands/image/index.js +4 -0
package/lib/cli/commands/movie/builder.d.ts +18 -0
package/lib/cli/commands/movie/builder.js +19 -0
package/lib/cli/commands/movie/handler.d.ts +6 -0
package/lib/cli/commands/movie/handler.js +12 -0
package/lib/cli/commands/movie/index.d.ts +4 -0
package/lib/cli/commands/movie/index.js +4 -0
package/lib/cli/commands/pdf/builder.d.ts +18 -0
package/lib/cli/commands/pdf/builder.js +19 -0
package/lib/cli/commands/pdf/handler.d.ts +6 -0
package/lib/cli/commands/pdf/handler.js +8 -0
package/lib/cli/commands/pdf/index.d.ts +4 -0
package/lib/cli/commands/pdf/index.js +4 -0
package/lib/cli/commands/tool/index.d.ts +6 -0
package/lib/cli/commands/tool/index.js +8 -0
package/lib/cli/commands/tool/prompt/builder.d.ts +4 -0
package/lib/cli/commands/tool/prompt/builder.js +11 -0
package/lib/cli/commands/tool/prompt/handler.d.ts +4 -0
package/lib/cli/commands/tool/prompt/handler.js +14 -0
package/lib/cli/commands/tool/prompt/index.d.ts +4 -0
package/lib/cli/commands/tool/prompt/index.js +4 -0
package/lib/cli/commands/tool/schema/builder.d.ts +2 -0
package/lib/cli/commands/tool/schema/builder.js +3 -0
package/lib/cli/commands/tool/schema/handler.d.ts +2 -0
package/lib/cli/commands/tool/schema/handler.js +12 -0
package/lib/cli/commands/tool/schema/index.d.ts +4 -0
package/lib/cli/commands/tool/schema/index.js +4 -0
package/lib/cli/commands/tool/scripting/builder.d.ts +20 -0
package/lib/cli/commands/tool/scripting/builder.js +63 -0
package/lib/cli/commands/tool/scripting/handler.d.ts +12 -0
package/lib/cli/commands/tool/scripting/handler.js +36 -0
package/lib/cli/commands/tool/scripting/index.d.ts +4 -0
package/lib/cli/commands/tool/scripting/index.js +4 -0
package/lib/cli/commands/tool/story_to_script/builder.d.ts +18 -0
package/lib/cli/commands/tool/story_to_script/builder.js +53 -0
package/lib/cli/commands/tool/story_to_script/handler.d.ts +11 -0
package/lib/cli/commands/tool/story_to_script/handler.js +35 -0
package/lib/cli/commands/tool/story_to_script/index.d.ts +4 -0
package/lib/cli/commands/tool/story_to_script/index.js +4 -0
package/lib/cli/commands/translate/builder.d.ts +14 -0
package/lib/cli/commands/translate/builder.js +5 -0
package/lib/cli/commands/translate/handler.d.ts +4 -0
package/lib/cli/commands/translate/handler.js +6 -0
package/lib/cli/commands/translate/index.d.ts +4 -0
package/lib/cli/commands/translate/index.js +4 -0
package/lib/cli/common.d.ts +6 -2
package/lib/cli/common.js +18 -7
package/lib/cli/helpers.d.ts +38 -0
package/lib/cli/helpers.js +115 -0
package/lib/cli/tool-args.d.ts +1 -0
package/lib/cli/tool-args.js +1 -1
package/lib/cli/tool-cli.js +8 -0
package/lib/methods/mulmo_script.d.ts +0 -1
package/lib/methods/mulmo_script.js +4 -7
package/lib/methods/mulmo_script_template.js +2 -12
package/lib/tools/create_mulmo_script_from_url.d.ts +1 -1
package/lib/tools/create_mulmo_script_from_url.js +43 -14
package/lib/tools/create_mulmo_script_interactively.js +14 -13
package/lib/tools/dump_prompt.js +2 -0
package/lib/tools/story_to_script.d.ts +10 -0
package/lib/tools/story_to_script.js +201 -0
package/lib/types/cli_types.d.ts +14 -0
package/lib/types/cli_types.js +1 -0
package/lib/types/schema.d.ts +493 -176
package/lib/types/schema.js +37 -7
package/lib/types/type.d.ts +6 -1
package/lib/utils/const.d.ts +1 -0
package/lib/utils/const.js +1 -0
package/lib/utils/ffmpeg_utils.d.ts +12 -0
package/lib/utils/ffmpeg_utils.js +63 -0
package/lib/utils/file.d.ts +7 -3
package/lib/utils/file.js +24 -5
package/lib/utils/image_plugins/chart.js +6 -1
package/lib/utils/image_plugins/html_tailwind.d.ts +3 -0
package/lib/utils/image_plugins/html_tailwind.js +18 -0
package/lib/utils/image_plugins/index.d.ts +2 -1
package/lib/utils/image_plugins/index.js +2 -1
package/lib/utils/image_plugins/mermaid.js +1 -1
package/lib/utils/image_plugins/tailwind.d.ts +3 -0
package/lib/utils/image_plugins/tailwind.js +18 -0
package/lib/utils/image_plugins/text_slide.js +9 -2
package/lib/utils/markdown.d.ts +1 -1
package/lib/utils/markdown.js +8 -2
package/lib/utils/preprocess.d.ts +23 -12
package/lib/utils/preprocess.js +4 -0
package/lib/utils/prompt.d.ts +15 -0
package/lib/utils/prompt.js +57 -0
package/lib/utils/utils.d.ts +2 -0
package/lib/utils/utils.js +10 -0
package/package.json +27 -23

package/lib/agents/add_bgm_agent.js CHANGED Viewed

@@ -1,46 +1,22 @@
 import { GraphAILogger } from "graphai";
-import ffmpeg from "fluent-ffmpeg";
-import { MulmoScriptMethods } from "../methods/index.js";
+import { FfmpegContextAddInput, FfmpegContextInit, FfmpegContextGenerateOutput, ffmpegGetMediaDuration } from "../utils/ffmpeg_utils.js";
 const addBGMAgent = async ({ namedInputs, params, }) => {
     const { voiceFile, outputFile, script } = namedInputs;
     const { musicFile } = params;
-    const promise = new Promise((resolve, reject) => {
-        ffmpeg.ffprobe(voiceFile, (err, metadata) => {
-            if (err) {
-                GraphAILogger.info("Error getting metadata: " + err.message);
-                reject(err);
-            }
-            const speechDuration = metadata.format.duration;
-            const padding = MulmoScriptMethods.getPadding(script);
-            const totalDuration = (padding * 2) / 1000 + Math.round(speechDuration ?? 0);
-            GraphAILogger.log("totalDucation:", speechDuration, totalDuration);
-            const command = ffmpeg();
-            command
-                .input(musicFile)
-                .input(voiceFile)
-                .complexFilter([
-                // Add a 2-second delay to the speech
-                `[1:a]adelay=${padding}|${padding}, volume=4[a1]`, // 4000ms delay for both left and right channels
-                // Set the background music volume to 0.2
-                `[0:a]volume=0.2[a0]`,
-                // Mix the delayed speech and the background music
-                `[a0][a1]amix=inputs=2:duration=longest:dropout_transition=3[amixed]`,
-                // Trim the output to the length of speech + 8 seconds
-                `[amixed]atrim=start=0:end=${totalDuration}[trimmed]`,
-                // Add fade out effect for the last 4 seconds
-                `[trimmed]afade=t=out:st=${totalDuration - padding / 1000}:d=${padding}`,
-            ])
-                .on("error", (err) => {
-                GraphAILogger.info("Error: " + err.message);
-                reject(err);
-            })
-                .on("end", () => {
-                resolve(0);
-            })
-                .save(outputFile);
-        });
-    });
-    await promise;
+    const speechDuration = await ffmpegGetMediaDuration(voiceFile);
+    const introPadding = script.audioParams.introPadding;
+    const outroPadding = script.audioParams.outroPadding;
+    const totalDuration = speechDuration + introPadding + outroPadding;
+    GraphAILogger.log("totalDucation:", speechDuration, totalDuration);
+    const ffmpegContext = FfmpegContextInit();
+    const musicInputIndex = FfmpegContextAddInput(ffmpegContext, musicFile);
+    const voiceInputIndex = FfmpegContextAddInput(ffmpegContext, voiceFile);
+    ffmpegContext.filterComplex.push(`[${musicInputIndex}:a]aformat=sample_fmts=fltp:sample_rates=44100:channel_layouts=stereo, volume=0.2[music]`);
+    ffmpegContext.filterComplex.push(`[${voiceInputIndex}:a]aformat=sample_fmts=fltp:sample_rates=44100:channel_layouts=stereo, volume=2, adelay=${introPadding * 1000}|${introPadding * 1000}[voice]`);
+    ffmpegContext.filterComplex.push(`[music][voice]amix=inputs=2:duration=longest[mixed]`);
+    ffmpegContext.filterComplex.push(`[mixed]atrim=start=0:end=${totalDuration}[trimmed]`);
+    ffmpegContext.filterComplex.push(`[trimmed]afade=t=out:st=${totalDuration - outroPadding}:d=${outroPadding}[faded]`);
+    await FfmpegContextGenerateOutput(ffmpegContext, outputFile, ["-map", "[faded]"]);
     return outputFile;
 };
 const addBGMAgentInfo = {

package/lib/agents/combine_audio_files_agent.js CHANGED Viewed

@@ -1,45 +1,52 @@
 import { GraphAILogger } from "graphai";
-import ffmpeg from "fluent-ffmpeg";
-import { silentPath, silentLastPath } from "../utils/file.js";
-const combineAudioFilesAgent = async ({ namedInputs }) => {
-    const { context, combinedFileName, audioDirPath } = namedInputs;
-    const command = ffmpeg();
-    const getDuration = (filePath, isLastGap) => {
-        return new Promise((resolve, reject) => {
-            ffmpeg.ffprobe(filePath, (err, metadata) => {
-                if (err) {
-                    GraphAILogger.info("Error while getting metadata:", err);
-                    reject(err);
-                }
-                else {
-                    // TODO: Remove hard-coded 0.8 and 0.3
-                    resolve(metadata.format.duration + (isLastGap ? 0.8 : 0.3));
-                }
-            });
-        });
-    };
-    await Promise.all(context.studio.beats.map(async (studioBeat, index) => {
-        const isLastGap = index === context.studio.beats.length - 2;
+import { silent60secPath } from "../utils/file.js";
+import { FfmpegContextInit, FfmpegContextGenerateOutput, FfmpegContextInputFormattedAudio, ffmpegGetMediaDuration } from "../utils/ffmpeg_utils.js";
+const combineAudioFilesAgent = async ({ namedInputs, }) => {
+    const { context, combinedFileName } = namedInputs;
+    const ffmpegContext = FfmpegContextInit();
+    const longSilentId = FfmpegContextInputFormattedAudio(ffmpegContext, silent60secPath);
+    // We cannot reuse longSilentId. We need to explicitly split it for each beat.
+    const silentIds = context.studio.beats.map((_, index) => `[ls_${index}]`);
+    ffmpegContext.filterComplex.push(`${longSilentId}asplit=${silentIds.length}${silentIds.join("")}`);
+    const inputIds = (await Promise.all(context.studio.beats.map(async (studioBeat, index) => {
+        const isClosingGap = index === context.studio.beats.length - 2;
         if (studioBeat.audioFile) {
-            command.input(studioBeat.audioFile);
-            command.input(isLastGap ? silentLastPath : silentPath);
-            studioBeat.duration = await getDuration(studioBeat.audioFile, isLastGap);
+            const audioId = FfmpegContextInputFormattedAudio(ffmpegContext, studioBeat.audioFile);
+            const padding = (() => {
+                if (index === context.studio.beats.length - 1) {
+                    return 0;
+                }
+                return isClosingGap ? context.studio.script.audioParams.closingPadding : context.studio.script.audioParams.padding;
+            })();
+            studioBeat.duration = (await ffmpegGetMediaDuration(studioBeat.audioFile)) + padding;
+            if (padding > 0) {
+                const silentId = silentIds.pop();
+                ffmpegContext.filterComplex.push(`${silentId}atrim=start=0:end=${padding}[padding_${index}]`);
+                return [audioId, `[padding_${index}]`];
+            }
+            else {
+                return [audioId];
+            }
         }
         else {
-            GraphAILogger.error("Missing studioBeat.audioFile:", index);
+            // NOTE: We come here when the text is empty and no audio property is specified.
+            studioBeat.duration = context.studio.script.beats[index].duration ?? 1.0;
+            const silentId = silentIds.pop();
+            ffmpegContext.filterComplex.push(`${silentId}atrim=start=0:end=${studioBeat.duration}[silent_${index}]`);
+            return [`[silent_${index}]`];
         }
-    }));
-    await new Promise((resolve, reject) => {
-        command
-            .on("end", () => {
-            resolve(0);
-        })
-            .on("error", (err) => {
-            GraphAILogger.info("Error while combining MP3 files:", err);
-            reject(err);
-        })
-            .mergeToFile(combinedFileName, audioDirPath);
+    }))).flat();
+    // HACK: Because the last beat may not use an silent audio, we need to consume it to make ffmpeg happy.
+    if (silentIds.length > 1) {
+        throw new Error("UNEXPECTED: silentIds.length > 1");
+    }
+    silentIds.forEach((silentId) => {
+        GraphAILogger.log(`Using extra silentId: ${silentId}`);
+        ffmpegContext.filterComplex.push(`${silentId}atrim=start=0:end=${0.01}[silent_extra]`);
+        inputIds.push("[silent_extra]");
     });
+    ffmpegContext.filterComplex.push(`${inputIds.join("")}concat=n=${inputIds.length}:v=0:a=1[aout]`);
+    await FfmpegContextGenerateOutput(ffmpegContext, combinedFileName, ["-map", "[aout]"]);
     return {
         studio: context.studio,
     };

package/lib/agents/index.d.ts CHANGED Viewed

@@ -2,12 +2,11 @@ import addBGMAgent from "./add_bgm_agent.js";
 import combineAudioFilesAgent from "./combine_audio_files_agent.js";
 import imageGoogleAgent from "./image_google_agent.js";
 import imageOpenaiAgent from "./image_openai_agent.js";
-import mulmoPromptsAgent from "./mulmo_prompts_agent.js";
 import ttsNijivoiceAgent from "./tts_nijivoice_agent.js";
 import ttsOpenaiAgent from "./tts_openai_agent.js";
-import validateMulmoScriptAgent from "./validate_mulmo_script_agent.js";
+import validateSchemaAgent from "./validate_schema_agent.js";
 import { browserlessAgent } from "@graphai/browserless_agent";
 import { textInputAgent } from "@graphai/input_agents";
 import { openAIAgent } from "@graphai/openai_agent";
 import { fileWriteAgent } from "@graphai/vanilla_node_agents";
-export { openAIAgent, fileWriteAgent, browserlessAgent, textInputAgent, addBGMAgent, combineAudioFilesAgent, imageGoogleAgent, imageOpenaiAgent, mulmoPromptsAgent, ttsNijivoiceAgent, ttsOpenaiAgent, validateMulmoScriptAgent, };
+export { openAIAgent, fileWriteAgent, browserlessAgent, textInputAgent, addBGMAgent, combineAudioFilesAgent, imageGoogleAgent, imageOpenaiAgent, ttsNijivoiceAgent, ttsOpenaiAgent, validateSchemaAgent, };

package/lib/agents/index.js CHANGED Viewed

@@ -2,13 +2,12 @@ import addBGMAgent from "./add_bgm_agent.js";
 import combineAudioFilesAgent from "./combine_audio_files_agent.js";
 import imageGoogleAgent from "./image_google_agent.js";
 import imageOpenaiAgent from "./image_openai_agent.js";
-import mulmoPromptsAgent from "./mulmo_prompts_agent.js";
 import ttsNijivoiceAgent from "./tts_nijivoice_agent.js";
 import ttsOpenaiAgent from "./tts_openai_agent.js";
-import validateMulmoScriptAgent from "./validate_mulmo_script_agent.js";
+import validateSchemaAgent from "./validate_schema_agent.js";
 import { browserlessAgent } from "@graphai/browserless_agent";
 import { textInputAgent } from "@graphai/input_agents";
 import { openAIAgent } from "@graphai/openai_agent";
 // import * as vanilla from "@graphai/vanilla";
 import { fileWriteAgent } from "@graphai/vanilla_node_agents";
-export { openAIAgent, fileWriteAgent, browserlessAgent, textInputAgent, addBGMAgent, combineAudioFilesAgent, imageGoogleAgent, imageOpenaiAgent, mulmoPromptsAgent, ttsNijivoiceAgent, ttsOpenaiAgent, validateMulmoScriptAgent, };
+export { openAIAgent, fileWriteAgent, browserlessAgent, textInputAgent, addBGMAgent, combineAudioFilesAgent, imageGoogleAgent, imageOpenaiAgent, ttsNijivoiceAgent, ttsOpenaiAgent, validateSchemaAgent, };

package/lib/agents/tts_google_agent.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+import type { AgentFunction, AgentFunctionInfo } from "graphai";
+export declare const ttsGoogleAgent: AgentFunction;
+declare const ttsGoogleAgentInfo: AgentFunctionInfo;
+export default ttsGoogleAgentInfo;

package/lib/agents/tts_google_agent.js ADDED Viewed

@@ -0,0 +1,51 @@
+import { GraphAILogger } from "graphai";
+import * as textToSpeech from "@google-cloud/text-to-speech";
+const client = new textToSpeech.TextToSpeechClient();
+export const ttsGoogleAgent = async ({ namedInputs, params }) => {
+    const { text } = namedInputs;
+    const { voice, suppressError, speed } = params;
+    // Construct the voice request
+    const voiceParams = {
+        languageCode: "en-US", // TODO: Make this configurable
+        ssmlGender: "FEMALE", // TODO: Make this configurable
+    };
+    if (voice) {
+        voiceParams.name = voice;
+    }
+    // Construct the request
+    const request = {
+        input: { text: text },
+        voice: voiceParams,
+        audioConfig: {
+            audioEncoding: "MP3",
+            speakingRate: speed || 1.0,
+        },
+    };
+    try {
+        // Call the Text-to-Speech API
+        const [response] = await client.synthesizeSpeech(request);
+        return { buffer: response.audioContent };
+    }
+    catch (e) {
+        if (suppressError) {
+            return {
+                error: e,
+            };
+        }
+        GraphAILogger.info(e);
+        throw new Error("TTS Google Error");
+    }
+};
+const ttsGoogleAgentInfo = {
+    name: "ttsGoogleAgent",
+    agent: ttsGoogleAgent,
+    mock: ttsGoogleAgent,
+    samples: [],
+    description: "Google TTS agent",
+    category: ["tts"],
+    author: "Receptron Team",
+    repository: "https://github.com/receptron/graphai-agents/tree/main/tts/tts-openai-agent",
+    license: "MIT",
+    environmentVariables: ["OPENAI_API_KEY"],
+};
+export default ttsGoogleAgentInfo;

package/lib/agents/validate_schema_agent.d.ts ADDED Viewed

@@ -0,0 +1,19 @@
+import type { AgentFunction, AgentFunctionInfo, DefaultConfigData } from "graphai";
+import { MulmoScript } from "../types/index.js";
+import { ZodSchema } from "zod";
+interface ValidateMulmoScriptInputs {
+    text: string;
+    schema: ZodSchema;
+}
+interface ValidateMulmoScriptResponse {
+    isValid: boolean;
+    data?: MulmoScript;
+    error?: string;
+}
+/**
+ * Zod schema validation agent
+ * Validates if a JSON string conforms to the Zod schema
+ */
+export declare const validateSchemaAgent: AgentFunction<object, ValidateMulmoScriptResponse, ValidateMulmoScriptInputs, DefaultConfigData>;
+declare const validateMulmoScriptAgentInfo: AgentFunctionInfo;
+export default validateMulmoScriptAgentInfo;

package/lib/agents/validate_schema_agent.js ADDED Viewed

@@ -0,0 +1,36 @@
+import assert from "node:assert";
+/**
+ * Zod schema validation agent
+ * Validates if a JSON string conforms to the Zod schema
+ */
+export const validateSchemaAgent = async ({ namedInputs, }) => {
+    const { text, schema } = namedInputs;
+    try {
+        assert(schema, "schema is required");
+        assert(text, "text is required");
+        const jsonData = JSON.parse(text);
+        const parsed = schema.parse(jsonData);
+        return {
+            isValid: true,
+            data: parsed,
+        };
+    }
+    catch (error) {
+        return {
+            isValid: false,
+            error: error instanceof Error ? error.message : String(error),
+        };
+    }
+};
+const validateMulmoScriptAgentInfo = {
+    name: "validateSchemaAgent",
+    agent: validateSchemaAgent,
+    mock: validateSchemaAgent,
+    samples: [],
+    description: "Validates if a JSON string conforms to the Zod schema",
+    category: ["validation"],
+    author: "Receptron Team",
+    repository: "https://github.com/receptron/mulmocast-cli/tree/main/src/agents/validate_schema_agent.ts",
+    license: "MIT",
+};
+export default validateMulmoScriptAgentInfo;

package/lib/cli/args.d.ts CHANGED Viewed

@@ -3,9 +3,11 @@ export declare const getArgs: () => {
     v: boolean;
     o: string | undefined;
     b: string | undefined;
+    l: string | undefined;
     a: string | undefined;
     i: string | undefined;
     f: boolean;
+    c: string | undefined;
     pdf_mode: string;
     pdf_size: string;
     _: (string | number)[];

package/lib/cli/args.js CHANGED Viewed

@@ -1,7 +1,7 @@
 import yargs from "yargs";
 import { hideBin } from "yargs/helpers";
 import { commonOptions } from "./common.js";
-import { pdf_modes, pdf_sizes } from "../utils/const.js";
+import { pdf_modes, pdf_sizes, languages } from "../utils/const.js";
 export const getArgs = () => {
     return commonOptions(yargs(hideBin(process.argv)))
         .scriptName("mulmo")
@@ -23,6 +23,13 @@ export const getArgs = () => {
         demandOption: false,
         default: false,
         type: "boolean",
+    })
+        .option("c", {
+        alias: "caption",
+        description: "Video captions",
+        choices: languages,
+        demandOption: false,
+        type: "string",
     })
         .option("pdf_mode", {
         description: "pdf mode",
@@ -40,7 +47,7 @@ export const getArgs = () => {
         return yargs
             .positional("action", {
             describe: "action to perform",
-            choices: ["translate", "audio", "images", "movie", "pdf", "preprocess"],
+            choices: ["translate", "audio", "images", "movie", "pdf"],
             type: "string",
         })
             .positional("file", {

package/lib/cli/bin.d.ts ADDED Viewed

@@ -0,0 +1,3 @@
+#!/usr/bin/env node
+import "dotenv/config";
+export declare const main: () => Promise<void>;

package/lib/cli/bin.js ADDED Viewed

@@ -0,0 +1,38 @@
+#!/usr/bin/env node
+import "dotenv/config";
+import yargs from "yargs/yargs";
+import { hideBin } from "yargs/helpers";
+import * as translateCmd from "./commands/translate/index.js";
+import * as audioCmd from "./commands/audio/index.js";
+import * as imagesCmd from "./commands/image/index.js";
+import * as movieCmd from "./commands/movie/index.js";
+import * as pdfCmd from "./commands/pdf/index.js";
+import * as toolCmd from "./commands/tool/index.js";
+import { GraphAILogger } from "graphai";
+export const main = async () => {
+    const cli = yargs(hideBin(process.argv))
+        .scriptName("mulmo")
+        .usage("$0 <command> [options]")
+        .option("v", {
+        alias: "verbose",
+        describe: "verbose log",
+        demandOption: true,
+        default: false,
+        type: "boolean",
+    })
+        .command(translateCmd)
+        .command(audioCmd)
+        .command(imagesCmd)
+        .command(movieCmd)
+        .command(pdfCmd)
+        .command(toolCmd)
+        .demandCommand()
+        .strict()
+        .help()
+        .alias("help", "h");
+    await cli.parseAsync();
+};
+main().catch((error) => {
+    GraphAILogger.info("An unexpected error occurred:", error);
+    process.exit(1);
+});

package/lib/cli/cli.js CHANGED Viewed

@@ -6,18 +6,32 @@ import { GraphAILogger } from "graphai";
 import { getArgs } from "./args.js";
 import { createOrUpdateStudioData } from "../utils/preprocess.js";
 import { outDirName, imageDirName, audioDirName } from "../utils/const.js";
-import { translate, audio, images, movie, pdf } from "../actions/index.js";
-import { getBaseDirPath, getFullPath, readMulmoScriptFile, fetchMulmoScriptFile, getOutputStudioFilePath } from "../utils/file.js";
+import { translate, audio, images, movie, pdf, captions } from "../actions/index.js";
+import { getBaseDirPath, getFullPath, readMulmoScriptFile, fetchMulmoScriptFile, getOutputStudioFilePath, resolveDirPath } from "../utils/file.js";
 import { isHttp } from "../utils/utils.js";
+import clipboardy from "clipboardy";
 export const getFileObject = (_args) => {
     const { basedir, file, outdir, imagedir, audiodir } = _args;
     const baseDirPath = getBaseDirPath(basedir);
-    const fileOrUrl = file ?? "";
-    const fileName = path.parse(fileOrUrl).name;
+    const outDirPath = getFullPath(baseDirPath, outdir ?? outDirName);
+    const { fileOrUrl, fileName } = (() => {
+        if (file === "__clipboard") {
+            // We generate a new unique script file from clipboard text in the output directory
+            const now = new Date();
+            const pad = (n) => n.toString().padStart(2, "0");
+            const fileName = `script_${now.getFullYear()}${pad(now.getMonth() + 1)}${pad(now.getDate())}_${pad(now.getHours())}${pad(now.getMinutes())}${pad(now.getSeconds())}`;
+            const clipboardText = clipboardy.readSync();
+            const fileOrUrl = resolveDirPath(outDirPath, `${fileName}.json`);
+            fs.writeFileSync(fileOrUrl, clipboardText, "utf8");
+            return { fileOrUrl, fileName };
+        }
+        const fileOrUrl = file ?? "";
+        const fileName = path.parse(fileOrUrl).name;
+        return { fileOrUrl, fileName };
+    })();
     const isHttpPath = isHttp(fileOrUrl);
     const mulmoFilePath = isHttpPath ? "" : getFullPath(baseDirPath, fileOrUrl);
     const mulmoFileDirPath = path.dirname(isHttpPath ? baseDirPath : mulmoFilePath);
-    const outDirPath = getFullPath(baseDirPath, outdir ?? outDirName);
     const imageDirPath = getFullPath(outDirPath, imagedir ?? imageDirName);
     const audioDirPath = getFullPath(outDirPath, audiodir ?? audioDirName);
     const outputStudioFilePath = getOutputStudioFilePath(outDirPath, fileName);
@@ -50,7 +64,7 @@ export const main = async () => {
         GraphAILogger.setLevelEnabled("log", false);
         GraphAILogger.setLevelEnabled("warn", false);
     }
-    const { action, force, pdf_mode, pdf_size } = args;
+    const { action, f: force, pdf_mode, pdf_size, l: lang, c: caption } = args;
     const mulmoScript = await fetchScript(isHttpPath, mulmoFilePath, fileOrUrl);
     // Create or update MulmoStudio file with MulmoScript
     const currentStudio = readMulmoScriptFile(outputStudioFilePath);
@@ -68,8 +82,11 @@ export const main = async () => {
         studio,
         fileDirs: files,
         force: Boolean(force),
+        lang: lang,
+        caption: caption,
     };
-    if (action === "translate") {
+    if (action === "translate" || lang || caption) {
+        GraphAILogger.log("run translate");
         await translate(context);
     }
     if (action === "audio") {
@@ -79,6 +96,9 @@ export const main = async () => {
         await images(context);
     }
     if (action === "movie") {
+        if (caption) {
+            await captions(context);
+        }
         await audio(context);
         await images(context);
         await movie(context);
@@ -87,4 +107,11 @@ export const main = async () => {
         await images(context);
         await pdf(context, pdf_mode, pdf_size);
     }
+    if (context.studio.script.title) {
+        GraphAILogger.info(context.studio.script.title);
+    }
+    if (context.studio.script.references) {
+        const textOutput = context.studio.script.references.map((reference) => `${reference.title}\n${reference.url}`).join("\n");
+        GraphAILogger.info(textOutput);
+    }
 };

package/lib/cli/commands/audio/builder.d.ts ADDED Viewed

@@ -0,0 +1,14 @@
+import type { Argv } from "yargs";
+export declare const builder: (yargs: Argv) => Argv<{
+    o: string | undefined;
+} & {
+    b: string | undefined;
+} & {
+    l: string | undefined;
+} & {
+    f: boolean;
+} & {
+    file: string | undefined;
+} & {
+    a: string | undefined;
+}>;

package/lib/cli/commands/audio/builder.js ADDED Viewed

@@ -0,0 +1,6 @@
+import { commonOptions } from "../../common.js";
+export const builder = (yargs) => commonOptions(yargs).option("a", {
+    alias: "audiodir",
+    describe: "Audio output directory",
+    type: "string",
+});

package/lib/cli/commands/audio/handler.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+import { CliArgs } from "../../../types/cli_types.js";
+export declare const handler: (argv: CliArgs<{
+    a?: string;
+}>) => Promise<void>;

package/lib/cli/commands/audio/handler.js ADDED Viewed

@@ -0,0 +1,7 @@
+import { audio } from "../../../actions/index.js";
+import { initializeContext, runTranslateIfNeeded } from "../../../cli/helpers.js";
+export const handler = async (argv) => {
+    const context = await initializeContext(argv);
+    await runTranslateIfNeeded(context, argv);
+    await audio(context);
+};

package/lib/cli/commands/audio/index.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export declare const command = "audio <file>";
+export declare const desc = "Generate audio files";
+export { builder } from "./builder.js";
+export { handler } from "./handler.js";

package/lib/cli/commands/audio/index.js ADDED Viewed

@@ -0,0 +1,4 @@
+export const command = "audio <file>";
+export const desc = "Generate audio files";
+export { builder } from "./builder.js";
+export { handler } from "./handler.js";

package/lib/cli/commands/image/builder.d.ts ADDED Viewed

@@ -0,0 +1,14 @@
+import type { Argv } from "yargs";
+export declare const builder: (yargs: Argv) => Argv<{
+    o: string | undefined;
+} & {
+    b: string | undefined;
+} & {
+    l: string | undefined;
+} & {
+    f: boolean;
+} & {
+    file: string | undefined;
+} & {
+    i: string | undefined;
+}>;

package/lib/cli/commands/image/builder.js ADDED Viewed

@@ -0,0 +1,6 @@
+import { commonOptions } from "../../common.js";
+export const builder = (yargs) => commonOptions(yargs).option("i", {
+    alias: "imagedir",
+    describe: "Image output directory",
+    type: "string",
+});

package/lib/cli/commands/image/handler.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+import { CliArgs } from "../../../types/cli_types.js";
+export declare const handler: (argv: CliArgs<{
+    i?: string;
+}>) => Promise<void>;

package/lib/cli/commands/image/handler.js ADDED Viewed

@@ -0,0 +1,7 @@
+import { images } from "../../../actions/index.js";
+import { initializeContext, runTranslateIfNeeded } from "../../../cli/helpers.js";
+export const handler = async (argv) => {
+    const context = await initializeContext(argv);
+    await runTranslateIfNeeded(context, argv);
+    await images(context);
+};

package/lib/cli/commands/image/index.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export declare const command = "images <file>";
+export declare const desc = "Generate image files";
+export { builder } from "./builder.js";
+export { handler } from "./handler.js";

package/lib/cli/commands/image/index.js ADDED Viewed

@@ -0,0 +1,4 @@
+export const command = "images <file>";
+export const desc = "Generate image files";
+export { builder } from "./builder.js";
+export { handler } from "./handler.js";

package/lib/cli/commands/movie/builder.d.ts ADDED Viewed

@@ -0,0 +1,18 @@
+import type { Argv } from "yargs";
+export declare const builder: (yargs: Argv) => Argv<{
+    o: string | undefined;
+} & {
+    b: string | undefined;
+} & {
+    l: string | undefined;
+} & {
+    f: boolean;
+} & {
+    file: string | undefined;
+} & {
+    a: string | undefined;
+} & {
+    i: string | undefined;
+} & {
+    c: string | undefined;
+}>;

package/lib/cli/commands/movie/builder.js ADDED Viewed

@@ -0,0 +1,19 @@
+import { commonOptions } from "../../common.js";
+import { languages } from "../../../utils/const.js";
+export const builder = (yargs) => commonOptions(yargs)
+    .option("a", {
+    alias: "audiodir",
+    describe: "Audio output directory",
+    type: "string",
+})
+    .option("i", {
+    alias: "imagedir",
+    describe: "Image output directory",
+    type: "string",
+})
+    .option("c", {
+    alias: "caption",
+    describe: "Video captions",
+    choices: languages,
+    type: "string",
+});

package/lib/cli/commands/movie/handler.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+import { CliArgs } from "../../../types/cli_types.js";
+export declare const handler: (argv: CliArgs<{
+    a?: string;
+    i?: string;
+    c?: string;
+}>) => Promise<void>;

package/lib/cli/commands/movie/handler.js ADDED Viewed

@@ -0,0 +1,12 @@
+import { audio, images, movie, captions } from "../../../actions/index.js";
+import { initializeContext, runTranslateIfNeeded } from "../../../cli/helpers.js";
+export const handler = async (argv) => {
+    const context = await initializeContext(argv);
+    await runTranslateIfNeeded(context, argv);
+    await audio(context);
+    await images(context);
+    if (context.caption) {
+        await captions(context);
+    }
+    await movie(context);
+};

package/lib/cli/commands/movie/index.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export declare const command = "movie <file>";
+export declare const desc = "Generate movie file";
+export { builder } from "./builder.js";
+export { handler } from "./handler.js";