npm - mulmocast - Versions diffs - 0.0.1 → 0.0.3 - Mend

mulmocast 0.0.1 → 0.0.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

package/README.md +129 -15
package/assets/font/NotoSansJP-Regular.ttf +0 -0
package/assets/html/chart.html +38 -0
package/assets/html/mermaid.html +51 -0
package/assets/templates/business.json +57 -14
package/assets/templates/children_book.json +1 -3
package/assets/templates/coding.json +140 -0
package/lib/actions/audio.d.ts +2 -2
package/lib/actions/audio.js +88 -101
package/lib/actions/images.d.ts +1 -1
package/lib/actions/images.js +50 -88
package/lib/actions/index.d.ts +5 -0
package/lib/actions/index.js +5 -0
package/lib/actions/movie.d.ts +9 -1
package/lib/actions/movie.js +124 -65
package/lib/actions/pdf.d.ts +2 -0
package/lib/actions/pdf.js +211 -0
package/lib/actions/pdf2.d.ts +2 -0
package/lib/actions/pdf2.js +203 -0
package/lib/actions/translate.d.ts +1 -1
package/lib/actions/translate.js +38 -61
package/lib/agents/add_bgm_agent.d.ts +1 -1
package/lib/agents/add_bgm_agent.js +10 -14
package/lib/agents/anthropic_agent.d.ts +23 -0
package/lib/agents/anthropic_agent.js +162 -0
package/lib/agents/combine_audio_files_agent.d.ts +1 -1
package/lib/agents/combine_audio_files_agent.js +33 -32
package/lib/agents/image_google_agent.d.ts +1 -1
package/lib/agents/image_google_agent.js +8 -11
package/lib/agents/image_openai_agent.js +7 -14
package/lib/agents/index.d.ts +8 -8
package/lib/agents/index.js +13 -30
package/lib/agents/mulmo_prompts_agent.d.ts +1 -1
package/lib/agents/mulmo_prompts_agent.js +7 -11
package/lib/agents/nested_agent.d.ts +9 -0
package/lib/agents/nested_agent.js +138 -0
package/lib/agents/prompts_data.js +1 -4
package/lib/agents/tts_nijivoice_agent.d.ts +1 -1
package/lib/agents/tts_nijivoice_agent.js +8 -12
package/lib/agents/tts_openai_agent.js +9 -16
package/lib/agents/validate_mulmo_script_agent.d.ts +1 -1
package/lib/agents/validate_mulmo_script_agent.js +6 -10
package/lib/cli/args.d.ts +5 -2
package/lib/cli/args.js +52 -35
package/lib/cli/cli.d.ts +14 -0
package/lib/cli/cli.js +74 -57
package/lib/cli/common.js +1 -5
package/lib/cli/tool-args.d.ts +4 -1
package/lib/cli/tool-args.js +29 -18
package/lib/cli/tool-cli.js +34 -51
package/lib/methods/index.d.ts +4 -3
package/lib/methods/index.js +4 -19
package/lib/methods/mulmo_media_source.d.ts +4 -0
package/lib/methods/mulmo_media_source.js +21 -0
package/lib/methods/mulmo_script.d.ts +6 -5
package/lib/methods/mulmo_script.js +29 -16
package/lib/methods/mulmo_script_template.d.ts +1 -1
package/lib/methods/mulmo_script_template.js +4 -10
package/lib/methods/mulmo_studio_context.d.ts +1 -1
package/lib/methods/mulmo_studio_context.js +3 -9
package/lib/tools/create_mulmo_script_from_url.d.ts +3 -0
package/lib/tools/create_mulmo_script_from_url.js +152 -0
package/lib/tools/create_mulmo_script_interactively.d.ts +3 -0
package/lib/tools/create_mulmo_script_interactively.js +258 -0
package/lib/tools/dump_prompt.js +5 -8
package/lib/tools/prompt.js +9 -11
package/lib/tools/seed_from_url2.d.ts +3 -0
package/lib/tools/seed_from_url2.js +154 -0
package/lib/types/index.d.ts +2 -1
package/lib/types/index.js +2 -17
package/lib/types/schema.d.ts +3624 -2798
package/lib/types/schema.js +172 -123
package/lib/types/type.d.ts +34 -3
package/lib/types/type.js +1 -2
package/lib/utils/const.d.ts +4 -1
package/lib/utils/const.js +6 -6
package/lib/utils/file.d.ts +22 -4
package/lib/utils/file.js +100 -79
package/lib/utils/filters.d.ts +1 -0
package/lib/utils/filters.js +47 -26
package/lib/utils/image_plugins/chart.d.ts +3 -0
package/lib/utils/image_plugins/chart.js +18 -0
package/lib/utils/image_plugins/image.d.ts +2 -0
package/lib/utils/image_plugins/image.js +3 -0
package/lib/utils/image_plugins/index.d.ts +7 -0
package/lib/utils/image_plugins/index.js +7 -0
package/lib/utils/image_plugins/markdown.d.ts +3 -0
package/lib/utils/image_plugins/markdown.js +11 -0
package/lib/utils/image_plugins/mermaid.d.ts +3 -0
package/lib/utils/image_plugins/mermaid.js +21 -0
package/lib/utils/image_plugins/movie.d.ts +2 -0
package/lib/utils/image_plugins/movie.js +3 -0
package/lib/utils/image_plugins/source.d.ts +4 -0
package/lib/utils/image_plugins/source.js +15 -0
package/lib/utils/image_plugins/text_slide.d.ts +3 -0
package/lib/utils/image_plugins/text_slide.js +12 -0
package/lib/utils/image_plugins/type_guards.d.ts +6 -0
package/lib/utils/image_plugins/type_guards.js +21 -0
package/lib/utils/image_preprocess.d.ts +14 -0
package/lib/utils/image_preprocess.js +52 -0
package/lib/utils/inquirer.d.ts +2 -0
package/lib/utils/inquirer.js +33 -0
package/lib/utils/markdown.d.ts +3 -1
package/lib/utils/markdown.js +20 -19
package/lib/utils/pdf.d.ts +8 -0
package/lib/utils/pdf.js +75 -0
package/lib/utils/plugins.d.ts +5 -0
package/lib/utils/plugins.js +11 -0
package/lib/utils/preprocess.d.ts +70 -123
package/lib/utils/preprocess.js +37 -43
package/lib/utils/string.js +4 -10
package/lib/utils/text_hash.js +2 -39
package/lib/utils/utils.d.ts +12 -0
package/lib/utils/utils.js +34 -0
package/package.json +23 -8

package/lib/actions/audio.js CHANGED Viewed

@@ -1,88 +1,67 @@
-"use strict";
-var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
-    if (k2 === undefined) k2 = k;
-    var desc = Object.getOwnPropertyDescriptor(m, k);
-    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
-      desc = { enumerable: true, get: function() { return m[k]; } };
+import "dotenv/config";
+import { GraphAI } from "graphai";
+import * as agents from "@graphai/vanilla";
+import ttsNijivoiceAgent from "../agents/tts_nijivoice_agent.js";
+import addBGMAgent from "../agents/add_bgm_agent.js";
+import combineAudioFilesAgent from "../agents/combine_audio_files_agent.js";
+import ttsOpenaiAgent from "../agents/tts_openai_agent.js";
+import { fileWriteAgent } from "@graphai/vanilla_node_agents";
+import { MulmoScriptMethods } from "../methods/index.js";
+import { fileCacheAgentFilter } from "../utils/filters.js";
+import { getAudioArtifactFilePath, getAudioSegmentDirPath, getAudioCombinedFilePath, getOutputStudioFilePath, defaultBGMPath, mkdir, writingMessage, getAudioSegmentFilePath, resolveMediaSource, } from "../utils/file.js";
+import { text2hash } from "../utils/utils.js";
+const { default: __, ...vanillaAgents } = agents;
+// const rion_takanashi_voice = "b9277ce3-ba1c-4f6f-9a65-c05ca102ded0"; // たかなし りおん
+// const ben_carter_voice = "bc06c63f-fef6-43b6-92f7-67f919bd5dae"; // ベン・カーター
+const provider_to_agent = {
+    nijivoice: "ttsNijivoiceAgent",
+    openai: "ttsOpenaiAgent",
+};
+const getAudioPath = (context, beat, audioFile, audioDirPath) => {
+    if (beat.audio?.type === "audio") {
+        const path = resolveMediaSource(beat.audio.source, context);
+        if (path) {
+            return path;
+        }
+        throw new Error("Invalid audio source");
     }
-    Object.defineProperty(o, k2, desc);
-}) : (function(o, m, k, k2) {
-    if (k2 === undefined) k2 = k;
-    o[k2] = m[k];
-}));
-var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
-    Object.defineProperty(o, "default", { enumerable: true, value: v });
-}) : function(o, v) {
-    o["default"] = v;
-});
-var __importStar = (this && this.__importStar) || (function () {
-    var ownKeys = function(o) {
-        ownKeys = Object.getOwnPropertyNames || function (o) {
-            var ar = [];
-            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
-            return ar;
-        };
-        return ownKeys(o);
-    };
-    return function (mod) {
-        if (mod && mod.__esModule) return mod;
-        var result = {};
-        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
-        __setModuleDefault(result, mod);
-        return result;
+    return getAudioSegmentFilePath(audioDirPath, context.studio.filename, audioFile);
+};
+const preprocessor = (namedInputs) => {
+    const { beat, index, context, audioDirPath } = namedInputs;
+    const studioBeat = context.studio.beats[index];
+    const voiceId = context.studio.script.speechParams.speakers[beat.speaker].voiceId;
+    const speechOptions = MulmoScriptMethods.getSpeechOptions(context.studio.script, beat);
+    const hash_string = `${beat.text}${voiceId}${speechOptions?.instruction ?? ""}${speechOptions?.speed ?? 1.0}`;
+    const audioFile = `${context.studio.filename}_${index}_${text2hash(hash_string)}`;
+    const audioPath = getAudioPath(context, beat, audioFile, audioDirPath);
+    studioBeat.audioFile = audioPath;
+    return {
+        ttsAgent: provider_to_agent[context.studio.script.speechParams.provider],
+        studioBeat,
+        voiceId,
+        speechOptions,
+        audioPath,
     };
-})();
-var __importDefault = (this && this.__importDefault) || function (mod) {
-    return (mod && mod.__esModule) ? mod : { "default": mod };
 };
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.audio = void 0;
-require("dotenv/config");
-const graphai_1 = require("graphai");
-const agents = __importStar(require("@graphai/vanilla"));
-const tts_nijivoice_agent_1 = __importDefault(require("../agents/tts_nijivoice_agent"));
-const add_bgm_agent_1 = __importDefault(require("../agents/add_bgm_agent"));
-const combine_audio_files_agent_1 = __importDefault(require("../agents/combine_audio_files_agent"));
-const tts_openai_agent_1 = __importDefault(require("../agents/tts_openai_agent"));
-const vanilla_node_agents_1 = require("@graphai/vanilla_node_agents");
-const methods_1 = require("../methods");
-const filters_1 = require("../utils/filters");
-const file_1 = require("../utils/file");
-// const rion_takanashi_voice = "b9277ce3-ba1c-4f6f-9a65-c05ca102ded0"; // たかなし りおん
-// const ben_carter_voice = "bc06c63f-fef6-43b6-92f7-67f919bd5dae"; // ベン・カーター
 const graph_tts = {
     nodes: {
         preprocessor: {
-            agent: (namedInputs) => {
-                const { beat, script, speakers } = namedInputs;
-                return {
-                    voiceId: speakers[beat.speaker].voiceId,
-                    speechOptions: methods_1.MulmoScriptMethods.getSpeechOptions(script, beat),
-                };
-            },
+            agent: preprocessor,
             inputs: {
                 beat: ":beat",
-                script: ":script",
-                speakers: ":script.speechParams.speakers",
-            },
-        },
-        ttsAgent: {
-            agent: (namedInputs) => {
-                if (namedInputs.provider === "nijivoice") {
-                    return "ttsNijivoiceAgent";
-                }
-                return "ttsOpenaiAgent";
-            },
-            inputs: {
-                provider: ":script.speechParams.provider",
+                index: ":__mapIndex",
+                context: ":context",
+                audioDirPath: ":audioDirPath",
             },
         },
         tts: {
             unless: ":beat.audio",
-            agent: ":ttsAgent",
+            agent: ":preprocessor.ttsAgent",
             inputs: {
                 text: ":beat.text",
-                file: "${:scratchpadDirPath}/${:beat.audioFile}.mp3", // TODO
+                file: ":preprocessor.audioPath",
+                force: ":context.force",
             },
             params: {
                 voice: ":preprocessor.voiceId",
@@ -97,13 +76,20 @@ const graph_data = {
     concurrency: 8,
     nodes: {
         context: {},
-        outputBGMFilePath: {},
-        outputAudioFilePath: {},
+        audioArtifactFilePath: {},
+        audioCombinedFilePath: {},
         outputStudioFilePath: {},
-        scratchpadDirPath: {},
+        audioDirPath: {},
+        audioSegmentDirPath: {},
         map: {
             agent: "mapAgent",
-            inputs: { rows: ":context.studio.beats", script: ":context.studio.script", scratchpadDirPath: ":scratchpadDirPath" },
+            inputs: {
+                rows: ":context.studio.script.beats",
+                studio: ":context.studio",
+                audioDirPath: ":audioDirPath",
+                audioSegmentDirPath: ":audioSegmentDirPath",
+                context: ":context",
+            },
             params: {
                 rowKey: "beat",
             },
@@ -114,8 +100,8 @@ const graph_data = {
             inputs: {
                 map: ":map",
                 context: ":context",
-                combinedFileName: ":outputAudioFilePath",
-                scratchpadDirPath: ":scratchpadDirPath",
+                combinedFileName: ":audioCombinedFilePath",
+                audioDirPath: ":audioDirPath",
             },
             isResult: true,
         },
@@ -129,12 +115,12 @@ const graph_data = {
         addBGM: {
             agent: "addBGMAgent",
             params: {
-                musicFile: process.env.PATH_BGM ?? file_1.defaultBGMPath,
+                musicFile: process.env.PATH_BGM ?? defaultBGMPath,
             },
             inputs: {
                 wait: ":combineFiles",
-                voiceFile: ":outputAudioFilePath",
-                outputFile: ":outputBGMFilePath",
+                voiceFile: ":audioCombinedFilePath",
+                outputFile: ":audioArtifactFilePath",
                 script: ":context.studio.script",
             },
             isResult: true,
@@ -154,33 +140,34 @@ const graph_data = {
 const agentFilters = [
     {
         name: "fileCacheAgentFilter",
-        agent: filters_1.fileCacheAgentFilter,
+        agent: fileCacheAgentFilter,
         nodeIds: ["tts"],
     },
 ];
-const audio = async (context, concurrency) => {
+export const audio = async (context) => {
     const { studio, fileDirs } = context;
-    const { outDirPath, scratchpadDirPath } = fileDirs;
-    const outputBGMFilePath = (0, file_1.getOutputBGMFilePath)(outDirPath, studio.filename);
-    const outputAudioFilePath = (0, file_1.getOutputAudioFilePath)(outDirPath, studio.filename);
-    const outputStudioFilePath = (0, file_1.getOutputStudioFilePath)(outDirPath, studio.filename);
-    (0, file_1.mkdir)(outDirPath);
-    (0, file_1.mkdir)(scratchpadDirPath);
-    graph_data.concurrency = concurrency;
-    const graph = new graphai_1.GraphAI(graph_data, {
-        ...agents,
-        fileWriteAgent: vanilla_node_agents_1.fileWriteAgent,
-        ttsOpenaiAgent: tts_openai_agent_1.default,
-        ttsNijivoiceAgent: tts_nijivoice_agent_1.default,
-        addBGMAgent: add_bgm_agent_1.default,
-        combineAudioFilesAgent: combine_audio_files_agent_1.default,
+    const { outDirPath, audioDirPath } = fileDirs;
+    const audioArtifactFilePath = getAudioArtifactFilePath(outDirPath, studio.filename);
+    const audioSegmentDirPath = getAudioSegmentDirPath(audioDirPath, studio.filename);
+    const audioCombinedFilePath = getAudioCombinedFilePath(audioDirPath, studio.filename);
+    const outputStudioFilePath = getOutputStudioFilePath(outDirPath, studio.filename);
+    mkdir(outDirPath);
+    mkdir(audioSegmentDirPath);
+    graph_data.concurrency = MulmoScriptMethods.getSpeechProvider(studio.script) === "nijivoice" ? 1 : 8;
+    const graph = new GraphAI(graph_data, {
+        ...vanillaAgents,
+        fileWriteAgent,
+        ttsOpenaiAgent,
+        ttsNijivoiceAgent,
+        addBGMAgent,
+        combineAudioFilesAgent,
     }, { agentFilters });
     graph.injectValue("context", context);
-    graph.injectValue("outputBGMFilePath", outputBGMFilePath);
-    graph.injectValue("outputAudioFilePath", outputAudioFilePath);
+    graph.injectValue("audioArtifactFilePath", audioArtifactFilePath);
+    graph.injectValue("audioCombinedFilePath", audioCombinedFilePath);
     graph.injectValue("outputStudioFilePath", outputStudioFilePath);
-    graph.injectValue("scratchpadDirPath", scratchpadDirPath);
+    graph.injectValue("audioSegmentDirPath", audioSegmentDirPath);
+    graph.injectValue("audioDirPath", audioDirPath);
     await graph.run();
-    (0, file_1.writingMessage)(outputAudioFilePath);
+    writingMessage(audioCombinedFilePath);
 };
-exports.audio = audio;

package/lib/actions/images.d.ts CHANGED Viewed

@@ -1,2 +1,2 @@
-import { MulmoStudioContext } from "../types";
+import { MulmoStudioContext } from "../types/index.js";
 export declare const images: (context: MulmoStudioContext) => Promise<void>;

package/lib/actions/images.js CHANGED Viewed

@@ -1,83 +1,42 @@
-"use strict";
-var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
-    if (k2 === undefined) k2 = k;
-    var desc = Object.getOwnPropertyDescriptor(m, k);
-    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
-      desc = { enumerable: true, get: function() { return m[k]; } };
-    }
-    Object.defineProperty(o, k2, desc);
-}) : (function(o, m, k, k2) {
-    if (k2 === undefined) k2 = k;
-    o[k2] = m[k];
-}));
-var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
-    Object.defineProperty(o, "default", { enumerable: true, value: v });
-}) : function(o, v) {
-    o["default"] = v;
-});
-var __importStar = (this && this.__importStar) || (function () {
-    var ownKeys = function(o) {
-        ownKeys = Object.getOwnPropertyNames || function (o) {
-            var ar = [];
-            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
-            return ar;
-        };
-        return ownKeys(o);
-    };
-    return function (mod) {
-        if (mod && mod.__esModule) return mod;
-        var result = {};
-        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
-        __setModuleDefault(result, mod);
-        return result;
+import dotenv from "dotenv";
+import { GraphAI, GraphAILogger } from "graphai";
+import * as agents from "@graphai/vanilla";
+import { fileWriteAgent } from "@graphai/vanilla_node_agents";
+import { getOutputStudioFilePath, mkdir } from "../utils/file.js";
+import { fileCacheAgentFilter } from "../utils/filters.js";
+import imageGoogleAgent from "../agents/image_google_agent.js";
+import imageOpenaiAgent from "../agents/image_openai_agent.js";
+import { MulmoScriptMethods } from "../methods/index.js";
+import { imagePlugins } from "../utils/image_plugins/index.js";
+const { default: __, ...vanillaAgents } = agents;
+dotenv.config();
+// const openai = new OpenAI();
+import { GoogleAuth } from "google-auth-library";
+const htmlStyle = (script, beat) => {
+    return {
+        canvasSize: MulmoScriptMethods.getCanvasSize(script),
+        textSlideStyle: MulmoScriptMethods.getTextSlideStyle(script, beat),
     };
-})();
-var __importDefault = (this && this.__importDefault) || function (mod) {
-    return (mod && mod.__esModule) ? mod : { "default": mod };
 };
-Object.defineProperty(exports, "__esModule", { value: true });
-exports.images = void 0;
-const dotenv_1 = __importDefault(require("dotenv"));
-const graphai_1 = require("graphai");
-const agents = __importStar(require("@graphai/vanilla"));
-const vanilla_node_agents_1 = require("@graphai/vanilla_node_agents");
-const file_1 = require("../utils/file");
-const filters_1 = require("../utils/filters");
-const markdown_1 = require("../utils/markdown");
-const image_google_agent_1 = __importDefault(require("../agents/image_google_agent"));
-const image_openai_agent_1 = __importDefault(require("../agents/image_openai_agent"));
-const methods_1 = require("../methods");
-dotenv_1.default.config();
-// const openai = new OpenAI();
-const google_auth_library_1 = require("google-auth-library");
-const preprocess_agent = async (namedInputs) => {
-    const { context, beat, index, suffix, imageDirPath } = namedInputs;
-    const imageParams = { ...context.studio.script.imageParams, ...beat.imageParams };
-    const prompt = (beat.imagePrompt || beat.text) + "\n" + (imageParams.style || "");
+const imagePreprocessAgent = async (namedInputs) => {
+    const { context, beat, index, suffix, imageDirPath, imageAgentInfo } = namedInputs;
+    const imageParams = { ...imageAgentInfo.imageParams, ...beat.imageParams };
     const imagePath = `${imageDirPath}/${context.studio.filename}/${index}${suffix}.png`;
-    const aspectRatio = methods_1.MulmoScriptMethods.getAspectRatio(context.studio.script);
+    const returnValue = {
+        aspectRatio: MulmoScriptMethods.getAspectRatio(context.studio.script),
+        imageParams,
+    };
     if (beat.image) {
-        if (beat.image.type === "textSlide") {
-            const slide = beat.image.slide;
-            const markdown = `# ${slide.title}` + slide.bullets.map((text) => `- ${text}`).join("\n");
-            await (0, markdown_1.convertMarkdownToImage)(markdown, methods_1.MulmoScriptMethods.getTextSlideStyle(context.studio.script, beat), imagePath);
-        }
-        else if (beat.image.type === "markdown") {
-            const markdown = Array.isArray(beat.image.markdown) ? beat.image.markdown.join("\n") : beat.image.markdown;
-            await (0, markdown_1.convertMarkdownToImage)(markdown, methods_1.MulmoScriptMethods.getTextSlideStyle(context.studio.script, beat), imagePath);
-        }
-        else if (beat.image.type === "image") {
-            if (beat.image.source.kind === "url") {
-                // undefined prompt indicates "no need to generate image"
-                return { path: beat.image.source.url, prompt: undefined, imageParams, aspectRatio };
-            }
-            else if (beat.image.source.kind === "path") {
-                const path = methods_1.MulmoStudioContextMethods.resolveAssetPath(context, beat.image.source.path);
-                return { path, prompt: undefined, imageParams, aspectRatio };
-            }
+        const plugin = imagePlugins.find((plugin) => plugin.imageType === beat?.image?.type);
+        if (plugin) {
+            const processorParams = { beat, context, imagePath, ...htmlStyle(context.studio.script, beat) };
+            const path = await plugin.process(processorParams);
+            // undefined prompt indicates that image generation is not needed
+            return { path, ...returnValue };
         }
     }
-    return { path: imagePath, prompt, imageParams, aspectRatio };
+    const prompt = (beat.imagePrompt || beat.text) + "\n" + (imageParams.style || "");
+    return { path: imagePath, prompt, ...returnValue };
 };
 const graph_data = {
     version: 0.5,
@@ -85,11 +44,11 @@ const graph_data = {
     nodes: {
         context: {},
         imageDirPath: {},
-        text2imageAgent: {},
+        imageAgentInfo: {},
         outputStudioFilePath: {},
         map: {
             agent: "mapAgent",
-            inputs: { rows: ":context.studio.beats", context: ":context", text2imageAgent: ":text2imageAgent", imageDirPath: ":imageDirPath" },
+            inputs: { rows: ":context.studio.script.beats", context: ":context", imageAgentInfo: ":imageAgentInfo", imageDirPath: ":imageDirPath" },
             isResult: true,
             params: {
                 rowKey: "beat",
@@ -98,18 +57,19 @@ const graph_data = {
             graph: {
                 nodes: {
                     preprocessor: {
-                        agent: preprocess_agent,
+                        agent: imagePreprocessAgent,
                         inputs: {
                             context: ":context",
                             beat: ":beat",
                             index: ":__mapIndex",
                             suffix: "p",
                             imageDirPath: ":imageDirPath",
+                            imageAgentInfo: ":imageAgentInfo",
                         },
                     },
                     imageGenerator: {
                         if: ":preprocessor.prompt",
-                        agent: ":text2imageAgent",
+                        agent: ":imageAgentInfo.agent",
                         params: {
                             model: ":preprocessor.imageParams.model",
                             size: ":preprocessor.imageParams.size",
@@ -120,6 +80,7 @@ const graph_data = {
                             prompt: ":preprocessor.prompt",
                             file: ":preprocessor.path", // only for fileCacheAgentFilter
                             text: ":preprocessor.prompt", // only for fileCacheAgentFilter
+                            force: ":context.force",
                         },
                         defaultValue: {},
                     },
@@ -164,30 +125,31 @@ const graph_data = {
     },
 };
 const googleAuth = async () => {
-    const auth = new google_auth_library_1.GoogleAuth({
+    const auth = new GoogleAuth({
         scopes: ["https://www.googleapis.com/auth/cloud-platform"],
     });
     const client = await auth.getClient();
     const accessToken = await client.getAccessToken();
     return accessToken.token;
 };
-const images = async (context) => {
+export const images = async (context) => {
     const { studio, fileDirs } = context;
     const { outDirPath, imageDirPath } = fileDirs;
-    (0, file_1.mkdir)(`${imageDirPath}/${studio.filename}`);
+    mkdir(`${imageDirPath}/${studio.filename}`);
     const agentFilters = [
         {
             name: "fileCacheAgentFilter",
-            agent: filters_1.fileCacheAgentFilter,
+            agent: fileCacheAgentFilter,
             nodeIds: ["imageGenerator"],
         },
     ];
     const options = {
         agentFilters,
     };
+    const imageAgentInfo = MulmoScriptMethods.getImageAgentInfo(studio.script);
     // We need to get google's auth token only if the google is the text2image provider.
-    if (methods_1.MulmoScriptMethods.getImageProvider(studio.script) === "google") {
-        console.log("google was specified as text2image engine");
+    if (imageAgentInfo.provider === "google") {
+        GraphAILogger.log("google was specified as text2image engine");
         const token = await googleAuth();
         options.config = {
             imageGoogleAgent: {
@@ -196,16 +158,16 @@ const images = async (context) => {
             },
         };
     }
+    GraphAILogger.info(`text2image: provider=${imageAgentInfo.provider} model=${imageAgentInfo.imageParams.model}`);
     const injections = {
         context,
-        text2imageAgent: methods_1.MulmoScriptMethods.getText2imageAgent(studio.script),
-        outputStudioFilePath: (0, file_1.getOutputStudioFilePath)(outDirPath, studio.filename),
+        imageAgentInfo,
+        outputStudioFilePath: getOutputStudioFilePath(outDirPath, studio.filename),
         imageDirPath,
     };
-    const graph = new graphai_1.GraphAI(graph_data, { ...agents, imageGoogleAgent: image_google_agent_1.default, imageOpenaiAgent: image_openai_agent_1.default, fileWriteAgent: vanilla_node_agents_1.fileWriteAgent }, options);
+    const graph = new GraphAI(graph_data, { ...vanillaAgents, imageGoogleAgent, imageOpenaiAgent, fileWriteAgent }, options);
     Object.keys(injections).forEach((key) => {
         graph.injectValue(key, injections[key]);
     });
     await graph.run();
 };
-exports.images = images;

package/lib/actions/index.d.ts ADDED Viewed

@@ -0,0 +1,5 @@
+export * from "./audio.js";
+export * from "./images.js";
+export * from "./movie.js";
+export * from "./pdf.js";
+export * from "./translate.js";

package/lib/actions/index.js ADDED Viewed

@@ -0,0 +1,5 @@
+export * from "./audio.js";
+export * from "./images.js";
+export * from "./movie.js";
+export * from "./pdf.js";
+export * from "./translate.js";

package/lib/actions/movie.d.ts CHANGED Viewed

@@ -1,2 +1,10 @@
-import { MulmoStudioContext } from "../types";
+import { MulmoStudioContext, MulmoCanvasDimension, BeatMediaType } from "../types/index.js";
+export declare const getVideoPart: (inputIndex: number, mediaType: BeatMediaType, duration: number, canvasInfo: MulmoCanvasDimension) => {
+    videoId: string;
+    videoPart: string;
+};
+export declare const getAudioPart: (inputIndex: number, duration: number, delay: number) => {
+    audioId: string;
+    audioPart: string;
+};
 export declare const movie: (context: MulmoStudioContext) => Promise<void>;