npm - mulmocast - Versions diffs - 2.0.6 → 2.0.8 - Mend

mulmocast 2.0.6 → 2.0.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (40) hide show

package/lib/actions/audio.js +3 -1
package/lib/agents/image_genai_agent.js +62 -56
package/lib/agents/image_replicate_agent.js +9 -1
package/lib/agents/index.d.ts +2 -1
package/lib/agents/index.js +2 -1
package/lib/agents/movie_genai_agent.d.ts +0 -4
package/lib/agents/movie_genai_agent.js +3 -12
package/lib/agents/test.d.ts +1 -0
package/lib/agents/test.js +12 -0
package/lib/agents/tts_elevenlabs_agent.js +42 -32
package/lib/agents/tts_gemini_agent.js +8 -2
package/lib/agents/tts_kotodama_agent.d.ts +5 -0
package/lib/agents/tts_kotodama_agent.js +76 -0
package/lib/agents/tts_openai_agent.js +1 -1
package/lib/agents/utils.d.ts +1 -0
package/lib/agents/utils.js +1 -0
package/lib/types/agent.d.ts +3 -0
package/lib/types/schema.d.ts +21 -0
package/lib/types/schema.js +3 -2
package/lib/utils/const.d.ts +1 -0
package/lib/utils/const.js +1 -0
package/lib/utils/context.d.ts +8 -0
package/lib/utils/error_cause.d.ts +10 -0
package/lib/utils/error_cause.js +22 -0
package/lib/utils/provider2agent.d.ts +7 -0
package/lib/utils/provider2agent.js +7 -0
package/lib/utils/utils.d.ts +4 -0
package/lib/utils/utils.js +21 -6
package/package.json +4 -4
package/scripts/test/README.md +161 -0
package/scripts/test/test_all_elevenlabs_tts_model.json +111 -0
package/scripts/test/test_all_gemini_tts_model.json +433 -0
package/scripts/test/test_all_image.json +40 -0
package/scripts/test/test_all_image.json~ +45 -0
package/scripts/test/test_all_movie.json +33 -0
package/scripts/test/test_all_movie.json~ +37 -0
package/scripts/test/test_all_tts.json +83 -0
package/scripts/test/test_all_tts.json~ +83 -0
package/scripts/test/test_kotodama.json +57 -0
package/scripts/test/test_kotodama.json~ +0 -0

package/lib/types/schema.d.ts CHANGED Viewed

@@ -19,6 +19,7 @@ export declare const multiLingualTextsSchema: z.ZodRecord<z.ZodString, z.ZodObje
 export declare const speechOptionsSchema: z.ZodObject<{
     speed: z.ZodOptional<z.ZodNumber>;
     instruction: z.ZodOptional<z.ZodString>;
+    decoration: z.ZodOptional<z.ZodString>;
 }, z.core.$strict>;
 export declare const defaultSpeaker = "Presenter";
 export declare const text2SpeechProviderSchema: z.ZodDefault<z.ZodEnum<{
@@ -31,6 +32,7 @@ export declare const speakerDataSchema: z.ZodObject<{
     speechOptions: z.ZodOptional<z.ZodObject<{
         speed: z.ZodOptional<z.ZodNumber>;
         instruction: z.ZodOptional<z.ZodString>;
+        decoration: z.ZodOptional<z.ZodString>;
     }, z.core.$strict>>;
     provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
         [x: string]: string;
@@ -44,6 +46,7 @@ export declare const speakerSchema: z.ZodObject<{
     speechOptions: z.ZodOptional<z.ZodObject<{
         speed: z.ZodOptional<z.ZodNumber>;
         instruction: z.ZodOptional<z.ZodString>;
+        decoration: z.ZodOptional<z.ZodString>;
     }, z.core.$strict>>;
     provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
         [x: string]: string;
@@ -56,6 +59,7 @@ export declare const speakerSchema: z.ZodObject<{
         speechOptions: z.ZodOptional<z.ZodObject<{
             speed: z.ZodOptional<z.ZodNumber>;
             instruction: z.ZodOptional<z.ZodString>;
+            decoration: z.ZodOptional<z.ZodString>;
         }, z.core.$strict>>;
         provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
             [x: string]: string;
@@ -70,6 +74,7 @@ export declare const speakerDictionarySchema: z.ZodRecord<z.ZodString, z.ZodObje
     speechOptions: z.ZodOptional<z.ZodObject<{
         speed: z.ZodOptional<z.ZodNumber>;
         instruction: z.ZodOptional<z.ZodString>;
+        decoration: z.ZodOptional<z.ZodString>;
     }, z.core.$strict>>;
     provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
         [x: string]: string;
@@ -82,6 +87,7 @@ export declare const speakerDictionarySchema: z.ZodRecord<z.ZodString, z.ZodObje
         speechOptions: z.ZodOptional<z.ZodObject<{
             speed: z.ZodOptional<z.ZodNumber>;
             instruction: z.ZodOptional<z.ZodString>;
+            decoration: z.ZodOptional<z.ZodString>;
         }, z.core.$strict>>;
         provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
             [x: string]: string;
@@ -97,6 +103,7 @@ export declare const mulmoSpeechParamsSchema: z.ZodDefault<z.ZodObject<{
         speechOptions: z.ZodOptional<z.ZodObject<{
             speed: z.ZodOptional<z.ZodNumber>;
             instruction: z.ZodOptional<z.ZodString>;
+            decoration: z.ZodOptional<z.ZodString>;
         }, z.core.$strict>>;
         provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
             [x: string]: string;
@@ -109,6 +116,7 @@ export declare const mulmoSpeechParamsSchema: z.ZodDefault<z.ZodObject<{
             speechOptions: z.ZodOptional<z.ZodObject<{
                 speed: z.ZodOptional<z.ZodNumber>;
                 instruction: z.ZodOptional<z.ZodString>;
+                decoration: z.ZodOptional<z.ZodString>;
             }, z.core.$strict>>;
             provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                 [x: string]: string;
@@ -629,6 +637,7 @@ export declare const mulmoBeatSchema: z.ZodObject<{
     speechOptions: z.ZodOptional<z.ZodObject<{
         speed: z.ZodOptional<z.ZodNumber>;
         instruction: z.ZodOptional<z.ZodString>;
+        decoration: z.ZodOptional<z.ZodString>;
     }, z.core.$strict>>;
     textSlideParams: z.ZodOptional<z.ZodObject<{
         cssStyles: z.ZodUnion<readonly [z.ZodString, z.ZodArray<z.ZodString>]>;
@@ -716,6 +725,7 @@ export declare const mulmoPresentationStyleSchema: z.ZodObject<{
             speechOptions: z.ZodOptional<z.ZodObject<{
                 speed: z.ZodOptional<z.ZodNumber>;
                 instruction: z.ZodOptional<z.ZodString>;
+                decoration: z.ZodOptional<z.ZodString>;
             }, z.core.$strict>>;
             provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                 [x: string]: string;
@@ -728,6 +738,7 @@ export declare const mulmoPresentationStyleSchema: z.ZodObject<{
                 speechOptions: z.ZodOptional<z.ZodObject<{
                     speed: z.ZodOptional<z.ZodNumber>;
                     instruction: z.ZodOptional<z.ZodString>;
+                    decoration: z.ZodOptional<z.ZodString>;
                 }, z.core.$strict>>;
                 provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                     [x: string]: string;
@@ -852,6 +863,7 @@ export declare const mulmoScriptSchema: z.ZodObject<{
             speechOptions: z.ZodOptional<z.ZodObject<{
                 speed: z.ZodOptional<z.ZodNumber>;
                 instruction: z.ZodOptional<z.ZodString>;
+                decoration: z.ZodOptional<z.ZodString>;
             }, z.core.$strict>>;
             provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                 [x: string]: string;
@@ -864,6 +876,7 @@ export declare const mulmoScriptSchema: z.ZodObject<{
                 speechOptions: z.ZodOptional<z.ZodObject<{
                     speed: z.ZodOptional<z.ZodNumber>;
                     instruction: z.ZodOptional<z.ZodString>;
+                    decoration: z.ZodOptional<z.ZodString>;
                 }, z.core.$strict>>;
                 provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                     [x: string]: string;
@@ -1133,6 +1146,7 @@ export declare const mulmoScriptSchema: z.ZodObject<{
         speechOptions: z.ZodOptional<z.ZodObject<{
             speed: z.ZodOptional<z.ZodNumber>;
             instruction: z.ZodOptional<z.ZodString>;
+            decoration: z.ZodOptional<z.ZodString>;
         }, z.core.$strict>>;
         textSlideParams: z.ZodOptional<z.ZodObject<{
             cssStyles: z.ZodUnion<readonly [z.ZodString, z.ZodArray<z.ZodString>]>;
@@ -1264,6 +1278,7 @@ export declare const mulmoStudioSchema: z.ZodObject<{
                 speechOptions: z.ZodOptional<z.ZodObject<{
                     speed: z.ZodOptional<z.ZodNumber>;
                     instruction: z.ZodOptional<z.ZodString>;
+                    decoration: z.ZodOptional<z.ZodString>;
                 }, z.core.$strict>>;
                 provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                     [x: string]: string;
@@ -1276,6 +1291,7 @@ export declare const mulmoStudioSchema: z.ZodObject<{
                     speechOptions: z.ZodOptional<z.ZodObject<{
                         speed: z.ZodOptional<z.ZodNumber>;
                         instruction: z.ZodOptional<z.ZodString>;
+                        decoration: z.ZodOptional<z.ZodString>;
                     }, z.core.$strict>>;
                     provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                         [x: string]: string;
@@ -1545,6 +1561,7 @@ export declare const mulmoStudioSchema: z.ZodObject<{
             speechOptions: z.ZodOptional<z.ZodObject<{
                 speed: z.ZodOptional<z.ZodNumber>;
                 instruction: z.ZodOptional<z.ZodString>;
+                decoration: z.ZodOptional<z.ZodString>;
             }, z.core.$strict>>;
             textSlideParams: z.ZodOptional<z.ZodObject<{
                 cssStyles: z.ZodUnion<readonly [z.ZodString, z.ZodArray<z.ZodString>]>;
@@ -1612,6 +1629,7 @@ export declare const mulmoPromptTemplateSchema: z.ZodObject<{
                 speechOptions: z.ZodOptional<z.ZodObject<{
                     speed: z.ZodOptional<z.ZodNumber>;
                     instruction: z.ZodOptional<z.ZodString>;
+                    decoration: z.ZodOptional<z.ZodString>;
                 }, z.core.$strict>>;
                 provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                     [x: string]: string;
@@ -1624,6 +1642,7 @@ export declare const mulmoPromptTemplateSchema: z.ZodObject<{
                     speechOptions: z.ZodOptional<z.ZodObject<{
                         speed: z.ZodOptional<z.ZodNumber>;
                         instruction: z.ZodOptional<z.ZodString>;
+                        decoration: z.ZodOptional<z.ZodString>;
                     }, z.core.$strict>>;
                     provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                         [x: string]: string;
@@ -1742,6 +1761,7 @@ export declare const mulmoPromptTemplateFileSchema: z.ZodObject<{
                 speechOptions: z.ZodOptional<z.ZodObject<{
                     speed: z.ZodOptional<z.ZodNumber>;
                     instruction: z.ZodOptional<z.ZodString>;
+                    decoration: z.ZodOptional<z.ZodString>;
                 }, z.core.$strict>>;
                 provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                     [x: string]: string;
@@ -1754,6 +1774,7 @@ export declare const mulmoPromptTemplateFileSchema: z.ZodObject<{
                     speechOptions: z.ZodOptional<z.ZodObject<{
                         speed: z.ZodOptional<z.ZodNumber>;
                         instruction: z.ZodOptional<z.ZodString>;
+                        decoration: z.ZodOptional<z.ZodString>;
                     }, z.core.$strict>>;
                     provider: z.ZodOptional<z.ZodDefault<z.ZodEnum<{
                         [x: string]: string;

package/lib/types/schema.js CHANGED Viewed

@@ -18,8 +18,9 @@ export const localizedTextSchema = z
 export const multiLingualTextsSchema = z.record(langSchema, localizedTextSchema);
 export const speechOptionsSchema = z
     .object({
-    speed: z.number().optional(), // default: 1.0
-    instruction: z.string().optional(),
+    speed: z.number().optional(), // default: 1.0 for google and niji voice
+    instruction: z.string().optional(), // for tts openai
+    decoration: z.string().optional(), // for kotodama. default: neutral
 })
     .strict();
 const speakerIdSchema = z.string();

package/lib/utils/const.d.ts CHANGED Viewed

@@ -11,3 +11,4 @@ export declare const storyToScriptGenerateMode: {
     oneStep: string;
 };
 export declare const bundleTargetLang: string[];
+export declare const ASPECT_RATIOS: string[];

package/lib/utils/const.js CHANGED Viewed

@@ -11,3 +11,4 @@ export const storyToScriptGenerateMode = {
     oneStep: "one_step",
 };
 export const bundleTargetLang = ["ja", "en"];
+export const ASPECT_RATIOS = ["1:1", "9:16", "16:9"];

package/lib/utils/context.d.ts CHANGED Viewed

@@ -17,6 +17,7 @@ export declare const createStudioData: (_mulmoScript: MulmoScript, fileName: str
                 speechOptions?: {
                     speed?: number | undefined;
                     instruction?: string | undefined;
+                    decoration?: string | undefined;
                 } | undefined;
                 provider?: string | undefined;
                 model?: string | undefined;
@@ -27,6 +28,7 @@ export declare const createStudioData: (_mulmoScript: MulmoScript, fileName: str
                     speechOptions?: {
                         speed?: number | undefined;
                         instruction?: string | undefined;
+                        decoration?: string | undefined;
                     } | undefined;
                     provider?: string | undefined;
                     model?: string | undefined;
@@ -242,6 +244,7 @@ export declare const createStudioData: (_mulmoScript: MulmoScript, fileName: str
             speechOptions?: {
                 speed?: number | undefined;
                 instruction?: string | undefined;
+                decoration?: string | undefined;
             } | undefined;
             textSlideParams?: {
                 cssStyles: string | string[];
@@ -332,6 +335,7 @@ export declare const initializeContextFromFiles: (files: FileObject, raiseError:
                     speechOptions?: {
                         speed?: number | undefined;
                         instruction?: string | undefined;
+                        decoration?: string | undefined;
                     } | undefined;
                     provider?: string | undefined;
                     model?: string | undefined;
@@ -342,6 +346,7 @@ export declare const initializeContextFromFiles: (files: FileObject, raiseError:
                         speechOptions?: {
                             speed?: number | undefined;
                             instruction?: string | undefined;
+                            decoration?: string | undefined;
                         } | undefined;
                         provider?: string | undefined;
                         model?: string | undefined;
@@ -557,6 +562,7 @@ export declare const initializeContextFromFiles: (files: FileObject, raiseError:
                 speechOptions?: {
                     speed?: number | undefined;
                     instruction?: string | undefined;
+                    decoration?: string | undefined;
                 } | undefined;
                 textSlideParams?: {
                     cssStyles: string | string[];
@@ -654,6 +660,7 @@ export declare const initializeContextFromFiles: (files: FileObject, raiseError:
                 speechOptions?: {
                     speed?: number | undefined;
                     instruction?: string | undefined;
+                    decoration?: string | undefined;
                 } | undefined;
                 provider?: string | undefined;
                 model?: string | undefined;
@@ -664,6 +671,7 @@ export declare const initializeContextFromFiles: (files: FileObject, raiseError:
                     speechOptions?: {
                         speed?: number | undefined;
                         instruction?: string | undefined;
+                        decoration?: string | undefined;
                     } | undefined;
                     provider?: string | undefined;
                     model?: string | undefined;

package/lib/utils/error_cause.d.ts CHANGED Viewed

@@ -197,3 +197,13 @@ export declare const translateApiKeyMissingError: () => {
 export declare const hasCause: (err: unknown) => err is Error & {
     cause: unknown;
 };
+type Result<T> = {
+    ok: true;
+    value: T;
+} | {
+    ok: false;
+    error: Error;
+};
+export declare function resultify<T>(fn: () => Promise<T>): Promise<Result<T>>;
+export declare const getGenAIErrorReason: (error: Error) => any;
+export {};

package/lib/utils/error_cause.js CHANGED Viewed

@@ -226,3 +226,25 @@ export const translateApiKeyMissingError = () => {
 export const hasCause = (err) => {
     return err instanceof Error && "cause" in err;
 };
+export async function resultify(fn) {
+    try {
+        return { ok: true, value: await fn() };
+    }
+    catch (error) {
+        return { ok: false, error: error };
+    }
+}
+export const getGenAIErrorReason = (error) => {
+    try {
+        if (error instanceof Error && error.message && error.message[0] === "{") {
+            const reasonDetail = JSON.parse(error.message).error.details.find((detail) => detail.reason);
+            if (reasonDetail) {
+                return reasonDetail;
+            }
+        }
+    }
+    catch (__error) {
+        // nothing.
+    }
+    return undefined;
+};

package/lib/utils/provider2agent.d.ts CHANGED Viewed

@@ -29,6 +29,13 @@ export declare const provider2TTSAgent: {
         models: string[];
         keyName: string;
     };
+    kotodama: {
+        agentName: string;
+        hasLimitedConcurrency: boolean;
+        defaultVoice: string;
+        defaultDecoration: string;
+        keyName: string;
+    };
     mock: {
         agentName: string;
         hasLimitedConcurrency: boolean;

package/lib/utils/provider2agent.js CHANGED Viewed

@@ -32,6 +32,13 @@ export const provider2TTSAgent = {
         models: ["eleven_multilingual_v2", "eleven_turbo_v2_5", "eleven_turbo_v2", "eleven_flash_v2_5", "eleven_flash_v2"],
         keyName: "ELEVENLABS_API_KEY",
     },
+    kotodama: {
+        agentName: "ttsKotodamaAgent",
+        hasLimitedConcurrency: true,
+        defaultVoice: "Atla",
+        defaultDecoration: "neutral",
+        keyName: "KOTODAMA_API_KEY",
+    },
     mock: {
         agentName: "mediaMockAgent",
         hasLimitedConcurrency: true,

package/lib/utils/utils.d.ts CHANGED Viewed

@@ -35,4 +35,8 @@ export declare const multiLingualObjectToArray: (multiLingual: MulmoStudioMultiL
     }>;
     cacheKey?: string | undefined;
 }[];
+export declare const getAspectRatio: (canvasSize: {
+    width: number;
+    height: number;
+}, ASPECT_RATIOS: string[]) => string;
 export {};

package/lib/utils/utils.js CHANGED Viewed

@@ -47,9 +47,8 @@ export const settings2GraphAIConfig = (settings, env) => {
             apiKey: getKey("LLM", "OPENAI_API_KEY"),
             baseURL: getKey("LLM", "OPENAI_BASE_URL"),
         },
-        ttsOpenaiAgent: {
-            apiKey: getKey("TTS", "OPENAI_API_KEY"),
-            baseURL: getKey("TTS", "OPENAI_BASE_URL"),
+        anthropicAgent: {
+            apiKey: getKey("LLM", "ANTHROPIC_API_TOKEN"),
         },
         imageOpenaiAgent: {
             apiKey: getKey("IMAGE", "OPENAI_API_KEY"),
@@ -61,24 +60,31 @@ export const settings2GraphAIConfig = (settings, env) => {
         imageGenAIAgent: {
             apiKey: getKey("IMAGE", "GEMINI_API_KEY"),
         },
-        anthropicAgent: {
-            apiKey: getKey("LLM", "ANTHROPIC_API_TOKEN"),
-        },
         movieReplicateAgent: {
             apiKey: getKey("MOVIE", "REPLICATE_API_TOKEN"),
         },
         movieGenAIAgent: {
             apiKey: getKey("MOVIE", "GEMINI_API_KEY"),
         },
+        ttsOpenaiAgent: {
+            apiKey: getKey("TTS", "OPENAI_API_KEY"),
+            baseURL: getKey("TTS", "OPENAI_BASE_URL"),
+        },
         ttsNijivoiceAgent: {
             apiKey: getKey("TTS", "NIJIVOICE_API_KEY"),
         },
+        ttsGoogleAgent: {
+            apiKey: getKey("TTS", "GEMINI_API_KEY"),
+        },
         ttsGeminiAgent: {
             apiKey: getKey("TTS", "GEMINI_API_KEY"),
         },
         ttsElevenlabsAgent: {
             apiKey: getKey("TTS", "ELEVENLABS_API_KEY"),
         },
+        ttsKotodamaAgent: {
+            apiKey: getKey("TTS", "KOTODAMA_API_KEY"),
+        },
         soundEffectReplicateAgent: {
             apiKey: getKey("SOUND_EFFECT", "REPLICATE_API_TOKEN"),
         },
@@ -126,3 +132,12 @@ export const multiLingualObjectToArray = (multiLingual, beats) => {
         return { multiLingualTexts: {} };
     });
 };
+export const getAspectRatio = (canvasSize, ASPECT_RATIOS) => {
+    const target = canvasSize.width / canvasSize.height;
+    return ASPECT_RATIOS.reduce((best, ratio) => {
+        const [w, h] = ratio.split(":").map(Number);
+        const r = w / h;
+        const diff = Math.abs(target - r);
+        return diff < best.diff ? { ratio, diff } : best;
+    }, { ratio: ASPECT_RATIOS[0], diff: Infinity }).ratio;
+};

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "mulmocast",
-  "version": "2.0.6",
+  "version": "2.0.8",
   "description": "",
   "type": "module",
   "main": "lib/index.node.js",
@@ -75,12 +75,12 @@
   "dependencies": {
     "@google-cloud/text-to-speech": "^6.4.0",
     "@google/genai": "^1.30.0",
-    "@graphai/anthropic_agent": "^2.0.11",
+    "@graphai/anthropic_agent": "^2.0.12",
     "@graphai/browserless_agent": "^2.0.1",
     "@graphai/gemini_agent": "^2.0.1",
     "@graphai/groq_agent": "^2.0.2",
     "@graphai/input_agents": "^1.0.2",
-    "@graphai/openai_agent": "^2.0.7",
+    "@graphai/openai_agent": "^2.0.8",
     "@graphai/stream_agent_filter": "^2.0.2",
     "@graphai/vanilla": "^2.0.12",
     "@graphai/vanilla_node_agents": "^2.0.4",
@@ -114,7 +114,7 @@
     "eslint-config-prettier": "^10.1.8",
     "eslint-plugin-prettier": "^5.5.4",
     "eslint-plugin-sonarjs": "^3.0.5",
-    "prettier": "^3.6.2",
+    "prettier": "^3.7.1",
     "tsx": "^4.20.6",
     "typescript": "^5.9.3",
     "typescript-eslint": "^8.48.0"

package/scripts/test/README.md ADDED Viewed

@@ -0,0 +1,161 @@
+# MulmoCast Test Scripts
+このディレクトリには、MulmoCastの機能テスト用のMulmoScriptサンプルが含まれています。
+This directory contains MulmoScript samples for testing MulmoCast features.
+## 📋 テストカテゴリ / Test Categories
+### 🎯 基本テスト / Basic Tests
+**シンプルな動作確認用のテストスクリプト**
+Simple test scripts for basic functionality verification
+- **test_hello.json** - 最もシンプルなHello Worldテスト / Simplest Hello World test
+- **test.json** - 基本的な動作テスト / Basic functionality test
+- **test1.json**, **test2.json** - 追加の基本テスト / Additional basic tests
+- **test_beats.json** - Beatの基本機能テスト / Beat basic features test
+### 🎤 TTS（音声合成）テスト / TTS (Text-to-Speech) Tests
+**各種音声合成プロバイダーのテスト**
+Tests for various TTS providers
+- **test_all_tts.json** - 全TTSプロバイダーのテスト（OpenAI, Gemini, Google, ElevenLabs, Nijivoice） / All TTS providers test
+- **test_audio.json** - 音声パラメータのテスト（padding, duration, movieVolumeなど） / Audio parameters test
+- **test_audio_gemini.json** - Gemini TTSの個別テスト / Gemini TTS specific test
+- **test_audio_instructions.json** - OpenAI TTS instructionsのテスト / OpenAI TTS instructions test
+- **test_elevenlabs_models.json** - ElevenLabsの複数モデルテスト / ElevenLabs multiple models test
+- **test_voices.json** - 複数の音声設定テスト / Multiple voice settings test
+- **test_mixed_providers.json** - 複数のTTSプロバイダー混在テスト / Mixed TTS providers test
+### 🖼️ 画像生成テスト / Image Generation Tests
+**画像生成機能のテスト**
+Image generation feature tests
+- **test_images.json** - 画像生成の基本テスト / Basic image generation test
+- **test_hello_image.json** - Hello World画像テスト / Hello World image test
+- **test_image_refs.json** - 参照画像を使った生成テスト / Image generation with references
+- **test_markdown.json** - Markdown形式の画像テスト / Markdown format image test
+- **test_html.json** - HTMLから画像生成テスト / HTML to image test
+- **test_vision.json** - Vision APIを使った画像生成テスト / Vision API image test
+- **test_layout.json** - レイアウト機能のテスト / Layout features test
+### 🎬 動画生成テスト / Video Generation Tests
+**動画生成機能のテスト**
+Video generation feature tests
+- **test_movie.json** - 動画生成の基本テスト（imagePrompt + moviePrompt） / Basic video generation test
+- **test_movie2.json** - 動画生成の追加テスト / Additional video generation test
+- **test_genai_movie.json** - GenAI動画生成テスト / GenAI video generation test
+- **test_genai.json** - GenAI機能テスト / GenAI features test
+- **test_replicate.json** - Replicate動画生成テスト / Replicate video generation test
+- **test_mv.json** - ミュージックビデオ形式のテスト / Music video format test
+### 🎭 高度な機能テスト / Advanced Feature Tests
+**特殊機能や複雑なシナリオのテスト**
+Special features and complex scenario tests
+- **test_spillover.json** - 音声スピルオーバー機能テスト / Audio spillover feature test
+- **test_lipsync.json** - リップシンク機能テスト / Lip-sync feature test
+- **test_transition.json** - トランジション効果テスト / Transition effects test
+- **test_transition_no_audio.json** - 音声なしトランジションテスト / Transition without audio test
+- **test_slideout_left_no_audio.json** - スライドアウト効果テスト / Slide-out effect test
+- **test_sound_effect.json** - サウンドエフェクトテスト / Sound effect test
+- **test_voice_over.json** - ボイスオーバー機能テスト / Voice-over feature test
+- **test_captions.json** - 字幕機能テスト / Caption feature test
+- **test_hello_caption.json** - Hello World字幕テスト / Hello World caption test
+- **test_loop.json** - ループ再生テスト / Loop playback test
+- **test_video_speed.json** - 動画速度調整テスト / Video speed adjustment test
+### 🔧 特殊条件テスト / Special Condition Tests
+**エッジケースや特殊な条件のテスト**
+Edge cases and special condition tests
+- **test_no_audio.json** - 音声なし動画テスト / Video without audio test
+- **test_no_audio_with_credit.json** - クレジット付き音声なしテスト / No audio with credits test
+- **test_hello_nobgm.json** - BGMなしテスト / Test without BGM
+- **test_size_error.json** - サイズエラーテスト / Size error test
+- **test_media.json** - メディアファイル処理テスト / Media file processing test
+- **test_order.json** - 順序処理テスト / Order processing test
+- **test_order_portrait.json** - 縦向き順序テスト / Portrait order test
+### 🌍 多言語テスト / Multi-language Tests
+**言語設定のテスト**
+Language setting tests
+- **test_lang.json** - 多言語サポートテスト / Multi-language support test
+- **test_en.json** - 英語専用テスト / English-only test
+### 🎯 プロバイダー別テスト / Provider-Specific Tests
+**特定プロバイダーの機能テスト**
+Provider-specific feature tests
+- **test_hello_google.json** - Google TTS専用テスト / Google TTS specific test
+- **gpt.json** - GPTモデルテスト / GPT model test
+- **mulmo_story.json** - ストーリー形式テスト / Story format test
+- **nano_banana.json** - カスタムサンプル / Custom sample
+## 🚀 使い方 / Usage
+### 基本的な実行方法 / Basic Execution
+```bash
+# 動画生成
+# Generate video
+yarn movie scripts/test/test_hello.json
+# 音声のみ生成
+# Generate audio only
+yarn audio scripts/test/test_audio.json
+# 画像のみ生成
+# Generate images only
+yarn images scripts/test/test_images.json
+```
+### 強制再生成 / Force Regeneration
+キャッシュを無視して再生成する場合は `-f` フラグを使用:
+Use the `-f` flag to ignore cache and regenerate:
+```bash
+yarn movie scripts/test/test_hello.json -f
+```
+## 📝 テストスクリプト作成のヒント / Tips for Creating Test Scripts
+1. **シンプルから始める** - `test_hello.json` を参考に基本構造を理解
+2. **機能を段階的に追加** - 一度に複数の機能をテストせず、段階的に追加
+3. **既存のテストを参考にする** - 同じカテゴリのテストスクリプトを参考に
+4. **適切な命名** - `test_<feature>.json` の形式で目的が分かりやすい名前を付ける
+---
+1. **Start simple** - Refer to `test_hello.json` to understand basic structure
+2. **Add features incrementally** - Don't test multiple features at once
+3. **Reference existing tests** - Look at tests in the same category
+4. **Use descriptive naming** - Use `test_<feature>.json` format for clarity
+## 🔗 関連ドキュメント / Related Documentation
+- [メインREADME](../../README.md)
+- [MulmoScript Schema](../../docs/schena.md)
+- [TTS Provider追加手順](../../docs/tts.md)
+- [Image Plugin仕様](../../docs/image_plugin.md)
+- [音声スピルオーバー](../../docs/sound_and_voice.md)