npm - omnius - Versions diffs - 1.0.20 → 1.0.21 - Mend

omnius 1.0.20 → 1.0.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/index.js CHANGED Viewed

@@ -250375,6 +250375,22 @@ function optionalNumberArg(value2) {
   const n2 = Number(value2);
   return Number.isFinite(n2) ? n2 : void 0;
 }
+function booleanArg(value2, fallback) {
+  if (typeof value2 === "boolean")
+    return value2;
+  if (typeof value2 === "string") {
+    if (/^(1|true|yes|on)$/i.test(value2.trim()))
+      return true;
+    if (/^(0|false|no|off)$/i.test(value2.trim()))
+      return false;
+  }
+  return fallback;
+}
+function generationFallbackEnabled(args) {
+  if (booleanArg(args["strict_model"] ?? args["strictModel"] ?? args["strict"], false))
+    return false;
+  return booleanArg(args["fallback"] ?? args["allow_fallback"] ?? args["allowFallback"], true);
+}
 function isBackend(value2) {
   return value2 === "auto" || value2 === "ollama" || value2 === "diffusers" || value2 === "sdcpp";
 }
@@ -250383,6 +250399,9 @@ function getImageGenerationPreset(model) {
     return void 0;
   return IMAGE_GENERATION_MODEL_PRESETS.find((preset) => preset.id === model);
 }
+function imageGenerationQualityLadder() {
+  return IMAGE_GENERATION_QUALITY_LADDER.map((id) => getImageGenerationPreset(id)).filter((preset) => Boolean(preset));
+}
 function inferImageGenerationBackend(model, requested) {
   if (requested && isBackend(requested))
     return requested;
@@ -250399,6 +250418,40 @@ function inferImageGenerationBackend(model, requested) {
     return "sdcpp";
   return "diffusers";
 }
+function imageCandidateFor(model, requestedBackend) {
+  let backend = inferImageGenerationBackend(model, requestedBackend);
+  if (backend === "auto")
+    backend = "diffusers";
+  return {
+    model,
+    backend,
+    preset: getImageGenerationPreset(model)
+  };
+}
+function imageGenerationFallbackCandidates(requestedModel, requestedBackend, allowFallback = true) {
+  const ladder = imageGenerationQualityLadder();
+  const candidates = [];
+  const add2 = (candidate) => {
+    const key = `${candidate.backend}:${candidate.model}`;
+    if (!candidates.some((existing) => `${existing.backend}:${existing.model}` === key))
+      candidates.push(candidate);
+  };
+  if (requestedModel) {
+    add2(imageCandidateFor(requestedModel, requestedBackend));
+  } else if (requestedBackend && requestedBackend !== "auto") {
+    const firstForBackend = ladder.find((preset) => preset.backend === requestedBackend);
+    add2(imageCandidateFor(firstForBackend?.id ?? (requestedBackend === "ollama" ? DEFAULT_OLLAMA_IMAGE_MODEL : DEFAULT_DIFFUSERS_IMAGE_MODEL), requestedBackend));
+  } else if (!allowFallback) {
+    add2(imageCandidateFor(DEFAULT_DIFFUSERS_IMAGE_MODEL, requestedBackend));
+  }
+  if (!allowFallback)
+    return candidates.length ? candidates : [imageCandidateFor(DEFAULT_DIFFUSERS_IMAGE_MODEL, requestedBackend)];
+  const primaryIndex = requestedModel ? ladder.findIndex((preset) => preset.id === requestedModel) : requestedBackend && requestedBackend !== "auto" ? ladder.findIndex((preset) => preset.backend === requestedBackend) : 0;
+  const fallbackTail = primaryIndex >= 0 ? ladder.slice(primaryIndex) : ladder;
+  for (const preset of fallbackTail)
+    add2(imageCandidateFor(preset.id));
+  return candidates;
+}
 function imageGenerationDir(repoRoot = ".") {
   return join36(repoRoot, ".omnius", "image-gen");
 }
@@ -250653,6 +250706,33 @@ function formatSuccessOutput(args) {
     `  Prompt: "${prompt}"`
   ].filter(Boolean).join("\n");
 }
+function summarizeToolResult(result) {
+  return trimProcessText(String(result.error || result.output || "unknown error"), 700).replace(/\s+/g, " ").trim();
+}
+function formatImageAttempt(candidate, reason, index) {
+  return `${index + 1}. ${candidate.model} [${candidate.backend}] - ${reason}`;
+}
+function formatImageFallbackFailure(failed) {
+  return [
+    "No image generation model in the fallback ladder completed successfully.",
+    "Attempted, highest quality to lowest:",
+    ...failed.map((attempt, index) => `  ${formatImageAttempt(attempt.candidate, attempt.reason, index)}`)
+  ].join("\n");
+}
+function annotateImageFallbackSuccess(result, failed, winner) {
+  if (failed.length === 0)
+    return result;
+  const prefix = [
+    `Fallback ladder succeeded with ${winner.model} [${winner.backend}] after ${failed.length} failed attempt(s).`,
+    "Failed attempts:",
+    ...failed.map((attempt, index) => `  ${formatImageAttempt(attempt.candidate, attempt.reason, index)}`),
+    ""
+  ].join("\n");
+  return {
+    ...result,
+    output: prefix + result.output
+  };
+}
 function parseRunnerJson(stdout) {
   const lines = stdout.trim().split(/\r?\n/).reverse();
   for (const line of lines) {
@@ -250665,7 +250745,7 @@ function parseRunnerJson(stdout) {
   }
   return null;
 }
-var DEFAULT_DIFFUSERS_IMAGE_MODEL, DEFAULT_OLLAMA_IMAGE_MODEL, DIFFUSERS_PYTHON_PACKAGES, SDCPP_PYTHON_PACKAGES, IMAGE_GENERATION_MODEL_PRESETS, OLLAMA_IMAGE_MODELS, DIFFUSERS_RUNNER, SDCPP_RUNNER, ImageGenerateTool;
+var DEFAULT_DIFFUSERS_IMAGE_MODEL, DEFAULT_OLLAMA_IMAGE_MODEL, DIFFUSERS_PYTHON_PACKAGES, SDCPP_PYTHON_PACKAGES, IMAGE_GENERATION_MODEL_PRESETS, IMAGE_GENERATION_QUALITY_LADDER, OLLAMA_IMAGE_MODELS, DIFFUSERS_RUNNER, SDCPP_RUNNER, ImageGenerateTool;
 var init_image_generate = __esm({
   "packages/execution/dist/tools/image-generate.js"() {
     "use strict";
@@ -250989,6 +251069,21 @@ var init_image_generate = __esm({
         note: "CPU/GGUF/checkpoint route; requires a local model path."
       }
     ];
+    IMAGE_GENERATION_QUALITY_LADDER = [
+      "black-forest-labs/FLUX.1-dev",
+      "stabilityai/stable-diffusion-3.5-large",
+      DEFAULT_OLLAMA_IMAGE_MODEL,
+      "black-forest-labs/FLUX.1-schnell",
+      "stabilityai/stable-diffusion-3.5-large-turbo",
+      "Tongyi-MAI/Z-Image-Turbo",
+      "black-forest-labs/FLUX.2-klein-4B",
+      DEFAULT_DIFFUSERS_IMAGE_MODEL,
+      "Efficient-Large-Model/Sana_Sprint_0.6B_1024px_diffusers",
+      "SimianLuo/LCM_Dreamshaper_v7",
+      "stabilityai/sd-turbo",
+      "segmind/tiny-sd",
+      "nota-ai/bk-sdm-tiny-2m"
+    ];
     OLLAMA_IMAGE_MODELS = IMAGE_GENERATION_MODEL_PRESETS.filter((preset) => preset.backend === "ollama").map((preset) => preset.id);
     DIFFUSERS_RUNNER = String.raw`#!/usr/bin/env python3
 import argparse
@@ -251170,7 +251265,7 @@ if __name__ == "__main__":
 `;
     ImageGenerateTool = class {
       name = "generate_image";
-      description = "Generate an image from a text prompt using a local image-generation backend. Supports Ollama image models (x/z-image-turbo, x/flux2-klein), Python Diffusers models (SDXL Turbo default, FLUX.1 dev, SD3.5 Large, Tiny-SD, LCM, Sana Sprint), and stable-diffusion.cpp local checkpoints/GGUF. Saves a PNG under .omnius/images and returns the file path.";
+      description = "Generate an image from a text prompt using a local image-generation backend. Supports Ollama image models (x/z-image-turbo, x/flux2-klein), Python Diffusers models (SDXL Turbo default, FLUX.1 dev, SD3.5 Large, Tiny-SD, LCM, Sana Sprint), and stable-diffusion.cpp local checkpoints/GGUF. When fallback is enabled, auto generation tries ranked high-quality candidates first and falls back to smaller models if setup, download, or generation fails. Saves a PNG under .omnius/images and returns the file path.";
       parameters = {
         type: "object",
         properties: {
@@ -251215,6 +251310,14 @@ if __name__ == "__main__":
             type: "string",
             enum: ["generate", "list_models", "setup"],
             description: "Optional utility action. Default is generate."
+          },
+          fallback: {
+            type: "boolean",
+            description: "Whether to try the ranked quality ladder if the selected model/backend fails. Defaults true."
+          },
+          strict_model: {
+            type: "boolean",
+            description: "When true, use only the requested model/backend and do not fall back. Defaults false."
           }
         },
         required: ["prompt"]
@@ -251257,7 +251360,7 @@ if __name__ == "__main__":
         if (action === "list_models") {
           return {
             success: true,
-            output: IMAGE_GENERATION_MODEL_PRESETS.map((preset2) => `${preset2.id} [${preset2.backend}] - ${preset2.note}`).join("\n"),
+            output: IMAGE_GENERATION_MODEL_PRESETS.map((preset) => `${preset.id} [${preset.backend}] - ${preset.note}`).join("\n"),
             durationMs: performance.now() - start2
           };
         }
@@ -251281,19 +251384,8 @@ if __name__ == "__main__":
           const rawModel2 = args["model_path"] ? String(args["model_path"]) : args["model"] ? String(args["model"]) : this.defaultModel;
           const requestedModel2 = rawModel2 === "auto" ? void 0 : rawModel2;
           const requestedBackend2 = args["backend"] ? String(args["backend"]) : this.defaultBackend;
-          let backend = inferImageGenerationBackend(requestedModel2, requestedBackend2);
-          if (backend === "auto") {
-            backend = inferImageGenerationBackend(requestedModel2, void 0);
-            if (backend === "auto")
-              backend = "diffusers";
-          }
-          const model = requestedModel2 ?? (backend === "diffusers" ? DEFAULT_DIFFUSERS_IMAGE_MODEL : DEFAULT_OLLAMA_IMAGE_MODEL);
-          this.emitProgress({ stage: "setup", message: `Preparing image model ${model} (${backend})` });
-          if (backend === "ollama")
-            return await this.prewarmOllama({ model, start: start2 });
-          if (backend === "sdcpp")
-            return await this.prewarmSdCpp({ model, start: start2, python: args["python"] });
-          return await this.prewarmDiffusers({ model, start: start2, python: args["python"] });
+          const candidates2 = imageGenerationFallbackCandidates(requestedModel2, requestedBackend2, generationFallbackEnabled(args));
+          return await this.prewarmCandidateLadder({ candidates: candidates2, args, start: start2 });
         }
         const prompt = String(args["prompt"] ?? "").trim();
         if (!prompt) {
@@ -251302,31 +251394,10 @@ if __name__ == "__main__":
         const rawModel = args["model_path"] ? String(args["model_path"]) : args["model"] ? String(args["model"]) : this.defaultModel;
         const requestedModel = rawModel === "auto" ? void 0 : rawModel;
         const requestedBackend = args["backend"] ? String(args["backend"]) : this.defaultBackend;
-        const preset = getImageGenerationPreset(requestedModel);
-        const width = numberArg(args["width"], preset?.width ?? 1024);
-        const height = numberArg(args["height"], preset?.height ?? 1024);
-        const steps = optionalNumberArg(args["steps"]) ?? preset?.steps;
-        const guidance = optionalNumberArg(args["guidance"]) ?? preset?.guidance;
         const seed = optionalNumberArg(args["seed"]);
+        const candidates = imageGenerationFallbackCandidates(requestedModel, requestedBackend, generationFallbackEnabled(args));
         try {
-          let backend = inferImageGenerationBackend(requestedModel, requestedBackend);
-          let model = requestedModel;
-          if (backend === "auto") {
-            backend = inferImageGenerationBackend(model, void 0);
-            if (backend === "auto")
-              backend = "diffusers";
-          }
-          if (!model) {
-            model = backend === "diffusers" ? DEFAULT_DIFFUSERS_IMAGE_MODEL : DEFAULT_OLLAMA_IMAGE_MODEL;
-          }
-          this.emitProgress({ stage: "setup", message: `Using image model ${model} (${backend})` });
-          if (backend === "ollama") {
-            return await this.generateWithOllama({ prompt, model, width, height, steps, start: start2 });
-          }
-          if (backend === "sdcpp") {
-            return await this.generateWithSdCpp({ prompt, model, width, height, steps, seed, start: start2, python: args["python"] });
-          }
-          return await this.generateWithDiffusers({ prompt, model, width, height, steps, guidance, seed, start: start2, python: args["python"] });
+          return await this.generateCandidateLadder({ candidates, prompt, args, seed, start: start2 });
         } catch (err) {
           return {
             success: false,
@@ -251335,6 +251406,64 @@ if __name__ == "__main__":
           };
         }
       }
+      async prewarmCandidateLadder(args) {
+        const failed = [];
+        for (let index = 0; index < args.candidates.length; index++) {
+          const candidate = args.candidates[index];
+          this.emitProgress({
+            stage: "setup",
+            message: `Preparing image model ${candidate.model} (${candidate.backend}) [${index + 1}/${args.candidates.length}]`
+          });
+          const result = candidate.backend === "ollama" ? await this.prewarmOllama({ model: candidate.model, start: args.start }) : candidate.backend === "sdcpp" ? await this.prewarmSdCpp({ model: candidate.model, start: args.start, python: args.args["python"] }) : await this.prewarmDiffusers({ model: candidate.model, start: args.start, python: args.args["python"] });
+          if (result.success)
+            return annotateImageFallbackSuccess(result, failed, candidate);
+          failed.push({ candidate, reason: summarizeToolResult(result) });
+          if (index < args.candidates.length - 1) {
+            this.emitProgress({
+              stage: "setup",
+              message: `${candidate.model} failed; trying ${args.candidates[index + 1].model}`
+            });
+          }
+        }
+        const output = formatImageFallbackFailure(failed);
+        return {
+          success: false,
+          output,
+          error: output,
+          durationMs: performance.now() - args.start
+        };
+      }
+      async generateCandidateLadder(args) {
+        const failed = [];
+        for (let index = 0; index < args.candidates.length; index++) {
+          const candidate = args.candidates[index];
+          const width = numberArg(args.args["width"], candidate.preset?.width ?? 1024);
+          const height = numberArg(args.args["height"], candidate.preset?.height ?? 1024);
+          const steps = optionalNumberArg(args.args["steps"]) ?? candidate.preset?.steps;
+          const guidance = optionalNumberArg(args.args["guidance"]) ?? candidate.preset?.guidance;
+          this.emitProgress({
+            stage: "setup",
+            message: `Using image model ${candidate.model} (${candidate.backend}) [${index + 1}/${args.candidates.length}]`
+          });
+          const result = candidate.backend === "ollama" ? await this.generateWithOllama({ prompt: args.prompt, model: candidate.model, width, height, steps, start: args.start }) : candidate.backend === "sdcpp" ? await this.generateWithSdCpp({ prompt: args.prompt, model: candidate.model, width, height, steps, seed: args.seed, start: args.start, python: args.args["python"] }) : await this.generateWithDiffusers({ prompt: args.prompt, model: candidate.model, width, height, steps, guidance, seed: args.seed, start: args.start, python: args.args["python"] });
+          if (result.success)
+            return annotateImageFallbackSuccess(result, failed, candidate);
+          failed.push({ candidate, reason: summarizeToolResult(result) });
+          if (index < args.candidates.length - 1) {
+            this.emitProgress({
+              stage: "setup",
+              message: `${candidate.model} failed; falling back to ${args.candidates[index + 1].model}`
+            });
+          }
+        }
+        const output = formatImageFallbackFailure(failed);
+        return {
+          success: false,
+          output,
+          error: output,
+          durationMs: performance.now() - args.start
+        };
+      }
       async prewarmOllama(args) {
         const model = args.model || DEFAULT_OLLAMA_IMAGE_MODEL;
         if (await this.ollamaHasModel(model)) {
@@ -251830,7 +251959,7 @@ function backendImportCheck(backend) {
   if (backend === "audiocraft")
     return "import torch, torchaudio, audiocraft\nfrom audiocraft.models import MusicGen, AudioGen\n";
   if (backend === "stable-audio")
-    return "import torch, torchaudio, stable_audio_tools\n";
+    return "import torch, torchaudio, diffusers, scipy\nfrom diffusers import StableAudioPipeline\n";
   if (backend === "tangoflux")
     return "import torch, torchaudio\nfrom tangoflux import TangoFluxInference\n";
   return "import torch, diffusers, scipy\nfrom diffusers import AudioLDMPipeline\n";
@@ -252160,11 +252289,31 @@ function playbackRequested(args) {
     return false;
   return true;
 }
+function booleanArg2(value2, fallback) {
+  if (typeof value2 === "boolean")
+    return value2;
+  if (typeof value2 === "string") {
+    if (/^(1|true|yes|on)$/i.test(value2.trim()))
+      return true;
+    if (/^(0|false|no|off)$/i.test(value2.trim()))
+      return false;
+  }
+  return fallback;
+}
+function generationFallbackEnabled2(args) {
+  if (booleanArg2(args["strict_model"] ?? args["strictModel"] ?? args["strict"], false))
+    return false;
+  return booleanArg2(args["fallback"] ?? args["allow_fallback"] ?? args["allowFallback"], true);
+}
 function getAudioGenerationPreset(model, kind) {
   if (!model)
     return void 0;
   return AUDIO_GENERATION_MODEL_PRESETS.find((preset) => preset.id === model && (!kind || preset.kind === kind)) ?? AUDIO_GENERATION_MODEL_PRESETS.find((preset) => preset.id === model);
 }
+function audioGenerationQualityLadder(kind) {
+  const ids = kind === "music" ? MUSIC_GENERATION_QUALITY_LADDER : SOUND_GENERATION_QUALITY_LADDER;
+  return ids.map((id) => getAudioGenerationPreset(id, kind)).filter((preset) => Boolean(preset));
+}
 function inferAudioGenerationBackend(model, requested) {
   if (requested && requested !== "auto") {
     if (requested === "diffusers" || requested === "transformers" || requested === "audiocraft" || requested === "stable-audio" || requested === "tangoflux" || requested === "project")
@@ -252188,6 +252337,41 @@ function inferAudioGenerationBackend(model, requested) {
     return "project";
   return "diffusers";
 }
+function audioCandidateFor(kind, model, requestedBackend) {
+  const backend = inferAudioGenerationBackend(model, requestedBackend);
+  const resolvedBackend = backend === "auto" ? kind === "music" ? "transformers" : "diffusers" : backend;
+  return {
+    kind,
+    model,
+    backend: resolvedBackend,
+    preset: getAudioGenerationPreset(model, kind)
+  };
+}
+function audioGenerationFallbackCandidates(kind, requestedModel, requestedBackend, allowFallback = true) {
+  const ladder = audioGenerationQualityLadder(kind);
+  const candidates = [];
+  const add2 = (candidate) => {
+    const key = `${candidate.kind}:${candidate.backend}:${candidate.model}`;
+    if (!candidates.some((existing) => `${existing.kind}:${existing.backend}:${existing.model}` === key)) {
+      candidates.push(candidate);
+    }
+  };
+  if (requestedModel) {
+    add2(audioCandidateFor(kind, requestedModel, requestedBackend));
+  } else if (requestedBackend && requestedBackend !== "auto") {
+    const firstForBackend = ladder.find((preset) => preset.backend === requestedBackend);
+    add2(audioCandidateFor(kind, firstForBackend?.id ?? (kind === "music" ? DEFAULT_MUSIC_MODEL : DEFAULT_SOUND_MODEL), requestedBackend));
+  } else if (!allowFallback) {
+    add2(audioCandidateFor(kind, kind === "music" ? DEFAULT_MUSIC_MODEL : DEFAULT_SOUND_MODEL, requestedBackend));
+  }
+  if (!allowFallback)
+    return candidates.length ? candidates : [audioCandidateFor(kind, kind === "music" ? DEFAULT_MUSIC_MODEL : DEFAULT_SOUND_MODEL, requestedBackend)];
+  const primaryIndex = requestedModel ? ladder.findIndex((preset) => preset.id === requestedModel) : requestedBackend && requestedBackend !== "auto" ? ladder.findIndex((preset) => preset.backend === requestedBackend) : 0;
+  const fallbackTail = primaryIndex >= 0 ? ladder.slice(primaryIndex) : ladder;
+  for (const preset of fallbackTail)
+    add2(audioCandidateFor(kind, preset.id));
+  return candidates;
+}
 function audioGenerationSetupPlan(kind, backend, repoRoot = ".", model) {
   const commandName = kind === "music" ? "music" : "sound";
   const fallback = kind === "music" ? DEFAULT_MUSIC_MODEL : DEFAULT_SOUND_MODEL;
@@ -252261,6 +252445,7 @@ function audioGenerationSetupPlan(kind, backend, repoRoot = ".", model) {
       ],
       notes: [
         "Use this path for Stable Audio Open 1.0, the serious stereo audio/music baseline.",
+        "Omnius uses Diffusers StableAudioPipeline here; stable-audio-tools is intentionally not installed because it often pulls build-from-source dependencies.",
         "Expect larger model downloads and higher VRAM pressure than AudioLDM or MusicGen small."
       ]
     };
@@ -252296,7 +252481,34 @@ function audioGenerationSetupPlan(kind, backend, repoRoot = ".", model) {
     ]
   };
 }
-var DEFAULT_SOUND_MODEL, DEFAULT_MUSIC_MODEL, DIFFUSERS_AUDIO_PACKAGES, TRANSFORMERS_AUDIO_PACKAGES, AUDIOCRAFT_PACKAGES, STABLE_AUDIO_PACKAGES, TANGOFLUX_PACKAGES, AUDIO_GENERATION_MODEL_PRESETS, DIFFUSERS_AUDIO_RUNNER, AUDIOCRAFT_RUNNER, TRANSFORMERS_AUDIO_RUNNER, TANGOFLUX_RUNNER, AudioGenerateTool;
+function summarizeToolResult2(result) {
+  return trimProcessText2(String(result.error || result.output || "unknown error"), 700).replace(/\s+/g, " ").trim();
+}
+function formatAudioAttempt(candidate, reason, index) {
+  return `${index + 1}. ${candidate.model} [${candidate.backend}] - ${reason}`;
+}
+function formatAudioFallbackFailure(kind, failed) {
+  return [
+    `No ${kind} generation model in the fallback ladder completed successfully.`,
+    "Attempted, highest quality to lowest:",
+    ...failed.map((attempt, index) => `  ${formatAudioAttempt(attempt.candidate, attempt.reason, index)}`)
+  ].join("\n");
+}
+function annotateAudioFallbackSuccess(result, failed, winner) {
+  if (failed.length === 0)
+    return result;
+  const prefix = [
+    `Fallback ladder succeeded with ${winner.model} [${winner.backend}] after ${failed.length} failed attempt(s).`,
+    "Failed attempts:",
+    ...failed.map((attempt, index) => `  ${formatAudioAttempt(attempt.candidate, attempt.reason, index)}`),
+    ""
+  ].join("\n");
+  return {
+    ...result,
+    output: prefix + result.output
+  };
+}
+var DEFAULT_SOUND_MODEL, DEFAULT_MUSIC_MODEL, DIFFUSERS_AUDIO_PACKAGES, TRANSFORMERS_AUDIO_PACKAGES, AUDIOCRAFT_PACKAGES, STABLE_AUDIO_PACKAGES, TANGOFLUX_PACKAGES, AUDIO_GENERATION_MODEL_PRESETS, SOUND_GENERATION_QUALITY_LADDER, MUSIC_GENERATION_QUALITY_LADDER, DIFFUSERS_AUDIO_RUNNER, AUDIOCRAFT_RUNNER, TRANSFORMERS_AUDIO_RUNNER, TANGOFLUX_RUNNER, AudioGenerateTool;
 var init_audio_generate = __esm({
   "packages/execution/dist/tools/audio-generate.js"() {
     "use strict";
@@ -252338,7 +252550,6 @@ var init_audio_generate = __esm({
       "accelerate",
       "scipy",
       "soundfile",
-      "stable-audio-tools",
       "einops"
     ];
     TANGOFLUX_PACKAGES = [
@@ -252644,6 +252855,21 @@ var init_audio_generate = __esm({
         note: "Legacy specialized music-generation path."
       }
     ];
+    SOUND_GENERATION_QUALITY_LADDER = [
+      "stabilityai/stable-audio-open-1.0",
+      "cvssp/audioldm2-large",
+      "cvssp/audioldm2",
+      "facebook/audiogen-medium",
+      "declare-lab/TangoFlux",
+      DEFAULT_SOUND_MODEL
+    ];
+    MUSIC_GENERATION_QUALITY_LADDER = [
+      "stabilityai/stable-audio-open-1.0",
+      "facebook/musicgen-stereo-large",
+      "facebook/musicgen-large",
+      "facebook/musicgen-medium",
+      DEFAULT_MUSIC_MODEL
+    ];
     DIFFUSERS_AUDIO_RUNNER = String.raw`#!/usr/bin/env python3
 import argparse, json, sys, time
 from pathlib import Path
@@ -253030,7 +253256,7 @@ if __name__ == "__main__":
 `;
     AudioGenerateTool = class {
       name = "generate_audio";
-      description = "Generate a sound effect or music clip from a text prompt using local audio-generation backends. Supports Diffusers AudioLDM/AudioLDM2, Transformers MusicGen, AudioCraft AudioGen, Stable Audio Open deployment paths, and explicit research-project profiles. Saves WAV files under .omnius/audio and returns the file path.";
+      description = "Generate a sound effect or music clip from a text prompt using local audio-generation backends. Supports Diffusers AudioLDM/AudioLDM2, Transformers MusicGen, AudioCraft AudioGen, Stable Audio Open deployment paths, and explicit research-project profiles. When fallback is enabled, auto generation tries ranked high-quality candidates first and gracefully falls back to smaller models if setup, download, or generation fails. Saves WAV files under .omnius/audio and returns the file path.";
       parameters = {
         type: "object",
         properties: {
@@ -253044,6 +253270,14 @@ if __name__ == "__main__":
           playback: {
             type: "boolean",
             description: "Whether the TUI should play generated audio after saving it. Defaults true; set false for silent generation."
+          },
+          fallback: {
+            type: "boolean",
+            description: "Whether to try the ranked quality ladder if the selected model/backend fails. Defaults true."
+          },
+          strict_model: {
+            type: "boolean",
+            description: "When true, use only the requested model/backend and do not fall back. Defaults false."
           }
         },
         required: ["prompt"]
@@ -253147,14 +253381,14 @@ if __name__ == "__main__":
         if (action === "list_models") {
           return {
             success: true,
-            output: AUDIO_GENERATION_MODEL_PRESETS.filter((preset2) => preset2.kind === kind).map((preset2) => `${preset2.id} [${preset2.backend}] - ${preset2.note}`).join("\n"),
+            output: AUDIO_GENERATION_MODEL_PRESETS.filter((preset) => preset.kind === kind).map((preset) => `${preset.id} [${preset.backend}] - ${preset.note}`).join("\n"),
             durationMs: performance.now() - start2
           };
         }
         if (action === "setup") {
           const requested = String(args["backend"] ?? (kind === "music" ? this.defaults.musicBackend : this.defaults.soundBackend) ?? (kind === "music" ? "transformers" : "diffusers"));
-          const backend2 = inferAudioGenerationBackend(typeof args["model"] === "string" ? args["model"] : void 0, requested);
-          const resolvedBackend = backend2 === "auto" ? kind === "music" ? "transformers" : "diffusers" : backend2;
+          const backend = inferAudioGenerationBackend(typeof args["model"] === "string" ? args["model"] : void 0, requested);
+          const resolvedBackend = backend === "auto" ? kind === "music" ? "transformers" : "diffusers" : backend;
           const plan = audioGenerationSetupPlan(kind, resolvedBackend, this.cwd, typeof args["model"] === "string" ? args["model"] : void 0);
           return {
             success: true,
@@ -253173,37 +253407,9 @@ if __name__ == "__main__":
           const defaultBackend2 = kind === "music" ? this.defaults.musicBackend : this.defaults.soundBackend;
           const rawModel2 = args["model"] ? String(args["model"]) : defaultModel2;
           const requestedModel2 = rawModel2 === "auto" ? void 0 : rawModel2;
-          let backend2 = inferAudioGenerationBackend(requestedModel2, args["backend"] ? String(args["backend"]) : defaultBackend2);
-          if (backend2 === "auto")
-            backend2 = kind === "music" ? "transformers" : "diffusers";
-          const model2 = requestedModel2 ?? (kind === "music" ? DEFAULT_MUSIC_MODEL : DEFAULT_SOUND_MODEL);
-          const preset2 = getAudioGenerationPreset(model2, kind);
-          const duration2 = numberArg2(args["duration"], preset2?.defaultDurationSec ?? (kind === "music" ? 20 : 8));
-          if (backend2 === "project") {
-            const plan = audioGenerationSetupPlan(kind, "project", this.cwd, model2);
-            return {
-              success: false,
-              output: [
-                `${preset2?.label ?? model2} is a project deployment profile, not an automatic generic runner.`,
-                "",
-                "Setup path:",
-                ...plan.commands.map((cmd) => `  ${cmd}`),
-                "",
-                ...plan.notes.map((note) => `- ${note}`)
-              ].join("\n"),
-              durationMs: performance.now() - start2
-            };
-          }
-          this.emitProgress({ stage: "setup", message: `Preparing ${kind} model ${model2} (${backend2})` });
-          return await this.prewarmPythonBackend({
-            kind,
-            backend: backend2,
-            runnerBackend: backend2,
-            model: model2,
-            duration: duration2,
-            start: start2,
-            python: args["python"]
-          });
+          const requestedBackend2 = args["backend"] ? String(args["backend"]) : defaultBackend2;
+          const candidates2 = audioGenerationFallbackCandidates(kind, requestedModel2, requestedBackend2, generationFallbackEnabled2(args));
+          return await this.prewarmCandidateLadder({ kind, candidates: candidates2, args, start: start2 });
         }
         const prompt = String(args["prompt"] ?? "").trim();
         if (!prompt) {
@@ -253213,45 +253419,12 @@ if __name__ == "__main__":
         const defaultBackend = kind === "music" ? this.defaults.musicBackend : this.defaults.soundBackend;
         const rawModel = args["model"] ? String(args["model"]) : defaultModel;
         const requestedModel = rawModel === "auto" ? void 0 : rawModel;
-        let backend = inferAudioGenerationBackend(requestedModel, args["backend"] ? String(args["backend"]) : defaultBackend);
-        if (backend === "auto")
-          backend = kind === "music" ? "transformers" : "diffusers";
-        const model = requestedModel ?? (kind === "music" ? DEFAULT_MUSIC_MODEL : DEFAULT_SOUND_MODEL);
-        const preset = getAudioGenerationPreset(model, kind);
-        const duration = numberArg2(args["duration"], preset?.defaultDurationSec ?? (kind === "music" ? 20 : 8));
-        const steps = optionalNumberArg2(args["steps"]) ?? preset?.defaultSteps;
+        const requestedBackend = args["backend"] ? String(args["backend"]) : defaultBackend;
+        const candidates = audioGenerationFallbackCandidates(kind, requestedModel, requestedBackend, generationFallbackEnabled2(args));
         const seed = optionalNumberArg2(args["seed"]);
         const playback = playbackRequested(args);
         try {
-          this.emitProgress({ stage: "setup", message: `Using ${kind} model ${model} (${backend})` });
-          if (backend === "project") {
-            const plan = audioGenerationSetupPlan(kind, "project", this.cwd, model);
-            return {
-              success: false,
-              output: [
-                `${preset?.label ?? model} is a project deployment profile, not an automatic generic runner.`,
-                "",
-                "Setup path:",
-                ...plan.commands.map((cmd) => `  ${cmd}`),
-                "",
-                ...plan.notes.map((note) => `- ${note}`)
-              ].join("\n"),
-              durationMs: performance.now() - start2
-            };
-          }
-          if (backend === "tangoflux") {
-            return await this.generateWithPythonBackend({ kind, backend, runnerBackend: "tangoflux", prompt, model, duration, steps, seed, playback, start: start2, python: args["python"] });
-          }
-          if (backend === "transformers") {
-            return await this.generateWithPythonBackend({ kind, backend, runnerBackend: "transformers", prompt, model, duration, steps, seed, playback, start: start2, python: args["python"] });
-          }
-          if (backend === "audiocraft") {
-            return await this.generateWithPythonBackend({ kind, backend, runnerBackend: "audiocraft", prompt, model, duration, steps, seed, playback, start: start2, python: args["python"] });
-          }
-          if (backend === "stable-audio") {
-            return await this.generateWithPythonBackend({ kind, backend, runnerBackend: "stable-audio", prompt, model, duration, steps, seed, playback, start: start2, python: args["python"] });
-          }
-          return await this.generateWithPythonBackend({ kind, backend: "diffusers", runnerBackend: "diffusers", prompt, model, duration, steps, seed, playback, start: start2, python: args["python"] });
+          return await this.generateCandidateLadder({ kind, candidates, prompt, args, seed, playback, start: start2 });
         } catch (err) {
           return {
             success: false,
@@ -253260,6 +253433,96 @@ if __name__ == "__main__":
           };
         }
       }
+      async prewarmCandidateLadder(args) {
+        const failed = [];
+        for (let index = 0; index < args.candidates.length; index++) {
+          const candidate = args.candidates[index];
+          const duration = numberArg2(args.args["duration"], candidate.preset?.defaultDurationSec ?? (args.kind === "music" ? 20 : 8));
+          this.emitProgress({
+            stage: "setup",
+            message: `Preparing ${args.kind} model ${candidate.model} (${candidate.backend}) [${index + 1}/${args.candidates.length}]`
+          });
+          const result = candidate.backend === "project" ? this.projectProfileResult(args.kind, candidate, args.start) : await this.prewarmPythonBackend({
+            kind: args.kind,
+            backend: candidate.backend,
+            runnerBackend: candidate.backend,
+            model: candidate.model,
+            duration,
+            start: args.start,
+            python: args.args["python"]
+          });
+          if (result.success)
+            return annotateAudioFallbackSuccess(result, failed, candidate);
+          failed.push({ candidate, reason: summarizeToolResult2(result) });
+          if (index < args.candidates.length - 1) {
+            this.emitProgress({
+              stage: "setup",
+              message: `${candidate.model} failed; trying ${args.candidates[index + 1].model}`
+            });
+          }
+        }
+        return {
+          success: false,
+          output: formatAudioFallbackFailure(args.kind, failed),
+          error: formatAudioFallbackFailure(args.kind, failed),
+          durationMs: performance.now() - args.start
+        };
+      }
+      async generateCandidateLadder(args) {
+        const failed = [];
+        for (let index = 0; index < args.candidates.length; index++) {
+          const candidate = args.candidates[index];
+          const duration = numberArg2(args.args["duration"], candidate.preset?.defaultDurationSec ?? (args.kind === "music" ? 20 : 8));
+          const steps = optionalNumberArg2(args.args["steps"]) ?? candidate.preset?.defaultSteps;
+          this.emitProgress({
+            stage: "setup",
+            message: `Using ${args.kind} model ${candidate.model} (${candidate.backend}) [${index + 1}/${args.candidates.length}]`
+          });
+          const result = candidate.backend === "project" ? this.projectProfileResult(args.kind, candidate, args.start) : await this.generateWithPythonBackend({
+            kind: args.kind,
+            backend: candidate.backend,
+            runnerBackend: candidate.backend,
+            prompt: args.prompt,
+            model: candidate.model,
+            duration,
+            steps,
+            seed: args.seed,
+            playback: args.playback,
+            start: args.start,
+            python: args.args["python"]
+          });
+          if (result.success)
+            return annotateAudioFallbackSuccess(result, failed, candidate);
+          failed.push({ candidate, reason: summarizeToolResult2(result) });
+          if (index < args.candidates.length - 1) {
+            this.emitProgress({
+              stage: "setup",
+              message: `${candidate.model} failed; falling back to ${args.candidates[index + 1].model}`
+            });
+          }
+        }
+        return {
+          success: false,
+          output: formatAudioFallbackFailure(args.kind, failed),
+          error: formatAudioFallbackFailure(args.kind, failed),
+          durationMs: performance.now() - args.start
+        };
+      }
+      projectProfileResult(kind, candidate, start2) {
+        const plan = audioGenerationSetupPlan(kind, "project", this.cwd, candidate.model);
+        return {
+          success: false,
+          output: [
+            `${candidate.preset?.label ?? candidate.model} is a project deployment profile, not an automatic generic runner.`,
+            "",
+            "Setup path:",
+            ...plan.commands.map((cmd) => `  ${cmd}`),
+            "",
+            ...plan.notes.map((note) => `- ${note}`)
+          ].join("\n"),
+          durationMs: performance.now() - start2
+        };
+      }
       async generateWithPythonBackend(args) {
         const runner = await ensureAudioRunner(this.cwd, args.runnerBackend);
         await mkdir12(audioOutputDir(this.cwd), { recursive: true });
@@ -507359,6 +507622,18 @@ function supertonicInferScript() {
 function mlxVenvPy() {
   return process.platform === "win32" ? join58(voiceDir(), "mlx-venv", "Scripts", "python.exe") : join58(voiceDir(), "mlx-venv", "bin", "python3");
 }
+function luxttsVenvDir() {
+  return join58(voiceDir(), "luxtts-venv");
+}
+function luxttsVenvPy() {
+  return process.platform === "win32" ? join58(luxttsVenvDir(), "Scripts", "python.exe") : join58(luxttsVenvDir(), "bin", "python3");
+}
+function luxttsRepoDir() {
+  return join58(voiceDir(), "LuxTTS");
+}
+function luxttsInferScript() {
+  return join58(voiceDir(), "luxtts-infer.py");
+}
 function piperVenvDir() {
   return join58(voiceDir(), "piper-venv");
 }
@@ -507385,7 +507660,7 @@ function ensureSupertonicInstalled() {
 }
 function ensureMlxInstalled() {
   if (process.platform !== "darwin" || process.arch !== "arm64") {
-    throw new Error("MLX TTS requires macOS on Apple Silicon. Use luxtts, supertonic, onnx/piper, or espeak on this machine.");
+    throw new Error("MLX TTS requires macOS on Apple Silicon. Use luxtts, supertonic, onnx/piper, or backend=auto on this machine.");
   }
   const venvPy = mlxVenvPy();
   if (!existsSync40(venvPy)) {
@@ -507402,6 +507677,81 @@ function ensureMlxInstalled() {
   }
   return venvPy;
 }
+function pythonCanImportLuxTts(venvPy) {
+  try {
+    execFileSync2(venvPy, [
+      "-c",
+      "import sys, os; sys.path.insert(0, os.environ['LUXTTS_REPO_PATH']); from zipvoice.luxvoice import LuxTTS; print('ok')"
+    ], {
+      stdio: "pipe",
+      timeout: 3e4,
+      env: { ...process.env, LUXTTS_REPO_PATH: luxttsRepoDir() }
+    });
+    return true;
+  } catch {
+    return false;
+  }
+}
+function pipInstall(venvPy, packages, timeout2 = 9e5) {
+  execFileSync2(venvPy, ["-m", "pip", "install", "--prefer-binary", ...packages], {
+    stdio: "pipe",
+    timeout: timeout2,
+    env: process.env
+  });
+}
+function ensureLuxttsInstalled() {
+  const venvPy = luxttsVenvPy();
+  const repoDir = luxttsRepoDir();
+  mkdirSync16(voiceDir(), { recursive: true });
+  if (existsSync40(venvPy) && existsSync40(join58(repoDir, "zipvoice", "luxvoice.py")) && pythonCanImportLuxTts(venvPy)) {
+    writeFileSync16(luxttsInferScript(), LUXTTS_DAEMON_PY, "utf-8");
+    return venvPy;
+  }
+  const py = findPython32();
+  if (!py)
+    throw new Error("python3 is required to set up LuxTTS voice cloning.");
+  if (!existsSync40(venvPy)) {
+    execFileSync2(py, ["-m", "venv", luxttsVenvDir()], { stdio: "pipe", timeout: 18e4 });
+  }
+  execFileSync2(venvPy, ["-m", "pip", "install", "--upgrade", "pip", "wheel", "setuptools<81"], {
+    stdio: "pipe",
+    timeout: 3e5
+  });
+  pipInstall(venvPy, ["torch", "torchaudio"], 12e5);
+  if (!existsSync40(join58(repoDir, "zipvoice", "luxvoice.py"))) {
+    if (!hasCommand3("git"))
+      throw new Error("git is required to set up LuxTTS voice cloning.");
+    execFileSync2("git", ["clone", "--depth", "1", "https://github.com/ysharma3501/LuxTTS.git", repoDir], {
+      stdio: "pipe",
+      timeout: 3e5
+    });
+  }
+  pipInstall(venvPy, [
+    "lhotse",
+    "huggingface_hub",
+    "safetensors",
+    "pydub",
+    "onnxruntime",
+    "librosa",
+    "transformers<=4.57.6",
+    "inflect",
+    "numpy",
+    "vocos",
+    "jieba",
+    "pypinyin",
+    "cn2an"
+  ], 12e5);
+  try {
+    pipInstall(venvPy, ["git+https://github.com/ysharma3501/LinaCodec.git"], 12e5);
+  } catch {
+  }
+  pipInstall(venvPy, ["-e", repoDir], 6e5);
+  writeFileSync16(luxttsInferScript(), LUXTTS_DAEMON_PY, "utf-8");
+  if (!pythonCanImportLuxTts(venvPy)) {
+    throw new Error(`LuxTTS setup completed but import still fails in ${luxttsVenvDir()}.`);
+  }
+  return venvPy;
+}
 function ensurePiperInstalled() {
   if (hasCommand3("piper"))
     return "piper";
@@ -507435,6 +507785,28 @@ function saveCloneRefFromSample(sample, cloneName) {
   copyFileSync2(source, dest);
   return dest;
 }
+function cloneSampleArg(args) {
+  for (const key of ["sample", "source_audio", "voice_sample", "reference_audio", "ref_audio", "clone_sample"]) {
+    const value2 = args[key];
+    if (typeof value2 === "string" && value2.trim())
+      return value2.trim();
+  }
+  return "";
+}
+function wantsVoiceClone(args) {
+  if (cloneSampleArg(args))
+    return true;
+  if (typeof args["clone_ref"] === "string" && args["clone_ref"].trim())
+    return true;
+  const voice = typeof args["voice"] === "string" ? args["voice"].trim() : "";
+  return /\.(wav|mp3|flac|ogg|m4a)$/i.test(voice) || voice.startsWith("/") || voice.startsWith("./") || voice.startsWith("../") || voice.startsWith("~/");
+}
+function cloneRefForSynthesis(args) {
+  const sample = cloneSampleArg(args);
+  if (sample)
+    return saveCloneRefFromSample(sample, typeof args["clone_name"] === "string" ? args["clone_name"] : void 0);
+  return resolveCloneRef(args["clone_ref"] ?? args["voice"]);
+}
 function ensureLuxttsDaemon() {
   if (_luxttsDaemon && !_luxttsDaemon.killed && _luxttsReady)
     return Promise.resolve(true);
@@ -507448,14 +507820,23 @@ function ensureLuxttsDaemon() {
   }
   if (_luxttsStarting)
     return Promise.resolve(false);
-  const venvPy = join58(homedir14(), ".omnius", "voice", "luxtts-venv", "bin", "python3");
-  const inferScript = join58(homedir14(), ".omnius", "voice", "luxtts-infer.py");
-  const repoDir = join58(homedir14(), ".omnius", "voice", "LuxTTS");
+  const venvPy = luxttsVenvPy();
+  const inferScript = luxttsInferScript();
+  const repoDir = luxttsRepoDir();
   if (!existsSync40(venvPy) || !existsSync40(inferScript))
     return Promise.resolve(false);
   _luxttsStarting = true;
   return new Promise((resolve48) => {
-    const timeout2 = setTimeout(() => {
+    let settled = false;
+    let timeout2;
+    const finish = (ready) => {
+      if (settled)
+        return;
+      settled = true;
+      clearTimeout(timeout2);
+      resolve48(ready);
+    };
+    timeout2 = setTimeout(() => {
       _luxttsStarting = false;
       if (_luxttsDaemon && !_luxttsReady) {
         try {
@@ -507464,7 +507845,7 @@ function ensureLuxttsDaemon() {
         }
         _luxttsDaemon = null;
       }
-      resolve48(false);
+      finish(false);
     }, 12e4);
     const daemon = spawn16(venvPy, [inferScript], {
       stdio: ["pipe", "pipe", "pipe"],
@@ -507486,8 +507867,7 @@ function ensureLuxttsDaemon() {
           if (msg.type === "ready") {
             _luxttsReady = true;
             _luxttsStarting = false;
-            clearTimeout(timeout2);
-            resolve48(true);
+            finish(true);
           } else if (msg.type === "result" && msg.id) {
             const pending = _luxttsPending.get(msg.id);
             if (pending) {
@@ -507509,13 +507889,13 @@ function ensureLuxttsDaemon() {
       _luxttsDaemon = null;
       _luxttsReady = false;
       _luxttsStarting = false;
+      finish(false);
     });
     daemon.on("error", () => {
       _luxttsDaemon = null;
       _luxttsReady = false;
       _luxttsStarting = false;
-      clearTimeout(timeout2);
-      resolve48(false);
+      finish(false);
     });
   });
 }
@@ -507545,7 +507925,7 @@ function luxttsSynthesize(text, cloneRef, outputPath2, speed = 1) {
     _luxttsDaemon.stdin.write(req2 + "\n");
   });
 }
-var _luxttsDaemon, _luxttsReady, _luxttsRequestId, _luxttsPending, _luxttsBuffer, _luxttsStarting, SUPERTONIC_INFER_PY, AudioPlaybackTool, TtsGenerateTool, SoundPlaybackTool;
+var _luxttsDaemon, _luxttsReady, _luxttsRequestId, _luxttsPending, _luxttsBuffer, _luxttsStarting, SUPERTONIC_INFER_PY, LUXTTS_DAEMON_PY, AudioPlaybackTool, TtsGenerateTool, SoundPlaybackTool;
 var init_audio_playback = __esm({
   "packages/execution/dist/tools/audio-playback.js"() {
     "use strict";
@@ -507585,10 +507965,45 @@ try:
 except Exception as exc:
     print(json.dumps({"ok": False, "error": str(exc), "trace": traceback.format_exc(limit=3)}))
     sys.exit(1)
+`;
+    LUXTTS_DAEMON_PY = String.raw`
+import json, os, sys, traceback, wave
+import numpy as np
+import torch
+repo = os.environ.get("LUXTTS_REPO_PATH") or ""
+if repo:
+    sys.path.insert(0, repo)
+from zipvoice.luxvoice import LuxTTS
+device = "cuda" if torch.cuda.is_available() else "cpu"
+tts = LuxTTS(model_path="YatharthS/LuxTTS", device=device, threads=4)
+print(json.dumps({"type": "ready", "device": device}), flush=True)
+for line in sys.stdin:
+    if not line.strip():
+        continue
+    req = json.loads(line)
+    if req.get("action") == "quit":
+        break
+    rid = req.get("id")
+    try:
+        text = str(req.get("text") or "").strip()
+        clone_ref = str(req.get("clone_ref") or "")
+        output = str(req.get("output_path") or "")
+        speed = float(req.get("speed") or 1.0)
+        enc = tts.encode_prompt(clone_ref, duration=5, rms=0.001)
+        wav = tts.generate_speech(text, enc, num_steps=4, guidance_scale=3.0, t_shift=0.5, speed=speed)
+        data = (np.clip(wav.cpu().numpy().squeeze(), -1, 1) * 32767).astype(np.int16)
+        with wave.open(output, "wb") as f:
+            f.setnchannels(1)
+            f.setsampwidth(2)
+            f.setframerate(48000)
+            f.writeframes(data.tobytes())
+        print(json.dumps({"type": "result", "id": rid, "path": output}), flush=True)
+    except Exception as exc:
+        print(json.dumps({"type": "error", "id": rid, "error": str(exc), "trace": traceback.format_exc(limit=3)}), flush=True)
 `;
     AudioPlaybackTool = class {
       name = "audio_playback";
-      description = "Play audio through speakers, synthesize text-to-speech, and manage TTS clone voices. Actions: 'play' to play an audio file (WAV/MP3/OGG — including recordings from memory episodes), 'speak' to synthesize and play text, 'synthesize' to save TTS to a WAV file, 'clone' to register a voice-clone sample, 'list_voices' to inspect available clone refs/backends, 'volume' to get or set system volume, 'list' to enumerate audio output devices. TTS backends are explicit: auto, luxtts, supertonic, mlx, onnx/piper, or espeak. Neural TTS backends self-provision into ~/.omnius/voice on first use where supported. Use generate_tts when the task is specifically to create a TTS file; do not use shell speech commands or generate_audio for spoken TTS.";
+      description = "Play audio through speakers, synthesize text-to-speech, and manage TTS clone voices. Actions: 'play' to play an audio file (WAV/MP3/OGG — including recordings from memory episodes), 'speak' to synthesize and play text, 'synthesize' to save TTS to a WAV file, 'clone' to register a voice-clone source clip, 'list_voices' to inspect available clone refs/backends, 'volume' to get or set system volume, 'list' to enumerate audio output devices. TTS backends include auto, LuxTTS voice cloning, Supertonic, MLX, ONNX/Piper, and a local fallback. Neural TTS backends self-provision into ~/.omnius/voice on first use where supported. For cloned speech from a source clip, call generate_tts or audio_playback action=synthesize with sample/source_audio/voice_sample and backend=auto or luxtts. Use generate_tts when the task is specifically to create a TTS file; do not use shell speech commands or generate_audio for spoken TTS.";
       parameters = {
         type: "object",
         properties: {
@@ -507615,8 +508030,8 @@ except Exception as exc:
           },
           backend: {
             type: "string",
-            enum: ["auto", "luxtts", "supertonic", "mlx", "onnx", "piper", "espeak"],
-            description: "TTS backend. auto tries LuxTTS clone, Supertonic, MLX on Apple Silicon, Piper/ONNX, then espeak."
+            enum: ["auto", "luxtts", "supertonic", "mlx", "onnx", "piper"],
+            description: "TTS backend. auto tries LuxTTS clone, Supertonic, MLX on Apple Silicon, Piper/ONNX, then a local fallback."
           },
           output: {
             type: "string",
@@ -507632,11 +508047,31 @@ except Exception as exc:
           },
           sample: {
             type: "string",
-            description: "Audio sample path to register as a clone voice for action=clone."
+            description: "Audio source clip path to register or use as a LuxTTS clone voice."
+          },
+          source_audio: {
+            type: "string",
+            description: "Alias for sample. Use this for cloned speech from a source voice clip."
+          },
+          voice_sample: {
+            type: "string",
+            description: "Alias for sample/source_audio."
+          },
+          reference_audio: {
+            type: "string",
+            description: "Alias for sample/source_audio."
+          },
+          ref_audio: {
+            type: "string",
+            description: "Alias for sample/source_audio."
+          },
+          clone_sample: {
+            type: "string",
+            description: "Alias for sample/source_audio."
           },
           clone_name: {
             type: "string",
-            description: "Friendly filename stem for action=clone."
+            description: "Friendly filename stem for action=clone or for registering a source clip during synthesis."
           },
           model: {
             type: "string",
@@ -507652,11 +508087,11 @@ except Exception as exc:
           },
           speed: {
             type: "number",
-            description: "Speech speed. espeak uses words per minute; neural backends use a multiplier."
+            description: "Speech speed. Neural backends use a multiplier; local fallback uses its backend-specific rate."
           },
           voice: {
             type: "string",
-            description: "Voice id/name. Examples: Supertonic voice M4, MLX voice af_heart, espeak voice en-us, or Piper/ONNX model path."
+            description: "Voice id/name. Examples: Supertonic voice M4, MLX voice af_heart, a source audio path for cloning, or Piper/ONNX model path."
           },
           lang: {
             type: "string",
@@ -507720,9 +508155,9 @@ except Exception as exc:
         return await this.synthesizeText(args, start2, true);
       }
       cloneVoice(args, start2) {
-        const sample = typeof args["sample"] === "string" ? args["sample"] : typeof args["file"] === "string" ? args["file"] : "";
+        const sample = cloneSampleArg(args) || (typeof args["file"] === "string" ? args["file"] : "");
         if (!sample.trim()) {
-          return { success: false, output: "", error: "Missing 'sample' parameter. Provide a local audio sample to register as a clone voice.", durationMs: performance.now() - start2 };
+          return { success: false, output: "", error: "Missing source audio. Provide sample=<file> or source_audio=<file> to register as a clone voice.", durationMs: performance.now() - start2 };
         }
         const saved = saveCloneRefFromSample(sample, typeof args["clone_name"] === "string" ? args["clone_name"] : void 0);
         return {
@@ -507739,10 +508174,11 @@ except Exception as exc:
         const lines = [
           "TTS backends:",
           `  luxtts: ${existsSync40(join58(voiceDir(), "luxtts-venv", "bin", "python3")) ? "installed" : "not installed"}; clone refs: ${refs.length}`,
+          "    clone from source clip: generate_tts text=<words> source_audio=<wav/mp3/flac/ogg/m4a> backend=auto",
           `  supertonic: ${existsSync40(supertonicVenvPy()) ? "installed" : "not installed"}; voices include M1, M2, M3, M4 when package assets are available`,
           `  mlx: ${existsSync40(mlxVenvPy()) ? "installed" : "not installed"}; Apple Silicon only; default model mlx-community/Kokoro-82M-bf16`,
           `  piper/onnx: ${hasCommand3("piper") || existsSync40(piperVenvBin()) ? "available" : "not installed"}; first use installs piper-tts into ${piperVenvDir()}; pass model=<path.onnx> for raw ONNX voices`,
-          `  espeak: ${hasCommand3("espeak-ng") ? "available" : "not found"}`,
+          `  local fallback: ${hasCommand3("espeak-ng") ? "available" : "not found"}`,
           "",
           "Registered clone refs:",
           ...refs.length ? refs.map((ref) => `  ${ref}`) : ["  none"]
@@ -507756,11 +508192,20 @@ except Exception as exc:
         }
         const requestedBackend = normalizeTtsBackend(args["backend"]);
         const strictBackend = boolArg(args["strict_backend"] ?? args["strictBackend"], false);
+        const cloneRequested = wantsVoiceClone(args);
+        if (cloneRequested && requestedBackend !== "auto" && requestedBackend !== "luxtts") {
+          return {
+            success: false,
+            output: "",
+            error: "Voice cloning from a source clip requires backend=auto or backend=luxtts.",
+            durationMs: performance.now() - start2
+          };
+        }
         const playback = playbackArg(args, speakDefault);
         const outputPath2 = ttsOutputPath(args, requestedBackend);
         const device = typeof args["device"] === "string" ? args["device"] : "default";
         const tried = [];
-        const autoCandidates = ["luxtts", "supertonic", ...process.platform === "darwin" && process.arch === "arm64" ? ["mlx"] : [], "piper", "espeak"];
+        const autoCandidates = cloneRequested ? ["luxtts"] : ["luxtts", "supertonic", ...process.platform === "darwin" && process.arch === "arm64" ? ["mlx"] : [], "piper", "espeak"];
         const candidates = requestedBackend === "auto" ? autoCandidates : strictBackend ? [requestedBackend] : [requestedBackend, ...autoCandidates.filter((backend) => backend !== requestedBackend)];
         let usedBackend = "";
         let voiceSummary = "";
@@ -507823,21 +508268,19 @@ ${tried.map((line) => `- ${line}`).join("\n")}`,
         };
       }
       async synthesizeLuxtts(text, outputPath2, args) {
-        const cloneRef = resolveCloneRef(args["clone_ref"] ?? args["voice"] ?? args["sample"]);
+        const cloneRef = cloneRefForSynthesis(args);
         if (!cloneRef)
-          throw new Error(`No LuxTTS clone reference found. Register one with audio_playback action=clone sample=<file>.`);
+          throw new Error(`No LuxTTS clone source found. Provide source_audio=<voice clip> or clone_ref=<registered clip>.`);
         const speed = numberArg3(args["speed"], 1);
+        ensureLuxttsInstalled();
         const daemonReady = await ensureLuxttsDaemon();
         if (daemonReady) {
           await luxttsSynthesize(text, cloneRef, outputPath2, speed);
           if (existsSync40(outputPath2))
             return `${basename12(cloneRef)} (LuxTTS daemon)`;
         }
-        const venvPy = join58(voiceDir(), "luxtts-venv", "bin", "python3");
-        const repoDir = join58(voiceDir(), "LuxTTS");
-        if (!existsSync40(venvPy) || !existsSync40(repoDir)) {
-          throw new Error("LuxTTS is not installed in the managed voice environment yet.");
-        }
+        const venvPy = luxttsVenvPy();
+        const repoDir = luxttsRepoDir();
         const pyScript = [
           "import json, sys, wave",
           "import numpy as np, torch",
@@ -507913,7 +508356,7 @@ ${tried.map((line) => `- ${line}`).join("\n")}`,
       }
       synthesizeEspeak(text, outputPath2, args) {
         if (!hasCommand3("espeak-ng"))
-          throw new Error("espeak-ng command not found.");
+          throw new Error("Local fallback TTS command not found.");
         const voice = typeof args["voice"] === "string" ? args["voice"] : "en";
         const speed = Math.round(numberArg3(args["speed"], 160));
         execFileSync2("espeak-ng", ["-v", voice, "-s", String(speed), "-w", outputPath2, text], {
@@ -507995,20 +508438,27 @@ ${devices.join("\n")}`,
     };
     TtsGenerateTool = class {
       name = "generate_tts";
-      description = "Generate text-to-speech audio as a WAV file, optionally playing it after synthesis. Supports explicit backends: auto, luxtts voice cloning, supertonic, mlx, onnx/piper, and espeak. Neural TTS backends self-provision into ~/.omnius/voice on first use where supported. Use clone_ref to select a registered LuxTTS voice, sample+clone_name to register a clone sample via audio_playback action=clone, and playback=false for silent file generation. Use this tool for speech/TTS requests; do not use shell commands or generate_audio as a TTS fallback.";
+      description = "Generate text-to-speech audio as a WAV file, optionally playing it after synthesis. Supports explicit backends: auto, LuxTTS voice cloning, Supertonic, MLX, ONNX/Piper, and local fallback. Neural TTS backends self-provision into ~/.omnius/voice on first use where supported. For voice cloning, pass source_audio/sample/voice_sample with the reference clip and backend=auto or luxtts; clone_name can register it for reuse. Use clone_ref to select a registered LuxTTS voice and playback=false for silent file generation. Use this tool for speech/TTS requests; do not use shell commands or generate_audio as a TTS fallback.";
       parameters = {
         type: "object",
         properties: {
           text: { type: "string", description: "Text to synthesize" },
           input: { type: "string", description: "Alias for text." },
           prompt: { type: "string", description: "Alias for text." },
-          backend: { type: "string", enum: ["auto", "luxtts", "supertonic", "mlx", "onnx", "piper", "espeak"] },
+          backend: { type: "string", enum: ["auto", "luxtts", "supertonic", "mlx", "onnx", "piper"] },
           output: { type: "string", description: "Output WAV path. Defaults to ~/.omnius/voice/generated/tts-*.wav." },
           path: { type: "string", description: "Alias for output." },
           playback: { type: "boolean", description: "Whether to play after generating. Defaults false for generate_tts." },
           strict_backend: { type: "boolean", description: "When true, fail instead of falling back if the requested backend is unavailable. Defaults false." },
           voice: { type: "string", description: "Voice id/name, or raw Piper/ONNX path when backend=onnx/piper." },
           clone_ref: { type: "string", description: "LuxTTS clone reference path, filename, or registered clone name." },
+          sample: { type: "string", description: "Voice source clip path for cloned speech. Alias: source_audio." },
+          source_audio: { type: "string", description: "Voice source clip path for cloned speech." },
+          voice_sample: { type: "string", description: "Alias for source_audio." },
+          reference_audio: { type: "string", description: "Alias for source_audio." },
+          ref_audio: { type: "string", description: "Alias for source_audio." },
+          clone_sample: { type: "string", description: "Alias for source_audio." },
+          clone_name: { type: "string", description: "Optional name to register the source clip for later reuse." },
           model: { type: "string", description: "Backend model id or raw ONNX/Piper model path." },
           lang: { type: "string", description: "Language code for Supertonic/MLX where supported." },
           speed: { type: "number", description: "Speech speed multiplier or backend-specific rate." },
@@ -575357,19 +575807,19 @@ function modelOnnxPath(id) {
 function modelConfigPath(id) {
   return join109(modelDir(id), "config.json");
 }
-function luxttsVenvDir() {
+function luxttsVenvDir2() {
   return join109(voiceDir2(), "luxtts-venv");
 }
-function luxttsVenvPy() {
-  return platform5() === "win32" ? join109(luxttsVenvDir(), "Scripts", "python.exe") : join109(luxttsVenvDir(), "bin", "python3");
+function luxttsVenvPy2() {
+  return platform5() === "win32" ? join109(luxttsVenvDir2(), "Scripts", "python.exe") : join109(luxttsVenvDir2(), "bin", "python3");
 }
-function luxttsRepoDir() {
+function luxttsRepoDir2() {
   return join109(voiceDir2(), "LuxTTS");
 }
 function luxttsCloneRefsDir() {
   return join109(voiceDir2(), "clone-refs");
 }
-function luxttsInferScript() {
+function luxttsInferScript2() {
   return join109(voiceDir2(), "luxtts-infer.py");
 }
 function supertonicVenvDir() {
@@ -577936,12 +578386,12 @@ Error: ${err2 instanceof Error ? err2.message : String(err2)}`
             "python3 not found. LuxTTS requires Python 3.10+. Try: apt install python3 / brew install python3"
           );
         }
-        const venvDir = luxttsVenvDir();
-        const venvPy = luxttsVenvPy();
+        const venvDir = luxttsVenvDir2();
+        const venvPy = luxttsVenvPy2();
         if (existsSync95(venvPy)) {
           try {
             const quotedPy = `"${venvPy}"`;
-            const repoPath = luxttsRepoDir().replace(/\\/g, "/");
+            const repoPath = luxttsRepoDir2().replace(/\\/g, "/");
             await this.asyncShell(
               `${quotedPy} -c "import sys; sys.path.insert(0, '${repoPath}'); from zipvoice.luxvoice import LuxTTS; print('ok')"`,
               3e4
@@ -578055,7 +578505,7 @@ Error: ${err2 instanceof Error ? err2.message : String(err2)}`
             }
           }
         }
-        const repoDir = luxttsRepoDir();
+        const repoDir = luxttsRepoDir2();
         if (!existsSync95(join109(repoDir, "zipvoice", "luxvoice.py"))) {
           renderInfo("  Cloning LuxTTS repository...");
           try {
@@ -578479,18 +578929,18 @@ def main():
 if __name__ == '__main__':
     main()
 `;
-        const scriptPath2 = luxttsInferScript();
+        const scriptPath2 = luxttsInferScript2();
         mkdirSync52(voiceDir2(), { recursive: true });
         writeFileSync49(scriptPath2, script);
       }
       /** Ensure the LuxTTS daemon is running, spawn if needed */
       async ensureLuxttsDaemon() {
         if (this._luxttsDaemon && !this._luxttsDaemon.killed) return true;
-        const venvPy = luxttsVenvPy();
+        const venvPy = luxttsVenvPy2();
         if (!existsSync95(venvPy)) return false;
         return new Promise((resolve48) => {
-          const env2 = { ...process.env, LUXTTS_REPO_PATH: luxttsRepoDir() };
-          const daemon = nodeSpawn(venvPy, [luxttsInferScript()], {
+          const env2 = { ...process.env, LUXTTS_REPO_PATH: luxttsRepoDir2() };
+          const daemon = nodeSpawn(venvPy, [luxttsInferScript2()], {
             stdio: ["pipe", "pipe", "pipe"],
             cwd: tmpdir20(),
             env: env2
@@ -596500,6 +596950,7 @@ function scopedTool(base3, root, mode) {
     async execute(args) {
       const next = { ...args };
       if (base3.name === "generate_image" || base3.name === "generate_audio" || base3.name === "generate_tts") {
+        const cleanup = [];
         const localModel = typeof next["model_path"] === "string" ? String(next["model_path"]) : typeof next["model"] === "string" && looksLikeLocalPath(String(next["model"])) ? String(next["model"]) : "";
         if (localModel) {
           const guarded = guardPath(rootAbs, localModel);
@@ -596508,6 +596959,22 @@ function scopedTool(base3, root, mode) {
           else next["model"] = guarded.path.abs;
         }
         if (base3.name === "generate_tts") {
+          for (const key of TTS_CLONE_SOURCE_KEYS) {
+            const value2 = next[key];
+            if (typeof value2 !== "string" || !value2.trim()) continue;
+            const materialized = materializeTelegramCreativeArtifactForSend(rootAbs, value2.trim());
+            if (!materialized.ok) return denied(materialized.error);
+            next[key] = materialized.path;
+            if (materialized.cleanup) cleanup.push(materialized.cleanup);
+          }
+          for (const key of ["clone_ref", "voice"]) {
+            const value2 = next[key];
+            if (typeof value2 !== "string" || !value2.trim() || !looksLikeAudioPath(value2.trim())) continue;
+            const materialized = materializeTelegramCreativeArtifactForSend(rootAbs, value2.trim());
+            if (!materialized.ok) return denied(materialized.error);
+            next[key] = materialized.path;
+            if (materialized.cleanup) cleanup.push(materialized.cleanup);
+          }
           const rawOutput = typeof next["output"] === "string" && String(next["output"]).trim() ? String(next["output"]) : typeof next["output_path"] === "string" && String(next["output_path"]).trim() ? String(next["output_path"]) : `tts-${Date.now()}.wav`;
           const guardedOutput = guardPath(rootAbs, rawOutput);
           if (!guardedOutput.ok) return denied(guardedOutput.error);
@@ -596517,16 +596984,20 @@ function scopedTool(base3, root, mode) {
           next["output"] = guardedOutput.path.abs;
           next["playback"] = false;
         }
-        const result2 = await base3.execute(next);
-        if (result2.success) {
-          if (base3.name === "generate_tts" && typeof next["output"] === "string") {
-            rememberCreated(rootAbs, String(next["output"]));
-          }
-          for (const path11 of collectGeneratedArtifactPathsFromText(result2.output, rootAbs)) {
-            rememberCreated(rootAbs, path11);
+        try {
+          const result2 = await base3.execute(next);
+          if (result2.success) {
+            if (base3.name === "generate_tts" && typeof next["output"] === "string") {
+              rememberCreated(rootAbs, String(next["output"]));
+            }
+            for (const path11 of collectGeneratedArtifactPathsFromText(result2.output, rootAbs)) {
+              rememberCreated(rootAbs, path11);
+            }
           }
+          return result2;
+        } finally {
+          for (const fn of cleanup) fn();
         }
-        return result2;
       }
       const pathKey = PATH_KEYS.find((key) => typeof next[key] === "string" && String(next[key]).trim());
       if (pathKey) {
@@ -596591,6 +597062,9 @@ function isInside(root, path11) {
 function looksLikeLocalPath(value2) {
   return value2.startsWith("/") || value2.startsWith("./") || value2.startsWith("../");
 }
+function looksLikeAudioPath(value2) {
+  return looksLikeLocalPath(value2) || value2.startsWith("~/") || /\.(wav|mp3|flac|ogg|m4a)$/i.test(value2);
+}
 function manifestPath(root) {
   return join119(root, MANIFEST_FILE);
 }
@@ -596753,7 +597227,7 @@ function denied(error) {
     mutatedFiles: []
   };
 }
-var MANIFEST_FILE, OBJECTS_DIR, SEND_DIR, PATH_KEYS, MEDIA_PATH_RE, PUBLIC_EXECUTABLE_ARTIFACT_EXTENSIONS, CreativeAudioFileTool;
+var MANIFEST_FILE, OBJECTS_DIR, SEND_DIR, PATH_KEYS, TTS_CLONE_SOURCE_KEYS, MEDIA_PATH_RE, PUBLIC_EXECUTABLE_ARTIFACT_EXTENSIONS, CreativeAudioFileTool;
 var init_telegram_creative_tools = __esm({
   "packages/cli/src/tui/telegram-creative-tools.ts"() {
     "use strict";
@@ -596762,6 +597236,7 @@ var init_telegram_creative_tools = __esm({
     OBJECTS_DIR = ".objects";
     SEND_DIR = ".send";
     PATH_KEYS = ["path", "file", "file_path", "filename", "filepath", "filePath"];
+    TTS_CLONE_SOURCE_KEYS = ["sample", "source_audio", "voice_sample", "reference_audio", "ref_audio", "clone_sample"];
     MEDIA_PATH_RE = /(?:^|[\s([])(\/[^\s<>"')\]]+\.[A-Za-z0-9]{1,12})(?:$|[\s),.\]])/g;
     PUBLIC_EXECUTABLE_ARTIFACT_EXTENSIONS = /* @__PURE__ */ new Set([
       ".sh",
@@ -596836,9 +597311,16 @@ var init_telegram_creative_tools = __esm({
           input: { type: "string", description: "Alias for text" },
           prompt: { type: "string", description: "Alias for text" },
           path: { type: "string", description: "Output .wav path inside the creative workspace" },
-          backend: { type: "string", enum: ["auto", "luxtts", "supertonic", "mlx", "onnx", "piper", "espeak"], description: "TTS backend. Defaults to auto." },
-          voice: { type: "string", description: "Voice id/name for the selected TTS backend" },
+          backend: { type: "string", enum: ["auto", "luxtts", "supertonic", "mlx", "onnx", "piper"], description: "TTS backend. Defaults to auto." },
+          voice: { type: "string", description: "Voice id/name for the selected TTS backend, or a scoped source audio path for cloning" },
           clone_ref: { type: "string", description: "Optional LuxTTS clone reference" },
+          sample: { type: "string", description: "Voice source clip path inside the creative workspace" },
+          source_audio: { type: "string", description: "Alias for sample" },
+          voice_sample: { type: "string", description: "Alias for sample" },
+          reference_audio: { type: "string", description: "Alias for sample" },
+          ref_audio: { type: "string", description: "Alias for sample" },
+          clone_sample: { type: "string", description: "Alias for sample" },
+          clone_name: { type: "string", description: "Optional name to register the source clip for later reuse" },
           model: { type: "string", description: "Optional backend model id or raw Piper/ONNX path" },
           speed: { type: "number", description: "Speech speed multiplier or backend-specific rate" }
         },
@@ -596857,26 +597339,57 @@ var init_telegram_creative_tools = __esm({
         if (!guarded.path.abs.toLowerCase().endsWith(".wav")) {
           return denied("create_audio_file currently writes WAV files; use a .wav output path.");
         }
-        await mkdir17(dirname33(guarded.path.abs), { recursive: true });
-        const tts = new TtsGenerateTool();
-        const result = await tts.execute({
-          text,
-          output: guarded.path.abs,
-          playback: false,
-          backend: args["backend"],
-          voice: args["voice"],
-          clone_ref: args["clone_ref"],
-          model: args["model"],
-          speed: args["speed"]
-        });
-        if (!result.success || !existsSync104(guarded.path.abs)) {
-          return {
-            success: false,
-            output: "",
-            error: `Audio synthesis failed through generate_tts.
+        const cloneArgs = {};
+        const cleanup = [];
+        for (const key of TTS_CLONE_SOURCE_KEYS) {
+          const value2 = args[key];
+          if (typeof value2 !== "string" || !value2.trim()) continue;
+          const materialized = materializeTelegramCreativeArtifactForSend(this.root, value2.trim());
+          if (!materialized.ok) return denied(materialized.error);
+          cloneArgs[key] = materialized.path;
+          if (materialized.cleanup) cleanup.push(materialized.cleanup);
+        }
+        for (const key of ["clone_ref", "voice"]) {
+          const value2 = args[key];
+          if (typeof value2 !== "string" || !value2.trim() || !looksLikeAudioPath(value2.trim())) continue;
+          const materialized = materializeTelegramCreativeArtifactForSend(this.root, value2.trim());
+          if (!materialized.ok) return denied(materialized.error);
+          cloneArgs[key] = materialized.path;
+          if (materialized.cleanup) cleanup.push(materialized.cleanup);
+        }
+        let result;
+        try {
+          await mkdir17(dirname33(guarded.path.abs), { recursive: true });
+          const tts = new TtsGenerateTool();
+          result = await tts.execute({
+            text,
+            output: guarded.path.abs,
+            playback: false,
+            backend: args["backend"],
+            voice: cloneArgs["voice"] ?? args["voice"],
+            clone_ref: cloneArgs["clone_ref"] ?? args["clone_ref"],
+            ...cloneArgs,
+            sample: cloneArgs["sample"],
+            source_audio: cloneArgs["source_audio"],
+            voice_sample: cloneArgs["voice_sample"],
+            reference_audio: cloneArgs["reference_audio"],
+            ref_audio: cloneArgs["ref_audio"],
+            clone_sample: cloneArgs["clone_sample"],
+            clone_name: args["clone_name"],
+            model: args["model"],
+            speed: args["speed"]
+          });
+          if (!result.success || !existsSync104(guarded.path.abs)) {
+            return {
+              success: false,
+              output: "",
+              error: `Audio synthesis failed through generate_tts.
 ${(result.error || result.output || "").slice(0, 1200)}`,
-            durationMs: performance.now() - start2
-          };
+              durationMs: performance.now() - start2
+            };
+          }
+        } finally {
+          for (const fn of cleanup) fn();
         }
         rememberCreated(this.root, guarded.path.abs);
         const sizeKB = Math.round(statSync35(guarded.path.abs).size / 1024);