npm - @glissade/narrate - Versions diffs - 0.6.0 → 0.7.0-pre.0 - Mend

@glissade/narrate 0.6.0 → 0.7.0-pre.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/providers.d.ts CHANGED Viewed

@@ -50,8 +50,21 @@ declare function openaiProvider(opts?: {
  * (`{ noiseScale: 0.667, noiseWScale: 0.8 }`) and wire via `providerImpl`.
  * The noise mode is part of `version()`, so changing it invalidates the cache.
  */
+/**
+ * Resolve a piper voice to something piper-tts 1.x can actually open. piper's
+ * `--model` wants a filesystem PATH to the `.onnx`, or a downloadable voice KEY
+ * — it does NOT search for a bare `.onnx` filename. So: an existing path is used
+ * as-is (absolutized); a bare `<name>`/`<name>.onnx` is looked up under the
+ * voices dir (`voicesDir` option → `PIPER_VOICES` env → `~/.local/share/piper-voices`);
+ * a `.onnx` name that resolves nowhere is a clear error; a bare key with no
+ * `.onnx` is passed through so piper can resolve/download it.
+ */
+declare function resolvePiperVoice(model: string, voicesDir?: string): string;
+/** Surface the TAIL of a child's stderr — Python tracebacks put the real exception last. */
+declare function stderrTail(stderr: unknown, max?: number): string;
 declare function piperProvider(opts?: {
   model?: string;
+  voicesDir?: string;
   noiseScale?: number;
   noiseWScale?: number;
 }): TtsProvider;
@@ -186,4 +199,4 @@ declare function synthesizeScript(scriptPath: string, opts?: SynthesizeOptions):
 /** Resolve `<scene>.narration.json` for a scene-module path (or accept the script itself). */
 declare function scriptPathFor(input: string): string;
 //#endregion
-export { AlignRequest, Aligner, SynthesizeOptions, SynthesizeResult, TtsProvider, TtsRequest, TtsResult, VoskAlignWord, alignerById, cacheKey, espeakProvider, fakeProvider, heuristicAligner, heuristicWords, interpolateMissing, mapAsrToScript, openaiProvider, piperProvider, providerById, scriptPathFor, synthesizeScript, voskAligner, wavDuration };
+export { AlignRequest, Aligner, SynthesizeOptions, SynthesizeResult, TtsProvider, TtsRequest, TtsResult, VoskAlignWord, alignerById, cacheKey, espeakProvider, fakeProvider, heuristicAligner, heuristicWords, interpolateMissing, mapAsrToScript, openaiProvider, piperProvider, providerById, resolvePiperVoice, scriptPathFor, stderrTail, synthesizeScript, voskAligner, wavDuration };

package/dist/providers.js CHANGED Viewed

@@ -1,8 +1,8 @@
 import { NarrationError, isPause } from "./index.js";
 import { createHash } from "node:crypto";
 import { existsSync, mkdirSync, readFileSync, unlinkSync, writeFileSync } from "node:fs";
-import { basename, dirname, join } from "node:path";
-import { tmpdir } from "node:os";
+import { basename, dirname, isAbsolute, join, resolve } from "node:path";
+import { homedir, tmpdir } from "node:os";
 import { spawnSync } from "node:child_process";
 //#region src/providers.ts
 /**
@@ -147,6 +147,30 @@ function openaiProvider(opts = {}) {
 * (`{ noiseScale: 0.667, noiseWScale: 0.8 }`) and wire via `providerImpl`.
 * The noise mode is part of `version()`, so changing it invalidates the cache.
 */
+/**
+* Resolve a piper voice to something piper-tts 1.x can actually open. piper's
+* `--model` wants a filesystem PATH to the `.onnx`, or a downloadable voice KEY
+* — it does NOT search for a bare `.onnx` filename. So: an existing path is used
+* as-is (absolutized); a bare `<name>`/`<name>.onnx` is looked up under the
+* voices dir (`voicesDir` option → `PIPER_VOICES` env → `~/.local/share/piper-voices`);
+* a `.onnx` name that resolves nowhere is a clear error; a bare key with no
+* `.onnx` is passed through so piper can resolve/download it.
+*/
+function resolvePiperVoice(model, voicesDir) {
+	if (existsSync(model)) return resolve(model);
+	if (isAbsolute(model)) return model;
+	const dir = voicesDir ?? process.env["PIPER_VOICES"] ?? join(homedir(), ".local", "share", "piper-voices");
+	const named = model.endsWith(".onnx") ? model : `${model}.onnx`;
+	for (const cand of [join(dir, model), join(dir, named)]) if (existsSync(cand)) return resolve(cand);
+	if (model.endsWith(".onnx")) throw new NarrationError(`piper voice '${model}' not found — it is not a path and is absent from the voices dir '${dir}'. Put the .onnx there, pass an absolute path as the voice, or set PIPER_VOICES / { voicesDir }.`);
+	return model;
+}
+/** Surface the TAIL of a child's stderr — Python tracebacks put the real exception last. */
+function stderrTail(stderr, max = 400) {
+	const s = (stderr == null ? "" : String(stderr)).trim();
+	if (!s) return "no output";
+	return s.length > max ? `…${s.slice(-max)}` : s;
+}
 function piperProvider(opts = {}) {
 	const noiseScale = opts.noiseScale ?? 0;
 	const noiseWScale = opts.noiseWScale ?? 0;
@@ -168,8 +192,9 @@ function piperProvider(opts = {}) {
 			].filter(Boolean).join(" "));
 		},
 		synthesize: (req) => {
-			const model = req.voice ?? opts.model;
-			if (!model) throw new NarrationError("piper needs a voice model (.onnx) — pass { model }, or set the segment voice to its path");
+			const raw = req.voice ?? opts.model;
+			if (!raw) throw new NarrationError("piper needs a voice model (.onnx) — pass { model }, or set the segment voice to its path or name");
+			const model = resolvePiperVoice(raw, opts.voicesDir);
 			const tag = createHash("sha256").update(req.text).digest("hex").slice(0, 8);
 			const out = join(tmpdir(), `glissade-piper-${process.pid}-${tag}.wav`);
 			const args = [
@@ -188,7 +213,7 @@ function piperProvider(opts = {}) {
 				maxBuffer: 64 * 1024 * 1024
 			});
 			try {
-				if (r.status !== 0 || !existsSync(out)) throw new NarrationError(`piper failed: ${r.stderr?.toString().slice(0, 300) ?? "no output"}`);
+				if (r.status !== 0 || !existsSync(out)) throw new NarrationError(`piper failed: ${stderrTail(r.stderr)}`);
 				const wav = readFileSync(out);
 				return Promise.resolve({
 					wav,
@@ -533,4 +558,4 @@ function scriptPathFor(input) {
 	return candidate;
 }
 //#endregion
-export { alignerById, cacheKey, espeakProvider, fakeProvider, heuristicAligner, heuristicWords, interpolateMissing, mapAsrToScript, openaiProvider, piperProvider, providerById, scriptPathFor, synthesizeScript, voskAligner, wavDuration };
+export { alignerById, cacheKey, espeakProvider, fakeProvider, heuristicAligner, heuristicWords, interpolateMissing, mapAsrToScript, openaiProvider, piperProvider, providerById, resolvePiperVoice, scriptPathFor, stderrTail, synthesizeScript, voskAligner, wavDuration };

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@glissade/narrate",
-  "version": "0.6.0",
+  "version": "0.7.0-pre.0",
   "description": "glissade narration + captions: TTS at prepare time (gs narrate), deterministic caching, narration-anchored timeline beats, and captions as plain tracks. Render stays offline.",
   "license": "Apache-2.0",
   "type": "module",
@@ -19,8 +19,8 @@
     "dist"
   ],
   "dependencies": {
-    "@glissade/core": "0.6.0",
-    "@glissade/scene": "0.6.0"
+    "@glissade/core": "0.7.0-pre.0",
+    "@glissade/scene": "0.7.0-pre.0"
   },
   "repository": {
     "type": "git",