@tryhamster/gerbil 1.0.0-rc.5 → 1.0.0-rc.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/browser/index.js +6 -6
- package/dist/cli.mjs +7 -7
- package/dist/cli.mjs.map +1 -1
- package/dist/frameworks/express.mjs +1 -1
- package/dist/frameworks/fastify.mjs +1 -1
- package/dist/frameworks/hono.mjs +1 -1
- package/dist/frameworks/next.mjs +1 -1
- package/dist/frameworks/trpc.mjs +1 -1
- package/dist/{gerbil-CocYaJhE.mjs → gerbil-CgLjZy0K.mjs} +5 -5
- package/dist/{gerbil-CocYaJhE.mjs.map → gerbil-CgLjZy0K.mjs.map} +1 -1
- package/dist/gerbil-IwhB_Sip.mjs +4 -0
- package/dist/index.d.mts.map +1 -1
- package/dist/index.mjs +4 -4
- package/dist/integrations/ai-sdk.mjs +3 -3
- package/dist/integrations/langchain.mjs +1 -1
- package/dist/integrations/llamaindex.mjs +1 -1
- package/dist/integrations/mcp.mjs +4 -4
- package/dist/{kokoro-BSHqCbNW.js → kokoro-DFRQ1OeM.js} +2 -2
- package/dist/{kokoro-BSHqCbNW.js.map → kokoro-DFRQ1OeM.js.map} +1 -1
- package/dist/{mcp-m9BkEngp.mjs → mcp-DGK69gbU.mjs} +3 -3
- package/dist/{mcp-m9BkEngp.mjs.map → mcp-DGK69gbU.mjs.map} +1 -1
- package/dist/{one-liner-BBbeCywj.mjs → one-liner-BJ7hDVlY.mjs} +2 -2
- package/dist/{one-liner-BBbeCywj.mjs.map → one-liner-BJ7hDVlY.mjs.map} +1 -1
- package/dist/{repl-DX6JI6fo.mjs → repl-BTq1JyH7.mjs} +3 -3
- package/dist/skills/index.d.mts +4 -4
- package/dist/skills/index.d.mts.map +1 -1
- package/dist/skills/index.mjs +3 -3
- package/dist/{skills-CBpAWeKy.mjs → skills-Hf3iEkq4.mjs} +2 -2
- package/dist/{skills-CBpAWeKy.mjs.map → skills-Hf3iEkq4.mjs.map} +1 -1
- package/dist/{stt-CkfJswka.mjs → stt-CpLYbGFd.mjs} +2 -8
- package/dist/stt-CpLYbGFd.mjs.map +1 -0
- package/dist/stt-DRPLEEHB.mjs +3 -0
- package/dist/{stt-BN46nKJd.js → stt-Te8Qz-Ay.js} +2 -8
- package/dist/stt-Te8Qz-Ay.js.map +1 -0
- package/dist/transformers.web-DokyH3rP.js +3 -0
- package/dist/{transformers.web-BschYzqZ.js → transformers.web-M6mCnEYJ.js} +2 -2
- package/dist/{transformers.web-BschYzqZ.js.map → transformers.web-M6mCnEYJ.js.map} +1 -1
- package/dist/{tts-Bn_zwjoM.js → tts-C0xx3CtE.js} +3 -13
- package/dist/tts-C0xx3CtE.js.map +1 -0
- package/dist/{tts-CmaC0yA9.mjs → tts-D5hrNcGD.mjs} +3 -13
- package/dist/tts-D5hrNcGD.mjs.map +1 -0
- package/dist/{tts-C8NaF1jo.mjs → tts-DzJDBsFR.mjs} +1 -1
- package/package.json +1 -1
- package/dist/gerbil-CjnM4Pra.mjs +0 -4
- package/dist/stt-BN46nKJd.js.map +0 -1
- package/dist/stt-BT4Rt49f.mjs +0 -3
- package/dist/stt-CkfJswka.mjs.map +0 -1
- package/dist/transformers.web-BFh4CnBR.js +0 -3
- package/dist/tts-Bn_zwjoM.js.map +0 -1
- package/dist/tts-CmaC0yA9.mjs.map +0 -1
|
@@ -338,10 +338,7 @@ var KokoroTTS = class {
|
|
|
338
338
|
const { onProgress, device = "auto" } = options;
|
|
339
339
|
onProgress?.({ status: `Loading TTS model (${this.modelConfig.id})...` });
|
|
340
340
|
try {
|
|
341
|
-
const { KokoroTTS: KokoroJS } = await import(
|
|
342
|
-
/* webpackIgnore: true */
|
|
343
|
-
"./kokoro-BSHqCbNW.js"
|
|
344
|
-
);
|
|
341
|
+
const { KokoroTTS: KokoroJS } = await import("./kokoro-DFRQ1OeM.js");
|
|
345
342
|
const isBrowser = typeof window !== "undefined";
|
|
346
343
|
let dtype = "fp32";
|
|
347
344
|
if (device === "webgpu" || device === "auto" && isBrowser && "gpu" in navigator) {
|
|
@@ -574,14 +571,7 @@ var SupertonicTTS = class {
|
|
|
574
571
|
onProgress?.({ status: `Loading TTS model (${this.modelConfig.id})...` });
|
|
575
572
|
try {
|
|
576
573
|
const isBrowser = typeof window !== "undefined";
|
|
577
|
-
const
|
|
578
|
-
let transformersModule;
|
|
579
|
-
if (isNode) transformersModule = await import(
|
|
580
|
-
/* webpackIgnore: true */
|
|
581
|
-
"./transformers.web-BFh4CnBR.js"
|
|
582
|
-
);
|
|
583
|
-
else transformersModule = await import("https://cdn.jsdelivr.net/npm/@huggingface/transformers@3.8.1");
|
|
584
|
-
const { pipeline } = transformersModule;
|
|
574
|
+
const { pipeline } = await import("./transformers.web-DokyH3rP.js");
|
|
585
575
|
if (device === "webgpu" || device === "auto" && isBrowser && "gpu" in navigator) this._deviceMode = "webgpu";
|
|
586
576
|
else this._deviceMode = "cpu";
|
|
587
577
|
onProgress?.({ status: `Loading Supertonic model...` });
|
|
@@ -731,4 +721,4 @@ function createTTS(modelId = "kokoro-82m") {
|
|
|
731
721
|
|
|
732
722
|
//#endregion
|
|
733
723
|
export { createTTS };
|
|
734
|
-
//# sourceMappingURL=tts-
|
|
724
|
+
//# sourceMappingURL=tts-C0xx3CtE.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tts-C0xx3CtE.js","names":["KOKORO_VOICES: VoiceInfo[]","SUPERTONIC_VOICES: VoiceInfo[]","TTS_MODELS: Record<string, TTSModelConfig>","dtype: \"fp32\" | \"fp16\" | \"q8\" | \"q4\" | \"q4f16\"","allAudio: Float32Array[]","chunk: AudioChunk"],"sources":["../src/core/tts.ts"],"sourcesContent":["/**\n * Text-to-Speech with Kokoro-82M\n *\n * Provides local TTS using the Kokoro-82M model with multiple voice options.\n * Uses kokoro-js for proper phoneme conversion (G2P) and audio generation.\n * Supports streaming audio generation and works in both Node.js and browser.\n *\n * @example\n * ```ts\n * const tts = new KokoroTTS();\n * await tts.load({ onProgress: (p) => console.log(p.status) });\n *\n * // List available voices\n * const voices = tts.listVoices();\n *\n * // Generate audio\n * const result = await tts.speak(\"Hello world\", { voice: \"af_bella\" });\n * // result.audio = Float32Array, result.sampleRate = 24000\n *\n * // Stream audio chunks\n * for await (const chunk of tts.speakStream(\"Long text...\")) {\n * playAudioChunk(chunk);\n * }\n * ```\n */\n\nimport type {\n AudioChunk,\n LoadTTSOptions,\n SpeakOptions,\n SpeakResult,\n TTSModelConfig,\n VoiceInfo,\n} from \"./types.js\";\n\n// Regex for sentence splitting (defined at module level for performance)\nconst SENTENCE_SPLIT_REGEX = /(?<=[.!?])\\s+/;\n\n// ============================================\n// Voice Registry\n// ============================================\n\n/**\n * Kokoro voice definitions\n * Voice IDs follow pattern: {language}{gender}_{name}\n * - a = American English\n * - b = British English\n * - f = female, m = male\n */\nexport const KOKORO_VOICES: VoiceInfo[] = [\n // American English - Female (ordered by quality)\n {\n id: \"af_heart\",\n name: \"Heart\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, highest quality voice (Grade A)\",\n embeddingFile: \"voices/af_heart.bin\",\n },\n {\n id: \"af_bella\",\n name: \"Bella\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, warm and friendly (Grade A-)\",\n embeddingFile: \"voices/af_bella.bin\",\n },\n {\n id: \"af_nicole\",\n name: \"Nicole\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, soft and gentle (Grade B-)\",\n embeddingFile: \"voices/af_nicole.bin\",\n },\n {\n id: \"af_sarah\",\n name: \"Sarah\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, clear and professional (Grade C+)\",\n embeddingFile: \"voices/af_sarah.bin\",\n },\n {\n id: \"af_sky\",\n name: \"Sky\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, young and energetic (Grade C-)\",\n embeddingFile: \"voices/af_sky.bin\",\n },\n {\n id: \"af_alloy\",\n name: \"Alloy\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade C)\",\n embeddingFile: \"voices/af_alloy.bin\",\n },\n {\n id: \"af_aoede\",\n name: \"Aoede\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade C+)\",\n embeddingFile: \"voices/af_aoede.bin\",\n },\n {\n id: \"af_kore\",\n name: \"Kore\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade C+)\",\n embeddingFile: \"voices/af_kore.bin\",\n },\n {\n id: \"af_nova\",\n name: \"Nova\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade C)\",\n embeddingFile: \"voices/af_nova.bin\",\n },\n {\n id: \"af_river\",\n name: \"River\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade D)\",\n embeddingFile: \"voices/af_river.bin\",\n },\n {\n id: \"af_jessica\",\n name: \"Jessica\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade D)\",\n embeddingFile: \"voices/af_jessica.bin\",\n },\n // American English - Male\n {\n id: \"am_fenrir\",\n name: \"Fenrir\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male, best quality (Grade C+)\",\n embeddingFile: \"voices/am_fenrir.bin\",\n },\n {\n id: \"am_michael\",\n name: \"Michael\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male, warm and friendly (Grade C+)\",\n embeddingFile: \"voices/am_michael.bin\",\n },\n {\n id: \"am_puck\",\n name: \"Puck\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade C+)\",\n embeddingFile: \"voices/am_puck.bin\",\n },\n {\n id: \"am_adam\",\n name: \"Adam\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male, deep voice (Grade F+)\",\n embeddingFile: \"voices/am_adam.bin\",\n },\n {\n id: \"am_echo\",\n name: \"Echo\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade D)\",\n embeddingFile: \"voices/am_echo.bin\",\n },\n {\n id: \"am_eric\",\n name: \"Eric\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade D)\",\n embeddingFile: \"voices/am_eric.bin\",\n },\n {\n id: \"am_liam\",\n name: \"Liam\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade D)\",\n embeddingFile: \"voices/am_liam.bin\",\n },\n {\n id: \"am_onyx\",\n name: \"Onyx\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade D)\",\n embeddingFile: \"voices/am_onyx.bin\",\n },\n {\n id: \"am_santa\",\n name: \"Santa\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male, festive (Grade D-)\",\n embeddingFile: \"voices/am_santa.bin\",\n },\n // British English - Female\n {\n id: \"bf_emma\",\n name: \"Emma\",\n gender: \"female\",\n language: \"en-gb\",\n description: \"British female, elegant and clear (Grade B-)\",\n embeddingFile: \"voices/bf_emma.bin\",\n },\n {\n id: \"bf_isabella\",\n name: \"Isabella\",\n gender: \"female\",\n language: \"en-gb\",\n description: \"British female, sophisticated (Grade C)\",\n embeddingFile: \"voices/bf_isabella.bin\",\n },\n {\n id: \"bf_alice\",\n name: \"Alice\",\n gender: \"female\",\n language: \"en-gb\",\n description: \"British female (Grade D)\",\n embeddingFile: \"voices/bf_alice.bin\",\n },\n {\n id: \"bf_lily\",\n name: \"Lily\",\n gender: \"female\",\n language: \"en-gb\",\n description: \"British female (Grade D)\",\n embeddingFile: \"voices/bf_lily.bin\",\n },\n // British English - Male\n {\n id: \"bm_george\",\n name: \"George\",\n gender: \"male\",\n language: \"en-gb\",\n description: \"British male, distinguished (Grade C)\",\n embeddingFile: \"voices/bm_george.bin\",\n },\n {\n id: \"bm_fable\",\n name: \"Fable\",\n gender: \"male\",\n language: \"en-gb\",\n description: \"British male (Grade C)\",\n embeddingFile: \"voices/bm_fable.bin\",\n },\n {\n id: \"bm_lewis\",\n name: \"Lewis\",\n gender: \"male\",\n language: \"en-gb\",\n description: \"British male, friendly (Grade D+)\",\n embeddingFile: \"voices/bm_lewis.bin\",\n },\n {\n id: \"bm_daniel\",\n name: \"Daniel\",\n gender: \"male\",\n language: \"en-gb\",\n description: \"British male (Grade D)\",\n embeddingFile: \"voices/bm_daniel.bin\",\n },\n];\n\n// ============================================\n// Supertonic Voice Registry\n// ============================================\n\n/**\n * Supertonic voice definitions\n * 4 built-in voices: F1, F2 (female), M1, M2 (male)\n */\nexport const SUPERTONIC_VOICES: VoiceInfo[] = [\n {\n id: \"F1\",\n name: \"Female 1\",\n gender: \"female\",\n language: \"en\",\n description: \"Female voice 1 - Clear and natural\",\n embeddingFile: \"voices/F1.bin\",\n },\n {\n id: \"F2\",\n name: \"Female 2\",\n gender: \"female\",\n language: \"en\",\n description: \"Female voice 2 - Warm and expressive\",\n embeddingFile: \"voices/F2.bin\",\n },\n {\n id: \"M1\",\n name: \"Male 1\",\n gender: \"male\",\n language: \"en\",\n description: \"Male voice 1 - Deep and confident\",\n embeddingFile: \"voices/M1.bin\",\n },\n {\n id: \"M2\",\n name: \"Male 2\",\n gender: \"male\",\n language: \"en\",\n description: \"Male voice 2 - Friendly and casual\",\n embeddingFile: \"voices/M2.bin\",\n },\n];\n\n// ============================================\n// TTS Model Registry\n// ============================================\n\nexport const TTS_MODELS: Record<string, TTSModelConfig> = {\n \"kokoro-82m\": {\n id: \"kokoro-82m\",\n repo: \"onnx-community/Kokoro-82M-v1.0-ONNX\",\n description: \"Kokoro 82M - High-quality multilingual TTS\",\n size: \"~330MB\",\n sampleRate: 24000,\n voices: KOKORO_VOICES,\n defaultVoice: \"af_heart\",\n languages: [\"en-us\", \"en-gb\"],\n },\n \"supertonic-66m\": {\n id: \"supertonic-66m\",\n repo: \"onnx-community/Supertonic-TTS-ONNX\",\n description: \"Supertonic 66M - Fast on-device TTS (167x realtime)\",\n size: \"~250MB\",\n sampleRate: 44100,\n voices: SUPERTONIC_VOICES,\n defaultVoice: \"F1\",\n languages: [\"en\"],\n },\n};\n\n/**\n * Get TTS model config by ID\n */\nexport function getTTSModelConfig(modelId: string): TTSModelConfig | null {\n return TTS_MODELS[modelId] || null;\n}\n\n/**\n * List all available TTS models\n */\nexport function listTTSModels(): TTSModelConfig[] {\n return Object.values(TTS_MODELS);\n}\n\n// ============================================\n// Kokoro TTS Class (wraps kokoro-js)\n// ============================================\n\n// kokoro-js types\ninterface KokoroJSAudio {\n audio: Float32Array;\n sampling_rate: number;\n}\n\ninterface KokoroJSInstance {\n generate(text: string, options?: { voice?: string; speed?: number }): Promise<KokoroJSAudio>;\n list_voices(): Array<{\n name: string;\n language: string;\n gender: string;\n traits: string;\n targetQuality: string;\n overallGrade: string;\n }>;\n}\n\n/**\n * Kokoro TTS - Local text-to-speech with voice selection\n *\n * Uses kokoro-js (official Kokoro library by xenova) for high-quality speech synthesis.\n * Includes proper G2P (grapheme-to-phoneme) conversion for accurate pronunciation.\n */\nexport class KokoroTTS {\n private kokoroInstance: KokoroJSInstance | null = null;\n private modelConfig: TTSModelConfig;\n private loadPromise: Promise<void> | null = null;\n private _isLoaded = false;\n private _deviceMode: \"webgpu\" | \"cpu\" = \"cpu\";\n\n constructor(modelId = \"kokoro-82m\") {\n const config = getTTSModelConfig(modelId);\n if (!config) {\n throw new Error(\n `Unknown TTS model: ${modelId}. Available: ${Object.keys(TTS_MODELS).join(\", \")}`,\n );\n }\n this.modelConfig = config;\n }\n\n // ============================================\n // Model Loading\n // ============================================\n\n /**\n * Load the TTS model\n *\n * @example\n * ```ts\n * const tts = new KokoroTTS();\n * await tts.load({\n * onProgress: (p) => console.log(p.status, p.progress),\n * device: \"webgpu\",\n * });\n * ```\n */\n async load(options: LoadTTSOptions = {}): Promise<void> {\n if (this._isLoaded) {\n return;\n }\n\n // Prevent duplicate loads\n if (this.loadPromise) {\n return this.loadPromise;\n }\n\n this.loadPromise = this._load(options);\n await this.loadPromise;\n }\n\n private async _load(options: LoadTTSOptions = {}): Promise<void> {\n const { onProgress, device = \"auto\" } = options;\n\n onProgress?.({ status: `Loading TTS model (${this.modelConfig.id})...` });\n\n try {\n // Dynamically import kokoro-js\n // tsdown handles resolution: Node.js = external, Browser = bundled\n const kokoroModule = await import(\"kokoro-js\");\n const { KokoroTTS: KokoroJS } = kokoroModule;\n\n // Determine device/dtype\n const isBrowser = typeof window !== \"undefined\";\n let dtype: \"fp32\" | \"fp16\" | \"q8\" | \"q4\" | \"q4f16\" = \"fp32\";\n\n if (device === \"webgpu\" || (device === \"auto\" && isBrowser && \"gpu\" in navigator)) {\n dtype = \"fp16\";\n this._deviceMode = \"webgpu\";\n } else {\n dtype = \"fp32\";\n this._deviceMode = \"cpu\";\n }\n\n onProgress?.({ status: `Loading model with ${dtype} precision...` });\n\n // Load the model using kokoro-js\n // kokoro-js handles:\n // - Model loading with proper quantization\n // - Phoneme tokenization (G2P) via phonemizer\n // - Voice embeddings\n this.kokoroInstance = (await KokoroJS.from_pretrained(this.modelConfig.repo, {\n dtype,\n progress_callback: (progress: any) => {\n if (progress.status === \"progress\" && progress.file) {\n onProgress?.({\n status: `Downloading ${progress.file}`,\n progress: Math.round(progress.progress || 0),\n file: progress.file,\n });\n } else if (progress.status === \"ready\") {\n onProgress?.({ status: \"Model ready\" });\n }\n },\n })) as unknown as KokoroJSInstance;\n\n this._isLoaded = true;\n onProgress?.({ status: `Ready (${this._deviceMode.toUpperCase()})!` });\n } catch (error) {\n this.loadPromise = null;\n throw error;\n }\n }\n\n /**\n * Ensure model is loaded (lazy loading)\n */\n async ensureLoaded(options?: LoadTTSOptions): Promise<void> {\n if (!this._isLoaded) {\n await this.load(options);\n }\n }\n\n // ============================================\n // Voice Management\n // ============================================\n\n /**\n * Get list of available voices\n *\n * @example\n * ```ts\n * const voices = tts.listVoices();\n * // [{ id: \"af_heart\", name: \"Heart\", gender: \"female\", ... }, ...]\n * ```\n */\n listVoices(): VoiceInfo[] {\n return [...this.modelConfig.voices];\n }\n\n /**\n * Get a specific voice by ID\n */\n getVoice(voiceId: string): VoiceInfo | null {\n return this.modelConfig.voices.find((v) => v.id === voiceId) || null;\n }\n\n /**\n * Get voices by gender\n */\n getVoicesByGender(gender: \"male\" | \"female\"): VoiceInfo[] {\n return this.modelConfig.voices.filter((v) => v.gender === gender);\n }\n\n /**\n * Get voices by language\n */\n getVoicesByLanguage(language: string): VoiceInfo[] {\n return this.modelConfig.voices.filter(\n (v) => v.language === language || v.language.startsWith(language),\n );\n }\n\n // ============================================\n // Speech Generation\n // ============================================\n\n /**\n * Generate speech from text\n *\n * @example\n * ```ts\n * const result = await tts.speak(\"Hello world\", {\n * voice: \"af_heart\",\n * speed: 1.0,\n * });\n *\n * // Play in browser\n * const audioContext = new AudioContext();\n * const buffer = audioContext.createBuffer(1, result.audio.length, result.sampleRate);\n * buffer.copyToChannel(result.audio, 0);\n * const source = audioContext.createBufferSource();\n * source.buffer = buffer;\n * source.connect(audioContext.destination);\n * source.start();\n * ```\n */\n async speak(text: string, options: SpeakOptions = {}): Promise<SpeakResult> {\n await this.ensureLoaded({ onProgress: options.onProgress });\n\n const { voice = this.modelConfig.defaultVoice, speed = 1.0 } = options;\n\n // Validate voice exists in our registry\n const voiceInfo = this.getVoice(voice);\n if (!voiceInfo) {\n throw new Error(`Unknown voice: ${voice}. Use listVoices() to see available options.`);\n }\n\n if (!this.kokoroInstance) {\n throw new Error(\"Model not loaded\");\n }\n\n const startTime = performance.now();\n\n // Generate audio using kokoro-js\n const result = await this.kokoroInstance.generate(text, {\n voice,\n speed,\n });\n\n const totalTime = performance.now() - startTime;\n\n return {\n audio: result.audio,\n sampleRate: result.sampling_rate,\n duration: result.audio.length / result.sampling_rate,\n voice,\n totalTime,\n };\n }\n\n /**\n * Stream speech generation (yields audio chunks as they're generated)\n *\n * @example\n * ```ts\n * for await (const chunk of tts.speakStream(\"Long text...\")) {\n * // chunk.samples = Float32Array\n * // chunk.sampleRate = 24000\n * // chunk.isFinal = boolean\n * playChunk(chunk);\n * }\n * ```\n */\n async *speakStream(\n text: string,\n options: SpeakOptions = {},\n ): AsyncGenerator<AudioChunk, SpeakResult, unknown> {\n await this.ensureLoaded({ onProgress: options.onProgress });\n\n const { voice = this.modelConfig.defaultVoice, speed = 1.0 } = options;\n\n // Validate voice\n const voiceInfo = this.getVoice(voice);\n if (!voiceInfo) {\n throw new Error(`Unknown voice: ${voice}. Use listVoices() to see available options.`);\n }\n\n if (!this.kokoroInstance) {\n throw new Error(\"Model not loaded\");\n }\n\n const startTime = performance.now();\n\n // Split text into sentences for streaming\n const sentences = this.splitIntoSentences(text);\n const allAudio: Float32Array[] = [];\n let chunkIndex = 0;\n let sampleRate = this.modelConfig.sampleRate;\n\n for (let i = 0; i < sentences.length; i++) {\n const sentence = sentences[i];\n if (!sentence.trim()) {\n continue;\n }\n\n const result = await this.kokoroInstance.generate(sentence, {\n voice,\n speed,\n });\n\n sampleRate = result.sampling_rate;\n allAudio.push(result.audio);\n\n const chunk: AudioChunk = {\n samples: result.audio,\n sampleRate: result.sampling_rate,\n index: chunkIndex++,\n isFinal: i === sentences.length - 1,\n };\n\n yield chunk;\n options.onAudioChunk?.(chunk);\n }\n\n // Concatenate all audio\n const totalLength = allAudio.reduce((sum, arr) => sum + arr.length, 0);\n const fullAudio = new Float32Array(totalLength);\n let offset = 0;\n for (const chunk of allAudio) {\n fullAudio.set(chunk, offset);\n offset += chunk.length;\n }\n\n const totalTime = performance.now() - startTime;\n\n return {\n audio: fullAudio,\n sampleRate,\n duration: fullAudio.length / sampleRate,\n voice,\n totalTime,\n };\n }\n\n /**\n * Split text into sentences for streaming\n */\n private splitIntoSentences(text: string): string[] {\n // Split on sentence boundaries while preserving the delimiters\n return text.split(SENTENCE_SPLIT_REGEX).filter((s) => s.trim());\n }\n\n // ============================================\n // Status & Info\n // ============================================\n\n /**\n * Check if model is loaded\n */\n isLoaded(): boolean {\n return this._isLoaded;\n }\n\n /**\n * Get current device mode\n */\n getDeviceMode(): \"webgpu\" | \"cpu\" {\n return this._deviceMode;\n }\n\n /**\n * Get model configuration\n */\n getModelInfo(): TTSModelConfig {\n return { ...this.modelConfig };\n }\n\n /**\n * Get sample rate\n */\n getSampleRate(): number {\n return this.modelConfig.sampleRate;\n }\n\n // ============================================\n // Cleanup\n // ============================================\n\n /**\n * Dispose of resources\n */\n async dispose(): Promise<void> {\n // kokoro-js doesn't expose a dispose method currently\n // but we clear our reference\n this.kokoroInstance = null;\n this._isLoaded = false;\n this.loadPromise = null;\n }\n}\n\n// ============================================\n// Supertonic TTS Class (uses transformers.js)\n// ============================================\n\n/**\n * Supertonic TTS - Fast on-device text-to-speech\n *\n * Uses transformers.js with the Supertonic-TTS-ONNX model.\n * Generates speech at 167x realtime with 66M parameters.\n * Outputs at 44100 Hz sample rate.\n */\nexport class SupertonicTTS {\n private pipeline: any = null;\n private modelConfig: TTSModelConfig;\n private loadPromise: Promise<void> | null = null;\n private _isLoaded = false;\n private _deviceMode: \"webgpu\" | \"cpu\" = \"cpu\";\n private voiceEmbeddings: Map<string, Float32Array> = new Map();\n\n constructor(modelId = \"supertonic-66m\") {\n const config = getTTSModelConfig(modelId);\n if (!config) {\n throw new Error(\n `Unknown TTS model: ${modelId}. Available: ${Object.keys(TTS_MODELS).join(\", \")}`,\n );\n }\n this.modelConfig = config;\n }\n\n /**\n * Load the TTS model\n */\n async load(options: LoadTTSOptions = {}): Promise<void> {\n if (this._isLoaded) {\n return;\n }\n\n if (this.loadPromise) {\n return this.loadPromise;\n }\n\n this.loadPromise = this._load(options);\n await this.loadPromise;\n }\n\n private async _load(options: LoadTTSOptions = {}): Promise<void> {\n const { onProgress, device = \"auto\" } = options;\n\n onProgress?.({ status: `Loading TTS model (${this.modelConfig.id})...` });\n\n try {\n // Determine device\n const isBrowser = typeof window !== \"undefined\";\n\n // Dynamically import transformers.js\n // tsdown handles resolution: Node.js = external, Browser = bundled\n const { pipeline } = await import(\"@huggingface/transformers\");\n if (device === \"webgpu\" || (device === \"auto\" && isBrowser && \"gpu\" in navigator)) {\n this._deviceMode = \"webgpu\";\n } else {\n this._deviceMode = \"cpu\";\n }\n\n onProgress?.({ status: `Loading Supertonic model...` });\n\n // Create TTS pipeline\n this.pipeline = await pipeline(\"text-to-speech\", this.modelConfig.repo, {\n dtype: \"fp32\", // Supertonic works best with fp32\n device: this._deviceMode,\n progress_callback: (progress: any) => {\n if (progress.status === \"progress\" && progress.file) {\n onProgress?.({\n status: `Downloading ${progress.file}`,\n progress: Math.round(progress.progress || 0),\n file: progress.file,\n });\n }\n },\n });\n\n // Load voice embeddings\n onProgress?.({ status: \"Loading voice embeddings...\" });\n await this.loadVoiceEmbeddings();\n\n this._isLoaded = true;\n onProgress?.({ status: `Ready (${this._deviceMode.toUpperCase()})!` });\n } catch (error) {\n this.loadPromise = null;\n throw error;\n }\n }\n\n /**\n * Load speaker embeddings for all voices\n * Supertonic uses 101x128 = 12,928 floats per voice\n */\n private async loadVoiceEmbeddings(): Promise<void> {\n // In browser, we'd fetch from HuggingFace Hub\n // In Node.js, we'd load from cache\n // For now, we'll lazy-load embeddings when needed\n // The pipeline handles this internally when we pass speaker_embeddings\n }\n\n async ensureLoaded(options?: LoadTTSOptions): Promise<void> {\n if (!this._isLoaded) {\n await this.load(options);\n }\n }\n\n listVoices(): VoiceInfo[] {\n return [...this.modelConfig.voices];\n }\n\n getVoice(voiceId: string): VoiceInfo | null {\n return this.modelConfig.voices.find((v) => v.id === voiceId) || null;\n }\n\n getVoicesByGender(gender: \"male\" | \"female\"): VoiceInfo[] {\n return this.modelConfig.voices.filter((v) => v.gender === gender);\n }\n\n /**\n * Generate speech from text\n */\n async speak(text: string, options: SpeakOptions = {}): Promise<SpeakResult> {\n await this.ensureLoaded({ onProgress: options.onProgress });\n\n const { voice = this.modelConfig.defaultVoice } = options;\n\n // Validate voice\n const voiceInfo = this.getVoice(voice);\n if (!voiceInfo) {\n throw new Error(`Unknown voice: ${voice}. Use listVoices() to see available options.`);\n }\n\n if (!this.pipeline) {\n throw new Error(\"Model not loaded\");\n }\n\n const startTime = performance.now();\n\n // Get or create speaker embedding\n // Supertonic expects [101, 128] = 12,928 floats\n let speakerEmbedding = this.voiceEmbeddings.get(voice);\n if (!speakerEmbedding) {\n // Load from HuggingFace Hub via fetch\n try {\n const voiceUrl = `https://huggingface.co/${this.modelConfig.repo}/resolve/main/voices/${voice}.bin`;\n const response = await fetch(voiceUrl);\n if (response.ok) {\n const buffer = await response.arrayBuffer();\n speakerEmbedding = new Float32Array(buffer);\n this.voiceEmbeddings.set(voice, speakerEmbedding);\n } else {\n throw new Error(`Failed to load voice: ${response.status}`);\n }\n } catch {\n // Fallback: create neutral embedding (not ideal but works)\n speakerEmbedding = new Float32Array(101 * 128).fill(0.1);\n this.voiceEmbeddings.set(voice, speakerEmbedding);\n }\n }\n\n // Generate audio\n const result = await this.pipeline(text, {\n speaker_embeddings: speakerEmbedding,\n });\n\n const totalTime = performance.now() - startTime;\n const audio = result.audio as Float32Array;\n const sampleRate = result.sampling_rate as number;\n\n return {\n audio,\n sampleRate,\n duration: audio.length / sampleRate,\n voice,\n totalTime,\n };\n }\n\n /**\n * Stream speech generation\n */\n async *speakStream(\n text: string,\n options: SpeakOptions = {},\n ): AsyncGenerator<AudioChunk, SpeakResult, unknown> {\n await this.ensureLoaded({ onProgress: options.onProgress });\n\n const { voice = this.modelConfig.defaultVoice, speed = 1.0 } = options;\n\n const voiceInfo = this.getVoice(voice);\n if (!voiceInfo) {\n throw new Error(`Unknown voice: ${voice}. Use listVoices() to see available options.`);\n }\n\n const startTime = performance.now();\n\n // Split text into sentences for streaming\n const sentences = text.split(SENTENCE_SPLIT_REGEX).filter((s) => s.trim());\n const allAudio: Float32Array[] = [];\n let chunkIndex = 0;\n let sampleRate = this.modelConfig.sampleRate;\n\n for (let i = 0; i < sentences.length; i++) {\n const sentence = sentences[i];\n if (!sentence.trim()) continue;\n\n const result = await this.speak(sentence, { voice, speed });\n sampleRate = result.sampleRate;\n allAudio.push(result.audio);\n\n const chunk: AudioChunk = {\n samples: result.audio,\n sampleRate: result.sampleRate,\n index: chunkIndex++,\n isFinal: i === sentences.length - 1,\n };\n\n yield chunk;\n options.onAudioChunk?.(chunk);\n }\n\n // Concatenate all audio\n const totalLength = allAudio.reduce((sum, arr) => sum + arr.length, 0);\n const fullAudio = new Float32Array(totalLength);\n let offset = 0;\n for (const chunk of allAudio) {\n fullAudio.set(chunk, offset);\n offset += chunk.length;\n }\n\n const totalTime = performance.now() - startTime;\n\n return {\n audio: fullAudio,\n sampleRate,\n duration: fullAudio.length / sampleRate,\n voice,\n totalTime,\n };\n }\n\n isLoaded(): boolean {\n return this._isLoaded;\n }\n\n getDeviceMode(): \"webgpu\" | \"cpu\" {\n return this._deviceMode;\n }\n\n getModelInfo(): TTSModelConfig {\n return { ...this.modelConfig };\n }\n\n getSampleRate(): number {\n return this.modelConfig.sampleRate;\n }\n\n async dispose(): Promise<void> {\n this.pipeline = null;\n this.voiceEmbeddings.clear();\n this._isLoaded = false;\n this.loadPromise = null;\n }\n}\n\n// ============================================\n// Unified TTS Factory\n// ============================================\n\nexport type TTSBackend = KokoroTTS | SupertonicTTS;\n\n/**\n * Create a TTS instance based on model ID\n */\nexport function createTTS(modelId: string = \"kokoro-82m\"): TTSBackend {\n if (modelId.startsWith(\"supertonic\")) {\n return new SupertonicTTS(modelId);\n }\n return new KokoroTTS(modelId);\n}\n\nexport default KokoroTTS;\n"],"mappings":";AAoCA,MAAM,uBAAuB;;;;;;;;AAa7B,MAAaA,gBAA6B;CAExC;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CAED;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CAED;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CAED;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACF;;;;;AAUD,MAAaC,oBAAiC;CAC5C;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACF;AAMD,MAAaC,aAA6C;CACxD,cAAc;EACZ,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,YAAY;EACZ,QAAQ;EACR,cAAc;EACd,WAAW,CAAC,SAAS,QAAQ;EAC9B;CACD,kBAAkB;EAChB,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,YAAY;EACZ,QAAQ;EACR,cAAc;EACd,WAAW,CAAC,KAAK;EAClB;CACF;;;;AAKD,SAAgB,kBAAkB,SAAwC;AACxE,QAAO,WAAW,YAAY;;;;;;;;AAsChC,IAAa,YAAb,MAAuB;CACrB,AAAQ,iBAA0C;CAClD,AAAQ;CACR,AAAQ,cAAoC;CAC5C,AAAQ,YAAY;CACpB,AAAQ,cAAgC;CAExC,YAAY,UAAU,cAAc;EAClC,MAAM,SAAS,kBAAkB,QAAQ;AACzC,MAAI,CAAC,OACH,OAAM,IAAI,MACR,sBAAsB,QAAQ,eAAe,OAAO,KAAK,WAAW,CAAC,KAAK,KAAK,GAChF;AAEH,OAAK,cAAc;;;;;;;;;;;;;;CAmBrB,MAAM,KAAK,UAA0B,EAAE,EAAiB;AACtD,MAAI,KAAK,UACP;AAIF,MAAI,KAAK,YACP,QAAO,KAAK;AAGd,OAAK,cAAc,KAAK,MAAM,QAAQ;AACtC,QAAM,KAAK;;CAGb,MAAc,MAAM,UAA0B,EAAE,EAAiB;EAC/D,MAAM,EAAE,YAAY,SAAS,WAAW;AAExC,eAAa,EAAE,QAAQ,sBAAsB,KAAK,YAAY,GAAG,OAAO,CAAC;AAEzE,MAAI;GAIF,MAAM,EAAE,WAAW,aADE,MAAM,OAAO;GAIlC,MAAM,YAAY,OAAO,WAAW;GACpC,IAAIC,QAAiD;AAErD,OAAI,WAAW,YAAa,WAAW,UAAU,aAAa,SAAS,WAAY;AACjF,YAAQ;AACR,SAAK,cAAc;UACd;AACL,YAAQ;AACR,SAAK,cAAc;;AAGrB,gBAAa,EAAE,QAAQ,sBAAsB,MAAM,gBAAgB,CAAC;AAOpE,QAAK,iBAAkB,MAAM,SAAS,gBAAgB,KAAK,YAAY,MAAM;IAC3E;IACA,oBAAoB,aAAkB;AACpC,SAAI,SAAS,WAAW,cAAc,SAAS,KAC7C,cAAa;MACX,QAAQ,eAAe,SAAS;MAChC,UAAU,KAAK,MAAM,SAAS,YAAY,EAAE;MAC5C,MAAM,SAAS;MAChB,CAAC;cACO,SAAS,WAAW,QAC7B,cAAa,EAAE,QAAQ,eAAe,CAAC;;IAG5C,CAAC;AAEF,QAAK,YAAY;AACjB,gBAAa,EAAE,QAAQ,UAAU,KAAK,YAAY,aAAa,CAAC,KAAK,CAAC;WAC/D,OAAO;AACd,QAAK,cAAc;AACnB,SAAM;;;;;;CAOV,MAAM,aAAa,SAAyC;AAC1D,MAAI,CAAC,KAAK,UACR,OAAM,KAAK,KAAK,QAAQ;;;;;;;;;;;CAiB5B,aAA0B;AACxB,SAAO,CAAC,GAAG,KAAK,YAAY,OAAO;;;;;CAMrC,SAAS,SAAmC;AAC1C,SAAO,KAAK,YAAY,OAAO,MAAM,MAAM,EAAE,OAAO,QAAQ,IAAI;;;;;CAMlE,kBAAkB,QAAwC;AACxD,SAAO,KAAK,YAAY,OAAO,QAAQ,MAAM,EAAE,WAAW,OAAO;;;;;CAMnE,oBAAoB,UAA+B;AACjD,SAAO,KAAK,YAAY,OAAO,QAC5B,MAAM,EAAE,aAAa,YAAY,EAAE,SAAS,WAAW,SAAS,CAClE;;;;;;;;;;;;;;;;;;;;;;CA2BH,MAAM,MAAM,MAAc,UAAwB,EAAE,EAAwB;AAC1E,QAAM,KAAK,aAAa,EAAE,YAAY,QAAQ,YAAY,CAAC;EAE3D,MAAM,EAAE,QAAQ,KAAK,YAAY,cAAc,QAAQ,MAAQ;AAI/D,MAAI,CADc,KAAK,SAAS,MAAM,CAEpC,OAAM,IAAI,MAAM,kBAAkB,MAAM,8CAA8C;AAGxF,MAAI,CAAC,KAAK,eACR,OAAM,IAAI,MAAM,mBAAmB;EAGrC,MAAM,YAAY,YAAY,KAAK;EAGnC,MAAM,SAAS,MAAM,KAAK,eAAe,SAAS,MAAM;GACtD;GACA;GACD,CAAC;EAEF,MAAM,YAAY,YAAY,KAAK,GAAG;AAEtC,SAAO;GACL,OAAO,OAAO;GACd,YAAY,OAAO;GACnB,UAAU,OAAO,MAAM,SAAS,OAAO;GACvC;GACA;GACD;;;;;;;;;;;;;;;CAgBH,OAAO,YACL,MACA,UAAwB,EAAE,EACwB;AAClD,QAAM,KAAK,aAAa,EAAE,YAAY,QAAQ,YAAY,CAAC;EAE3D,MAAM,EAAE,QAAQ,KAAK,YAAY,cAAc,QAAQ,MAAQ;AAI/D,MAAI,CADc,KAAK,SAAS,MAAM,CAEpC,OAAM,IAAI,MAAM,kBAAkB,MAAM,8CAA8C;AAGxF,MAAI,CAAC,KAAK,eACR,OAAM,IAAI,MAAM,mBAAmB;EAGrC,MAAM,YAAY,YAAY,KAAK;EAGnC,MAAM,YAAY,KAAK,mBAAmB,KAAK;EAC/C,MAAMC,WAA2B,EAAE;EACnC,IAAI,aAAa;EACjB,IAAI,aAAa,KAAK,YAAY;AAElC,OAAK,IAAI,IAAI,GAAG,IAAI,UAAU,QAAQ,KAAK;GACzC,MAAM,WAAW,UAAU;AAC3B,OAAI,CAAC,SAAS,MAAM,CAClB;GAGF,MAAM,SAAS,MAAM,KAAK,eAAe,SAAS,UAAU;IAC1D;IACA;IACD,CAAC;AAEF,gBAAa,OAAO;AACpB,YAAS,KAAK,OAAO,MAAM;GAE3B,MAAMC,QAAoB;IACxB,SAAS,OAAO;IAChB,YAAY,OAAO;IACnB,OAAO;IACP,SAAS,MAAM,UAAU,SAAS;IACnC;AAED,SAAM;AACN,WAAQ,eAAe,MAAM;;EAI/B,MAAM,cAAc,SAAS,QAAQ,KAAK,QAAQ,MAAM,IAAI,QAAQ,EAAE;EACtE,MAAM,YAAY,IAAI,aAAa,YAAY;EAC/C,IAAI,SAAS;AACb,OAAK,MAAM,SAAS,UAAU;AAC5B,aAAU,IAAI,OAAO,OAAO;AAC5B,aAAU,MAAM;;EAGlB,MAAM,YAAY,YAAY,KAAK,GAAG;AAEtC,SAAO;GACL,OAAO;GACP;GACA,UAAU,UAAU,SAAS;GAC7B;GACA;GACD;;;;;CAMH,AAAQ,mBAAmB,MAAwB;AAEjD,SAAO,KAAK,MAAM,qBAAqB,CAAC,QAAQ,MAAM,EAAE,MAAM,CAAC;;;;;CAUjE,WAAoB;AAClB,SAAO,KAAK;;;;;CAMd,gBAAkC;AAChC,SAAO,KAAK;;;;;CAMd,eAA+B;AAC7B,SAAO,EAAE,GAAG,KAAK,aAAa;;;;;CAMhC,gBAAwB;AACtB,SAAO,KAAK,YAAY;;;;;CAU1B,MAAM,UAAyB;AAG7B,OAAK,iBAAiB;AACtB,OAAK,YAAY;AACjB,OAAK,cAAc;;;;;;;;;;AAevB,IAAa,gBAAb,MAA2B;CACzB,AAAQ,WAAgB;CACxB,AAAQ;CACR,AAAQ,cAAoC;CAC5C,AAAQ,YAAY;CACpB,AAAQ,cAAgC;CACxC,AAAQ,kCAA6C,IAAI,KAAK;CAE9D,YAAY,UAAU,kBAAkB;EACtC,MAAM,SAAS,kBAAkB,QAAQ;AACzC,MAAI,CAAC,OACH,OAAM,IAAI,MACR,sBAAsB,QAAQ,eAAe,OAAO,KAAK,WAAW,CAAC,KAAK,KAAK,GAChF;AAEH,OAAK,cAAc;;;;;CAMrB,MAAM,KAAK,UAA0B,EAAE,EAAiB;AACtD,MAAI,KAAK,UACP;AAGF,MAAI,KAAK,YACP,QAAO,KAAK;AAGd,OAAK,cAAc,KAAK,MAAM,QAAQ;AACtC,QAAM,KAAK;;CAGb,MAAc,MAAM,UAA0B,EAAE,EAAiB;EAC/D,MAAM,EAAE,YAAY,SAAS,WAAW;AAExC,eAAa,EAAE,QAAQ,sBAAsB,KAAK,YAAY,GAAG,OAAO,CAAC;AAEzE,MAAI;GAEF,MAAM,YAAY,OAAO,WAAW;GAIpC,MAAM,EAAE,aAAa,MAAM,OAAO;AAClC,OAAI,WAAW,YAAa,WAAW,UAAU,aAAa,SAAS,UACrE,MAAK,cAAc;OAEnB,MAAK,cAAc;AAGrB,gBAAa,EAAE,QAAQ,+BAA+B,CAAC;AAGvD,QAAK,WAAW,MAAM,SAAS,kBAAkB,KAAK,YAAY,MAAM;IACtE,OAAO;IACP,QAAQ,KAAK;IACb,oBAAoB,aAAkB;AACpC,SAAI,SAAS,WAAW,cAAc,SAAS,KAC7C,cAAa;MACX,QAAQ,eAAe,SAAS;MAChC,UAAU,KAAK,MAAM,SAAS,YAAY,EAAE;MAC5C,MAAM,SAAS;MAChB,CAAC;;IAGP,CAAC;AAGF,gBAAa,EAAE,QAAQ,+BAA+B,CAAC;AACvD,SAAM,KAAK,qBAAqB;AAEhC,QAAK,YAAY;AACjB,gBAAa,EAAE,QAAQ,UAAU,KAAK,YAAY,aAAa,CAAC,KAAK,CAAC;WAC/D,OAAO;AACd,QAAK,cAAc;AACnB,SAAM;;;;;;;CAQV,MAAc,sBAAqC;CAOnD,MAAM,aAAa,SAAyC;AAC1D,MAAI,CAAC,KAAK,UACR,OAAM,KAAK,KAAK,QAAQ;;CAI5B,aAA0B;AACxB,SAAO,CAAC,GAAG,KAAK,YAAY,OAAO;;CAGrC,SAAS,SAAmC;AAC1C,SAAO,KAAK,YAAY,OAAO,MAAM,MAAM,EAAE,OAAO,QAAQ,IAAI;;CAGlE,kBAAkB,QAAwC;AACxD,SAAO,KAAK,YAAY,OAAO,QAAQ,MAAM,EAAE,WAAW,OAAO;;;;;CAMnE,MAAM,MAAM,MAAc,UAAwB,EAAE,EAAwB;AAC1E,QAAM,KAAK,aAAa,EAAE,YAAY,QAAQ,YAAY,CAAC;EAE3D,MAAM,EAAE,QAAQ,KAAK,YAAY,iBAAiB;AAIlD,MAAI,CADc,KAAK,SAAS,MAAM,CAEpC,OAAM,IAAI,MAAM,kBAAkB,MAAM,8CAA8C;AAGxF,MAAI,CAAC,KAAK,SACR,OAAM,IAAI,MAAM,mBAAmB;EAGrC,MAAM,YAAY,YAAY,KAAK;EAInC,IAAI,mBAAmB,KAAK,gBAAgB,IAAI,MAAM;AACtD,MAAI,CAAC,iBAEH,KAAI;GACF,MAAM,WAAW,0BAA0B,KAAK,YAAY,KAAK,uBAAuB,MAAM;GAC9F,MAAM,WAAW,MAAM,MAAM,SAAS;AACtC,OAAI,SAAS,IAAI;IACf,MAAM,SAAS,MAAM,SAAS,aAAa;AAC3C,uBAAmB,IAAI,aAAa,OAAO;AAC3C,SAAK,gBAAgB,IAAI,OAAO,iBAAiB;SAEjD,OAAM,IAAI,MAAM,yBAAyB,SAAS,SAAS;UAEvD;AAEN,sBAAmB,IAAI,aAAa,MAAU,CAAC,KAAK,GAAI;AACxD,QAAK,gBAAgB,IAAI,OAAO,iBAAiB;;EAKrD,MAAM,SAAS,MAAM,KAAK,SAAS,MAAM,EACvC,oBAAoB,kBACrB,CAAC;EAEF,MAAM,YAAY,YAAY,KAAK,GAAG;EACtC,MAAM,QAAQ,OAAO;EACrB,MAAM,aAAa,OAAO;AAE1B,SAAO;GACL;GACA;GACA,UAAU,MAAM,SAAS;GACzB;GACA;GACD;;;;;CAMH,OAAO,YACL,MACA,UAAwB,EAAE,EACwB;AAClD,QAAM,KAAK,aAAa,EAAE,YAAY,QAAQ,YAAY,CAAC;EAE3D,MAAM,EAAE,QAAQ,KAAK,YAAY,cAAc,QAAQ,MAAQ;AAG/D,MAAI,CADc,KAAK,SAAS,MAAM,CAEpC,OAAM,IAAI,MAAM,kBAAkB,MAAM,8CAA8C;EAGxF,MAAM,YAAY,YAAY,KAAK;EAGnC,MAAM,YAAY,KAAK,MAAM,qBAAqB,CAAC,QAAQ,MAAM,EAAE,MAAM,CAAC;EAC1E,MAAMD,WAA2B,EAAE;EACnC,IAAI,aAAa;EACjB,IAAI,aAAa,KAAK,YAAY;AAElC,OAAK,IAAI,IAAI,GAAG,IAAI,UAAU,QAAQ,KAAK;GACzC,MAAM,WAAW,UAAU;AAC3B,OAAI,CAAC,SAAS,MAAM,CAAE;GAEtB,MAAM,SAAS,MAAM,KAAK,MAAM,UAAU;IAAE;IAAO;IAAO,CAAC;AAC3D,gBAAa,OAAO;AACpB,YAAS,KAAK,OAAO,MAAM;GAE3B,MAAMC,QAAoB;IACxB,SAAS,OAAO;IAChB,YAAY,OAAO;IACnB,OAAO;IACP,SAAS,MAAM,UAAU,SAAS;IACnC;AAED,SAAM;AACN,WAAQ,eAAe,MAAM;;EAI/B,MAAM,cAAc,SAAS,QAAQ,KAAK,QAAQ,MAAM,IAAI,QAAQ,EAAE;EACtE,MAAM,YAAY,IAAI,aAAa,YAAY;EAC/C,IAAI,SAAS;AACb,OAAK,MAAM,SAAS,UAAU;AAC5B,aAAU,IAAI,OAAO,OAAO;AAC5B,aAAU,MAAM;;EAGlB,MAAM,YAAY,YAAY,KAAK,GAAG;AAEtC,SAAO;GACL,OAAO;GACP;GACA,UAAU,UAAU,SAAS;GAC7B;GACA;GACD;;CAGH,WAAoB;AAClB,SAAO,KAAK;;CAGd,gBAAkC;AAChC,SAAO,KAAK;;CAGd,eAA+B;AAC7B,SAAO,EAAE,GAAG,KAAK,aAAa;;CAGhC,gBAAwB;AACtB,SAAO,KAAK,YAAY;;CAG1B,MAAM,UAAyB;AAC7B,OAAK,WAAW;AAChB,OAAK,gBAAgB,OAAO;AAC5B,OAAK,YAAY;AACjB,OAAK,cAAc;;;;;;AAavB,SAAgB,UAAU,UAAkB,cAA0B;AACpE,KAAI,QAAQ,WAAW,aAAa,CAClC,QAAO,IAAI,cAAc,QAAQ;AAEnC,QAAO,IAAI,UAAU,QAAQ"}
|
|
@@ -344,10 +344,7 @@ var KokoroTTS = class {
|
|
|
344
344
|
const { onProgress, device = "auto" } = options;
|
|
345
345
|
onProgress?.({ status: `Loading TTS model (${this.modelConfig.id})...` });
|
|
346
346
|
try {
|
|
347
|
-
const { KokoroTTS: KokoroJS } = await import(
|
|
348
|
-
/* webpackIgnore: true */
|
|
349
|
-
"kokoro-js"
|
|
350
|
-
);
|
|
347
|
+
const { KokoroTTS: KokoroJS } = await import("kokoro-js");
|
|
351
348
|
const isBrowser = typeof window !== "undefined";
|
|
352
349
|
let dtype = "fp32";
|
|
353
350
|
if (device === "webgpu" || device === "auto" && isBrowser && "gpu" in navigator) {
|
|
@@ -580,14 +577,7 @@ var SupertonicTTS = class {
|
|
|
580
577
|
onProgress?.({ status: `Loading TTS model (${this.modelConfig.id})...` });
|
|
581
578
|
try {
|
|
582
579
|
const isBrowser = typeof window !== "undefined";
|
|
583
|
-
const
|
|
584
|
-
let transformersModule;
|
|
585
|
-
if (isNode) transformersModule = await import(
|
|
586
|
-
/* webpackIgnore: true */
|
|
587
|
-
"@huggingface/transformers"
|
|
588
|
-
);
|
|
589
|
-
else transformersModule = await import("https://cdn.jsdelivr.net/npm/@huggingface/transformers@3.8.1");
|
|
590
|
-
const { pipeline } = transformersModule;
|
|
580
|
+
const { pipeline } = await import("@huggingface/transformers");
|
|
591
581
|
if (device === "webgpu" || device === "auto" && isBrowser && "gpu" in navigator) this._deviceMode = "webgpu";
|
|
592
582
|
else this._deviceMode = "cpu";
|
|
593
583
|
onProgress?.({ status: `Loading Supertonic model...` });
|
|
@@ -737,4 +727,4 @@ function createTTS(modelId = "kokoro-82m") {
|
|
|
737
727
|
|
|
738
728
|
//#endregion
|
|
739
729
|
export { TTS_MODELS as a, listTTSModels as c, SupertonicTTS as i, KokoroTTS as n, createTTS as o, SUPERTONIC_VOICES as r, getTTSModelConfig as s, KOKORO_VOICES as t };
|
|
740
|
-
//# sourceMappingURL=tts-
|
|
730
|
+
//# sourceMappingURL=tts-D5hrNcGD.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tts-D5hrNcGD.mjs","names":["KOKORO_VOICES: VoiceInfo[]","SUPERTONIC_VOICES: VoiceInfo[]","TTS_MODELS: Record<string, TTSModelConfig>","dtype: \"fp32\" | \"fp16\" | \"q8\" | \"q4\" | \"q4f16\"","allAudio: Float32Array[]","chunk: AudioChunk"],"sources":["../src/core/tts.ts"],"sourcesContent":["/**\n * Text-to-Speech with Kokoro-82M\n *\n * Provides local TTS using the Kokoro-82M model with multiple voice options.\n * Uses kokoro-js for proper phoneme conversion (G2P) and audio generation.\n * Supports streaming audio generation and works in both Node.js and browser.\n *\n * @example\n * ```ts\n * const tts = new KokoroTTS();\n * await tts.load({ onProgress: (p) => console.log(p.status) });\n *\n * // List available voices\n * const voices = tts.listVoices();\n *\n * // Generate audio\n * const result = await tts.speak(\"Hello world\", { voice: \"af_bella\" });\n * // result.audio = Float32Array, result.sampleRate = 24000\n *\n * // Stream audio chunks\n * for await (const chunk of tts.speakStream(\"Long text...\")) {\n * playAudioChunk(chunk);\n * }\n * ```\n */\n\nimport type {\n AudioChunk,\n LoadTTSOptions,\n SpeakOptions,\n SpeakResult,\n TTSModelConfig,\n VoiceInfo,\n} from \"./types.js\";\n\n// Regex for sentence splitting (defined at module level for performance)\nconst SENTENCE_SPLIT_REGEX = /(?<=[.!?])\\s+/;\n\n// ============================================\n// Voice Registry\n// ============================================\n\n/**\n * Kokoro voice definitions\n * Voice IDs follow pattern: {language}{gender}_{name}\n * - a = American English\n * - b = British English\n * - f = female, m = male\n */\nexport const KOKORO_VOICES: VoiceInfo[] = [\n // American English - Female (ordered by quality)\n {\n id: \"af_heart\",\n name: \"Heart\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, highest quality voice (Grade A)\",\n embeddingFile: \"voices/af_heart.bin\",\n },\n {\n id: \"af_bella\",\n name: \"Bella\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, warm and friendly (Grade A-)\",\n embeddingFile: \"voices/af_bella.bin\",\n },\n {\n id: \"af_nicole\",\n name: \"Nicole\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, soft and gentle (Grade B-)\",\n embeddingFile: \"voices/af_nicole.bin\",\n },\n {\n id: \"af_sarah\",\n name: \"Sarah\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, clear and professional (Grade C+)\",\n embeddingFile: \"voices/af_sarah.bin\",\n },\n {\n id: \"af_sky\",\n name: \"Sky\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female, young and energetic (Grade C-)\",\n embeddingFile: \"voices/af_sky.bin\",\n },\n {\n id: \"af_alloy\",\n name: \"Alloy\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade C)\",\n embeddingFile: \"voices/af_alloy.bin\",\n },\n {\n id: \"af_aoede\",\n name: \"Aoede\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade C+)\",\n embeddingFile: \"voices/af_aoede.bin\",\n },\n {\n id: \"af_kore\",\n name: \"Kore\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade C+)\",\n embeddingFile: \"voices/af_kore.bin\",\n },\n {\n id: \"af_nova\",\n name: \"Nova\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade C)\",\n embeddingFile: \"voices/af_nova.bin\",\n },\n {\n id: \"af_river\",\n name: \"River\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade D)\",\n embeddingFile: \"voices/af_river.bin\",\n },\n {\n id: \"af_jessica\",\n name: \"Jessica\",\n gender: \"female\",\n language: \"en-us\",\n description: \"American female (Grade D)\",\n embeddingFile: \"voices/af_jessica.bin\",\n },\n // American English - Male\n {\n id: \"am_fenrir\",\n name: \"Fenrir\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male, best quality (Grade C+)\",\n embeddingFile: \"voices/am_fenrir.bin\",\n },\n {\n id: \"am_michael\",\n name: \"Michael\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male, warm and friendly (Grade C+)\",\n embeddingFile: \"voices/am_michael.bin\",\n },\n {\n id: \"am_puck\",\n name: \"Puck\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade C+)\",\n embeddingFile: \"voices/am_puck.bin\",\n },\n {\n id: \"am_adam\",\n name: \"Adam\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male, deep voice (Grade F+)\",\n embeddingFile: \"voices/am_adam.bin\",\n },\n {\n id: \"am_echo\",\n name: \"Echo\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade D)\",\n embeddingFile: \"voices/am_echo.bin\",\n },\n {\n id: \"am_eric\",\n name: \"Eric\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade D)\",\n embeddingFile: \"voices/am_eric.bin\",\n },\n {\n id: \"am_liam\",\n name: \"Liam\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade D)\",\n embeddingFile: \"voices/am_liam.bin\",\n },\n {\n id: \"am_onyx\",\n name: \"Onyx\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male (Grade D)\",\n embeddingFile: \"voices/am_onyx.bin\",\n },\n {\n id: \"am_santa\",\n name: \"Santa\",\n gender: \"male\",\n language: \"en-us\",\n description: \"American male, festive (Grade D-)\",\n embeddingFile: \"voices/am_santa.bin\",\n },\n // British English - Female\n {\n id: \"bf_emma\",\n name: \"Emma\",\n gender: \"female\",\n language: \"en-gb\",\n description: \"British female, elegant and clear (Grade B-)\",\n embeddingFile: \"voices/bf_emma.bin\",\n },\n {\n id: \"bf_isabella\",\n name: \"Isabella\",\n gender: \"female\",\n language: \"en-gb\",\n description: \"British female, sophisticated (Grade C)\",\n embeddingFile: \"voices/bf_isabella.bin\",\n },\n {\n id: \"bf_alice\",\n name: \"Alice\",\n gender: \"female\",\n language: \"en-gb\",\n description: \"British female (Grade D)\",\n embeddingFile: \"voices/bf_alice.bin\",\n },\n {\n id: \"bf_lily\",\n name: \"Lily\",\n gender: \"female\",\n language: \"en-gb\",\n description: \"British female (Grade D)\",\n embeddingFile: \"voices/bf_lily.bin\",\n },\n // British English - Male\n {\n id: \"bm_george\",\n name: \"George\",\n gender: \"male\",\n language: \"en-gb\",\n description: \"British male, distinguished (Grade C)\",\n embeddingFile: \"voices/bm_george.bin\",\n },\n {\n id: \"bm_fable\",\n name: \"Fable\",\n gender: \"male\",\n language: \"en-gb\",\n description: \"British male (Grade C)\",\n embeddingFile: \"voices/bm_fable.bin\",\n },\n {\n id: \"bm_lewis\",\n name: \"Lewis\",\n gender: \"male\",\n language: \"en-gb\",\n description: \"British male, friendly (Grade D+)\",\n embeddingFile: \"voices/bm_lewis.bin\",\n },\n {\n id: \"bm_daniel\",\n name: \"Daniel\",\n gender: \"male\",\n language: \"en-gb\",\n description: \"British male (Grade D)\",\n embeddingFile: \"voices/bm_daniel.bin\",\n },\n];\n\n// ============================================\n// Supertonic Voice Registry\n// ============================================\n\n/**\n * Supertonic voice definitions\n * 4 built-in voices: F1, F2 (female), M1, M2 (male)\n */\nexport const SUPERTONIC_VOICES: VoiceInfo[] = [\n {\n id: \"F1\",\n name: \"Female 1\",\n gender: \"female\",\n language: \"en\",\n description: \"Female voice 1 - Clear and natural\",\n embeddingFile: \"voices/F1.bin\",\n },\n {\n id: \"F2\",\n name: \"Female 2\",\n gender: \"female\",\n language: \"en\",\n description: \"Female voice 2 - Warm and expressive\",\n embeddingFile: \"voices/F2.bin\",\n },\n {\n id: \"M1\",\n name: \"Male 1\",\n gender: \"male\",\n language: \"en\",\n description: \"Male voice 1 - Deep and confident\",\n embeddingFile: \"voices/M1.bin\",\n },\n {\n id: \"M2\",\n name: \"Male 2\",\n gender: \"male\",\n language: \"en\",\n description: \"Male voice 2 - Friendly and casual\",\n embeddingFile: \"voices/M2.bin\",\n },\n];\n\n// ============================================\n// TTS Model Registry\n// ============================================\n\nexport const TTS_MODELS: Record<string, TTSModelConfig> = {\n \"kokoro-82m\": {\n id: \"kokoro-82m\",\n repo: \"onnx-community/Kokoro-82M-v1.0-ONNX\",\n description: \"Kokoro 82M - High-quality multilingual TTS\",\n size: \"~330MB\",\n sampleRate: 24000,\n voices: KOKORO_VOICES,\n defaultVoice: \"af_heart\",\n languages: [\"en-us\", \"en-gb\"],\n },\n \"supertonic-66m\": {\n id: \"supertonic-66m\",\n repo: \"onnx-community/Supertonic-TTS-ONNX\",\n description: \"Supertonic 66M - Fast on-device TTS (167x realtime)\",\n size: \"~250MB\",\n sampleRate: 44100,\n voices: SUPERTONIC_VOICES,\n defaultVoice: \"F1\",\n languages: [\"en\"],\n },\n};\n\n/**\n * Get TTS model config by ID\n */\nexport function getTTSModelConfig(modelId: string): TTSModelConfig | null {\n return TTS_MODELS[modelId] || null;\n}\n\n/**\n * List all available TTS models\n */\nexport function listTTSModels(): TTSModelConfig[] {\n return Object.values(TTS_MODELS);\n}\n\n// ============================================\n// Kokoro TTS Class (wraps kokoro-js)\n// ============================================\n\n// kokoro-js types\ninterface KokoroJSAudio {\n audio: Float32Array;\n sampling_rate: number;\n}\n\ninterface KokoroJSInstance {\n generate(text: string, options?: { voice?: string; speed?: number }): Promise<KokoroJSAudio>;\n list_voices(): Array<{\n name: string;\n language: string;\n gender: string;\n traits: string;\n targetQuality: string;\n overallGrade: string;\n }>;\n}\n\n/**\n * Kokoro TTS - Local text-to-speech with voice selection\n *\n * Uses kokoro-js (official Kokoro library by xenova) for high-quality speech synthesis.\n * Includes proper G2P (grapheme-to-phoneme) conversion for accurate pronunciation.\n */\nexport class KokoroTTS {\n private kokoroInstance: KokoroJSInstance | null = null;\n private modelConfig: TTSModelConfig;\n private loadPromise: Promise<void> | null = null;\n private _isLoaded = false;\n private _deviceMode: \"webgpu\" | \"cpu\" = \"cpu\";\n\n constructor(modelId = \"kokoro-82m\") {\n const config = getTTSModelConfig(modelId);\n if (!config) {\n throw new Error(\n `Unknown TTS model: ${modelId}. Available: ${Object.keys(TTS_MODELS).join(\", \")}`,\n );\n }\n this.modelConfig = config;\n }\n\n // ============================================\n // Model Loading\n // ============================================\n\n /**\n * Load the TTS model\n *\n * @example\n * ```ts\n * const tts = new KokoroTTS();\n * await tts.load({\n * onProgress: (p) => console.log(p.status, p.progress),\n * device: \"webgpu\",\n * });\n * ```\n */\n async load(options: LoadTTSOptions = {}): Promise<void> {\n if (this._isLoaded) {\n return;\n }\n\n // Prevent duplicate loads\n if (this.loadPromise) {\n return this.loadPromise;\n }\n\n this.loadPromise = this._load(options);\n await this.loadPromise;\n }\n\n private async _load(options: LoadTTSOptions = {}): Promise<void> {\n const { onProgress, device = \"auto\" } = options;\n\n onProgress?.({ status: `Loading TTS model (${this.modelConfig.id})...` });\n\n try {\n // Dynamically import kokoro-js\n // tsdown handles resolution: Node.js = external, Browser = bundled\n const kokoroModule = await import(\"kokoro-js\");\n const { KokoroTTS: KokoroJS } = kokoroModule;\n\n // Determine device/dtype\n const isBrowser = typeof window !== \"undefined\";\n let dtype: \"fp32\" | \"fp16\" | \"q8\" | \"q4\" | \"q4f16\" = \"fp32\";\n\n if (device === \"webgpu\" || (device === \"auto\" && isBrowser && \"gpu\" in navigator)) {\n dtype = \"fp16\";\n this._deviceMode = \"webgpu\";\n } else {\n dtype = \"fp32\";\n this._deviceMode = \"cpu\";\n }\n\n onProgress?.({ status: `Loading model with ${dtype} precision...` });\n\n // Load the model using kokoro-js\n // kokoro-js handles:\n // - Model loading with proper quantization\n // - Phoneme tokenization (G2P) via phonemizer\n // - Voice embeddings\n this.kokoroInstance = (await KokoroJS.from_pretrained(this.modelConfig.repo, {\n dtype,\n progress_callback: (progress: any) => {\n if (progress.status === \"progress\" && progress.file) {\n onProgress?.({\n status: `Downloading ${progress.file}`,\n progress: Math.round(progress.progress || 0),\n file: progress.file,\n });\n } else if (progress.status === \"ready\") {\n onProgress?.({ status: \"Model ready\" });\n }\n },\n })) as unknown as KokoroJSInstance;\n\n this._isLoaded = true;\n onProgress?.({ status: `Ready (${this._deviceMode.toUpperCase()})!` });\n } catch (error) {\n this.loadPromise = null;\n throw error;\n }\n }\n\n /**\n * Ensure model is loaded (lazy loading)\n */\n async ensureLoaded(options?: LoadTTSOptions): Promise<void> {\n if (!this._isLoaded) {\n await this.load(options);\n }\n }\n\n // ============================================\n // Voice Management\n // ============================================\n\n /**\n * Get list of available voices\n *\n * @example\n * ```ts\n * const voices = tts.listVoices();\n * // [{ id: \"af_heart\", name: \"Heart\", gender: \"female\", ... }, ...]\n * ```\n */\n listVoices(): VoiceInfo[] {\n return [...this.modelConfig.voices];\n }\n\n /**\n * Get a specific voice by ID\n */\n getVoice(voiceId: string): VoiceInfo | null {\n return this.modelConfig.voices.find((v) => v.id === voiceId) || null;\n }\n\n /**\n * Get voices by gender\n */\n getVoicesByGender(gender: \"male\" | \"female\"): VoiceInfo[] {\n return this.modelConfig.voices.filter((v) => v.gender === gender);\n }\n\n /**\n * Get voices by language\n */\n getVoicesByLanguage(language: string): VoiceInfo[] {\n return this.modelConfig.voices.filter(\n (v) => v.language === language || v.language.startsWith(language),\n );\n }\n\n // ============================================\n // Speech Generation\n // ============================================\n\n /**\n * Generate speech from text\n *\n * @example\n * ```ts\n * const result = await tts.speak(\"Hello world\", {\n * voice: \"af_heart\",\n * speed: 1.0,\n * });\n *\n * // Play in browser\n * const audioContext = new AudioContext();\n * const buffer = audioContext.createBuffer(1, result.audio.length, result.sampleRate);\n * buffer.copyToChannel(result.audio, 0);\n * const source = audioContext.createBufferSource();\n * source.buffer = buffer;\n * source.connect(audioContext.destination);\n * source.start();\n * ```\n */\n async speak(text: string, options: SpeakOptions = {}): Promise<SpeakResult> {\n await this.ensureLoaded({ onProgress: options.onProgress });\n\n const { voice = this.modelConfig.defaultVoice, speed = 1.0 } = options;\n\n // Validate voice exists in our registry\n const voiceInfo = this.getVoice(voice);\n if (!voiceInfo) {\n throw new Error(`Unknown voice: ${voice}. Use listVoices() to see available options.`);\n }\n\n if (!this.kokoroInstance) {\n throw new Error(\"Model not loaded\");\n }\n\n const startTime = performance.now();\n\n // Generate audio using kokoro-js\n const result = await this.kokoroInstance.generate(text, {\n voice,\n speed,\n });\n\n const totalTime = performance.now() - startTime;\n\n return {\n audio: result.audio,\n sampleRate: result.sampling_rate,\n duration: result.audio.length / result.sampling_rate,\n voice,\n totalTime,\n };\n }\n\n /**\n * Stream speech generation (yields audio chunks as they're generated)\n *\n * @example\n * ```ts\n * for await (const chunk of tts.speakStream(\"Long text...\")) {\n * // chunk.samples = Float32Array\n * // chunk.sampleRate = 24000\n * // chunk.isFinal = boolean\n * playChunk(chunk);\n * }\n * ```\n */\n async *speakStream(\n text: string,\n options: SpeakOptions = {},\n ): AsyncGenerator<AudioChunk, SpeakResult, unknown> {\n await this.ensureLoaded({ onProgress: options.onProgress });\n\n const { voice = this.modelConfig.defaultVoice, speed = 1.0 } = options;\n\n // Validate voice\n const voiceInfo = this.getVoice(voice);\n if (!voiceInfo) {\n throw new Error(`Unknown voice: ${voice}. Use listVoices() to see available options.`);\n }\n\n if (!this.kokoroInstance) {\n throw new Error(\"Model not loaded\");\n }\n\n const startTime = performance.now();\n\n // Split text into sentences for streaming\n const sentences = this.splitIntoSentences(text);\n const allAudio: Float32Array[] = [];\n let chunkIndex = 0;\n let sampleRate = this.modelConfig.sampleRate;\n\n for (let i = 0; i < sentences.length; i++) {\n const sentence = sentences[i];\n if (!sentence.trim()) {\n continue;\n }\n\n const result = await this.kokoroInstance.generate(sentence, {\n voice,\n speed,\n });\n\n sampleRate = result.sampling_rate;\n allAudio.push(result.audio);\n\n const chunk: AudioChunk = {\n samples: result.audio,\n sampleRate: result.sampling_rate,\n index: chunkIndex++,\n isFinal: i === sentences.length - 1,\n };\n\n yield chunk;\n options.onAudioChunk?.(chunk);\n }\n\n // Concatenate all audio\n const totalLength = allAudio.reduce((sum, arr) => sum + arr.length, 0);\n const fullAudio = new Float32Array(totalLength);\n let offset = 0;\n for (const chunk of allAudio) {\n fullAudio.set(chunk, offset);\n offset += chunk.length;\n }\n\n const totalTime = performance.now() - startTime;\n\n return {\n audio: fullAudio,\n sampleRate,\n duration: fullAudio.length / sampleRate,\n voice,\n totalTime,\n };\n }\n\n /**\n * Split text into sentences for streaming\n */\n private splitIntoSentences(text: string): string[] {\n // Split on sentence boundaries while preserving the delimiters\n return text.split(SENTENCE_SPLIT_REGEX).filter((s) => s.trim());\n }\n\n // ============================================\n // Status & Info\n // ============================================\n\n /**\n * Check if model is loaded\n */\n isLoaded(): boolean {\n return this._isLoaded;\n }\n\n /**\n * Get current device mode\n */\n getDeviceMode(): \"webgpu\" | \"cpu\" {\n return this._deviceMode;\n }\n\n /**\n * Get model configuration\n */\n getModelInfo(): TTSModelConfig {\n return { ...this.modelConfig };\n }\n\n /**\n * Get sample rate\n */\n getSampleRate(): number {\n return this.modelConfig.sampleRate;\n }\n\n // ============================================\n // Cleanup\n // ============================================\n\n /**\n * Dispose of resources\n */\n async dispose(): Promise<void> {\n // kokoro-js doesn't expose a dispose method currently\n // but we clear our reference\n this.kokoroInstance = null;\n this._isLoaded = false;\n this.loadPromise = null;\n }\n}\n\n// ============================================\n// Supertonic TTS Class (uses transformers.js)\n// ============================================\n\n/**\n * Supertonic TTS - Fast on-device text-to-speech\n *\n * Uses transformers.js with the Supertonic-TTS-ONNX model.\n * Generates speech at 167x realtime with 66M parameters.\n * Outputs at 44100 Hz sample rate.\n */\nexport class SupertonicTTS {\n private pipeline: any = null;\n private modelConfig: TTSModelConfig;\n private loadPromise: Promise<void> | null = null;\n private _isLoaded = false;\n private _deviceMode: \"webgpu\" | \"cpu\" = \"cpu\";\n private voiceEmbeddings: Map<string, Float32Array> = new Map();\n\n constructor(modelId = \"supertonic-66m\") {\n const config = getTTSModelConfig(modelId);\n if (!config) {\n throw new Error(\n `Unknown TTS model: ${modelId}. Available: ${Object.keys(TTS_MODELS).join(\", \")}`,\n );\n }\n this.modelConfig = config;\n }\n\n /**\n * Load the TTS model\n */\n async load(options: LoadTTSOptions = {}): Promise<void> {\n if (this._isLoaded) {\n return;\n }\n\n if (this.loadPromise) {\n return this.loadPromise;\n }\n\n this.loadPromise = this._load(options);\n await this.loadPromise;\n }\n\n private async _load(options: LoadTTSOptions = {}): Promise<void> {\n const { onProgress, device = \"auto\" } = options;\n\n onProgress?.({ status: `Loading TTS model (${this.modelConfig.id})...` });\n\n try {\n // Determine device\n const isBrowser = typeof window !== \"undefined\";\n\n // Dynamically import transformers.js\n // tsdown handles resolution: Node.js = external, Browser = bundled\n const { pipeline } = await import(\"@huggingface/transformers\");\n if (device === \"webgpu\" || (device === \"auto\" && isBrowser && \"gpu\" in navigator)) {\n this._deviceMode = \"webgpu\";\n } else {\n this._deviceMode = \"cpu\";\n }\n\n onProgress?.({ status: `Loading Supertonic model...` });\n\n // Create TTS pipeline\n this.pipeline = await pipeline(\"text-to-speech\", this.modelConfig.repo, {\n dtype: \"fp32\", // Supertonic works best with fp32\n device: this._deviceMode,\n progress_callback: (progress: any) => {\n if (progress.status === \"progress\" && progress.file) {\n onProgress?.({\n status: `Downloading ${progress.file}`,\n progress: Math.round(progress.progress || 0),\n file: progress.file,\n });\n }\n },\n });\n\n // Load voice embeddings\n onProgress?.({ status: \"Loading voice embeddings...\" });\n await this.loadVoiceEmbeddings();\n\n this._isLoaded = true;\n onProgress?.({ status: `Ready (${this._deviceMode.toUpperCase()})!` });\n } catch (error) {\n this.loadPromise = null;\n throw error;\n }\n }\n\n /**\n * Load speaker embeddings for all voices\n * Supertonic uses 101x128 = 12,928 floats per voice\n */\n private async loadVoiceEmbeddings(): Promise<void> {\n // In browser, we'd fetch from HuggingFace Hub\n // In Node.js, we'd load from cache\n // For now, we'll lazy-load embeddings when needed\n // The pipeline handles this internally when we pass speaker_embeddings\n }\n\n async ensureLoaded(options?: LoadTTSOptions): Promise<void> {\n if (!this._isLoaded) {\n await this.load(options);\n }\n }\n\n listVoices(): VoiceInfo[] {\n return [...this.modelConfig.voices];\n }\n\n getVoice(voiceId: string): VoiceInfo | null {\n return this.modelConfig.voices.find((v) => v.id === voiceId) || null;\n }\n\n getVoicesByGender(gender: \"male\" | \"female\"): VoiceInfo[] {\n return this.modelConfig.voices.filter((v) => v.gender === gender);\n }\n\n /**\n * Generate speech from text\n */\n async speak(text: string, options: SpeakOptions = {}): Promise<SpeakResult> {\n await this.ensureLoaded({ onProgress: options.onProgress });\n\n const { voice = this.modelConfig.defaultVoice } = options;\n\n // Validate voice\n const voiceInfo = this.getVoice(voice);\n if (!voiceInfo) {\n throw new Error(`Unknown voice: ${voice}. Use listVoices() to see available options.`);\n }\n\n if (!this.pipeline) {\n throw new Error(\"Model not loaded\");\n }\n\n const startTime = performance.now();\n\n // Get or create speaker embedding\n // Supertonic expects [101, 128] = 12,928 floats\n let speakerEmbedding = this.voiceEmbeddings.get(voice);\n if (!speakerEmbedding) {\n // Load from HuggingFace Hub via fetch\n try {\n const voiceUrl = `https://huggingface.co/${this.modelConfig.repo}/resolve/main/voices/${voice}.bin`;\n const response = await fetch(voiceUrl);\n if (response.ok) {\n const buffer = await response.arrayBuffer();\n speakerEmbedding = new Float32Array(buffer);\n this.voiceEmbeddings.set(voice, speakerEmbedding);\n } else {\n throw new Error(`Failed to load voice: ${response.status}`);\n }\n } catch {\n // Fallback: create neutral embedding (not ideal but works)\n speakerEmbedding = new Float32Array(101 * 128).fill(0.1);\n this.voiceEmbeddings.set(voice, speakerEmbedding);\n }\n }\n\n // Generate audio\n const result = await this.pipeline(text, {\n speaker_embeddings: speakerEmbedding,\n });\n\n const totalTime = performance.now() - startTime;\n const audio = result.audio as Float32Array;\n const sampleRate = result.sampling_rate as number;\n\n return {\n audio,\n sampleRate,\n duration: audio.length / sampleRate,\n voice,\n totalTime,\n };\n }\n\n /**\n * Stream speech generation\n */\n async *speakStream(\n text: string,\n options: SpeakOptions = {},\n ): AsyncGenerator<AudioChunk, SpeakResult, unknown> {\n await this.ensureLoaded({ onProgress: options.onProgress });\n\n const { voice = this.modelConfig.defaultVoice, speed = 1.0 } = options;\n\n const voiceInfo = this.getVoice(voice);\n if (!voiceInfo) {\n throw new Error(`Unknown voice: ${voice}. Use listVoices() to see available options.`);\n }\n\n const startTime = performance.now();\n\n // Split text into sentences for streaming\n const sentences = text.split(SENTENCE_SPLIT_REGEX).filter((s) => s.trim());\n const allAudio: Float32Array[] = [];\n let chunkIndex = 0;\n let sampleRate = this.modelConfig.sampleRate;\n\n for (let i = 0; i < sentences.length; i++) {\n const sentence = sentences[i];\n if (!sentence.trim()) continue;\n\n const result = await this.speak(sentence, { voice, speed });\n sampleRate = result.sampleRate;\n allAudio.push(result.audio);\n\n const chunk: AudioChunk = {\n samples: result.audio,\n sampleRate: result.sampleRate,\n index: chunkIndex++,\n isFinal: i === sentences.length - 1,\n };\n\n yield chunk;\n options.onAudioChunk?.(chunk);\n }\n\n // Concatenate all audio\n const totalLength = allAudio.reduce((sum, arr) => sum + arr.length, 0);\n const fullAudio = new Float32Array(totalLength);\n let offset = 0;\n for (const chunk of allAudio) {\n fullAudio.set(chunk, offset);\n offset += chunk.length;\n }\n\n const totalTime = performance.now() - startTime;\n\n return {\n audio: fullAudio,\n sampleRate,\n duration: fullAudio.length / sampleRate,\n voice,\n totalTime,\n };\n }\n\n isLoaded(): boolean {\n return this._isLoaded;\n }\n\n getDeviceMode(): \"webgpu\" | \"cpu\" {\n return this._deviceMode;\n }\n\n getModelInfo(): TTSModelConfig {\n return { ...this.modelConfig };\n }\n\n getSampleRate(): number {\n return this.modelConfig.sampleRate;\n }\n\n async dispose(): Promise<void> {\n this.pipeline = null;\n this.voiceEmbeddings.clear();\n this._isLoaded = false;\n this.loadPromise = null;\n }\n}\n\n// ============================================\n// Unified TTS Factory\n// ============================================\n\nexport type TTSBackend = KokoroTTS | SupertonicTTS;\n\n/**\n * Create a TTS instance based on model ID\n */\nexport function createTTS(modelId: string = \"kokoro-82m\"): TTSBackend {\n if (modelId.startsWith(\"supertonic\")) {\n return new SupertonicTTS(modelId);\n }\n return new KokoroTTS(modelId);\n}\n\nexport default KokoroTTS;\n"],"mappings":";AAoCA,MAAM,uBAAuB;;;;;;;;AAa7B,MAAaA,gBAA6B;CAExC;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CAED;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CAED;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CAED;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACF;;;;;AAUD,MAAaC,oBAAiC;CAC5C;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACD;EACE,IAAI;EACJ,MAAM;EACN,QAAQ;EACR,UAAU;EACV,aAAa;EACb,eAAe;EAChB;CACF;AAMD,MAAaC,aAA6C;CACxD,cAAc;EACZ,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,YAAY;EACZ,QAAQ;EACR,cAAc;EACd,WAAW,CAAC,SAAS,QAAQ;EAC9B;CACD,kBAAkB;EAChB,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,YAAY;EACZ,QAAQ;EACR,cAAc;EACd,WAAW,CAAC,KAAK;EAClB;CACF;;;;AAKD,SAAgB,kBAAkB,SAAwC;AACxE,QAAO,WAAW,YAAY;;;;;AAMhC,SAAgB,gBAAkC;AAChD,QAAO,OAAO,OAAO,WAAW;;;;;;;;AA+BlC,IAAa,YAAb,MAAuB;CACrB,AAAQ,iBAA0C;CAClD,AAAQ;CACR,AAAQ,cAAoC;CAC5C,AAAQ,YAAY;CACpB,AAAQ,cAAgC;CAExC,YAAY,UAAU,cAAc;EAClC,MAAM,SAAS,kBAAkB,QAAQ;AACzC,MAAI,CAAC,OACH,OAAM,IAAI,MACR,sBAAsB,QAAQ,eAAe,OAAO,KAAK,WAAW,CAAC,KAAK,KAAK,GAChF;AAEH,OAAK,cAAc;;;;;;;;;;;;;;CAmBrB,MAAM,KAAK,UAA0B,EAAE,EAAiB;AACtD,MAAI,KAAK,UACP;AAIF,MAAI,KAAK,YACP,QAAO,KAAK;AAGd,OAAK,cAAc,KAAK,MAAM,QAAQ;AACtC,QAAM,KAAK;;CAGb,MAAc,MAAM,UAA0B,EAAE,EAAiB;EAC/D,MAAM,EAAE,YAAY,SAAS,WAAW;AAExC,eAAa,EAAE,QAAQ,sBAAsB,KAAK,YAAY,GAAG,OAAO,CAAC;AAEzE,MAAI;GAIF,MAAM,EAAE,WAAW,aADE,MAAM,OAAO;GAIlC,MAAM,YAAY,OAAO,WAAW;GACpC,IAAIC,QAAiD;AAErD,OAAI,WAAW,YAAa,WAAW,UAAU,aAAa,SAAS,WAAY;AACjF,YAAQ;AACR,SAAK,cAAc;UACd;AACL,YAAQ;AACR,SAAK,cAAc;;AAGrB,gBAAa,EAAE,QAAQ,sBAAsB,MAAM,gBAAgB,CAAC;AAOpE,QAAK,iBAAkB,MAAM,SAAS,gBAAgB,KAAK,YAAY,MAAM;IAC3E;IACA,oBAAoB,aAAkB;AACpC,SAAI,SAAS,WAAW,cAAc,SAAS,KAC7C,cAAa;MACX,QAAQ,eAAe,SAAS;MAChC,UAAU,KAAK,MAAM,SAAS,YAAY,EAAE;MAC5C,MAAM,SAAS;MAChB,CAAC;cACO,SAAS,WAAW,QAC7B,cAAa,EAAE,QAAQ,eAAe,CAAC;;IAG5C,CAAC;AAEF,QAAK,YAAY;AACjB,gBAAa,EAAE,QAAQ,UAAU,KAAK,YAAY,aAAa,CAAC,KAAK,CAAC;WAC/D,OAAO;AACd,QAAK,cAAc;AACnB,SAAM;;;;;;CAOV,MAAM,aAAa,SAAyC;AAC1D,MAAI,CAAC,KAAK,UACR,OAAM,KAAK,KAAK,QAAQ;;;;;;;;;;;CAiB5B,aAA0B;AACxB,SAAO,CAAC,GAAG,KAAK,YAAY,OAAO;;;;;CAMrC,SAAS,SAAmC;AAC1C,SAAO,KAAK,YAAY,OAAO,MAAM,MAAM,EAAE,OAAO,QAAQ,IAAI;;;;;CAMlE,kBAAkB,QAAwC;AACxD,SAAO,KAAK,YAAY,OAAO,QAAQ,MAAM,EAAE,WAAW,OAAO;;;;;CAMnE,oBAAoB,UAA+B;AACjD,SAAO,KAAK,YAAY,OAAO,QAC5B,MAAM,EAAE,aAAa,YAAY,EAAE,SAAS,WAAW,SAAS,CAClE;;;;;;;;;;;;;;;;;;;;;;CA2BH,MAAM,MAAM,MAAc,UAAwB,EAAE,EAAwB;AAC1E,QAAM,KAAK,aAAa,EAAE,YAAY,QAAQ,YAAY,CAAC;EAE3D,MAAM,EAAE,QAAQ,KAAK,YAAY,cAAc,QAAQ,MAAQ;AAI/D,MAAI,CADc,KAAK,SAAS,MAAM,CAEpC,OAAM,IAAI,MAAM,kBAAkB,MAAM,8CAA8C;AAGxF,MAAI,CAAC,KAAK,eACR,OAAM,IAAI,MAAM,mBAAmB;EAGrC,MAAM,YAAY,YAAY,KAAK;EAGnC,MAAM,SAAS,MAAM,KAAK,eAAe,SAAS,MAAM;GACtD;GACA;GACD,CAAC;EAEF,MAAM,YAAY,YAAY,KAAK,GAAG;AAEtC,SAAO;GACL,OAAO,OAAO;GACd,YAAY,OAAO;GACnB,UAAU,OAAO,MAAM,SAAS,OAAO;GACvC;GACA;GACD;;;;;;;;;;;;;;;CAgBH,OAAO,YACL,MACA,UAAwB,EAAE,EACwB;AAClD,QAAM,KAAK,aAAa,EAAE,YAAY,QAAQ,YAAY,CAAC;EAE3D,MAAM,EAAE,QAAQ,KAAK,YAAY,cAAc,QAAQ,MAAQ;AAI/D,MAAI,CADc,KAAK,SAAS,MAAM,CAEpC,OAAM,IAAI,MAAM,kBAAkB,MAAM,8CAA8C;AAGxF,MAAI,CAAC,KAAK,eACR,OAAM,IAAI,MAAM,mBAAmB;EAGrC,MAAM,YAAY,YAAY,KAAK;EAGnC,MAAM,YAAY,KAAK,mBAAmB,KAAK;EAC/C,MAAMC,WAA2B,EAAE;EACnC,IAAI,aAAa;EACjB,IAAI,aAAa,KAAK,YAAY;AAElC,OAAK,IAAI,IAAI,GAAG,IAAI,UAAU,QAAQ,KAAK;GACzC,MAAM,WAAW,UAAU;AAC3B,OAAI,CAAC,SAAS,MAAM,CAClB;GAGF,MAAM,SAAS,MAAM,KAAK,eAAe,SAAS,UAAU;IAC1D;IACA;IACD,CAAC;AAEF,gBAAa,OAAO;AACpB,YAAS,KAAK,OAAO,MAAM;GAE3B,MAAMC,QAAoB;IACxB,SAAS,OAAO;IAChB,YAAY,OAAO;IACnB,OAAO;IACP,SAAS,MAAM,UAAU,SAAS;IACnC;AAED,SAAM;AACN,WAAQ,eAAe,MAAM;;EAI/B,MAAM,cAAc,SAAS,QAAQ,KAAK,QAAQ,MAAM,IAAI,QAAQ,EAAE;EACtE,MAAM,YAAY,IAAI,aAAa,YAAY;EAC/C,IAAI,SAAS;AACb,OAAK,MAAM,SAAS,UAAU;AAC5B,aAAU,IAAI,OAAO,OAAO;AAC5B,aAAU,MAAM;;EAGlB,MAAM,YAAY,YAAY,KAAK,GAAG;AAEtC,SAAO;GACL,OAAO;GACP;GACA,UAAU,UAAU,SAAS;GAC7B;GACA;GACD;;;;;CAMH,AAAQ,mBAAmB,MAAwB;AAEjD,SAAO,KAAK,MAAM,qBAAqB,CAAC,QAAQ,MAAM,EAAE,MAAM,CAAC;;;;;CAUjE,WAAoB;AAClB,SAAO,KAAK;;;;;CAMd,gBAAkC;AAChC,SAAO,KAAK;;;;;CAMd,eAA+B;AAC7B,SAAO,EAAE,GAAG,KAAK,aAAa;;;;;CAMhC,gBAAwB;AACtB,SAAO,KAAK,YAAY;;;;;CAU1B,MAAM,UAAyB;AAG7B,OAAK,iBAAiB;AACtB,OAAK,YAAY;AACjB,OAAK,cAAc;;;;;;;;;;AAevB,IAAa,gBAAb,MAA2B;CACzB,AAAQ,WAAgB;CACxB,AAAQ;CACR,AAAQ,cAAoC;CAC5C,AAAQ,YAAY;CACpB,AAAQ,cAAgC;CACxC,AAAQ,kCAA6C,IAAI,KAAK;CAE9D,YAAY,UAAU,kBAAkB;EACtC,MAAM,SAAS,kBAAkB,QAAQ;AACzC,MAAI,CAAC,OACH,OAAM,IAAI,MACR,sBAAsB,QAAQ,eAAe,OAAO,KAAK,WAAW,CAAC,KAAK,KAAK,GAChF;AAEH,OAAK,cAAc;;;;;CAMrB,MAAM,KAAK,UAA0B,EAAE,EAAiB;AACtD,MAAI,KAAK,UACP;AAGF,MAAI,KAAK,YACP,QAAO,KAAK;AAGd,OAAK,cAAc,KAAK,MAAM,QAAQ;AACtC,QAAM,KAAK;;CAGb,MAAc,MAAM,UAA0B,EAAE,EAAiB;EAC/D,MAAM,EAAE,YAAY,SAAS,WAAW;AAExC,eAAa,EAAE,QAAQ,sBAAsB,KAAK,YAAY,GAAG,OAAO,CAAC;AAEzE,MAAI;GAEF,MAAM,YAAY,OAAO,WAAW;GAIpC,MAAM,EAAE,aAAa,MAAM,OAAO;AAClC,OAAI,WAAW,YAAa,WAAW,UAAU,aAAa,SAAS,UACrE,MAAK,cAAc;OAEnB,MAAK,cAAc;AAGrB,gBAAa,EAAE,QAAQ,+BAA+B,CAAC;AAGvD,QAAK,WAAW,MAAM,SAAS,kBAAkB,KAAK,YAAY,MAAM;IACtE,OAAO;IACP,QAAQ,KAAK;IACb,oBAAoB,aAAkB;AACpC,SAAI,SAAS,WAAW,cAAc,SAAS,KAC7C,cAAa;MACX,QAAQ,eAAe,SAAS;MAChC,UAAU,KAAK,MAAM,SAAS,YAAY,EAAE;MAC5C,MAAM,SAAS;MAChB,CAAC;;IAGP,CAAC;AAGF,gBAAa,EAAE,QAAQ,+BAA+B,CAAC;AACvD,SAAM,KAAK,qBAAqB;AAEhC,QAAK,YAAY;AACjB,gBAAa,EAAE,QAAQ,UAAU,KAAK,YAAY,aAAa,CAAC,KAAK,CAAC;WAC/D,OAAO;AACd,QAAK,cAAc;AACnB,SAAM;;;;;;;CAQV,MAAc,sBAAqC;CAOnD,MAAM,aAAa,SAAyC;AAC1D,MAAI,CAAC,KAAK,UACR,OAAM,KAAK,KAAK,QAAQ;;CAI5B,aAA0B;AACxB,SAAO,CAAC,GAAG,KAAK,YAAY,OAAO;;CAGrC,SAAS,SAAmC;AAC1C,SAAO,KAAK,YAAY,OAAO,MAAM,MAAM,EAAE,OAAO,QAAQ,IAAI;;CAGlE,kBAAkB,QAAwC;AACxD,SAAO,KAAK,YAAY,OAAO,QAAQ,MAAM,EAAE,WAAW,OAAO;;;;;CAMnE,MAAM,MAAM,MAAc,UAAwB,EAAE,EAAwB;AAC1E,QAAM,KAAK,aAAa,EAAE,YAAY,QAAQ,YAAY,CAAC;EAE3D,MAAM,EAAE,QAAQ,KAAK,YAAY,iBAAiB;AAIlD,MAAI,CADc,KAAK,SAAS,MAAM,CAEpC,OAAM,IAAI,MAAM,kBAAkB,MAAM,8CAA8C;AAGxF,MAAI,CAAC,KAAK,SACR,OAAM,IAAI,MAAM,mBAAmB;EAGrC,MAAM,YAAY,YAAY,KAAK;EAInC,IAAI,mBAAmB,KAAK,gBAAgB,IAAI,MAAM;AACtD,MAAI,CAAC,iBAEH,KAAI;GACF,MAAM,WAAW,0BAA0B,KAAK,YAAY,KAAK,uBAAuB,MAAM;GAC9F,MAAM,WAAW,MAAM,MAAM,SAAS;AACtC,OAAI,SAAS,IAAI;IACf,MAAM,SAAS,MAAM,SAAS,aAAa;AAC3C,uBAAmB,IAAI,aAAa,OAAO;AAC3C,SAAK,gBAAgB,IAAI,OAAO,iBAAiB;SAEjD,OAAM,IAAI,MAAM,yBAAyB,SAAS,SAAS;UAEvD;AAEN,sBAAmB,IAAI,aAAa,MAAU,CAAC,KAAK,GAAI;AACxD,QAAK,gBAAgB,IAAI,OAAO,iBAAiB;;EAKrD,MAAM,SAAS,MAAM,KAAK,SAAS,MAAM,EACvC,oBAAoB,kBACrB,CAAC;EAEF,MAAM,YAAY,YAAY,KAAK,GAAG;EACtC,MAAM,QAAQ,OAAO;EACrB,MAAM,aAAa,OAAO;AAE1B,SAAO;GACL;GACA;GACA,UAAU,MAAM,SAAS;GACzB;GACA;GACD;;;;;CAMH,OAAO,YACL,MACA,UAAwB,EAAE,EACwB;AAClD,QAAM,KAAK,aAAa,EAAE,YAAY,QAAQ,YAAY,CAAC;EAE3D,MAAM,EAAE,QAAQ,KAAK,YAAY,cAAc,QAAQ,MAAQ;AAG/D,MAAI,CADc,KAAK,SAAS,MAAM,CAEpC,OAAM,IAAI,MAAM,kBAAkB,MAAM,8CAA8C;EAGxF,MAAM,YAAY,YAAY,KAAK;EAGnC,MAAM,YAAY,KAAK,MAAM,qBAAqB,CAAC,QAAQ,MAAM,EAAE,MAAM,CAAC;EAC1E,MAAMD,WAA2B,EAAE;EACnC,IAAI,aAAa;EACjB,IAAI,aAAa,KAAK,YAAY;AAElC,OAAK,IAAI,IAAI,GAAG,IAAI,UAAU,QAAQ,KAAK;GACzC,MAAM,WAAW,UAAU;AAC3B,OAAI,CAAC,SAAS,MAAM,CAAE;GAEtB,MAAM,SAAS,MAAM,KAAK,MAAM,UAAU;IAAE;IAAO;IAAO,CAAC;AAC3D,gBAAa,OAAO;AACpB,YAAS,KAAK,OAAO,MAAM;GAE3B,MAAMC,QAAoB;IACxB,SAAS,OAAO;IAChB,YAAY,OAAO;IACnB,OAAO;IACP,SAAS,MAAM,UAAU,SAAS;IACnC;AAED,SAAM;AACN,WAAQ,eAAe,MAAM;;EAI/B,MAAM,cAAc,SAAS,QAAQ,KAAK,QAAQ,MAAM,IAAI,QAAQ,EAAE;EACtE,MAAM,YAAY,IAAI,aAAa,YAAY;EAC/C,IAAI,SAAS;AACb,OAAK,MAAM,SAAS,UAAU;AAC5B,aAAU,IAAI,OAAO,OAAO;AAC5B,aAAU,MAAM;;EAGlB,MAAM,YAAY,YAAY,KAAK,GAAG;AAEtC,SAAO;GACL,OAAO;GACP;GACA,UAAU,UAAU,SAAS;GAC7B;GACA;GACD;;CAGH,WAAoB;AAClB,SAAO,KAAK;;CAGd,gBAAkC;AAChC,SAAO,KAAK;;CAGd,eAA+B;AAC7B,SAAO,EAAE,GAAG,KAAK,aAAa;;CAGhC,gBAAwB;AACtB,SAAO,KAAK,YAAY;;CAG1B,MAAM,UAAyB;AAC7B,OAAK,WAAW;AAChB,OAAK,gBAAgB,OAAO;AAC5B,OAAK,YAAY;AACjB,OAAK,cAAc;;;;;;AAavB,SAAgB,UAAU,UAAkB,cAA0B;AACpE,KAAI,QAAQ,WAAW,aAAa,CAClC,QAAO,IAAI,cAAc,QAAQ;AAEnC,QAAO,IAAI,UAAU,QAAQ"}
|
|
@@ -1,3 +1,3 @@
|
|
|
1
|
-
import { a as TTS_MODELS, c as listTTSModels, i as SupertonicTTS, n as KokoroTTS, o as createTTS, r as SUPERTONIC_VOICES, s as getTTSModelConfig, t as KOKORO_VOICES } from "./tts-
|
|
1
|
+
import { a as TTS_MODELS, c as listTTSModels, i as SupertonicTTS, n as KokoroTTS, o as createTTS, r as SUPERTONIC_VOICES, s as getTTSModelConfig, t as KOKORO_VOICES } from "./tts-D5hrNcGD.mjs";
|
|
2
2
|
|
|
3
3
|
export { TTS_MODELS, createTTS };
|
package/package.json
CHANGED
package/dist/gerbil-CjnM4Pra.mjs
DELETED
package/dist/stt-BN46nKJd.js.map
DELETED
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"stt-BN46nKJd.js","names":["WHISPER_MODELS: STTModelConfig[]","transformers: any","tfDevice: \"webgpu\" | \"cpu\" | \"wasm\"","audioData: Float32Array","pipelineOptions: any","transcribeResult: TranscribeResult","audioBuffer: Float32Array[]","intervalId: ReturnType<typeof setInterval> | null","e: any"],"sources":["../src/core/stt.ts"],"sourcesContent":["/**\n * Speech-to-Text with Whisper\n *\n * Provides local speech recognition using Whisper ONNX models via transformers.js.\n * Supports multiple model sizes and languages.\n *\n * @example\n * ```ts\n * const stt = new WhisperSTT();\n * await stt.load({ onProgress: (p) => console.log(p.status) });\n *\n * // Transcribe audio (Float32Array at 16kHz)\n * const result = await stt.transcribe(audioData);\n * console.log(result.text);\n *\n * // With timestamps\n * const result = await stt.transcribe(audioData, { timestamps: true });\n * for (const seg of result.segments) {\n * console.log(`[${seg.start.toFixed(1)}s] ${seg.text}`);\n * }\n * ```\n */\n\nimport type {\n LoadSTTOptions,\n ProgressInfo,\n STTModelConfig,\n StreamingTranscriptionOptions,\n StreamingTranscriptionSession,\n TranscribeOptions,\n TranscribeResult,\n TranscribeSegment,\n} from \"./types.js\";\n\n// ============================================\n// Model Registry\n// ============================================\n\n/**\n * Available Whisper models\n * Ordered by size (smallest first)\n */\nexport const WHISPER_MODELS: STTModelConfig[] = [\n {\n id: \"whisper-tiny.en\",\n repo: \"onnx-community/whisper-tiny.en\",\n description: \"Tiny English-only model, fastest\",\n size: \"39M\",\n multilingual: false,\n languages: [\"en\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-tiny\",\n repo: \"onnx-community/whisper-tiny\",\n description: \"Tiny multilingual model\",\n size: \"39M\",\n multilingual: true,\n languages: [\"en\", \"es\", \"fr\", \"de\", \"it\", \"pt\", \"nl\", \"ru\", \"zh\", \"ja\", \"ko\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-base.en\",\n repo: \"onnx-community/whisper-base.en\",\n description: \"Base English-only model, good balance\",\n size: \"74M\",\n multilingual: false,\n languages: [\"en\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-base\",\n repo: \"onnx-community/whisper-base\",\n description: \"Base multilingual model\",\n size: \"74M\",\n multilingual: true,\n languages: [\"en\", \"es\", \"fr\", \"de\", \"it\", \"pt\", \"nl\", \"ru\", \"zh\", \"ja\", \"ko\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-small.en\",\n repo: \"onnx-community/whisper-small.en\",\n description: \"Small English-only model, high quality\",\n size: \"244M\",\n multilingual: false,\n languages: [\"en\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-small\",\n repo: \"onnx-community/whisper-small\",\n description: \"Small multilingual model\",\n size: \"244M\",\n multilingual: true,\n languages: [\"en\", \"es\", \"fr\", \"de\", \"it\", \"pt\", \"nl\", \"ru\", \"zh\", \"ja\", \"ko\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-large-v3-turbo\",\n repo: \"onnx-community/whisper-large-v3-turbo\",\n description: \"Large Turbo model, 5.4x faster, 80+ languages\",\n size: \"809M\",\n multilingual: true,\n languages: [\n \"en\",\n \"es\",\n \"fr\",\n \"de\",\n \"it\",\n \"pt\",\n \"nl\",\n \"ru\",\n \"zh\",\n \"ja\",\n \"ko\",\n \"ar\",\n \"hi\",\n \"vi\",\n \"th\",\n ],\n sampleRate: 16000,\n },\n];\n\n// Default model\nconst DEFAULT_MODEL = \"whisper-tiny.en\";\n\n// ============================================\n// Audio Utilities\n// ============================================\n\n/**\n * Decode WAV file to Float32Array\n * Handles stereo to mono conversion\n */\nexport function decodeWav(buffer: Uint8Array): { audio: Float32Array; sampleRate: number } {\n const view = new DataView(buffer.buffer, buffer.byteOffset, buffer.byteLength);\n\n // Validate RIFF header\n const riff = String.fromCharCode(buffer[0], buffer[1], buffer[2], buffer[3]);\n if (riff !== \"RIFF\") {\n throw new Error(\"Invalid WAV file: missing RIFF header\");\n }\n\n // Get format details\n const numChannels = view.getUint16(22, true);\n const sampleRate = view.getUint32(24, true);\n const bitsPerSample = view.getUint16(34, true);\n\n if (bitsPerSample !== 16) {\n throw new Error(`Unsupported bit depth: ${bitsPerSample}. Only 16-bit WAV is supported.`);\n }\n\n // Find data chunk\n let dataOffset = 12;\n while (dataOffset < buffer.length - 8) {\n const chunkId = String.fromCharCode(\n buffer[dataOffset],\n buffer[dataOffset + 1],\n buffer[dataOffset + 2],\n buffer[dataOffset + 3],\n );\n const chunkSize = view.getUint32(dataOffset + 4, true);\n if (chunkId === \"data\") {\n dataOffset += 8;\n break;\n }\n dataOffset += 8 + chunkSize;\n }\n\n const dataSize = buffer.length - dataOffset;\n const bytesPerSample = bitsPerSample / 8;\n const totalSamples = Math.floor(dataSize / bytesPerSample);\n const samplesPerChannel = Math.floor(totalSamples / numChannels);\n\n // Convert to mono Float32Array\n const audio = new Float32Array(samplesPerChannel);\n\n for (let i = 0; i < samplesPerChannel; i++) {\n if (numChannels === 2) {\n const left = view.getInt16(dataOffset + i * 4, true);\n const right = view.getInt16(dataOffset + i * 4 + 2, true);\n audio[i] = (left + right) / 2 / 32768;\n } else {\n const sample = view.getInt16(dataOffset + i * 2, true);\n audio[i] = sample / 32768;\n }\n }\n\n return { audio, sampleRate };\n}\n\n/**\n * Resample audio to target sample rate using linear interpolation\n */\nexport function resampleAudio(audio: Float32Array, fromRate: number, toRate: number): Float32Array {\n if (fromRate === toRate) return audio;\n\n const ratio = toRate / fromRate;\n const newLength = Math.round(audio.length * ratio);\n const result = new Float32Array(newLength);\n\n for (let i = 0; i < newLength; i++) {\n const srcIndex = i / ratio;\n const floor = Math.floor(srcIndex);\n const ceil = Math.min(floor + 1, audio.length - 1);\n const t = srcIndex - floor;\n result[i] = audio[floor] * (1 - t) + audio[ceil] * t;\n }\n\n return result;\n}\n\n// ============================================\n// WhisperSTT Class\n// ============================================\n\n/**\n * Speech-to-Text using Whisper ONNX models\n */\nexport class WhisperSTT {\n private modelConfig: STTModelConfig;\n private pipeline: any = null;\n private loadPromise: Promise<void> | null = null;\n private _isLoaded = false;\n private _deviceMode: \"webgpu\" | \"cpu\" = \"cpu\";\n\n constructor(modelId: string = DEFAULT_MODEL) {\n const config = WHISPER_MODELS.find((m) => m.id === modelId);\n if (!config) {\n const available = WHISPER_MODELS.map((m) => m.id).join(\", \");\n throw new Error(`Unknown STT model: ${modelId}. Available: ${available}`);\n }\n this.modelConfig = config;\n }\n\n /**\n * Check if model is loaded\n */\n isLoaded(): boolean {\n return this._isLoaded;\n }\n\n /**\n * Get model configuration\n */\n getModelConfig(): STTModelConfig {\n return this.modelConfig;\n }\n\n /**\n * Get model info (alias for getModelConfig)\n */\n getModelInfo(): STTModelConfig {\n return this.modelConfig;\n }\n\n /**\n * Get current device mode\n */\n getDeviceMode(): \"webgpu\" | \"cpu\" {\n return this._deviceMode;\n }\n\n /**\n * List available models\n */\n static listModels(): STTModelConfig[] {\n return [...WHISPER_MODELS];\n }\n\n /**\n * Load the STT model\n */\n async load(options: LoadSTTOptions = {}): Promise<void> {\n if (this._isLoaded) return;\n if (this.loadPromise) {\n await this.loadPromise;\n return;\n }\n\n this.loadPromise = this._load(options);\n await this.loadPromise;\n }\n\n private async _load(options: LoadSTTOptions = {}): Promise<void> {\n const { onProgress, device = \"auto\" } = options;\n\n onProgress?.({ status: \"Loading transformers.js...\" });\n\n // Check if we're in Node.js or browser\n const isNode = typeof process !== \"undefined\" && process.versions?.node;\n\n // Import transformers.js dynamically\n // Both paths use webpackIgnore to prevent bundler static analysis\n // Node.js: uses npm package, Browser: uses CDN\n let transformers: any;\n if (isNode) {\n transformers = await import(/* webpackIgnore: true */ \"@huggingface/transformers\");\n } else {\n const cdnUrl = \"https://cdn.jsdelivr.net/npm/@huggingface/transformers@3.8.1\";\n transformers = await import(/* webpackIgnore: true */ cdnUrl);\n }\n const { pipeline, env } = transformers;\n\n // Configure environment based on runtime\n if (isNode) {\n // Node.js: allow local models (for CLI/server use)\n env.allowLocalModels = true;\n env.allowRemoteModels = true;\n } else {\n // Browser: use IndexedDB cache, fetch from HuggingFace CDN\n env.useBrowserCache = true;\n env.allowLocalModels = false;\n }\n\n // Determine device\n // Note: Whisper ONNX models work best with fp32 on CPU/WASM\n // WebGPU support for ASR is limited, so we use CPU for reliability\n let tfDevice: \"webgpu\" | \"cpu\" | \"wasm\" = \"cpu\";\n\n // In browser, use WASM for better compatibility\n if (!isNode) {\n tfDevice = \"wasm\";\n }\n\n // Store device mode\n this._deviceMode = \"cpu\"; // STT always reports as CPU since WASM is CPU-based\n\n onProgress?.({ status: `Loading ${this.modelConfig.id}...` });\n\n // Load the ASR pipeline\n // Always use fp32 for Whisper models (fp16 not available for ONNX ASR)\n this.pipeline = await pipeline(\"automatic-speech-recognition\", this.modelConfig.repo, {\n dtype: \"fp32\",\n device: tfDevice,\n progress_callback: (progress: any) => {\n if (progress.status === \"progress\" && progress.file) {\n onProgress?.({\n status: `Downloading ${progress.file}`,\n progress: Math.round(progress.progress || 0),\n file: progress.file,\n });\n }\n },\n });\n\n this._isLoaded = true;\n onProgress?.({ status: `Ready (${tfDevice.toUpperCase()})!` });\n }\n\n /**\n * Transcribe audio to text\n *\n * @param audio - Audio data as Float32Array (mono, 16kHz preferred) or Uint8Array (WAV file)\n * @param options - Transcription options\n * @returns Transcription result with text and optional timestamps\n */\n async transcribe(\n audio: Float32Array | Uint8Array,\n options: TranscribeOptions = {},\n ): Promise<TranscribeResult> {\n if (!this._isLoaded) {\n throw new Error(\"STT model not loaded. Call load() first.\");\n }\n\n const { language, timestamps = false, onProgress } = options;\n const startTime = performance.now();\n\n // Convert Uint8Array (WAV) to Float32Array\n let audioData: Float32Array;\n let inputSampleRate = 16000;\n\n if (audio instanceof Uint8Array) {\n onProgress?.({ status: \"Decoding audio...\" });\n const decoded = decodeWav(audio);\n audioData = decoded.audio;\n inputSampleRate = decoded.sampleRate;\n } else {\n audioData = audio;\n }\n\n // Resample to 16kHz if needed\n if (inputSampleRate !== 16000) {\n onProgress?.({ status: \"Resampling to 16kHz...\" });\n audioData = resampleAudio(audioData, inputSampleRate, 16000);\n }\n\n const audioDuration = audioData.length / 16000;\n onProgress?.({ status: `Transcribing ${audioDuration.toFixed(1)}s of audio...` });\n\n // Build pipeline options\n const pipelineOptions: any = {};\n\n // Only set language for multilingual models\n if (language && this.modelConfig.multilingual) {\n pipelineOptions.language = language;\n pipelineOptions.task = \"transcribe\";\n }\n\n // Enable timestamps if requested\n if (timestamps) {\n pipelineOptions.return_timestamps = true;\n }\n\n // Run transcription\n const result = await this.pipeline(audioData, pipelineOptions);\n\n const totalTime = performance.now() - startTime;\n\n // Build result\n let text = result.text?.trim() || \"\";\n\n // Filter out Whisper artifacts\n if (text === \"[BLANK_AUDIO]\" || text === \"(blank audio)\" || text === \"[BLANK AUDIO]\") {\n text = \"\";\n }\n\n const transcribeResult: TranscribeResult = {\n text,\n language: language || (this.modelConfig.multilingual ? \"auto\" : \"en\"),\n duration: audioDuration,\n totalTime,\n };\n\n // Add segments if timestamps were requested\n if (timestamps && result.chunks) {\n transcribeResult.segments = result.chunks.map(\n (chunk: any): TranscribeSegment => ({\n text: chunk.text?.trim() || \"\",\n start: chunk.timestamp?.[0] || 0,\n end: chunk.timestamp?.[1] || 0,\n }),\n );\n }\n\n onProgress?.({ status: \"Done!\" });\n\n return transcribeResult;\n }\n\n /**\n * Create a streaming transcription session\n *\n * Transcribes audio in real-time by processing chunks at regular intervals.\n * Perfect for live captioning, call transcription, or real-time subtitles.\n *\n * @param options - Streaming options\n * @returns Streaming session controller\n *\n * @example\n * ```ts\n * const session = stt.createStreamingSession({\n * chunkDuration: 3000, // Transcribe every 3 seconds\n * onChunk: (text, idx) => console.log(`Chunk ${idx}: ${text}`),\n * onTranscript: (fullText) => console.log(\"Full:\", fullText),\n * });\n *\n * // Feed audio data as it comes in (Float32Array at 16kHz)\n * session.feedAudio(audioChunk);\n *\n * // Or manually trigger transcription\n * await session.flush();\n *\n * // Stop and get final transcript\n * const finalText = await session.stop();\n * ```\n */\n createStreamingSession(\n options: StreamingTranscriptionOptions = {},\n ): StreamingTranscriptionSession {\n const {\n chunkDuration = 3000,\n minChunkSize = 8000, // ~0.5 seconds at 16kHz\n onChunk,\n onTranscript,\n onError,\n language,\n } = options;\n\n let audioBuffer: Float32Array[] = [];\n let fullTranscript = \"\";\n let chunkIndex = 0;\n let intervalId: ReturnType<typeof setInterval> | null = null;\n let isRunning = false;\n\n const getBufferSize = (): number => {\n return audioBuffer.reduce((sum, chunk) => sum + chunk.length, 0);\n };\n\n const mergeBuffer = (): Float32Array => {\n const totalLength = getBufferSize();\n const merged = new Float32Array(totalLength);\n let offset = 0;\n for (const chunk of audioBuffer) {\n merged.set(chunk, offset);\n offset += chunk.length;\n }\n return merged;\n };\n\n const transcribeBuffer = async (): Promise<string> => {\n if (!this._isLoaded || getBufferSize() < minChunkSize) {\n return \"\";\n }\n\n const audio = mergeBuffer();\n audioBuffer = []; // Clear buffer\n\n try {\n const result = await this.transcribe(audio, { language });\n const text = result.text.trim();\n\n if (text) {\n chunkIndex++;\n onChunk?.(text, chunkIndex);\n\n // Append to full transcript\n fullTranscript = fullTranscript + (fullTranscript ? \" \" : \"\") + text;\n onTranscript?.(fullTranscript);\n }\n\n return text;\n } catch (e: any) {\n onError?.(e.message || \"Transcription failed\");\n return \"\";\n }\n };\n\n let aborted = false;\n\n const session: StreamingTranscriptionSession = {\n feedAudio: (audio: Float32Array) => {\n if (!aborted) {\n audioBuffer.push(audio);\n }\n },\n\n flush: async () => {\n if (aborted) return \"\";\n return transcribeBuffer();\n },\n\n start: () => {\n if (isRunning || aborted) return;\n isRunning = true;\n\n intervalId = setInterval(async () => {\n if (isRunning && !aborted) {\n await transcribeBuffer();\n }\n }, chunkDuration);\n },\n\n stop: async () => {\n isRunning = false;\n\n if (intervalId) {\n clearInterval(intervalId);\n intervalId = null;\n }\n\n // Transcribe any remaining audio (unless aborted)\n if (!aborted && getBufferSize() >= minChunkSize) {\n await transcribeBuffer();\n }\n\n return fullTranscript;\n },\n\n abort: () => {\n // Immediately stop without final transcription\n aborted = true;\n isRunning = false;\n\n if (intervalId) {\n clearInterval(intervalId);\n intervalId = null;\n }\n\n audioBuffer = [];\n },\n\n isRunning: () => isRunning,\n\n getTranscript: () => fullTranscript,\n\n getChunkCount: () => chunkIndex,\n\n reset: () => {\n audioBuffer = [];\n fullTranscript = \"\";\n chunkIndex = 0;\n },\n };\n\n return session;\n }\n\n /**\n * Dispose of resources\n */\n dispose(): void {\n this.pipeline = null;\n this._isLoaded = false;\n this.loadPromise = null;\n }\n}\n"],"mappings":";;;;;AA0CA,MAAaA,iBAAmC;CAC9C;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW,CAAC,KAAK;EACjB,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW;GAAC;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAK;EAC7E,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW,CAAC,KAAK;EACjB,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW;GAAC;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAK;EAC7E,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW,CAAC,KAAK;EACjB,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW;GAAC;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAK;EAC7E,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW;GACT;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACD;EACD,YAAY;EACb;CACF;AAGD,MAAM,gBAAgB;;;;;AAUtB,SAAgB,UAAU,QAAiE;CACzF,MAAM,OAAO,IAAI,SAAS,OAAO,QAAQ,OAAO,YAAY,OAAO,WAAW;AAI9E,KADa,OAAO,aAAa,OAAO,IAAI,OAAO,IAAI,OAAO,IAAI,OAAO,GAAG,KAC/D,OACX,OAAM,IAAI,MAAM,wCAAwC;CAI1D,MAAM,cAAc,KAAK,UAAU,IAAI,KAAK;CAC5C,MAAM,aAAa,KAAK,UAAU,IAAI,KAAK;CAC3C,MAAM,gBAAgB,KAAK,UAAU,IAAI,KAAK;AAE9C,KAAI,kBAAkB,GACpB,OAAM,IAAI,MAAM,0BAA0B,cAAc,iCAAiC;CAI3F,IAAI,aAAa;AACjB,QAAO,aAAa,OAAO,SAAS,GAAG;EACrC,MAAM,UAAU,OAAO,aACrB,OAAO,aACP,OAAO,aAAa,IACpB,OAAO,aAAa,IACpB,OAAO,aAAa,GACrB;EACD,MAAM,YAAY,KAAK,UAAU,aAAa,GAAG,KAAK;AACtD,MAAI,YAAY,QAAQ;AACtB,iBAAc;AACd;;AAEF,gBAAc,IAAI;;CAGpB,MAAM,WAAW,OAAO,SAAS;CACjC,MAAM,iBAAiB,gBAAgB;CACvC,MAAM,eAAe,KAAK,MAAM,WAAW,eAAe;CAC1D,MAAM,oBAAoB,KAAK,MAAM,eAAe,YAAY;CAGhE,MAAM,QAAQ,IAAI,aAAa,kBAAkB;AAEjD,MAAK,IAAI,IAAI,GAAG,IAAI,mBAAmB,IACrC,KAAI,gBAAgB,EAGlB,OAAM,MAFO,KAAK,SAAS,aAAa,IAAI,GAAG,KAAK,GACtC,KAAK,SAAS,aAAa,IAAI,IAAI,GAAG,KAAK,IAC7B,IAAI;KAGhC,OAAM,KADS,KAAK,SAAS,aAAa,IAAI,GAAG,KAAK,GAClC;AAIxB,QAAO;EAAE;EAAO;EAAY;;;;;AAM9B,SAAgB,cAAc,OAAqB,UAAkB,QAA8B;AACjG,KAAI,aAAa,OAAQ,QAAO;CAEhC,MAAM,QAAQ,SAAS;CACvB,MAAM,YAAY,KAAK,MAAM,MAAM,SAAS,MAAM;CAClD,MAAM,SAAS,IAAI,aAAa,UAAU;AAE1C,MAAK,IAAI,IAAI,GAAG,IAAI,WAAW,KAAK;EAClC,MAAM,WAAW,IAAI;EACrB,MAAM,QAAQ,KAAK,MAAM,SAAS;EAClC,MAAM,OAAO,KAAK,IAAI,QAAQ,GAAG,MAAM,SAAS,EAAE;EAClD,MAAM,IAAI,WAAW;AACrB,SAAO,KAAK,MAAM,UAAU,IAAI,KAAK,MAAM,QAAQ;;AAGrD,QAAO;;;;;AAUT,IAAa,aAAb,MAAwB;CACtB,AAAQ;CACR,AAAQ,WAAgB;CACxB,AAAQ,cAAoC;CAC5C,AAAQ,YAAY;CACpB,AAAQ,cAAgC;CAExC,YAAY,UAAkB,eAAe;EAC3C,MAAM,SAAS,eAAe,MAAM,MAAM,EAAE,OAAO,QAAQ;AAC3D,MAAI,CAAC,QAAQ;GACX,MAAM,YAAY,eAAe,KAAK,MAAM,EAAE,GAAG,CAAC,KAAK,KAAK;AAC5D,SAAM,IAAI,MAAM,sBAAsB,QAAQ,eAAe,YAAY;;AAE3E,OAAK,cAAc;;;;;CAMrB,WAAoB;AAClB,SAAO,KAAK;;;;;CAMd,iBAAiC;AAC/B,SAAO,KAAK;;;;;CAMd,eAA+B;AAC7B,SAAO,KAAK;;;;;CAMd,gBAAkC;AAChC,SAAO,KAAK;;;;;CAMd,OAAO,aAA+B;AACpC,SAAO,CAAC,GAAG,eAAe;;;;;CAM5B,MAAM,KAAK,UAA0B,EAAE,EAAiB;AACtD,MAAI,KAAK,UAAW;AACpB,MAAI,KAAK,aAAa;AACpB,SAAM,KAAK;AACX;;AAGF,OAAK,cAAc,KAAK,MAAM,QAAQ;AACtC,QAAM,KAAK;;CAGb,MAAc,MAAM,UAA0B,EAAE,EAAiB;EAC/D,MAAM,EAAE,YAAY,SAAS,WAAW;AAExC,eAAa,EAAE,QAAQ,8BAA8B,CAAC;EAGtD,MAAM,SAAS,OAAO,YAAY,eAAe,QAAQ,UAAU;EAKnE,IAAIC;AACJ,MAAI,OACF,gBAAe,MAAM;;GAAiC;;MAGtD,gBAAe,MAAM,OADN;EAGjB,MAAM,EAAE,UAAU,QAAQ;AAG1B,MAAI,QAAQ;AAEV,OAAI,mBAAmB;AACvB,OAAI,oBAAoB;SACnB;AAEL,OAAI,kBAAkB;AACtB,OAAI,mBAAmB;;EAMzB,IAAIC,WAAsC;AAG1C,MAAI,CAAC,OACH,YAAW;AAIb,OAAK,cAAc;AAEnB,eAAa,EAAE,QAAQ,WAAW,KAAK,YAAY,GAAG,MAAM,CAAC;AAI7D,OAAK,WAAW,MAAM,SAAS,gCAAgC,KAAK,YAAY,MAAM;GACpF,OAAO;GACP,QAAQ;GACR,oBAAoB,aAAkB;AACpC,QAAI,SAAS,WAAW,cAAc,SAAS,KAC7C,cAAa;KACX,QAAQ,eAAe,SAAS;KAChC,UAAU,KAAK,MAAM,SAAS,YAAY,EAAE;KAC5C,MAAM,SAAS;KAChB,CAAC;;GAGP,CAAC;AAEF,OAAK,YAAY;AACjB,eAAa,EAAE,QAAQ,UAAU,SAAS,aAAa,CAAC,KAAK,CAAC;;;;;;;;;CAUhE,MAAM,WACJ,OACA,UAA6B,EAAE,EACJ;AAC3B,MAAI,CAAC,KAAK,UACR,OAAM,IAAI,MAAM,2CAA2C;EAG7D,MAAM,EAAE,UAAU,aAAa,OAAO,eAAe;EACrD,MAAM,YAAY,YAAY,KAAK;EAGnC,IAAIC;EACJ,IAAI,kBAAkB;AAEtB,MAAI,iBAAiB,YAAY;AAC/B,gBAAa,EAAE,QAAQ,qBAAqB,CAAC;GAC7C,MAAM,UAAU,UAAU,MAAM;AAChC,eAAY,QAAQ;AACpB,qBAAkB,QAAQ;QAE1B,aAAY;AAId,MAAI,oBAAoB,MAAO;AAC7B,gBAAa,EAAE,QAAQ,0BAA0B,CAAC;AAClD,eAAY,cAAc,WAAW,iBAAiB,KAAM;;EAG9D,MAAM,gBAAgB,UAAU,SAAS;AACzC,eAAa,EAAE,QAAQ,gBAAgB,cAAc,QAAQ,EAAE,CAAC,gBAAgB,CAAC;EAGjF,MAAMC,kBAAuB,EAAE;AAG/B,MAAI,YAAY,KAAK,YAAY,cAAc;AAC7C,mBAAgB,WAAW;AAC3B,mBAAgB,OAAO;;AAIzB,MAAI,WACF,iBAAgB,oBAAoB;EAItC,MAAM,SAAS,MAAM,KAAK,SAAS,WAAW,gBAAgB;EAE9D,MAAM,YAAY,YAAY,KAAK,GAAG;EAGtC,IAAI,OAAO,OAAO,MAAM,MAAM,IAAI;AAGlC,MAAI,SAAS,mBAAmB,SAAS,mBAAmB,SAAS,gBACnE,QAAO;EAGT,MAAMC,mBAAqC;GACzC;GACA,UAAU,aAAa,KAAK,YAAY,eAAe,SAAS;GAChE,UAAU;GACV;GACD;AAGD,MAAI,cAAc,OAAO,OACvB,kBAAiB,WAAW,OAAO,OAAO,KACvC,WAAmC;GAClC,MAAM,MAAM,MAAM,MAAM,IAAI;GAC5B,OAAO,MAAM,YAAY,MAAM;GAC/B,KAAK,MAAM,YAAY,MAAM;GAC9B,EACF;AAGH,eAAa,EAAE,QAAQ,SAAS,CAAC;AAEjC,SAAO;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA8BT,uBACE,UAAyC,EAAE,EACZ;EAC/B,MAAM,EACJ,gBAAgB,KAChB,eAAe,KACf,SACA,cACA,SACA,aACE;EAEJ,IAAIC,cAA8B,EAAE;EACpC,IAAI,iBAAiB;EACrB,IAAI,aAAa;EACjB,IAAIC,aAAoD;EACxD,IAAI,YAAY;EAEhB,MAAM,sBAA8B;AAClC,UAAO,YAAY,QAAQ,KAAK,UAAU,MAAM,MAAM,QAAQ,EAAE;;EAGlE,MAAM,oBAAkC;GACtC,MAAM,cAAc,eAAe;GACnC,MAAM,SAAS,IAAI,aAAa,YAAY;GAC5C,IAAI,SAAS;AACb,QAAK,MAAM,SAAS,aAAa;AAC/B,WAAO,IAAI,OAAO,OAAO;AACzB,cAAU,MAAM;;AAElB,UAAO;;EAGT,MAAM,mBAAmB,YAA6B;AACpD,OAAI,CAAC,KAAK,aAAa,eAAe,GAAG,aACvC,QAAO;GAGT,MAAM,QAAQ,aAAa;AAC3B,iBAAc,EAAE;AAEhB,OAAI;IAEF,MAAM,QADS,MAAM,KAAK,WAAW,OAAO,EAAE,UAAU,CAAC,EACrC,KAAK,MAAM;AAE/B,QAAI,MAAM;AACR;AACA,eAAU,MAAM,WAAW;AAG3B,sBAAiB,kBAAkB,iBAAiB,MAAM,MAAM;AAChE,oBAAe,eAAe;;AAGhC,WAAO;YACAC,GAAQ;AACf,cAAU,EAAE,WAAW,uBAAuB;AAC9C,WAAO;;;EAIX,IAAI,UAAU;AAmEd,SAjE+C;GAC7C,YAAY,UAAwB;AAClC,QAAI,CAAC,QACH,aAAY,KAAK,MAAM;;GAI3B,OAAO,YAAY;AACjB,QAAI,QAAS,QAAO;AACpB,WAAO,kBAAkB;;GAG3B,aAAa;AACX,QAAI,aAAa,QAAS;AAC1B,gBAAY;AAEZ,iBAAa,YAAY,YAAY;AACnC,SAAI,aAAa,CAAC,QAChB,OAAM,kBAAkB;OAEzB,cAAc;;GAGnB,MAAM,YAAY;AAChB,gBAAY;AAEZ,QAAI,YAAY;AACd,mBAAc,WAAW;AACzB,kBAAa;;AAIf,QAAI,CAAC,WAAW,eAAe,IAAI,aACjC,OAAM,kBAAkB;AAG1B,WAAO;;GAGT,aAAa;AAEX,cAAU;AACV,gBAAY;AAEZ,QAAI,YAAY;AACd,mBAAc,WAAW;AACzB,kBAAa;;AAGf,kBAAc,EAAE;;GAGlB,iBAAiB;GAEjB,qBAAqB;GAErB,qBAAqB;GAErB,aAAa;AACX,kBAAc,EAAE;AAChB,qBAAiB;AACjB,iBAAa;;GAEhB;;;;;CAQH,UAAgB;AACd,OAAK,WAAW;AAChB,OAAK,YAAY;AACjB,OAAK,cAAc"}
|
package/dist/stt-BT4Rt49f.mjs
DELETED
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"stt-CkfJswka.mjs","names":["WHISPER_MODELS: STTModelConfig[]","transformers: any","tfDevice: \"webgpu\" | \"cpu\" | \"wasm\"","audioData: Float32Array","pipelineOptions: any","transcribeResult: TranscribeResult","audioBuffer: Float32Array[]","intervalId: ReturnType<typeof setInterval> | null","e: any"],"sources":["../src/core/stt.ts"],"sourcesContent":["/**\n * Speech-to-Text with Whisper\n *\n * Provides local speech recognition using Whisper ONNX models via transformers.js.\n * Supports multiple model sizes and languages.\n *\n * @example\n * ```ts\n * const stt = new WhisperSTT();\n * await stt.load({ onProgress: (p) => console.log(p.status) });\n *\n * // Transcribe audio (Float32Array at 16kHz)\n * const result = await stt.transcribe(audioData);\n * console.log(result.text);\n *\n * // With timestamps\n * const result = await stt.transcribe(audioData, { timestamps: true });\n * for (const seg of result.segments) {\n * console.log(`[${seg.start.toFixed(1)}s] ${seg.text}`);\n * }\n * ```\n */\n\nimport type {\n LoadSTTOptions,\n ProgressInfo,\n STTModelConfig,\n StreamingTranscriptionOptions,\n StreamingTranscriptionSession,\n TranscribeOptions,\n TranscribeResult,\n TranscribeSegment,\n} from \"./types.js\";\n\n// ============================================\n// Model Registry\n// ============================================\n\n/**\n * Available Whisper models\n * Ordered by size (smallest first)\n */\nexport const WHISPER_MODELS: STTModelConfig[] = [\n {\n id: \"whisper-tiny.en\",\n repo: \"onnx-community/whisper-tiny.en\",\n description: \"Tiny English-only model, fastest\",\n size: \"39M\",\n multilingual: false,\n languages: [\"en\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-tiny\",\n repo: \"onnx-community/whisper-tiny\",\n description: \"Tiny multilingual model\",\n size: \"39M\",\n multilingual: true,\n languages: [\"en\", \"es\", \"fr\", \"de\", \"it\", \"pt\", \"nl\", \"ru\", \"zh\", \"ja\", \"ko\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-base.en\",\n repo: \"onnx-community/whisper-base.en\",\n description: \"Base English-only model, good balance\",\n size: \"74M\",\n multilingual: false,\n languages: [\"en\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-base\",\n repo: \"onnx-community/whisper-base\",\n description: \"Base multilingual model\",\n size: \"74M\",\n multilingual: true,\n languages: [\"en\", \"es\", \"fr\", \"de\", \"it\", \"pt\", \"nl\", \"ru\", \"zh\", \"ja\", \"ko\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-small.en\",\n repo: \"onnx-community/whisper-small.en\",\n description: \"Small English-only model, high quality\",\n size: \"244M\",\n multilingual: false,\n languages: [\"en\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-small\",\n repo: \"onnx-community/whisper-small\",\n description: \"Small multilingual model\",\n size: \"244M\",\n multilingual: true,\n languages: [\"en\", \"es\", \"fr\", \"de\", \"it\", \"pt\", \"nl\", \"ru\", \"zh\", \"ja\", \"ko\"],\n sampleRate: 16000,\n },\n {\n id: \"whisper-large-v3-turbo\",\n repo: \"onnx-community/whisper-large-v3-turbo\",\n description: \"Large Turbo model, 5.4x faster, 80+ languages\",\n size: \"809M\",\n multilingual: true,\n languages: [\n \"en\",\n \"es\",\n \"fr\",\n \"de\",\n \"it\",\n \"pt\",\n \"nl\",\n \"ru\",\n \"zh\",\n \"ja\",\n \"ko\",\n \"ar\",\n \"hi\",\n \"vi\",\n \"th\",\n ],\n sampleRate: 16000,\n },\n];\n\n// Default model\nconst DEFAULT_MODEL = \"whisper-tiny.en\";\n\n// ============================================\n// Audio Utilities\n// ============================================\n\n/**\n * Decode WAV file to Float32Array\n * Handles stereo to mono conversion\n */\nexport function decodeWav(buffer: Uint8Array): { audio: Float32Array; sampleRate: number } {\n const view = new DataView(buffer.buffer, buffer.byteOffset, buffer.byteLength);\n\n // Validate RIFF header\n const riff = String.fromCharCode(buffer[0], buffer[1], buffer[2], buffer[3]);\n if (riff !== \"RIFF\") {\n throw new Error(\"Invalid WAV file: missing RIFF header\");\n }\n\n // Get format details\n const numChannels = view.getUint16(22, true);\n const sampleRate = view.getUint32(24, true);\n const bitsPerSample = view.getUint16(34, true);\n\n if (bitsPerSample !== 16) {\n throw new Error(`Unsupported bit depth: ${bitsPerSample}. Only 16-bit WAV is supported.`);\n }\n\n // Find data chunk\n let dataOffset = 12;\n while (dataOffset < buffer.length - 8) {\n const chunkId = String.fromCharCode(\n buffer[dataOffset],\n buffer[dataOffset + 1],\n buffer[dataOffset + 2],\n buffer[dataOffset + 3],\n );\n const chunkSize = view.getUint32(dataOffset + 4, true);\n if (chunkId === \"data\") {\n dataOffset += 8;\n break;\n }\n dataOffset += 8 + chunkSize;\n }\n\n const dataSize = buffer.length - dataOffset;\n const bytesPerSample = bitsPerSample / 8;\n const totalSamples = Math.floor(dataSize / bytesPerSample);\n const samplesPerChannel = Math.floor(totalSamples / numChannels);\n\n // Convert to mono Float32Array\n const audio = new Float32Array(samplesPerChannel);\n\n for (let i = 0; i < samplesPerChannel; i++) {\n if (numChannels === 2) {\n const left = view.getInt16(dataOffset + i * 4, true);\n const right = view.getInt16(dataOffset + i * 4 + 2, true);\n audio[i] = (left + right) / 2 / 32768;\n } else {\n const sample = view.getInt16(dataOffset + i * 2, true);\n audio[i] = sample / 32768;\n }\n }\n\n return { audio, sampleRate };\n}\n\n/**\n * Resample audio to target sample rate using linear interpolation\n */\nexport function resampleAudio(audio: Float32Array, fromRate: number, toRate: number): Float32Array {\n if (fromRate === toRate) return audio;\n\n const ratio = toRate / fromRate;\n const newLength = Math.round(audio.length * ratio);\n const result = new Float32Array(newLength);\n\n for (let i = 0; i < newLength; i++) {\n const srcIndex = i / ratio;\n const floor = Math.floor(srcIndex);\n const ceil = Math.min(floor + 1, audio.length - 1);\n const t = srcIndex - floor;\n result[i] = audio[floor] * (1 - t) + audio[ceil] * t;\n }\n\n return result;\n}\n\n// ============================================\n// WhisperSTT Class\n// ============================================\n\n/**\n * Speech-to-Text using Whisper ONNX models\n */\nexport class WhisperSTT {\n private modelConfig: STTModelConfig;\n private pipeline: any = null;\n private loadPromise: Promise<void> | null = null;\n private _isLoaded = false;\n private _deviceMode: \"webgpu\" | \"cpu\" = \"cpu\";\n\n constructor(modelId: string = DEFAULT_MODEL) {\n const config = WHISPER_MODELS.find((m) => m.id === modelId);\n if (!config) {\n const available = WHISPER_MODELS.map((m) => m.id).join(\", \");\n throw new Error(`Unknown STT model: ${modelId}. Available: ${available}`);\n }\n this.modelConfig = config;\n }\n\n /**\n * Check if model is loaded\n */\n isLoaded(): boolean {\n return this._isLoaded;\n }\n\n /**\n * Get model configuration\n */\n getModelConfig(): STTModelConfig {\n return this.modelConfig;\n }\n\n /**\n * Get model info (alias for getModelConfig)\n */\n getModelInfo(): STTModelConfig {\n return this.modelConfig;\n }\n\n /**\n * Get current device mode\n */\n getDeviceMode(): \"webgpu\" | \"cpu\" {\n return this._deviceMode;\n }\n\n /**\n * List available models\n */\n static listModels(): STTModelConfig[] {\n return [...WHISPER_MODELS];\n }\n\n /**\n * Load the STT model\n */\n async load(options: LoadSTTOptions = {}): Promise<void> {\n if (this._isLoaded) return;\n if (this.loadPromise) {\n await this.loadPromise;\n return;\n }\n\n this.loadPromise = this._load(options);\n await this.loadPromise;\n }\n\n private async _load(options: LoadSTTOptions = {}): Promise<void> {\n const { onProgress, device = \"auto\" } = options;\n\n onProgress?.({ status: \"Loading transformers.js...\" });\n\n // Check if we're in Node.js or browser\n const isNode = typeof process !== \"undefined\" && process.versions?.node;\n\n // Import transformers.js dynamically\n // Both paths use webpackIgnore to prevent bundler static analysis\n // Node.js: uses npm package, Browser: uses CDN\n let transformers: any;\n if (isNode) {\n transformers = await import(/* webpackIgnore: true */ \"@huggingface/transformers\");\n } else {\n const cdnUrl = \"https://cdn.jsdelivr.net/npm/@huggingface/transformers@3.8.1\";\n transformers = await import(/* webpackIgnore: true */ cdnUrl);\n }\n const { pipeline, env } = transformers;\n\n // Configure environment based on runtime\n if (isNode) {\n // Node.js: allow local models (for CLI/server use)\n env.allowLocalModels = true;\n env.allowRemoteModels = true;\n } else {\n // Browser: use IndexedDB cache, fetch from HuggingFace CDN\n env.useBrowserCache = true;\n env.allowLocalModels = false;\n }\n\n // Determine device\n // Note: Whisper ONNX models work best with fp32 on CPU/WASM\n // WebGPU support for ASR is limited, so we use CPU for reliability\n let tfDevice: \"webgpu\" | \"cpu\" | \"wasm\" = \"cpu\";\n\n // In browser, use WASM for better compatibility\n if (!isNode) {\n tfDevice = \"wasm\";\n }\n\n // Store device mode\n this._deviceMode = \"cpu\"; // STT always reports as CPU since WASM is CPU-based\n\n onProgress?.({ status: `Loading ${this.modelConfig.id}...` });\n\n // Load the ASR pipeline\n // Always use fp32 for Whisper models (fp16 not available for ONNX ASR)\n this.pipeline = await pipeline(\"automatic-speech-recognition\", this.modelConfig.repo, {\n dtype: \"fp32\",\n device: tfDevice,\n progress_callback: (progress: any) => {\n if (progress.status === \"progress\" && progress.file) {\n onProgress?.({\n status: `Downloading ${progress.file}`,\n progress: Math.round(progress.progress || 0),\n file: progress.file,\n });\n }\n },\n });\n\n this._isLoaded = true;\n onProgress?.({ status: `Ready (${tfDevice.toUpperCase()})!` });\n }\n\n /**\n * Transcribe audio to text\n *\n * @param audio - Audio data as Float32Array (mono, 16kHz preferred) or Uint8Array (WAV file)\n * @param options - Transcription options\n * @returns Transcription result with text and optional timestamps\n */\n async transcribe(\n audio: Float32Array | Uint8Array,\n options: TranscribeOptions = {},\n ): Promise<TranscribeResult> {\n if (!this._isLoaded) {\n throw new Error(\"STT model not loaded. Call load() first.\");\n }\n\n const { language, timestamps = false, onProgress } = options;\n const startTime = performance.now();\n\n // Convert Uint8Array (WAV) to Float32Array\n let audioData: Float32Array;\n let inputSampleRate = 16000;\n\n if (audio instanceof Uint8Array) {\n onProgress?.({ status: \"Decoding audio...\" });\n const decoded = decodeWav(audio);\n audioData = decoded.audio;\n inputSampleRate = decoded.sampleRate;\n } else {\n audioData = audio;\n }\n\n // Resample to 16kHz if needed\n if (inputSampleRate !== 16000) {\n onProgress?.({ status: \"Resampling to 16kHz...\" });\n audioData = resampleAudio(audioData, inputSampleRate, 16000);\n }\n\n const audioDuration = audioData.length / 16000;\n onProgress?.({ status: `Transcribing ${audioDuration.toFixed(1)}s of audio...` });\n\n // Build pipeline options\n const pipelineOptions: any = {};\n\n // Only set language for multilingual models\n if (language && this.modelConfig.multilingual) {\n pipelineOptions.language = language;\n pipelineOptions.task = \"transcribe\";\n }\n\n // Enable timestamps if requested\n if (timestamps) {\n pipelineOptions.return_timestamps = true;\n }\n\n // Run transcription\n const result = await this.pipeline(audioData, pipelineOptions);\n\n const totalTime = performance.now() - startTime;\n\n // Build result\n let text = result.text?.trim() || \"\";\n\n // Filter out Whisper artifacts\n if (text === \"[BLANK_AUDIO]\" || text === \"(blank audio)\" || text === \"[BLANK AUDIO]\") {\n text = \"\";\n }\n\n const transcribeResult: TranscribeResult = {\n text,\n language: language || (this.modelConfig.multilingual ? \"auto\" : \"en\"),\n duration: audioDuration,\n totalTime,\n };\n\n // Add segments if timestamps were requested\n if (timestamps && result.chunks) {\n transcribeResult.segments = result.chunks.map(\n (chunk: any): TranscribeSegment => ({\n text: chunk.text?.trim() || \"\",\n start: chunk.timestamp?.[0] || 0,\n end: chunk.timestamp?.[1] || 0,\n }),\n );\n }\n\n onProgress?.({ status: \"Done!\" });\n\n return transcribeResult;\n }\n\n /**\n * Create a streaming transcription session\n *\n * Transcribes audio in real-time by processing chunks at regular intervals.\n * Perfect for live captioning, call transcription, or real-time subtitles.\n *\n * @param options - Streaming options\n * @returns Streaming session controller\n *\n * @example\n * ```ts\n * const session = stt.createStreamingSession({\n * chunkDuration: 3000, // Transcribe every 3 seconds\n * onChunk: (text, idx) => console.log(`Chunk ${idx}: ${text}`),\n * onTranscript: (fullText) => console.log(\"Full:\", fullText),\n * });\n *\n * // Feed audio data as it comes in (Float32Array at 16kHz)\n * session.feedAudio(audioChunk);\n *\n * // Or manually trigger transcription\n * await session.flush();\n *\n * // Stop and get final transcript\n * const finalText = await session.stop();\n * ```\n */\n createStreamingSession(\n options: StreamingTranscriptionOptions = {},\n ): StreamingTranscriptionSession {\n const {\n chunkDuration = 3000,\n minChunkSize = 8000, // ~0.5 seconds at 16kHz\n onChunk,\n onTranscript,\n onError,\n language,\n } = options;\n\n let audioBuffer: Float32Array[] = [];\n let fullTranscript = \"\";\n let chunkIndex = 0;\n let intervalId: ReturnType<typeof setInterval> | null = null;\n let isRunning = false;\n\n const getBufferSize = (): number => {\n return audioBuffer.reduce((sum, chunk) => sum + chunk.length, 0);\n };\n\n const mergeBuffer = (): Float32Array => {\n const totalLength = getBufferSize();\n const merged = new Float32Array(totalLength);\n let offset = 0;\n for (const chunk of audioBuffer) {\n merged.set(chunk, offset);\n offset += chunk.length;\n }\n return merged;\n };\n\n const transcribeBuffer = async (): Promise<string> => {\n if (!this._isLoaded || getBufferSize() < minChunkSize) {\n return \"\";\n }\n\n const audio = mergeBuffer();\n audioBuffer = []; // Clear buffer\n\n try {\n const result = await this.transcribe(audio, { language });\n const text = result.text.trim();\n\n if (text) {\n chunkIndex++;\n onChunk?.(text, chunkIndex);\n\n // Append to full transcript\n fullTranscript = fullTranscript + (fullTranscript ? \" \" : \"\") + text;\n onTranscript?.(fullTranscript);\n }\n\n return text;\n } catch (e: any) {\n onError?.(e.message || \"Transcription failed\");\n return \"\";\n }\n };\n\n let aborted = false;\n\n const session: StreamingTranscriptionSession = {\n feedAudio: (audio: Float32Array) => {\n if (!aborted) {\n audioBuffer.push(audio);\n }\n },\n\n flush: async () => {\n if (aborted) return \"\";\n return transcribeBuffer();\n },\n\n start: () => {\n if (isRunning || aborted) return;\n isRunning = true;\n\n intervalId = setInterval(async () => {\n if (isRunning && !aborted) {\n await transcribeBuffer();\n }\n }, chunkDuration);\n },\n\n stop: async () => {\n isRunning = false;\n\n if (intervalId) {\n clearInterval(intervalId);\n intervalId = null;\n }\n\n // Transcribe any remaining audio (unless aborted)\n if (!aborted && getBufferSize() >= minChunkSize) {\n await transcribeBuffer();\n }\n\n return fullTranscript;\n },\n\n abort: () => {\n // Immediately stop without final transcription\n aborted = true;\n isRunning = false;\n\n if (intervalId) {\n clearInterval(intervalId);\n intervalId = null;\n }\n\n audioBuffer = [];\n },\n\n isRunning: () => isRunning,\n\n getTranscript: () => fullTranscript,\n\n getChunkCount: () => chunkIndex,\n\n reset: () => {\n audioBuffer = [];\n fullTranscript = \"\";\n chunkIndex = 0;\n },\n };\n\n return session;\n }\n\n /**\n * Dispose of resources\n */\n dispose(): void {\n this.pipeline = null;\n this._isLoaded = false;\n this.loadPromise = null;\n }\n}\n"],"mappings":";;;;;AA0CA,MAAaA,iBAAmC;CAC9C;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW,CAAC,KAAK;EACjB,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW;GAAC;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAK;EAC7E,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW,CAAC,KAAK;EACjB,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW;GAAC;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAK;EAC7E,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW,CAAC,KAAK;EACjB,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW;GAAC;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAM;GAAK;EAC7E,YAAY;EACb;CACD;EACE,IAAI;EACJ,MAAM;EACN,aAAa;EACb,MAAM;EACN,cAAc;EACd,WAAW;GACT;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACA;GACD;EACD,YAAY;EACb;CACF;AAGD,MAAM,gBAAgB;;;;;AAUtB,SAAgB,UAAU,QAAiE;CACzF,MAAM,OAAO,IAAI,SAAS,OAAO,QAAQ,OAAO,YAAY,OAAO,WAAW;AAI9E,KADa,OAAO,aAAa,OAAO,IAAI,OAAO,IAAI,OAAO,IAAI,OAAO,GAAG,KAC/D,OACX,OAAM,IAAI,MAAM,wCAAwC;CAI1D,MAAM,cAAc,KAAK,UAAU,IAAI,KAAK;CAC5C,MAAM,aAAa,KAAK,UAAU,IAAI,KAAK;CAC3C,MAAM,gBAAgB,KAAK,UAAU,IAAI,KAAK;AAE9C,KAAI,kBAAkB,GACpB,OAAM,IAAI,MAAM,0BAA0B,cAAc,iCAAiC;CAI3F,IAAI,aAAa;AACjB,QAAO,aAAa,OAAO,SAAS,GAAG;EACrC,MAAM,UAAU,OAAO,aACrB,OAAO,aACP,OAAO,aAAa,IACpB,OAAO,aAAa,IACpB,OAAO,aAAa,GACrB;EACD,MAAM,YAAY,KAAK,UAAU,aAAa,GAAG,KAAK;AACtD,MAAI,YAAY,QAAQ;AACtB,iBAAc;AACd;;AAEF,gBAAc,IAAI;;CAGpB,MAAM,WAAW,OAAO,SAAS;CACjC,MAAM,iBAAiB,gBAAgB;CACvC,MAAM,eAAe,KAAK,MAAM,WAAW,eAAe;CAC1D,MAAM,oBAAoB,KAAK,MAAM,eAAe,YAAY;CAGhE,MAAM,QAAQ,IAAI,aAAa,kBAAkB;AAEjD,MAAK,IAAI,IAAI,GAAG,IAAI,mBAAmB,IACrC,KAAI,gBAAgB,EAGlB,OAAM,MAFO,KAAK,SAAS,aAAa,IAAI,GAAG,KAAK,GACtC,KAAK,SAAS,aAAa,IAAI,IAAI,GAAG,KAAK,IAC7B,IAAI;KAGhC,OAAM,KADS,KAAK,SAAS,aAAa,IAAI,GAAG,KAAK,GAClC;AAIxB,QAAO;EAAE;EAAO;EAAY;;;;;AAM9B,SAAgB,cAAc,OAAqB,UAAkB,QAA8B;AACjG,KAAI,aAAa,OAAQ,QAAO;CAEhC,MAAM,QAAQ,SAAS;CACvB,MAAM,YAAY,KAAK,MAAM,MAAM,SAAS,MAAM;CAClD,MAAM,SAAS,IAAI,aAAa,UAAU;AAE1C,MAAK,IAAI,IAAI,GAAG,IAAI,WAAW,KAAK;EAClC,MAAM,WAAW,IAAI;EACrB,MAAM,QAAQ,KAAK,MAAM,SAAS;EAClC,MAAM,OAAO,KAAK,IAAI,QAAQ,GAAG,MAAM,SAAS,EAAE;EAClD,MAAM,IAAI,WAAW;AACrB,SAAO,KAAK,MAAM,UAAU,IAAI,KAAK,MAAM,QAAQ;;AAGrD,QAAO;;;;;AAUT,IAAa,aAAb,MAAwB;CACtB,AAAQ;CACR,AAAQ,WAAgB;CACxB,AAAQ,cAAoC;CAC5C,AAAQ,YAAY;CACpB,AAAQ,cAAgC;CAExC,YAAY,UAAkB,eAAe;EAC3C,MAAM,SAAS,eAAe,MAAM,MAAM,EAAE,OAAO,QAAQ;AAC3D,MAAI,CAAC,QAAQ;GACX,MAAM,YAAY,eAAe,KAAK,MAAM,EAAE,GAAG,CAAC,KAAK,KAAK;AAC5D,SAAM,IAAI,MAAM,sBAAsB,QAAQ,eAAe,YAAY;;AAE3E,OAAK,cAAc;;;;;CAMrB,WAAoB;AAClB,SAAO,KAAK;;;;;CAMd,iBAAiC;AAC/B,SAAO,KAAK;;;;;CAMd,eAA+B;AAC7B,SAAO,KAAK;;;;;CAMd,gBAAkC;AAChC,SAAO,KAAK;;;;;CAMd,OAAO,aAA+B;AACpC,SAAO,CAAC,GAAG,eAAe;;;;;CAM5B,MAAM,KAAK,UAA0B,EAAE,EAAiB;AACtD,MAAI,KAAK,UAAW;AACpB,MAAI,KAAK,aAAa;AACpB,SAAM,KAAK;AACX;;AAGF,OAAK,cAAc,KAAK,MAAM,QAAQ;AACtC,QAAM,KAAK;;CAGb,MAAc,MAAM,UAA0B,EAAE,EAAiB;EAC/D,MAAM,EAAE,YAAY,SAAS,WAAW;AAExC,eAAa,EAAE,QAAQ,8BAA8B,CAAC;EAGtD,MAAM,SAAS,OAAO,YAAY,eAAe,QAAQ,UAAU;EAKnE,IAAIC;AACJ,MAAI,OACF,gBAAe,MAAM;;GAAiC;;MAGtD,gBAAe,MAAM,OADN;EAGjB,MAAM,EAAE,UAAU,QAAQ;AAG1B,MAAI,QAAQ;AAEV,OAAI,mBAAmB;AACvB,OAAI,oBAAoB;SACnB;AAEL,OAAI,kBAAkB;AACtB,OAAI,mBAAmB;;EAMzB,IAAIC,WAAsC;AAG1C,MAAI,CAAC,OACH,YAAW;AAIb,OAAK,cAAc;AAEnB,eAAa,EAAE,QAAQ,WAAW,KAAK,YAAY,GAAG,MAAM,CAAC;AAI7D,OAAK,WAAW,MAAM,SAAS,gCAAgC,KAAK,YAAY,MAAM;GACpF,OAAO;GACP,QAAQ;GACR,oBAAoB,aAAkB;AACpC,QAAI,SAAS,WAAW,cAAc,SAAS,KAC7C,cAAa;KACX,QAAQ,eAAe,SAAS;KAChC,UAAU,KAAK,MAAM,SAAS,YAAY,EAAE;KAC5C,MAAM,SAAS;KAChB,CAAC;;GAGP,CAAC;AAEF,OAAK,YAAY;AACjB,eAAa,EAAE,QAAQ,UAAU,SAAS,aAAa,CAAC,KAAK,CAAC;;;;;;;;;CAUhE,MAAM,WACJ,OACA,UAA6B,EAAE,EACJ;AAC3B,MAAI,CAAC,KAAK,UACR,OAAM,IAAI,MAAM,2CAA2C;EAG7D,MAAM,EAAE,UAAU,aAAa,OAAO,eAAe;EACrD,MAAM,YAAY,YAAY,KAAK;EAGnC,IAAIC;EACJ,IAAI,kBAAkB;AAEtB,MAAI,iBAAiB,YAAY;AAC/B,gBAAa,EAAE,QAAQ,qBAAqB,CAAC;GAC7C,MAAM,UAAU,UAAU,MAAM;AAChC,eAAY,QAAQ;AACpB,qBAAkB,QAAQ;QAE1B,aAAY;AAId,MAAI,oBAAoB,MAAO;AAC7B,gBAAa,EAAE,QAAQ,0BAA0B,CAAC;AAClD,eAAY,cAAc,WAAW,iBAAiB,KAAM;;EAG9D,MAAM,gBAAgB,UAAU,SAAS;AACzC,eAAa,EAAE,QAAQ,gBAAgB,cAAc,QAAQ,EAAE,CAAC,gBAAgB,CAAC;EAGjF,MAAMC,kBAAuB,EAAE;AAG/B,MAAI,YAAY,KAAK,YAAY,cAAc;AAC7C,mBAAgB,WAAW;AAC3B,mBAAgB,OAAO;;AAIzB,MAAI,WACF,iBAAgB,oBAAoB;EAItC,MAAM,SAAS,MAAM,KAAK,SAAS,WAAW,gBAAgB;EAE9D,MAAM,YAAY,YAAY,KAAK,GAAG;EAGtC,IAAI,OAAO,OAAO,MAAM,MAAM,IAAI;AAGlC,MAAI,SAAS,mBAAmB,SAAS,mBAAmB,SAAS,gBACnE,QAAO;EAGT,MAAMC,mBAAqC;GACzC;GACA,UAAU,aAAa,KAAK,YAAY,eAAe,SAAS;GAChE,UAAU;GACV;GACD;AAGD,MAAI,cAAc,OAAO,OACvB,kBAAiB,WAAW,OAAO,OAAO,KACvC,WAAmC;GAClC,MAAM,MAAM,MAAM,MAAM,IAAI;GAC5B,OAAO,MAAM,YAAY,MAAM;GAC/B,KAAK,MAAM,YAAY,MAAM;GAC9B,EACF;AAGH,eAAa,EAAE,QAAQ,SAAS,CAAC;AAEjC,SAAO;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA8BT,uBACE,UAAyC,EAAE,EACZ;EAC/B,MAAM,EACJ,gBAAgB,KAChB,eAAe,KACf,SACA,cACA,SACA,aACE;EAEJ,IAAIC,cAA8B,EAAE;EACpC,IAAI,iBAAiB;EACrB,IAAI,aAAa;EACjB,IAAIC,aAAoD;EACxD,IAAI,YAAY;EAEhB,MAAM,sBAA8B;AAClC,UAAO,YAAY,QAAQ,KAAK,UAAU,MAAM,MAAM,QAAQ,EAAE;;EAGlE,MAAM,oBAAkC;GACtC,MAAM,cAAc,eAAe;GACnC,MAAM,SAAS,IAAI,aAAa,YAAY;GAC5C,IAAI,SAAS;AACb,QAAK,MAAM,SAAS,aAAa;AAC/B,WAAO,IAAI,OAAO,OAAO;AACzB,cAAU,MAAM;;AAElB,UAAO;;EAGT,MAAM,mBAAmB,YAA6B;AACpD,OAAI,CAAC,KAAK,aAAa,eAAe,GAAG,aACvC,QAAO;GAGT,MAAM,QAAQ,aAAa;AAC3B,iBAAc,EAAE;AAEhB,OAAI;IAEF,MAAM,QADS,MAAM,KAAK,WAAW,OAAO,EAAE,UAAU,CAAC,EACrC,KAAK,MAAM;AAE/B,QAAI,MAAM;AACR;AACA,eAAU,MAAM,WAAW;AAG3B,sBAAiB,kBAAkB,iBAAiB,MAAM,MAAM;AAChE,oBAAe,eAAe;;AAGhC,WAAO;YACAC,GAAQ;AACf,cAAU,EAAE,WAAW,uBAAuB;AAC9C,WAAO;;;EAIX,IAAI,UAAU;AAmEd,SAjE+C;GAC7C,YAAY,UAAwB;AAClC,QAAI,CAAC,QACH,aAAY,KAAK,MAAM;;GAI3B,OAAO,YAAY;AACjB,QAAI,QAAS,QAAO;AACpB,WAAO,kBAAkB;;GAG3B,aAAa;AACX,QAAI,aAAa,QAAS;AAC1B,gBAAY;AAEZ,iBAAa,YAAY,YAAY;AACnC,SAAI,aAAa,CAAC,QAChB,OAAM,kBAAkB;OAEzB,cAAc;;GAGnB,MAAM,YAAY;AAChB,gBAAY;AAEZ,QAAI,YAAY;AACd,mBAAc,WAAW;AACzB,kBAAa;;AAIf,QAAI,CAAC,WAAW,eAAe,IAAI,aACjC,OAAM,kBAAkB;AAG1B,WAAO;;GAGT,aAAa;AAEX,cAAU;AACV,gBAAY;AAEZ,QAAI,YAAY;AACd,mBAAc,WAAW;AACzB,kBAAa;;AAGf,kBAAc,EAAE;;GAGlB,iBAAiB;GAEjB,qBAAqB;GAErB,qBAAqB;GAErB,aAAa;AACX,kBAAc,EAAE;AAChB,qBAAiB;AACjB,iBAAa;;GAEhB;;;;;CAQH,UAAgB;AACd,OAAK,WAAW;AAChB,OAAK,YAAY;AACjB,OAAK,cAAc"}
|