npm - n8n-nodes-tts-bigboss - Versions diffs - 1.0.6 → 1.0.8 - Mend

n8n-nodes-tts-bigboss 1.0.6 → 1.0.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/TTSBigBoss.node.js +281 -92
package/nodes/TTSBigBoss/TTSBigBoss.node.ts +321 -131
package/package.json +1 -1

package/dist/TTSBigBoss.node.js CHANGED Viewed

@@ -73,6 +73,16 @@ const PIPER_MODELS = [
     { name: 'German - Thorsten (Male) - Low', value: 'de_DE-thorsten-low' },
 ];
 const EDGE_URL = 'wss://speech.platform.bing.com/consumer/speech/synthesize/readaloud/edge/v1?TrustedClientToken=6A5AA1D4EAFF4E9FB37E23D68491D6F4';
+const EDGE_HEADERS = {
+    'Authority': 'speech.platform.bing.com',
+    'Sec-CH-UA': '"Not_A Brand";v="8", "Chromium";v="120", "Microsoft Edge";v="120"',
+    'Sec-CH-UA-Mobile': '?0',
+    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36 Edg/120.0.0.0',
+    'Sec-CH-UA-Platform': '"Windows"',
+    'Accept-Encoding': 'gzip, deflate, br',
+    'Accept-Language': 'en-US,en;q=0.9',
+    'Origin': 'chrome-extension://jdiccldimpdaibmpdkjnbmckianbfold'
+};
 const EDGE_VOICES = [
     { name: 'Arabic (Egypt) - Salma', value: 'ar-EG-SalmaNeural' },
     { name: 'Arabic (Egypt) - Shakir', value: 'ar-EG-ShakirNeural' },
@@ -125,7 +135,12 @@ class TTSBigBoss {
                         {
                             name: 'Coqui TTS (Local Server)',
                             value: 'coqui',
-                            description: 'Connect to a running Coqui TTS/XTTS server (e.g. python3 coqui_server.py).',
+                            description: 'Connect to a running Coqui TTS/XTTS server.',
+                        },
+                        {
+                            name: 'Kokoro TTS (Local OpenAI API)',
+                            value: 'kokoro',
+                            description: 'Connect to a local Kokoro server compatible with OpenAI API (e.g. /v1/audio/speech).',
                         },
                         {
                             name: 'System Command (Custom)',
@@ -277,11 +292,46 @@ class TTSBigBoss {
                     description: 'Name from Hugging Face (e.g. en_US-bryce-medium) or full URL to .onnx file.',
                 },
                 {
-                    displayName: 'Server URL',
+                    displayName: 'API URL',
+                    name: 'kokoroUrl',
+                    type: 'string',
+                    default: 'http://localhost:8880/v1/audio/speech',
+                    description: 'Endpoint URL for Kokoro generation (OpenAI compatible).',
+                    displayOptions: {
+                        show: {
+                            engine: ['kokoro'],
+                        },
+                    },
+                },
+                {
+                    displayName: 'Voice / Model',
+                    name: 'kokoroVoice',
+                    type: 'string',
+                    default: 'af_bella',
+                    description: 'Voice ID (e.g. af_bella, af_sarah, am_adam). Arabic might require specific model ID.',
+                    displayOptions: {
+                        show: {
+                            engine: ['kokoro'],
+                        },
+                    },
+                },
+                {
+                    displayName: 'Speed',
+                    name: 'kokoroSpeed',
+                    type: 'number',
+                    default: 1.0,
+                    displayOptions: {
+                        show: {
+                            engine: ['kokoro'],
+                        },
+                    },
+                },
+                {
+                    displayName: 'Base Server URL',
                     name: 'coquiUrl',
                     type: 'string',
-                    default: 'http://localhost:5002/api/tts',
-                    description: 'URL of the running Coqui server endpoint (usually /api/tts or /tts_stream).',
+                    default: 'http://localhost:5002',
+                    description: 'Base URL of Coqui server (e.g. http://localhost:5002 or http://host.docker.internal:5002).',
                     displayOptions: {
                         show: {
                             engine: ['coqui'],
@@ -289,23 +339,56 @@ class TTSBigBoss {
                     },
                 },
                 {
-                    displayName: 'Speaker ID / Wav Path',
+                    displayName: 'Speaker',
                     name: 'coquiSpeaker',
+                    type: 'options',
+                    typeOptions: {
+                        loadOptionsMethod: 'getCoquiSpeakers',
+                        loadOptionsDependsOn: ['coquiUrl'],
+                    },
+                    default: '',
+                    description: 'Select a speaker ID loaded from the server.',
+                    displayOptions: {
+                        show: {
+                            engine: ['coqui'],
+                        },
+                    },
+                },
+                {
+                    displayName: 'Use Custom WAV Path',
+                    name: 'coquiUseWav',
+                    type: 'boolean',
+                    default: false,
+                    description: 'Check to use a local WAV file path instead of a Speaker ID (for cloning).',
+                    displayOptions: {
+                        show: {
+                            engine: ['coqui'],
+                        },
+                    },
+                },
+                {
+                    displayName: 'WAV Path',
+                    name: 'coquiWavPath',
                     type: 'string',
                     default: '',
-                    description: 'Speaker ID (if multi-speaker) or path to reference wav (for cloning).',
+                    description: 'Absolute path to the reference WAV file on the server.',
                     displayOptions: {
                         show: {
                             engine: ['coqui'],
+                            coquiUseWav: [true],
                         },
                     },
                 },
                 {
                     displayName: 'Language',
                     name: 'coquiLang',
-                    type: 'string',
+                    type: 'options',
+                    typeOptions: {
+                        loadOptionsMethod: 'getCoquiLanguages',
+                        loadOptionsDependsOn: ['coquiUrl'],
+                    },
                     default: 'en',
-                    description: 'Language code (e.g. en, ar, fr).',
+                    description: 'Select language.',
                     displayOptions: {
                         show: {
                             engine: ['coqui'],
@@ -314,6 +397,60 @@ class TTSBigBoss {
                 },
             ],
         };
+        this.methods = {
+            loadOptions: {
+                async getCoquiSpeakers() {
+                    const baseUrl = this.getNodeParameter('coquiUrl');
+                    const cleanUrl = baseUrl.replace(/\/$/, '');
+                    const targetUrl = `${cleanUrl}/api/speakers`;
+                    try {
+                        const data = await httpRequest(targetUrl);
+                        const json = JSON.parse(data.toString());
+                        let speakers = [];
+                        if (Array.isArray(json))
+                            speakers = json;
+                        else if (json.speakers)
+                            speakers = json.speakers;
+                        else if (typeof json === 'object')
+                            speakers = Object.keys(json);
+                        return speakers.map((s) => {
+                            const name = typeof s === 'string' ? s : (s.name || s.id);
+                            const value = typeof s === 'string' ? s : (s.id || s.name);
+                            return { name, value };
+                        });
+                    }
+                    catch (e) {
+                        return [{ name: `Error loading: ${e.message}. Check URL & Connection.`, value: '' }];
+                    }
+                },
+                async getCoquiLanguages() {
+                    const baseUrl = this.getNodeParameter('coquiUrl');
+                    const cleanUrl = baseUrl.replace(/\/$/, '');
+                    const targetUrl = `${cleanUrl}/api/languages`;
+                    try {
+                        const data = await httpRequest(targetUrl);
+                        const json = JSON.parse(data.toString());
+                        let langs = [];
+                        if (Array.isArray(json))
+                            langs = json;
+                        else if (json.languages)
+                            langs = json.languages;
+                        return langs.map((l) => {
+                            const name = typeof l === 'string' ? l : (l.name || l.code);
+                            const value = typeof l === 'string' ? l : (l.code || l.name);
+                            return { name, value };
+                        });
+                    }
+                    catch (e) {
+                        return [
+                            { name: 'English (en)', value: 'en' },
+                            { name: 'Arabic (ar)', value: 'ar' },
+                            { name: 'Examples (Fix URL to load)', value: 'en' }
+                        ];
+                    }
+                },
+            },
+        };
     }
     async execute() {
         const items = this.getInputData();
@@ -347,6 +484,21 @@ class TTSBigBoss {
                         srtBuffer = Buffer.from(result.srt, 'utf8');
                     }
                 }
+                else if (engine === 'kokoro') {
+                    const url = this.getNodeParameter('kokoroUrl', i);
+                    const voice = this.getNodeParameter('kokoroVoice', i);
+                    const speed = this.getNodeParameter('kokoroSpeed', i);
+                    const payload = {
+                        model: 'kokoro',
+                        input: text,
+                        voice: voice,
+                        speed: speed,
+                        response_format: 'mp3'
+                    };
+                    audioBuffer = await httpRequest(url, 'POST', payload);
+                    const duration = getAudioDuration(audioBuffer, 'mp3');
+                    srtBuffer = Buffer.from(generateHeuristicSRT(text, duration), 'utf8');
+                }
                 else if (engine === 'piper_local') {
                     let piperModel = this.getNodeParameter('piperModel', i);
                     if (piperModel === 'custom') {
@@ -369,7 +521,7 @@ class TTSBigBoss {
                             if (code === 0)
                                 resolve();
                             if (errData.includes('json.exception.parse_error')) {
-                                reject(new Error(`Piper Config Error: The downloaded JSON configuration for model '${piperModel}' seems corrupted (HTML instead of JSON?). Try deleting the file at ${configPath} and running again.`));
+                                reject(new Error(`Piper Config Error: The downloaded JSON configuration for model '${piperModel}' seems corrupted. Try deleting the file at ${configPath}.`));
                             }
                             else {
                                 reject(new Error(`Piper failed (exit ${code}): ${errData}`));
@@ -380,43 +532,30 @@ class TTSBigBoss {
                     if (!fs.existsSync(outFile))
                         throw new Error('Piper did not produce output file');
                     audioBuffer = fs.readFileSync(outFile);
-                    srtBuffer = Buffer.from(generateHeuristicSRT(text, audioBuffer.length), 'utf8');
+                    const duration = getAudioDuration(audioBuffer, 'wav');
+                    srtBuffer = Buffer.from(generateHeuristicSRT(text, duration), 'utf8');
                     fs.unlinkSync(outFile);
                 }
                 else if (engine === 'coqui') {
-                    const url = this.getNodeParameter('coquiUrl', i);
-                    const speaker = this.getNodeParameter('coquiSpeaker', i);
+                    let url = this.getNodeParameter('coquiUrl', i);
+                    url = url.replace(/\/$/, '') + '/api/tts';
+                    const speakerSelection = this.getNodeParameter('coquiSpeaker', i);
+                    const useWav = this.getNodeParameter('coquiUseWav', i, false);
+                    const wavPath = this.getNodeParameter('coquiWavPath', i, '');
                     const lang = this.getNodeParameter('coquiLang', i);
                     const payload = {
                         text: text,
                         language_id: lang,
                     };
-                    if (speaker)
-                        payload.speaker_id = speaker;
-                    const requestModule = url.startsWith('https') ? https : http;
-                    audioBuffer = await new Promise((resolve, reject) => {
-                        const req = requestModule.request(url, {
-                            method: 'POST',
-                            headers: {
-                                'Content-Type': 'application/json',
-                            }
-                        }, (res) => {
-                            const chunks = [];
-                            res.on('data', (d) => chunks.push(d));
-                            res.on('end', () => {
-                                if (res.statusCode >= 200 && res.statusCode < 300) {
-                                    resolve(Buffer.concat(chunks));
-                                }
-                                else {
-                                    reject(new Error(`Coqui Server Error ${res.statusCode}: ${Buffer.concat(chunks).toString()}`));
-                                }
-                            });
-                        });
-                        req.on('error', reject);
-                        req.write(JSON.stringify(payload));
-                        req.end();
-                    });
-                    srtBuffer = Buffer.from(generateHeuristicSRT(text, audioBuffer.length), 'utf8');
+                    if (useWav && wavPath) {
+                        payload.speaker_wav = wavPath;
+                    }
+                    else if (speakerSelection) {
+                        payload.speaker_id = speakerSelection;
+                    }
+                    audioBuffer = await httpRequest(url, 'POST', payload);
+                    const duration = getAudioDuration(audioBuffer, 'wav');
+                    srtBuffer = Buffer.from(generateHeuristicSRT(text, duration), 'utf8');
                 }
                 else {
                     const commandTpl = this.getNodeParameter('systemCommand', i);
@@ -450,7 +589,8 @@ class TTSBigBoss {
                         throw new Error('System command did not produce output file at expected path');
                     }
                     audioBuffer = fs.readFileSync(outFile);
-                    srtBuffer = Buffer.from(generateHeuristicSRT(text, audioBuffer.length), 'utf8');
+                    const duration = getAudioDuration(audioBuffer);
+                    srtBuffer = Buffer.from(generateHeuristicSRT(text, duration), 'utf8');
                     if (fs.existsSync(outFile))
                         fs.unlinkSync(outFile);
                 }
@@ -481,7 +621,7 @@ async function runEdgeTTS(text, voice, rate, pitch) {
     return new Promise((resolve, reject) => {
         const ws = new ws_1.default(EDGE_URL, {
             headers: {
-                'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
+                'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/128.0.0.0 Safari/537.36 Edg/128.0.0.0',
                 'Origin': 'chrome-extension://jdiccldimpdaibmpdkjnbmckianbfold',
                 'TrustedClientToken': '6A5AA1D4EAFF4E9FB37E23D68491D6F4'
             }
@@ -595,23 +735,41 @@ function ticksToTime(ticks) {
     const mili = date.getMilliseconds().toString().padStart(3, '0');
     return `${h}:${m}:${s},${mili}`;
 }
-function generateHeuristicSRT(text, byteLength) {
-    const totalDurationSec = text.length / 15;
-    const sentences = text.match(/[^.!?]+[.!?]*/g) || [text];
-    let currentStartTime = 0;
-    let srt = '';
-    let counter = 1;
-    const msToSrt = (ms) => {
-        const date = new Date(0, 0, 0, 0, 0, 0, ms);
-        return `${date.getHours().toString().padStart(2, '0')}:${date.getMinutes().toString().padStart(2, '0')}:${date.getSeconds().toString().padStart(2, '0')},${date.getMilliseconds().toString().padStart(3, '0')}`;
-    };
-    for (const sentence of sentences) {
-        const sentenceDuration = (sentence.length / text.length) * (totalDurationSec * 1000);
-        const endTime = currentStartTime + sentenceDuration;
-        srt += `${counter++}\n${msToSrt(currentStartTime)} --> ${msToSrt(endTime)}\n${sentence.trim()}\n\n`;
-        currentStartTime = endTime;
-    }
-    return srt;
+async function downloadFile(url, dest) {
+    return new Promise((resolve, reject) => {
+        const file = fs.createWriteStream(dest);
+        file.on('error', (err) => {
+            fs.unlink(dest, () => { });
+            reject(new Error(`File write error: ${err.message}`));
+        });
+        const request = https.get(url, (response) => {
+            if (response.statusCode === 302 || response.statusCode === 301) {
+                file.close();
+                downloadFile(response.headers.location, dest).then(resolve).catch(reject);
+                return;
+            }
+            if (response.statusCode && response.statusCode !== 200) {
+                file.close();
+                fs.unlink(dest, () => { });
+                reject(new Error(`Download failed with status code: ${response.statusCode} for URL: ${url}`));
+                return;
+            }
+            response.pipe(file);
+            file.on('finish', () => {
+                file.close((err) => {
+                    if (err)
+                        reject(err);
+                    else
+                        resolve();
+                });
+            });
+        });
+        request.on('error', (err) => {
+            file.close();
+            fs.unlink(dest, () => { });
+            reject(new Error(`Network error: ${err.message}`));
+        });
+    });
 }
 async function ensurePiperBinary(binDir) {
     const platform = os.platform();
@@ -663,15 +821,15 @@ async function ensurePiperModel(binDir, modelNameOrUrl) {
     else {
         const parts = modelNameOrUrl.split('-');
         if (parts.length >= 3) {
-            const langRegion = parts[0] + '_' + parts[1];
-            const voice = parts[2];
-            const quality = parts[3] || 'medium';
-            const lang = parts[0];
+            const langRegion = parts[0];
+            const voice = parts[1];
+            const quality = parts[2];
+            const lang = langRegion.split('_')[0];
             modelFilename = modelNameOrUrl + '.onnx';
             modelUrl = `https://huggingface.co/rhasspy/piper-voices/resolve/main/${lang}/${langRegion}/${voice}/${quality}/${modelFilename}?download=true`;
         }
         else {
-            throw new Error(`Invalid model name format: ${modelNameOrUrl}. Use format lang_REGION-voice-quality`);
+            throw new Error(`Invalid model name format: ${modelNameOrUrl}.`);
         }
     }
     const modelPath = path.join(binDir, modelFilename);
@@ -700,39 +858,70 @@ async function ensurePiperModel(binDir, modelNameOrUrl) {
     }
     return { modelPath, configPath };
 }
-async function downloadFile(url, dest) {
-    return new Promise((resolve, reject) => {
-        const file = fs.createWriteStream(dest);
-        file.on('error', (err) => {
-            fs.unlink(dest, () => { });
-            reject(new Error(`File write error: ${err.message}`));
-        });
-        const request = https.get(url, (response) => {
-            if (response.statusCode === 302 || response.statusCode === 301) {
-                file.close();
-                downloadFile(response.headers.location, dest).then(resolve).catch(reject);
-                return;
+function getAudioDuration(buffer, hint = null) {
+    if (!buffer || buffer.length === 0)
+        return -1;
+    if ((hint === 'wav') || (buffer.length > 12 && buffer.toString('ascii', 0, 4) === 'RIFF' && buffer.toString('ascii', 8, 12) === 'WAVE')) {
+        try {
+            const byteRate = buffer.readUInt32LE(28);
+            if (byteRate > 0) {
+                const dataSize = buffer.length - 44;
+                return dataSize / byteRate;
             }
-            if (response.statusCode && response.statusCode !== 200) {
-                file.close();
-                fs.unlink(dest, () => { });
-                reject(new Error(`Download failed with status code: ${response.statusCode} for URL: ${url}`));
-                return;
+        }
+        catch (e) { }
+    }
+    return -1;
+}
+function generateHeuristicSRT(text, durationSeconds) {
+    if (durationSeconds <= 0) {
+        durationSeconds = text.length / 14;
+    }
+    const sentences = text.match(/[^.!?]+[.!?]*/g) || [text];
+    const totalContentLen = text.length;
+    let currentStartTime = 0;
+    let srt = '';
+    let counter = 1;
+    const msToSrt = (ms) => {
+        const totalSec = Math.floor(ms / 1000);
+        const mili = Math.floor(ms % 1000);
+        const h = Math.floor(totalSec / 3600);
+        const m = Math.floor((totalSec % 3600) / 60);
+        const s = totalSec % 60;
+        return `${h.toString().padStart(2, '0')}:${m.toString().padStart(2, '0')}:${s.toString().padStart(2, '0')},${mili.toString().padStart(3, '0')}`;
+    };
+    for (const sentence of sentences) {
+        const sentenceRatio = sentence.length / totalContentLen;
+        const sentenceDuration = sentenceRatio * durationSeconds;
+        const endTime = currentStartTime + sentenceDuration;
+        srt += `${counter++}\n${msToSrt(currentStartTime * 1000)} --> ${msToSrt(endTime * 1000)}\n${sentence.trim()}\n\n`;
+        currentStartTime = endTime;
+    }
+    return srt;
+}
+async function httpRequest(url, method = 'GET', body = null) {
+    const requestModule = url.startsWith('https') ? https : http;
+    return new Promise((resolve, reject) => {
+        const req = requestModule.request(url, {
+            method: method,
+            headers: {
+                'Content-Type': 'application/json',
             }
-            response.pipe(file);
-            file.on('finish', () => {
-                file.close((err) => {
-                    if (err)
-                        reject(err);
-                    else
-                        resolve();
-                });
+        }, (res) => {
+            const chunks = [];
+            res.on('data', (d) => chunks.push(d));
+            res.on('end', () => {
+                if (res.statusCode >= 200 && res.statusCode < 300) {
+                    resolve(Buffer.concat(chunks));
+                }
+                else {
+                    reject(new Error(`Server Request Failed ${res.statusCode}: ${Buffer.concat(chunks).toString()}`));
+                }
             });
         });
-        request.on('error', (err) => {
-            file.close();
-            fs.unlink(dest, () => { });
-            reject(new Error(`Network error: ${err.message}`));
-        });
+        req.on('error', reject);
+        if (body)
+            req.write(JSON.stringify(body));
+        req.end();
     });
 }

package/nodes/TTSBigBoss/TTSBigBoss.node.ts CHANGED Viewed

@@ -3,6 +3,8 @@ import {
     INodeExecutionData,
     INodeType,
     INodeTypeDescription,
+    ILoadOptionsFunctions,
+    INodePropertyOptions,
 } from 'n8n-workflow';
 import { v4 as uuidv4 } from 'uuid';
 import * as fs from 'fs';
@@ -59,6 +61,16 @@ const PIPER_MODELS = [
 // Edge TTS Constants
 const EDGE_URL = 'wss://speech.platform.bing.com/consumer/speech/synthesize/readaloud/edge/v1?TrustedClientToken=6A5AA1D4EAFF4E9FB37E23D68491D6F4';
+const EDGE_HEADERS = {
+    'Authority': 'speech.platform.bing.com',
+    'Sec-CH-UA': '"Not_A Brand";v="8", "Chromium";v="120", "Microsoft Edge";v="120"',
+    'Sec-CH-UA-Mobile': '?0',
+    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36 Edg/120.0.0.0',
+    'Sec-CH-UA-Platform': '"Windows"',
+    'Accept-Encoding': 'gzip, deflate, br',
+    'Accept-Language': 'en-US,en;q=0.9',
+    'Origin': 'chrome-extension://jdiccldimpdaibmpdkjnbmckianbfold'
+};
 const EDGE_VOICES = [
     // Arabic
     { name: 'Arabic (Egypt) - Salma', value: 'ar-EG-SalmaNeural' },
@@ -123,7 +135,12 @@ export class TTSBigBoss implements INodeType {
                     {
                         name: 'Coqui TTS (Local Server)',
                         value: 'coqui',
-                        description: 'Connect to a running Coqui TTS/XTTS server (e.g. python3 coqui_server.py).',
+                        description: 'Connect to a running Coqui TTS/XTTS server.',
+                    },
+                    {
+                        name: 'Kokoro TTS (Local OpenAI API)',
+                        value: 'kokoro',
+                        description: 'Connect to a local Kokoro server compatible with OpenAI API (e.g. /v1/audio/speech).',
                     },
                     {
                         name: 'System Command (Custom)',
@@ -287,14 +304,52 @@ export class TTSBigBoss implements INodeType {
                 description: 'Name from Hugging Face (e.g. en_US-bryce-medium) or full URL to .onnx file.',
             },
             // ----------------------------------
+            // Kokoro Settings
+            // ----------------------------------
+            {
+                displayName: 'API URL',
+                name: 'kokoroUrl',
+                type: 'string',
+                default: 'http://localhost:8880/v1/audio/speech',
+                description: 'Endpoint URL for Kokoro generation (OpenAI compatible).',
+                displayOptions: {
+                    show: {
+                        engine: ['kokoro'],
+                    },
+                },
+            },
+            {
+                displayName: 'Voice / Model',
+                name: 'kokoroVoice',
+                type: 'string',
+                default: 'af_bella',
+                description: 'Voice ID (e.g. af_bella, af_sarah, am_adam). Arabic might require specific model ID.',
+                displayOptions: {
+                    show: {
+                        engine: ['kokoro'],
+                    },
+                },
+            },
+            {
+                displayName: 'Speed',
+                name: 'kokoroSpeed',
+                type: 'number',
+                default: 1.0,
+                displayOptions: {
+                    show: {
+                        engine: ['kokoro'],
+                    },
+                },
+            },
+            // ----------------------------------
             // Coqui Server Settings
             // ----------------------------------
             {
-                displayName: 'Server URL',
+                displayName: 'Base Server URL',
                 name: 'coquiUrl',
                 type: 'string',
-                default: 'http://localhost:5002/api/tts',
-                description: 'URL of the running Coqui server endpoint (usually /api/tts or /tts_stream).',
+                default: 'http://localhost:5002',
+                description: 'Base URL of Coqui server (e.g. http://localhost:5002 or http://host.docker.internal:5002).',
                 displayOptions: {
                     show: {
                         engine: ['coqui'],
@@ -302,23 +357,56 @@ export class TTSBigBoss implements INodeType {
                 },
             },
             {
-                displayName: 'Speaker ID / Wav Path',
+                displayName: 'Speaker',
                 name: 'coquiSpeaker',
+                type: 'options',
+                typeOptions: {
+                    loadOptionsMethod: 'getCoquiSpeakers',
+                    loadOptionsDependsOn: ['coquiUrl'],
+                },
+                default: '',
+                description: 'Select a speaker ID loaded from the server.',
+                displayOptions: {
+                    show: {
+                        engine: ['coqui'],
+                    },
+                },
+            },
+            {
+                displayName: 'Use Custom WAV Path',
+                name: 'coquiUseWav',
+                type: 'boolean',
+                default: false,
+                description: 'Check to use a local WAV file path instead of a Speaker ID (for cloning).',
+                displayOptions: {
+                    show: {
+                        engine: ['coqui'],
+                    },
+                },
+            },
+            {
+                displayName: 'WAV Path',
+                name: 'coquiWavPath',
                 type: 'string',
                 default: '',
-                description: 'Speaker ID (if multi-speaker) or path to reference wav (for cloning).',
+                description: 'Absolute path to the reference WAV file on the server.',
                 displayOptions: {
                     show: {
                         engine: ['coqui'],
+                        coquiUseWav: [true],
                     },
                 },
             },
             {
                 displayName: 'Language',
                 name: 'coquiLang',
-                type: 'string',
+                type: 'options',
+                typeOptions: {
+                    loadOptionsMethod: 'getCoquiLanguages',
+                    loadOptionsDependsOn: ['coquiUrl'],
+                },
                 default: 'en',
-                description: 'Language code (e.g. en, ar, fr).',
+                description: 'Select language.',
                 displayOptions: {
                     show: {
                         engine: ['coqui'],
@@ -328,6 +416,63 @@ export class TTSBigBoss implements INodeType {
         ],
     };
+    methods = {
+        loadOptions: {
+            async getCoquiSpeakers(this: ILoadOptionsFunctions): Promise<INodePropertyOptions[]> {
+                const baseUrl = this.getNodeParameter('coquiUrl') as string;
+                // clean url
+                const cleanUrl = baseUrl.replace(/\/$/, '');
+                const targetUrl = `${cleanUrl}/api/speakers`; // Assumption: endpoints exist
+                try {
+                    const data = await httpRequest(targetUrl);
+                    // Assume data is [ {name: "id", ...} ] or [ "id", "id" ] or { "speakers": [...] }
+                    const json = JSON.parse(data.toString());
+                    let speakers: any[] = [];
+                    if (Array.isArray(json)) speakers = json;
+                    else if (json.speakers) speakers = json.speakers;
+                    else if (typeof json === 'object') speakers = Object.keys(json);
+                    return speakers.map((s: any) => {
+                        const name = typeof s === 'string' ? s : (s.name || s.id);
+                        const value = typeof s === 'string' ? s : (s.id || s.name);
+                        return { name, value };
+                    });
+                } catch (e: any) {
+                    return [{ name: `Error loading: ${e.message}. Check URL & Connection.`, value: '' }];
+                }
+            },
+            async getCoquiLanguages(this: ILoadOptionsFunctions): Promise<INodePropertyOptions[]> {
+                const baseUrl = this.getNodeParameter('coquiUrl') as string;
+                const cleanUrl = baseUrl.replace(/\/$/, '');
+                const targetUrl = `${cleanUrl}/api/languages`;
+                try {
+                    const data = await httpRequest(targetUrl);
+                    const json = JSON.parse(data.toString());
+                    let langs: any[] = [];
+                    if (Array.isArray(json)) langs = json;
+                    else if (json.languages) langs = json.languages;
+                    return langs.map((l: any) => {
+                        const name = typeof l === 'string' ? l : (l.name || l.code);
+                        const value = typeof l === 'string' ? l : (l.code || l.name);
+                        return { name, value };
+                    });
+                } catch (e) {
+                    // Fallback defaults if api fails
+                    return [
+                        { name: 'English (en)', value: 'en' },
+                        { name: 'Arabic (ar)', value: 'ar' },
+                        { name: 'Examples (Fix URL to load)', value: 'en' }
+                    ];
+                }
+            },
+        },
+    };
     async execute(this: IExecuteFunctions): Promise<INodeExecutionData[][]> {
         const items = this.getInputData();
         const returnData: INodeExecutionData[] = [];
@@ -369,6 +514,28 @@ export class TTSBigBoss implements INodeType {
                         srtBuffer = Buffer.from(result.srt, 'utf8');
                     }
+                } else if (engine === 'kokoro') {
+                    // ----------------------------------
+                    // KOKORO EXECUTION
+                    // ----------------------------------
+                    const url = this.getNodeParameter('kokoroUrl', i) as string;
+                    const voice = this.getNodeParameter('kokoroVoice', i) as string;
+                    const speed = this.getNodeParameter('kokoroSpeed', i) as number;
+                    // Standard OpenAI 'createSpeech' payload
+                    const payload = {
+                        model: 'kokoro', // or whatever the server expects
+                        input: text,
+                        voice: voice,
+                        speed: speed,
+                        response_format: 'mp3'
+                    };
+                    audioBuffer = await httpRequest(url, 'POST', payload);
+                    const duration = getAudioDuration(audioBuffer, 'mp3');
+                    srtBuffer = Buffer.from(generateHeuristicSRT(text, duration), 'utf8');
                 } else if (engine === 'piper_local') {
                     // ----------------------------------
                     // PIPER LOCAL AUTOMATION
@@ -386,8 +553,6 @@ export class TTSBigBoss implements INodeType {
                     // 3. Execute
                     const outFile = path.join(tempDir, `piper_out_${uuidv4()}.wav`);
-                    // Piper command: echo "text" | piper --model model.onnx --output_file out.wav
-                    // We use child_process.spawn to pipe text safely
                     await new Promise<void>((resolve, reject) => {
                         const piperProc = child_process.spawn(piperBinPath, [
@@ -404,9 +569,8 @@ export class TTSBigBoss implements INodeType {
                         piperProc.on('close', (code) => {
                             if (code === 0) resolve();
-                            // Check for the specific JSON error in stderr
                             if (errData.includes('json.exception.parse_error')) {
-                                reject(new Error(`Piper Config Error: The downloaded JSON configuration for model '${piperModel}' seems corrupted (HTML instead of JSON?). Try deleting the file at ${configPath} and running again.`));
+                                reject(new Error(`Piper Config Error: The downloaded JSON configuration for model '${piperModel}' seems corrupted. Try deleting the file at ${configPath}.`));
                             } else {
                                 reject(new Error(`Piper failed (exit ${code}): ${errData}`));
                             }
@@ -418,7 +582,8 @@ export class TTSBigBoss implements INodeType {
                     if (!fs.existsSync(outFile)) throw new Error('Piper did not produce output file');
                     audioBuffer = fs.readFileSync(outFile);
-                    srtBuffer = Buffer.from(generateHeuristicSRT(text, audioBuffer.length), 'utf8');
+                    const duration = getAudioDuration(audioBuffer, 'wav');
+                    srtBuffer = Buffer.from(generateHeuristicSRT(text, duration), 'utf8');
                     fs.unlinkSync(outFile);
@@ -426,44 +591,28 @@ export class TTSBigBoss implements INodeType {
                     // ----------------------------------
                     // COQUI SEVER EXECUTION
                     // ----------------------------------
-                    const url = this.getNodeParameter('coquiUrl', i) as string;
-                    const speaker = this.getNodeParameter('coquiSpeaker', i) as string;
+                    let url = this.getNodeParameter('coquiUrl', i) as string;
+                    url = url.replace(/\/$/, '') + '/api/tts'; // Append standard endpoint
+                    const speakerSelection = this.getNodeParameter('coquiSpeaker', i) as string;
+                    const useWav = this.getNodeParameter('coquiUseWav', i, false) as boolean;
+                    const wavPath = this.getNodeParameter('coquiWavPath', i, '') as string;
                     const lang = this.getNodeParameter('coquiLang', i) as string;
-                    // Construct Payload
-                    // Standard XTTS/Coqui API expects: text, speaker_id, language_id
                     const payload: any = {
                         text: text,
                         language_id: lang,
                     };
-                    if (speaker) payload.speaker_id = speaker;
-                    // Allow http and https
-                    const requestModule = url.startsWith('https') ? https : http;
-                    audioBuffer = await new Promise((resolve, reject) => {
-                        const req = requestModule.request(url, {
-                            method: 'POST',
-                            headers: {
-                                'Content-Type': 'application/json',
-                            }
-                        }, (res: any) => {
-                            const chunks: any[] = [];
-                            res.on('data', (d: any) => chunks.push(d));
-                            res.on('end', () => {
-                                if (res.statusCode >= 200 && res.statusCode < 300) {
-                                    resolve(Buffer.concat(chunks));
-                                } else {
-                                    reject(new Error(`Coqui Server Error ${res.statusCode}: ${Buffer.concat(chunks).toString()}`));
-                                }
-                            });
-                        });
-                        req.on('error', reject);
-                        req.write(JSON.stringify(payload));
-                        req.end();
-                    });
+                    if (useWav && wavPath) {
+                        payload.speaker_wav = wavPath;
+                    } else if (speakerSelection) {
+                        payload.speaker_id = speakerSelection;
+                    }
-                    srtBuffer = Buffer.from(generateHeuristicSRT(text, audioBuffer.length), 'utf8');
+                    audioBuffer = await httpRequest(url, 'POST', payload);
+                    const duration = getAudioDuration(audioBuffer, 'wav');
+                    srtBuffer = Buffer.from(generateHeuristicSRT(text, duration), 'utf8');
                 } else {
                     // ----------------------------------
@@ -479,7 +628,6 @@ export class TTSBigBoss implements INodeType {
                         .replace(/"{text}"/g, `"${text.replace(/"/g, '\\"')}"`) // Basic escape
                         .replace(/{text}/g, `"${text.replace(/"/g, '\\"')}"`);
-                    // Handle Clone Input
                     if (useClone) {
                         const cloneProp = this.getNodeParameter('cloneInputProperty', i) as string;
                         const cloneData = await this.helpers.getBinaryDataBuffer(i, cloneProp);
@@ -490,7 +638,6 @@ export class TTSBigBoss implements INodeType {
                             .replace(/{reference_audio}/g, `"${cloneFile}"`);
                     }
-                    // Execute
                     await new Promise((resolve, reject) => {
                         child_process.exec(cmd, (error, stdout, stderr) => {
                             if (error) {
@@ -506,9 +653,8 @@ export class TTSBigBoss implements INodeType {
                     }
                     audioBuffer = fs.readFileSync(outFile);
-                    // Generate Heuristic SRT (Estimate timestamps)
-                    srtBuffer = Buffer.from(generateHeuristicSRT(text, audioBuffer.length), 'utf8');
+                    const duration = getAudioDuration(audioBuffer);
+                    srtBuffer = Buffer.from(generateHeuristicSRT(text, duration), 'utf8');
                     // Cleanup
                     if (fs.existsSync(outFile)) fs.unlinkSync(outFile);
@@ -540,7 +686,7 @@ export class TTSBigBoss implements INodeType {
                 returnData.push(newItem);
-            } catch (error) {
+            } catch (error: any) {
                 if (this.continueOnFail()) {
                     returnData.push({ json: { error: error.message }, binary: {} });
                     continue;
@@ -560,8 +706,8 @@ async function runEdgeTTS(text: string, voice: string, rate: string, pitch: stri
     return new Promise((resolve, reject) => {
         const ws = new WebSocket(EDGE_URL, {
             headers: {
-                'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
-                'Origin': 'chrome-extension://jdiccldimpdaibmpdkjnbmckianbfold',
+                'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/128.0.0.0 Safari/537.36 Edg/128.0.0.0', // Updated UA to Edge
+                'Origin': 'chrome-extension://jdiccldimpdaibmpdkjnbmckianbfold', // Keep origin for now, usually required
                 'TrustedClientToken': '6A5AA1D4EAFF4E9FB37E23D68491D6F4'
             }
         });
@@ -707,41 +853,43 @@ function ticksToTime(ticks: number): string {
     return `${h}:${m}:${s},${mili}`;
 }
-// --------------------------------------------------------------------------
-// HEURISTIC SRT IMPLEMENTATION (For System Command)
-// --------------------------------------------------------------------------
-function generateHeuristicSRT(text: string, byteLength: number): string {
-    // Estimate duration assuming typical MP3/WAV bitrate.
-    // Actually, system command usually produces WAV (PCM).
-    // Wrapper might produce MP3. Let's assume user command output.
-    // It is safer to assume ~15 chars per second reading speed if we don't know duration.
-    // Or assume 16000 bytes/sec for mono 16khz? Too unreliable.
-    // Let's use text length heuristic: Avg reading speed 150 wpm ~ 2.5 words/sec ~ 15 chars/sec?
-    // Let's try 15 chars / second.
-    const totalDurationSec = text.length / 15;
-    // Ideally we'd use 'ffprobe' to get exact duration, but let's stick to pure TS for now.
-    // If we really wanted to be robust, we'd add 'ffprobe' execution here.
-    const sentences = text.match(/[^.!?]+[.!?]*/g) || [text];
-    let currentStartTime = 0;
-    let srt = '';
-    let counter = 1;
-    const msToSrt = (ms: number) => {
-        const date = new Date(0, 0, 0, 0, 0, 0, ms);
-        return `${date.getHours().toString().padStart(2, '0')}:${date.getMinutes().toString().padStart(2, '0')}:${date.getSeconds().toString().padStart(2, '0')},${date.getMilliseconds().toString().padStart(3, '0')}`;
-    };
-    for (const sentence of sentences) {
-        const sentenceDuration = (sentence.length / text.length) * (totalDurationSec * 1000);
-        const endTime = currentStartTime + sentenceDuration;
-        srt += `${counter++}\n${msToSrt(currentStartTime)} --> ${msToSrt(endTime)}\n${sentence.trim()}\n\n`;
-        currentStartTime = endTime;
-    }
+// ----------------------------------
+// OLD HEURISTIC REMOVED
+// ----------------------------------
-    return srt;
+async function downloadFile(url: string, dest: string): Promise<void> {
+    return new Promise((resolve, reject) => {
+        const file = fs.createWriteStream(dest);
+        file.on('error', (err) => {
+            fs.unlink(dest, () => { });
+            reject(new Error(`File write error: ${err.message}`));
+        });
+        const request = https.get(url, (response) => {
+            if (response.statusCode === 302 || response.statusCode === 301) {
+                file.close();
+                downloadFile(response.headers.location!, dest).then(resolve).catch(reject);
+                return;
+            }
+            if (response.statusCode && response.statusCode !== 200) {
+                file.close();
+                fs.unlink(dest, () => { });
+                reject(new Error(`Download failed with status code: ${response.statusCode} for URL: ${url}`));
+                return;
+            }
+            response.pipe(file);
+            file.on('finish', () => {
+                file.close((err) => {
+                    if (err) reject(err);
+                    else resolve();
+                });
+            });
+        });
+        request.on('error', (err) => {
+            file.close();
+            fs.unlink(dest, () => { });
+            reject(new Error(`Network error: ${err.message}`));
+        });
+    });
 }
 // --------------------------------------------------------------------------
@@ -811,25 +959,23 @@ async function ensurePiperModel(binDir: string, modelNameOrUrl: string): Promise
         modelUrl = modelNameOrUrl;
         modelFilename = path.basename(modelNameOrUrl);
     } else {
-        // Construct URL from name
+        // Correct Parsing for 'lang_REGION-voice-quality'
+        // e.g. en_US-lessac-medium -> [en_US, lessac, medium]
+        // e.g. ar_JO-kareem-medium -> [ar_JO, kareem, medium]
         const parts = modelNameOrUrl.split('-');
         if (parts.length >= 3) {
-            const langRegion = parts[0] + '_' + parts[1]; // en_US
-            const voice = parts[2];
-            const quality = parts[3] || 'medium';
-            const lang = parts[0]; // en
+            const langRegion = parts[0]; // 'ar_JO' or 'en_US'
+            const voice = parts[1];      // 'kareem'
+            const quality = parts[2];    // 'medium'
-            // e.g. en_US-lessac-medium
-            // lang=en, region=en_US, voice=lessac, quality=medium
-            // url path: en/en_US/lessac/medium/en_US-lessac-medium.onnx
-            // Handle special case: ar_JO (no lang folder? check repo)
-            // Generally structure is: lang_short/lang_long/voice/quality/filename
+            // Lang code is first part of langRegion (split by _)
+            const lang = langRegion.split('_')[0]; // 'ar' form 'ar_JO'
             modelFilename = modelNameOrUrl + '.onnx';
-            modelUrl = `https://huggingface.co/rhasspy/piper-voices/resolve/main/${lang}/${langRegion}/${voice}/${quality}/${modelFilename}?download=true`; // Add download=true to force direct link
+            modelUrl = `https://huggingface.co/rhasspy/piper-voices/resolve/main/${lang}/${langRegion}/${voice}/${quality}/${modelFilename}?download=true`;
         } else {
-            throw new Error(`Invalid model name format: ${modelNameOrUrl}. Use format lang_REGION-voice-quality`);
+            throw new Error(`Invalid model name format: ${modelNameOrUrl}.`);
         }
     }
@@ -865,45 +1011,89 @@ async function ensurePiperModel(binDir: string, modelNameOrUrl: string): Promise
     return { modelPath, configPath };
 }
-async function downloadFile(url: string, dest: string): Promise<void> {
-    return new Promise((resolve, reject) => {
-        const file = fs.createWriteStream(dest);
-        // Handle file system errors (e.g. permissions)
-        file.on('error', (err) => {
-            fs.unlink(dest, () => { }); // Cleanup
-            reject(new Error(`File write error: ${err.message}`));
-        });
+// --------------------------------------------------------------------------
+// HELPER: Determine Audio Duration for SRT
+// --------------------------------------------------------------------------
+function getAudioDuration(buffer: Buffer, hint: 'mp3' | 'wav' | null = null): number {
+    // 1. Try generic text length if buffer empty (fallback)
+    if (!buffer || buffer.length === 0) return -1;
-        const request = https.get(url, (response) => {
-            if (response.statusCode === 302 || response.statusCode === 301) {
-                // Follow redirect
-                file.close();
-                downloadFile(response.headers.location!, dest).then(resolve).catch(reject);
-                return;
+    // 2. Try parsing WAV header
+    // RIFF....WAVEfmt
+    if ((hint === 'wav') || (buffer.length > 12 && buffer.toString('ascii', 0, 4) === 'RIFF' && buffer.toString('ascii', 8, 12) === 'WAVE')) {
+        try {
+            // standard header is 44 bytes.
+            const byteRate = buffer.readUInt32LE(28);
+            if (byteRate > 0) {
+                const dataSize = buffer.length - 44;
+                return dataSize / byteRate;
             }
+        } catch (e) { /* ignore */ }
+    }
-            if (response.statusCode && response.statusCode !== 200) {
-                file.close();
-                fs.unlink(dest, () => { });
-                reject(new Error(`Download failed with status code: ${response.statusCode} for URL: ${url}`));
-                return;
-            }
+    // 3. Fallback: Char count estimation? No, we don't have text here.
+    // Return -1 to signal "Use text length"
+    return -1;
+}
-            response.pipe(file);
+// --------------------------------------------------------------------------
+// HEURISTIC SRT IMPLEMENTATION
+// --------------------------------------------------------------------------
+function generateHeuristicSRT(text: string, durationSeconds: number): string {
+    // If duration unknown (-1), estimate from text length (14 chars/sec)
+    if (durationSeconds <= 0) {
+        durationSeconds = text.length / 14;
+    }
-            file.on('finish', () => {
-                file.close((err) => {
-                    if (err) reject(err);
-                    else resolve();
-                });
-            });
-        });
+    const sentences = text.match(/[^.!?]+[.!?]*/g) || [text];
+    const totalContentLen = text.length;
-        request.on('error', (err) => {
-            file.close();
-            fs.unlink(dest, () => { });
-            reject(new Error(`Network error: ${err.message}`));
+    let currentStartTime = 0;
+    let srt = '';
+    let counter = 1;
+    const msToSrt = (ms: number) => {
+        const totalSec = Math.floor(ms / 1000);
+        const mili = Math.floor(ms % 1000);
+        const h = Math.floor(totalSec / 3600);
+        const m = Math.floor((totalSec % 3600) / 60);
+        const s = totalSec % 60;
+        return `${h.toString().padStart(2, '0')}:${m.toString().padStart(2, '0')}:${s.toString().padStart(2, '0')},${mili.toString().padStart(3, '0')}`;
+    };
+    for (const sentence of sentences) {
+        // Proportion of time = Proportion of length
+        const sentenceRatio = sentence.length / totalContentLen;
+        const sentenceDuration = sentenceRatio * durationSeconds;
+        const endTime = currentStartTime + sentenceDuration;
+        srt += `${counter++}\n${msToSrt(currentStartTime * 1000)} --> ${msToSrt(endTime * 1000)}\n${sentence.trim()}\n\n`;
+        currentStartTime = endTime;
+    }
+    return srt;
+}
+async function httpRequest(url: string, method: string = 'GET', body: any = null): Promise<Buffer> {
+    const requestModule = url.startsWith('https') ? https : http;
+    return new Promise((resolve, reject) => {
+        const req = requestModule.request(url, {
+            method: method,
+            headers: {
+                'Content-Type': 'application/json',
+            }
+        }, (res: any) => {
+            const chunks: any[] = [];
+            res.on('data', (d: any) => chunks.push(d));
+            res.on('end', () => {
+                if (res.statusCode >= 200 && res.statusCode < 300) {
+                    resolve(Buffer.concat(chunks));
+                } else {
+                    reject(new Error(`Server Request Failed ${res.statusCode}: ${Buffer.concat(chunks).toString()}`));
+                }
+            });
         });
+        req.on('error', reject);
+        if (body) req.write(JSON.stringify(body));
+        req.end();
     });
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "n8n-nodes-tts-bigboss",
-  "version": "1.0.6",
+  "version": "1.0.8",
   "description": "BigBoss TTS node with multi-engine support and automatic SRT generation",
   "keywords": [
     "n8n-community-node-package",