npm - speechflow - Versions diffs - 2.2.0 → 2.3.0 - Mend

speechflow 2.2.0 → 2.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (238) hide show

package/speechflow-cli/src/speechflow-node-t2a-openai.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -106,9 +106,13 @@ export default class SpeechFlowNodeT2AOpenAI extends SpeechFlowNode {
                 else if (chunk.payload === "")
                     callback()
                 else {
+                    let callbackCalled = false
                     let processTimeout: ReturnType<typeof setTimeout> | null = setTimeout(() => {
                         processTimeout = null
-                        callback(new Error("OpenAI TTS API timeout"))
+                        if (!callbackCalled) {
+                            callbackCalled = true
+                            callback(new Error("OpenAI TTS API timeout"))
+                        }
                     }, 60 * 1000)
                     const clearProcessTimeout = () => {
                         if (processTimeout !== null) {
@@ -119,12 +123,16 @@ export default class SpeechFlowNodeT2AOpenAI extends SpeechFlowNode {
                     try {
                         if (self.closing) {
                             clearProcessTimeout()
+                            callbackCalled = true
                             callback(new Error("stream destroyed during processing"))
                             return
                         }
                         const buffer = await textToSpeech(chunk.payload as string)
+                        clearProcessTimeout()
+                        if (callbackCalled)
+                            return
+                        callbackCalled = true
                         if (self.closing) {
-                            clearProcessTimeout()
                             callback(new Error("stream destroyed during processing"))
                             return
                         }
@@ -138,12 +146,14 @@ export default class SpeechFlowNodeT2AOpenAI extends SpeechFlowNode {
                         chunkNew.type         = "audio"
                         chunkNew.payload      = buffer
                         chunkNew.timestampEnd = Duration.fromMillis(chunkNew.timestampStart.toMillis() + durationMs)
-                        clearProcessTimeout()
                         this.push(chunkNew)
                         callback()
                     }
                     catch (error) {
                         clearProcessTimeout()
+                        if (callbackCalled)
+                            return
+                        callbackCalled = true
                         callback(util.ensureError(error, "OpenAI TTS processing failed"))
                     }
                 }
@@ -166,8 +176,10 @@ export default class SpeechFlowNodeT2AOpenAI extends SpeechFlowNode {
         }
         /*  destroy resampler  */
-        if (this.resampler !== null)
+        if (this.resampler !== null) {
+            this.resampler.destroy()
             this.resampler = null
+        }
         /*  destroy OpenAI API  */
         if (this.openai !== null)

package/speechflow-cli/src/speechflow-node-t2a-supertonic.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -138,8 +138,11 @@ export default class SpeechFlowNodeT2ASupertonic extends SpeechFlowNode {
                 throw new Error("unexpected Supertonic result: sampling_rate is not a number")
             const samples = result.audio
             const outputSampleRate = result.sampling_rate
-            if (outputSampleRate !== this.sampleRate)
-                this.log("warning", `unexpected sample rate ${outputSampleRate}Hz (expected ${this.sampleRate}Hz)`)
+            if (outputSampleRate !== this.sampleRate) {
+                this.log("warning", `unexpected sample rate change ${this.sampleRate}Hz -> ${outputSampleRate}Hz (recreating resampler)`)
+                this.sampleRate = outputSampleRate
+                this.resampler = new SpeexResampler(1, this.sampleRate, this.config.audioSampleRate, 7)
+            }
             /*  calculate duration  */
             const duration = samples.length / outputSampleRate
@@ -169,9 +172,13 @@ export default class SpeechFlowNodeT2ASupertonic extends SpeechFlowNode {
                 else if (chunk.payload === "")
                     callback()
                 else {
+                    let callbackCalled = false
                     let processTimeout: ReturnType<typeof setTimeout> | null = setTimeout(() => {
                         processTimeout = null
-                        callback(new Error("Supertonic TTS timeout"))
+                        if (!callbackCalled) {
+                            callbackCalled = true
+                            callback(new Error("Supertonic TTS timeout"))
+                        }
                     }, 120 * 1000)
                     const clearProcessTimeout = () => {
                         if (processTimeout !== null) {
@@ -180,8 +187,11 @@ export default class SpeechFlowNodeT2ASupertonic extends SpeechFlowNode {
                         }
                     }
                     text2speech(chunk.payload as string).then((buffer) => {
+                        clearProcessTimeout()
+                        if (callbackCalled)
+                            return
+                        callbackCalled = true
                         if (self.closing) {
-                            clearProcessTimeout()
                             callback(new Error("stream destroyed during processing"))
                             return
                         }
@@ -196,11 +206,13 @@ export default class SpeechFlowNodeT2ASupertonic extends SpeechFlowNode {
                         chunkNew.type         = "audio"
                         chunkNew.payload      = buffer
                         chunkNew.timestampEnd = Duration.fromMillis(chunkNew.timestampStart.toMillis() + durationMs)
-                        clearProcessTimeout()
                         this.push(chunkNew)
                         callback()
                     }).catch((error: unknown) => {
                         clearProcessTimeout()
+                        if (callbackCalled)
+                            return
+                        callbackCalled = true
                         callback(util.ensureError(error, "Supertonic processing failed"))
                     })
                 }
@@ -223,8 +235,10 @@ export default class SpeechFlowNodeT2ASupertonic extends SpeechFlowNode {
         }
         /*  destroy resampler  */
-        if (this.resampler !== null)
+        if (this.resampler !== null) {
+            this.resampler.destroy()
             this.resampler = null
+        }
         /*  destroy TTS pipeline  */
         if (this.tts !== null) {

package/speechflow-cli/src/speechflow-node-t2t-amazon.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-deepl.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-format.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-google.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -125,7 +125,9 @@ export default class SpeechFlowNodeT2TGoogle extends SpeechFlowNode {
         /*  shutdown Google Translate client  */
         if (this.client !== null) {
-            this.client.close()
+            await this.client.close().catch((error) => {
+                this.log("warning", `error closing Google Translate client: ${error}`)
+            })
             this.client = null
         }
     }

package/speechflow-cli/src/speechflow-node-t2t-modify.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-opus.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-profanity.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-punctuation.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-sentence.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-spellcheck.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-t2t-subtitle.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -112,6 +112,9 @@ export default class SpeechFlowNodeT2TSubtitle extends SpeechFlowNode {
                 /*  produce SRT/VTT blocks  */
                 let output = convertSingle(timestampStart, timestampEnd, chunk.payload)
                 if (this.params.words) {
+                    if (words.length === 0)
+                        this.log("warning", "word-level subtitle highlighting requested but no word-level timing data available")
                     /*  produce additional SRT/VTT blocks with each word highlighted  */
                     const occurrences = new Map<string, number>()
                     for (const word of words) {
@@ -166,7 +169,7 @@ export default class SpeechFlowNodeT2TSubtitle extends SpeechFlowNode {
         else if (this.params.mode === "import") {
             /*  parse timestamp in SRT format ("HH:MM:SS,mmm") or VTT format ("HH:MM:SS.mmm")  */
             const parseTimestamp = (ts: string): Duration => {
-                const match = ts.match(/^(\d{2}):(\d{2}):(\d{2})[,.](\d{3})$/)
+                const match = ts.match(/^(\d{2,}):(\d{2}):(\d{2})[,.](\d{3})$/)
                 if (!match)
                     throw new Error(`invalid timestamp format: "${ts}"`)
                 const hours        = Number.parseInt(match[1], 10)
@@ -202,7 +205,7 @@ export default class SpeechFlowNodeT2TSubtitle extends SpeechFlowNode {
                     /*  parse timestamp line  */
                     const timeLine  = lines[lineIdx]
-                    const timeMatch = timeLine.match(/^(\d{2}:\d{2}:\d{2},\d{3})\s*-->\s*(\d{2}:\d{2}:\d{2},\d{3})/)
+                    const timeMatch = timeLine.match(/^(\d{2,}:\d{2}:\d{2},\d{3})\s*-->\s*(\d{2,}:\d{2}:\d{2},\d{3})/)
                     if (!timeMatch) {
                         this.log("warning", "SRT contains invalid timestamp line")
                         continue
@@ -230,8 +233,8 @@ export default class SpeechFlowNodeT2TSubtitle extends SpeechFlowNode {
                 const blocks = content.trim().split(/\r?\n\r?\n+/)
                 for (const block of blocks) {
                     const lines = block.trim().split(/\r?\n/)
-                    if (lines.length < 1) {
-                        this.log("warning", "VTT block contains fewer than 1 line")
+                    if (lines.length < 2) {
+                        this.log("warning", "VTT block contains fewer than 2 lines")
                         continue
                     }
@@ -244,7 +247,7 @@ export default class SpeechFlowNodeT2TSubtitle extends SpeechFlowNode {
                     /*  parse timestamp line  */
                     const timeLine  = lines[lineIdx]
-                    const timeMatch = timeLine.match(/^(\d{2}:\d{2}:\d{2}\.\d{3})\s*-->\s*(\d{2}:\d{2}:\d{2}\.\d{3})/)
+                    const timeMatch = timeLine.match(/^(\d{2,}:\d{2}:\d{2}\.\d{3})\s*-->\s*(\d{2,}:\d{2}:\d{2}\.\d{3})/)
                     if (!timeMatch) {
                         this.log("warning", "VTT contains invalid timestamp line")
                         continue
@@ -288,25 +291,42 @@ export default class SpeechFlowNodeT2TSubtitle extends SpeechFlowNode {
                     /*  accumulate input  */
                     buffer += chunk.payload
-                    /*  parse accumulated input  */
+                    /*  find the last double-newline boundary to separate
+                        complete blocks from a potentially incomplete trailing block  */
+                    const boundary = /\r?\n\r?\n/g
+                    let lastBoundaryEnd = -1
+                    let match: RegExpExecArray | null
+                    while ((match = boundary.exec(buffer)) !== null)
+                        lastBoundaryEnd = match.index + match[0].length
+                    /*  if no complete block boundary found, wait for more data  */
+                    if (lastBoundaryEnd < 0) {
+                        callback()
+                        return
+                    }
+                    /*  split buffer into complete portion and remainder  */
+                    const complete  = buffer.substring(0, lastBoundaryEnd)
+                    const remainder = buffer.substring(lastBoundaryEnd)
+                    /*  parse only the complete portion  */
                     try {
                         /*  parse entries  */
-                        const entries = (self.params.format === "srt" ? parseSRT(buffer) : parseVTT(buffer))
+                        const entries = (self.params.format === "srt" ? parseSRT(complete) : parseVTT(complete))
                         /*  emit parsed entries as individual chunks  */
                         for (const entry of entries) {
                             const chunkNew = new SpeechFlowChunk(entry.start, entry.end, "final", "text", entry.text)
                             this.push(chunkNew)
                         }
-                        /*  clear buffer after successful parse  */
-                        buffer = ""
-                        callback()
                     }
                     catch (error: unknown) {
-                        buffer = ""
-                        callback(util.ensureError(error))
+                        self.log("warning", `subtitle parse error: ${util.ensureError(error).message}`)
                     }
+                    /*  keep only the unparsed remainder in the buffer  */
+                    buffer = remainder
+                    callback()
                 },
                 final (callback) {
                     /*  process any remaining buffer content  */
@@ -402,7 +422,11 @@ export default class SpeechFlowNodeT2TSubtitle extends SpeechFlowNode {
             const emit = (chunk: SpeechFlowChunk) => {
                 const data = JSON.stringify(chunk)
                 for (const info of wsPeers.values())
-                    info.ws.send(data)
+                    if (info.ws.readyState === WebSocket.OPEN)
+                        info.ws.send(data, (err) => {
+                            if (err)
+                                this.log("warning", `HAPI: WebSocket: subtitle send failed: ${err.message}`)
+                        })
             }
             /*  establish writable stream  */

package/speechflow-cli/src/speechflow-node-t2t-summary.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -103,7 +103,7 @@ export default class SpeechFlowNodeT2TSummary extends SpeechFlowNode {
     /*  count sentences in text  */
     private countSentences (text: string): number {
-        const matches = text.match(/[.;?!]/g)
+        const matches = text.match(/[.;?!]+(?:\s|$)/g)
         return matches ? matches.length : 0
     }
@@ -186,7 +186,7 @@ export default class SpeechFlowNodeT2TSummary extends SpeechFlowNode {
             },
             final (callback) {
                 /*  generate final summary if there is accumulated text  */
-                if (self.accumulatedText.length > 0 && self.sentencesSinceLastSummary > 0) {
+                if (self.accumulatedText.length > 0) {
                     self.sentencesSinceLastSummary = 0
                     self.log("info", "generating final summary of accumulated text")
                     const textToSummarize = self.accumulatedText

package/speechflow-cli/src/speechflow-node-t2t-translate.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-x2x-filter.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -47,6 +47,7 @@ export default class SpeechFlowNodeX2XFilter extends SpeechFlowNode {
         /*  helper function for comparing two values  */
         const comparison = (val1: any, op: string, val2: any) => {
+            val1 ??= ""
             if (op === "==" || op === "!=") {
                 /*  equal comparison  */
                 const str1 = (typeof val1 === "string" ? val1 : val1.toString())
@@ -73,8 +74,8 @@ export default class SpeechFlowNodeX2XFilter extends SpeechFlowNode {
                 /*  non-equal comparison  */
                 const coerceNum = (val: any) =>
                     typeof val === "number" ? val : (
-                        typeof val === "string" && val.match(/^[\d+-]+$/) ? Number.parseInt(val, 10) : (
-                            typeof val === "string" && val.match(/^[\d.+-]+$/) ?
+                        typeof val === "string" && val.match(/^[+-]?\d+$/) ? Number.parseInt(val, 10) : (
+                            typeof val === "string" && val.match(/^[+-]?(\d+\.?\d*|\d*\.?\d+)$/) ?
                                 Number.parseFloat(val) :
                                 Number(val)
                         )

package/speechflow-cli/src/speechflow-node-x2x-trace.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-xio-device.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -116,7 +116,8 @@ export default class SpeechFlowNodeXIODevice extends SpeechFlowNode {
         /*  convert regular stream into object-mode stream  */
         const wrapper1 = util.createTransformStreamForWritableSide("audio", 1)
-        const wrapper2 = util.createTransformStreamForReadableSide("audio", () => this.timeZero, highwaterMark)
+        const wrapper2 = util.createTransformStreamForReadableSide("audio", () => this.timeZero, highwaterMark,
+            this.config.audioSampleRate, this.config.audioBitDepth, this.config.audioChannels)
         this.stream = Stream.compose(wrapper1, this.stream, wrapper2)
     }
@@ -137,7 +138,8 @@ export default class SpeechFlowNodeXIODevice extends SpeechFlowNode {
         this.stream = this.io as unknown as Stream.Readable
         /*  convert regular stream into object-mode stream  */
-        const wrapper = util.createTransformStreamForReadableSide("audio", () => this.timeZero, highwaterMark)
+        const wrapper = util.createTransformStreamForReadableSide("audio", () => this.timeZero, highwaterMark,
+            this.config.audioSampleRate, this.config.audioBitDepth, this.config.audioChannels)
         this.stream = Stream.compose(this.stream, wrapper)
     }
@@ -207,24 +209,36 @@ export default class SpeechFlowNodeXIODevice extends SpeechFlowNode {
                 if (!error.message.match(/AudioIO Quit expects 1 argument/))
                     throw error
             }
+            const ac1 = new AbortController()
             await Promise.race([
-                util.timeout(2 * 1000, "PortAudio abort timeout"),
+                util.timeout(2 * 1000, "PortAudio abort timeout", ac1.signal),
                 new Promise<void>((resolve) => {
                     this.io!.abort(() => {
                         resolve()
                     })
                 }).catch(catchHandler)
-            ])
+            ]).finally(() => {
+                ac1.abort()
+            })
+            const ac2 = new AbortController()
             await Promise.race([
-                util.timeout(2 * 1000, "PortAudio quit timeout"),
+                util.timeout(2 * 1000, "PortAudio quit timeout", ac2.signal),
                 new Promise<void>((resolve) => {
                     this.io!.quit(() => {
                         resolve()
                     })
                 }).catch(catchHandler)
-            ])
+            ]).finally(() => {
+                ac2.abort()
+            })
             this.io = null
         }
+        /*  shutdown stream  */
+        if (this.stream !== null) {
+            await util.destroyStream(this.stream)
+            this.stream = null
+        }
     }
 }

package/speechflow-cli/src/speechflow-node-xio-exec.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -129,13 +129,15 @@ export default class SpeechFlowNodeXIOExec extends SpeechFlowNode {
             })
             const wrapper1 = util.createTransformStreamForWritableSide(this.params.type, highWaterMark)
             const wrapper2 = util.createTransformStreamForReadableSide(
-                this.params.type, () => this.timeZero, highWaterMark)
+                this.params.type, () => this.timeZero, highWaterMark,
+                this.config.audioSampleRate, this.config.audioBitDepth, this.config.audioChannels)
             this.stream = Stream.compose(wrapper1, this.stream, wrapper2)
         }
         else if (this.params.mode === "r") {
             /*  read-only mode: stdout only  */
             const wrapper = util.createTransformStreamForReadableSide(
-                this.params.type, () => this.timeZero, highWaterMark)
+                this.params.type, () => this.timeZero, highWaterMark,
+                this.config.audioSampleRate, this.config.audioBitDepth, this.config.audioChannels)
             this.stream = Stream.compose(this.subprocess.stdout!, wrapper)
         }
         else if (this.params.mode === "w") {
@@ -153,6 +155,7 @@ export default class SpeechFlowNodeXIOExec extends SpeechFlowNode {
             /*  gracefully end stdin if in write or read/write mode  */
             if ((this.params.mode === "w" || this.params.mode === "rw") && this.subprocess.stdin
                 && !this.subprocess.stdin.destroyed && !this.subprocess.stdin.writableEnded) {
+                const ac1 = new AbortController()
                 await Promise.race([
                     new Promise<void>((resolve, reject) => {
                         this.subprocess!.stdin!.end((err?: Error) => {
@@ -160,36 +163,47 @@ export default class SpeechFlowNodeXIOExec extends SpeechFlowNode {
                             else     resolve()
                         })
                     }),
-                    util.timeout(2000)
-                ]).catch((err: unknown) => {
+                    util.timeout(2000, "timeout", ac1.signal)
+                ]).finally(() => {
+                    ac1.abort()
+                }).catch((err: unknown) => {
                     const error = util.ensureError(err)
                     this.log("warning", `failed to gracefully close stdin: ${error.message}`)
                 })
             }
             /*  wait for subprocess to exit gracefully  */
+            const ac2 = new AbortController()
             await Promise.race([
                 this.subprocess,
-                util.timeout(5000, "subprocess exit timeout")
-            ]).catch(async (err: unknown) => {
+                util.timeout(5000, "subprocess exit timeout", ac2.signal)
+            ]).finally(() => {
+                ac2.abort()
+            }).catch(async (err: unknown) => {
                 /*  force kill with SIGTERM  */
                 const error = util.ensureError(err)
                 if (error.message.includes("timeout")) {
                     this.log("warning", "subprocess did not exit gracefully, forcing termination")
                     this.subprocess!.kill("SIGTERM")
+                    const ac3 = new AbortController()
                     return Promise.race([
                         this.subprocess,
-                        util.timeout(2000)
-                    ])
+                        util.timeout(2000, "timeout", ac3.signal)
+                    ]).finally(() => {
+                        ac3.abort()
+                    })
                 }
             }).catch(async () => {
                 /*  force kill with SIGKILL  */
                 this.log("warning", "subprocess did not respond to SIGTERM, forcing SIGKILL")
                 this.subprocess!.kill("SIGKILL")
+                const ac4 = new AbortController()
                 return Promise.race([
                     this.subprocess,
-                    util.timeout(1000)
-                ])
+                    util.timeout(1000, "timeout", ac4.signal)
+                ]).finally(() => {
+                    ac4.abort()
+                })
             }).catch(() => {
                 this.log("error", "subprocess did not terminate even after SIGKILL")
             })