npm - speechflow - Versions diffs - 2.2.1 → 2.3.1 - Mend

speechflow 2.2.1 → 2.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (242) hide show

package/speechflow-cli/src/speechflow-node-a2a-expander-wt.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -39,24 +39,23 @@ class ExpanderProcessor extends AudioWorkletProcessor {
         if (ratio <= 1.0)
             return 0
-        /*  determine thresholds  */
+        /*  determine knee boundaries (symmetric around threshold)  */
         const halfKnee  = kneeDB * 0.5
         const belowKnee = levelDB < (thresholdDB - halfKnee)
-        const aboveThr  = levelDB >= thresholdDB
+        const aboveKnee = levelDB > (thresholdDB + halfKnee)
-        /*  short-circuit for no expansion (above threshold)  */
-        if (aboveThr)
+        /*  short-circuit for no expansion (above knee)  */
+        if (aboveKnee)
             return 0
-        /*  apply soft-knee  */
+        /*  apply soft-knee (standard textbook quadratic)  */
         if (kneeDB > 0 && !belowKnee) {
-            const x = (levelDB - (thresholdDB - halfKnee)) / kneeDB
-            const idealGainDB = (thresholdDB + (levelDB - thresholdDB) * ratio) - levelDB
-            return idealGainDB * x * x
+            const d = thresholdDB + halfKnee - levelDB
+            return (1.0 - ratio) * d * d / (2.0 * kneeDB)
         }
         /*  determine target level  */
-        const targetOut = thresholdDB + (levelDB - thresholdDB) / ratio
+        const targetOut = thresholdDB + (levelDB - thresholdDB) * ratio
         /*  return gain difference  */
         return targetOut - levelDB
@@ -97,16 +96,17 @@ class ExpanderProcessor extends AudioWorkletProcessor {
         const releaseS    = Math.max(parameters["release"][0], 1 / this.sampleRate)
         const makeupDB    = parameters["makeup"][0]
-        /*  update envelope per channel  */
+        /*  update envelope per channel and collect RMS values  */
+        const rms = Array.from<number>({ length: nCh })
         for (let ch = 0; ch < nCh; ch++)
-            this.env[ch] = util.updateEnvelopeForChannel(this.env, this.sampleRate, ch, input[ch], attackS, releaseS)
+            rms[ch] = util.updateEnvelopeForChannel(this.env, this.sampleRate, ch, input[ch], attackS, releaseS)
         /*  determine linear value from decibel makeup value */
         const makeUpLin = util.dB2lin(makeupDB)
         /*  iterate over all channels  */
         for (let ch = 0; ch < nCh; ch++) {
-            const levelDB = util.lin2dB(this.env[ch])
+            const levelDB = util.lin2dB(rms[ch])
             const gainDB  = this.gainDBFor(levelDB, thresholdDB, ratio, kneeDB)
             let gainLin = util.dB2lin(gainDB) * makeUpLin
@@ -117,6 +117,10 @@ class ExpanderProcessor extends AudioWorkletProcessor {
                 gainLin *= util.dB2lin(neededLiftDB)
             }
+            /*  guard against IEEE 754 edge case (0 * Infinity = NaN on silence)  */
+            if (!Number.isFinite(gainLin))
+                gainLin = 0
             /*  apply gain change to channel  */
             const inp = input[ch]
             const out = output[ch]

package/speechflow-cli/src/speechflow-node-a2a-expander.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -168,7 +168,7 @@ export default class SpeechFlowNodeA2AExpander extends SpeechFlowNode {
                     callback(new Error("expander not initialized"))
                 else {
                     /*  expand chunk  */
-                    const payload = util.convertBufToI16(chunk.payload)
+                    const payload = util.convertBufToI16(chunk.payload, self.config.audioLittleEndian)
                     self.expander.process(payload).then((result) => {
                         if (self.closing) {
                             callback(new Error("stream already destroyed"))
@@ -176,9 +176,10 @@ export default class SpeechFlowNodeA2AExpander extends SpeechFlowNode {
                         }
                         /*  take over expanded data  */
-                        const payload = util.convertI16ToBuf(result)
-                        chunk.payload = payload
-                        this.push(chunk)
+                        const payload = util.convertI16ToBuf(result, self.config.audioLittleEndian)
+                        const chunkNew = chunk.clone()
+                        chunkNew.payload = payload
+                        this.push(chunkNew)
                         callback()
                     }).catch((error: unknown) => {
                         if (self.closing)

package/speechflow-cli/src/speechflow-node-a2a-ffmpeg.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -100,18 +100,13 @@ export default class SpeechFlowNodeA2AFFMPEG extends SpeechFlowNode {
         /*  wrap streams with conversions for chunk vs plain audio  */
         const wrapper1 = util.createTransformStreamForWritableSide("audio", 1)
-        const wrapper2 = util.createTransformStreamForReadableSide("audio", () => this.timeZero)
+        const wrapper2 = util.createTransformStreamForReadableSide("audio", () => this.timeZero, undefined,
+            this.config.audioSampleRate, this.config.audioBitDepth, this.config.audioChannels)
         this.stream = Stream.compose(wrapper1, ffmpegStream, wrapper2)
     }
     /*  close node  */
     async close () {
-        /*  shutdown stream  */
-        if (this.stream !== null) {
-            await util.destroyStream(this.stream)
-            this.stream = null
-        }
         /*  shutdown FFmpeg  */
         if (this.ffmpeg !== null) {
             util.run("stopping FFmpeg process",
@@ -119,6 +114,12 @@ export default class SpeechFlowNodeA2AFFMPEG extends SpeechFlowNode {
                 () => {})
             this.ffmpeg = null
         }
+        /*  shutdown stream  */
+        if (this.stream !== null) {
+            await util.destroyStream(this.stream)
+            this.stream = null
+        }
     }
 }

package/speechflow-cli/src/speechflow-node-a2a-filler.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -196,6 +196,12 @@ export default class SpeechFlowNodeA2AFiller extends SpeechFlowNode {
                     self.filler.done()
                     await util.sleep(10)
+                    /*  re-check after await (close() may have run during sleep)  */
+                    if (self.closing || self.sendQueue === null) {
+                        callback()
+                        return
+                    }
                     /*  signal end of stream  */
                     self.sendQueue.write(null)
                 }
@@ -221,10 +227,8 @@ export default class SpeechFlowNodeA2AFiller extends SpeechFlowNode {
                         self.log("info", "received EOF signal")
                         this.push(null)
                     }
-                    else if (!(chunk.payload instanceof Buffer)) {
+                    else if (!Buffer.isBuffer(chunk.payload))
                         self.log("warning", "invalid chunk (expected audio buffer)")
-                        this.push(null)
-                    }
                     else {
                         self.log("debug", `received data (${chunk.payload.byteLength} bytes)`)
                         this.push(chunk)

package/speechflow-cli/src/speechflow-node-a2a-gain.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-a2a-gender.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -105,10 +105,13 @@ export default class SpeechFlowNodeA2AGender extends SpeechFlowNode {
                 device:    "auto",
                 progress_callback: progressCallback
             })
+            const ac = new AbortController()
             this.classifier = await Promise.race([
                 pipelinePromise,
-                util.timeout(30 * 1000, "model initialization timeout")
-            ]) as Transformers.AudioClassificationPipeline
+                util.timeout(30 * 1000, "model initialization timeout", ac.signal)
+            ]).finally(() => {
+                ac.abort()
+            }) as Transformers.AudioClassificationPipeline
         }
         catch (error) {
             if (this.progressInterval) {
@@ -147,13 +150,13 @@ export default class SpeechFlowNodeA2AGender extends SpeechFlowNode {
                 return genderLast
             /*  classify audio  */
-            const result = await Promise.race([
-                this.classifier(data),
-                util.timeout(30 * 1000, "classification timeout")
-            ]) as Transformers.AudioClassificationOutput | Transformers.AudioClassificationOutput[]
-            const classified = Array.isArray(result) ?
-                result as Transformers.AudioClassificationOutput :
-                [ result ]
+            const ac = new AbortController()
+            const classified = await Promise.race([
+                this.classifier(data) as Promise<Transformers.AudioClassificationOutput>,
+                util.timeout(30 * 1000, "classification timeout", ac.signal)
+            ]).finally(() => {
+                ac.abort()
+            })
             const c1     = classified.find((c) => c.label === "male")
             const c2     = classified.find((c) => c.label === "female")
             const male   = c1 ? c1.score : 0.0
@@ -199,7 +202,7 @@ export default class SpeechFlowNodeA2AGender extends SpeechFlowNode {
                     const element = this.queueAC.peek(pos)
                     if (element === undefined || element.type !== "audio-frame")
                         break
-                    if ((samples + element.data.length) < frameWindowSamples) {
+                    if ((samples + element.data.length) <= frameWindowSamples) {
                         data.set(element.data, samples)
                         samples += element.data.length
                     }
@@ -224,12 +227,13 @@ export default class SpeechFlowNodeA2AGender extends SpeechFlowNode {
             catch (error) {
                 this.log("error", `gender classification error: ${error}`)
             }
-            /*  re-initiate working off round  */
-            workingOff = false
-            if (!this.closing) {
-                this.workingOffTimer = setTimeout(workOffQueue, 100)
-                this.queue.once("write", workOffQueue)
+            finally {
+                /*  re-initiate working off round  */
+                workingOff = false
+                if (!this.closing) {
+                    this.workingOffTimer = setTimeout(workOffQueue, 100)
+                    this.queue.once("write", workOffQueue)
+                }
             }
         }
         this.queue.once("write", workOffQueue)
@@ -313,7 +317,7 @@ export default class SpeechFlowNodeA2AGender extends SpeechFlowNode {
                             else if (element.type === "audio-frame"
                                 && element.gender === undefined)
                                 break
-                            const duration = util.audioArrayDuration(element.data)
+                            const duration = util.audioArrayDuration(element.data, sampleRateTarget)
                             const fmtTime = (t: Duration) => t.toFormat("hh:mm:ss.SSS")
                             const times = `start: ${fmtTime(element.chunk.timestampStart)}, ` +
                                 `end: ${fmtTime(element.chunk.timestampEnd)}`

package/speechflow-cli/src/speechflow-node-a2a-gtcrn-wt.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-a2a-gtcrn.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -114,17 +114,27 @@ export default class SpeechFlowNodeA2AGTCRN extends SpeechFlowNode {
             })
         })
-        /*  receive message from worker  */
-        const pending = new Map<string, (arr: Float32Array<ArrayBuffer>) => void>()
+        /*  track pending promises  */
+        const pending = new Map<string, {
+            resolve: (arr: Float32Array<ArrayBuffer>) => void,
+            reject:  (err: Error)                     => void
+        }>()
+        /*  reject all pending promises on worker exit  */
         this.worker.on("exit", () => {
+            const err = new Error("worker terminated")
+            for (const cb of pending.values())
+                cb.reject(err)
             pending.clear()
         })
+        /*  receive message from worker  */
         this.worker.on("message", (msg: any) => {
             if (typeof msg === "object" && msg !== null && msg.type === "process-done") {
                 const cb = pending.get(msg.id)
                 pending.delete(msg.id)
                 if (cb)
-                    cb(msg.data)
+                    cb.resolve(msg.data)
                 else
                     this.log("warning", `GTCRN worker thread sent back unexpected id: ${msg.id}`)
             }
@@ -140,8 +150,8 @@ export default class SpeechFlowNodeA2AGTCRN extends SpeechFlowNode {
             if (this.closing)
                 return samples
             const id = `${seq++}`
-            return new Promise<Float32Array<ArrayBuffer>>((resolve) => {
-                pending.set(id, (result) => { resolve(result) })
+            return new Promise<Float32Array<ArrayBuffer>>((resolve, reject) => {
+                pending.set(id, { resolve, reject })
                 this.worker!.postMessage({ type: "process", id, samples }, [ samples.buffer ])
             })
         }
@@ -161,24 +171,37 @@ export default class SpeechFlowNodeA2AGTCRN extends SpeechFlowNode {
                     callback(new Error("invalid chunk payload type"))
                 else {
                     /*  resample Buffer from 48KHz (SpeechFlow) to 16KHz (GTCRN)  */
-                    const resampledDown = self.resamplerDown!.processChunk(chunk.payload)
+                    if (self.resamplerDown === null) {
+                        callback(new Error("resamplerDown already destroyed"))
+                        return
+                    }
+                    const resampledDown = self.resamplerDown.processChunk(chunk.payload)
                     /*  convert Buffer into Float32Array  */
                     const payload = util.convertBufToF32(resampledDown)
                     /*  process with GTCRN  */
                     workerProcess(payload).then((result: Float32Array<ArrayBuffer>) => {
+                        /*  short-circuit if already closing  */
+                        if (self.closing) {
+                            callback()
+                            return
+                        }
                         /*  convert Float32Array into Buffer  */
                         const buf = util.convertF32ToBuf(result)
                         /*  resample Buffer from 16KHz (GTCRN) back to 48KHz (SpeechFlow)  */
-                        const resampledUp = self.resamplerUp!.processChunk(buf)
-                        /*  update chunk  */
-                        chunk.payload = resampledUp
-                        /*  forward updated chunk  */
-                        this.push(chunk)
+                        if (self.resamplerUp === null) {
+                            callback(new Error("resamplerUp already destroyed"))
+                            return
+                        }
+                        const resampledUp = self.resamplerUp.processChunk(buf)
+                        /*  forward cloned chunk with updated payload  */
+                        const chunkNew = chunk.clone()
+                        chunkNew.payload = resampledUp
+                        this.push(chunkNew)
                         callback()
                     }).catch((err: unknown) => {
                         const error = util.ensureError(err)
@@ -211,9 +234,13 @@ export default class SpeechFlowNodeA2AGTCRN extends SpeechFlowNode {
         }
         /*  destroy resamplers  */
-        if (this.resamplerDown !== null)
+        if (this.resamplerDown !== null) {
+            this.resamplerDown.destroy()
             this.resamplerDown = null
-        if (this.resamplerUp !== null)
+        }
+        if (this.resamplerUp !== null) {
+            this.resamplerUp.destroy()
             this.resamplerUp = null
+        }
     }
 }

package/speechflow-cli/src/speechflow-node-a2a-meter.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -81,7 +81,7 @@ export default class SpeechFlowNodeA2AMeter extends SpeechFlowNode {
             /*  grab the accumulated chunk data  */
             const chunkData = this.chunkBuffer
-            this.chunkBuffer = chunkData.subarray(samplesPerChunk)
+            this.chunkBuffer = chunkData.slice(samplesPerChunk)
             /*  update internal audio sample sliding window for LUFS-M  */
             if (chunkData.length > sampleWindow.length)

package/speechflow-cli/src/speechflow-node-a2a-mute.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */

package/speechflow-cli/src/speechflow-node-a2a-pitch.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -185,8 +185,9 @@ export default class SpeechFlowNodeA2APitch extends SpeechFlowNode {
                         /*  take over pitch-shifted data  */
                         const payload = util.convertI16ToBuf(result, self.config.audioLittleEndian)
-                        chunk.payload = payload
-                        this.push(chunk)
+                        const chunkNew = chunk.clone()
+                        chunkNew.payload = payload
+                        this.push(chunkNew)
                         callback()
                     }).catch((error: unknown) => {
                         if (self.closing)

package/speechflow-cli/src/speechflow-node-a2a-rnnoise-wt.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -46,7 +46,7 @@ parentPort!.on("message", (msg) => {
         /*  convert back Float32Array to Int16Array  */
         const i16 = new Int16Array(data.length)
         for (let i = 0; i < data.length; i++)
-            i16[i] = Math.round(f32a[i])
+            i16[i] = Math.max(-32768, Math.min(32767, Math.round(f32a[i])))
         /*  send processed frame back to parent  */
         parentPort!.postMessage({ type: "process-done", id, data: i16 }, [ i16.buffer ])

package/speechflow-cli/src/speechflow-node-a2a-rnnoise.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -71,14 +71,27 @@ export default class SpeechFlowNodeA2ARNNoise extends SpeechFlowNode {
             })
         })
+        /*  track pending promises  */
+        const pending = new Map<string, {
+            resolve: (arr: Int16Array<ArrayBuffer>) => void,
+            reject:  (err: Error)                   => void
+        }>()
+        /*  reject all pending promises on worker exit  */
+        this.worker.on("exit", () => {
+            const err = new Error("worker terminated")
+            for (const cb of pending.values())
+                cb.reject(err)
+            pending.clear()
+        })
         /*  receive message from worker  */
-        const pending = new Map<string, (arr: Int16Array<ArrayBuffer>) => void>()
         this.worker.on("message", (msg: any) => {
             if (typeof msg === "object" && msg !== null && msg.type === "process-done") {
                 const cb = pending.get(msg.id)
                 pending.delete(msg.id)
                 if (cb)
-                    cb(msg.data)
+                    cb.resolve(msg.data)
                 else
                     this.log("warning", `RNNoise worker thread sent back unexpected id: ${msg.id}`)
             }
@@ -92,8 +105,8 @@ export default class SpeechFlowNodeA2ARNNoise extends SpeechFlowNode {
             if (this.closing)
                 return segment
             const id = `${seq++}`
-            return new Promise<Int16Array<ArrayBuffer>>((resolve) => {
-                pending.set(id, (segment) => { resolve(segment) })
+            return new Promise<Int16Array<ArrayBuffer>>((resolve, reject) => {
+                pending.set(id, { resolve, reject })
                 this.worker!.postMessage({ type: "process", id, data: segment }, [ segment.buffer ])
             })
         }
@@ -113,20 +126,19 @@ export default class SpeechFlowNodeA2ARNNoise extends SpeechFlowNode {
                     callback(new Error("invalid chunk payload type"))
                 else {
                     /*  convert Buffer into Int16Array  */
-                    const payload = util.convertBufToI16(chunk.payload)
+                    const payload = util.convertBufToI16(chunk.payload, self.config.audioLittleEndian)
                     /*  process Int16Array in necessary segments  */
                     util.processInt16ArrayInSegments(payload, self.sampleSize, (segment) =>
                         workerProcessSegment(segment)
                     ).then((payload: Int16Array<ArrayBuffer>) => {
                         /*  convert Int16Array into Buffer  */
-                        const buf = util.convertI16ToBuf(payload)
-                        /*  update chunk  */
-                        chunk.payload = buf
+                        const buf = util.convertI16ToBuf(payload, self.config.audioLittleEndian)
-                        /*  forward updated chunk  */
-                        this.push(chunk)
+                        /*  forward cloned chunk with updated payload  */
+                        const chunkNew = chunk.clone()
+                        chunkNew.payload = buf
+                        this.push(chunkNew)
                         callback()
                     }).catch((err: unknown) => {
                         const error = util.ensureError(err)

package/speechflow-cli/src/speechflow-node-a2a-speex.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -53,7 +53,9 @@ export default class SpeechFlowNodeA2ASpeex extends SpeechFlowNode {
         const wasmBinary = await fs.promises.readFile(
             path.join(__dirname, "../node_modules/@sapphi-red/speex-preprocess-wasm/dist/speex.wasm"))
         const speexModule = await loadSpeexModule({
-            wasmBinary: wasmBinary.buffer
+            wasmBinary: wasmBinary.buffer.slice(
+                wasmBinary.byteOffset,
+                wasmBinary.byteOffset + wasmBinary.byteLength)
         })
         this.speexProcessor = new SpeexPreprocessor(
             speexModule, this.sampleSize, this.config.audioSampleRate)
@@ -79,7 +81,7 @@ export default class SpeechFlowNodeA2ASpeex extends SpeechFlowNode {
                     callback(new Error("invalid chunk payload type"))
                 else {
                     /*  convert Buffer into Int16Array  */
-                    const payload = util.convertBufToI16(chunk.payload)
+                    const payload = util.convertBufToI16(chunk.payload, self.config.audioLittleEndian)
                     /*  process Int16Array in necessary fixed-size segments  */
                     util.processInt16ArrayInSegments(payload, self.sampleSize, (segment) => {
@@ -94,13 +96,12 @@ export default class SpeechFlowNodeA2ASpeex extends SpeechFlowNode {
                             throw new Error("stream already destroyed")
                         /*  convert Int16Array back into Buffer  */
-                        const buf = util.convertI16ToBuf(payload)
+                        const buf = util.convertI16ToBuf(payload, self.config.audioLittleEndian)
-                        /*  update chunk  */
-                        chunk.payload = buf
-                        /*  forward updated chunk  */
-                        this.push(chunk)
+                        /*  forward cloned chunk with updated payload  */
+                        const chunkNew = chunk.clone()
+                        chunkNew.payload = buf
+                        this.push(chunkNew)
                         callback()
                     }).catch((err: unknown) => {
                         const error = util.ensureError(err)