npm - speechflow - Versions diffs - 1.3.1 → 1.4.0 - Mend

speechflow 1.3.1 → 1.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (156) hide show

package/CHANGELOG.md +23 -0
package/etc/stx.conf +54 -58
package/package.json +25 -106
package/{etc → speechflow-cli/etc}/eslint.mjs +1 -2
package/speechflow-cli/etc/stx.conf +77 -0
package/speechflow-cli/package.json +116 -0
package/{src → speechflow-cli/src}/speechflow-node-a2a-gender.ts +148 -64
package/speechflow-cli/src/speechflow-node-a2a-meter.ts +217 -0
package/{src → speechflow-cli/src}/speechflow-node-a2a-mute.ts +39 -11
package/speechflow-cli/src/speechflow-node-a2a-vad.ts +384 -0
package/{src → speechflow-cli/src}/speechflow-node-a2a-wav.ts +27 -11
package/speechflow-cli/src/speechflow-node-a2t-deepgram.ts +313 -0
package/{src → speechflow-cli/src}/speechflow-node-t2a-elevenlabs.ts +59 -12
package/{src → speechflow-cli/src}/speechflow-node-t2a-kokoro.ts +11 -4
package/{src → speechflow-cli/src}/speechflow-node-t2t-deepl.ts +9 -4
package/{src → speechflow-cli/src}/speechflow-node-t2t-format.ts +2 -2
package/{src → speechflow-cli/src}/speechflow-node-t2t-ollama.ts +1 -1
package/{src → speechflow-cli/src}/speechflow-node-t2t-openai.ts +1 -1
package/{src → speechflow-cli/src}/speechflow-node-t2t-sentence.ts +37 -20
package/speechflow-cli/src/speechflow-node-t2t-subtitle.ts +276 -0
package/{src → speechflow-cli/src}/speechflow-node-t2t-transformers.ts +4 -3
package/{src → speechflow-cli/src}/speechflow-node-x2x-filter.ts +9 -5
package/{src → speechflow-cli/src}/speechflow-node-x2x-trace.ts +16 -8
package/{src → speechflow-cli/src}/speechflow-node-xio-device.ts +12 -8
package/{src → speechflow-cli/src}/speechflow-node-xio-file.ts +9 -3
package/{src → speechflow-cli/src}/speechflow-node-xio-mqtt.ts +5 -2
package/{src → speechflow-cli/src}/speechflow-node-xio-websocket.ts +12 -12
package/{src → speechflow-cli/src}/speechflow-node.ts +7 -0
package/{src → speechflow-cli/src}/speechflow-utils.ts +78 -44
package/{src → speechflow-cli/src}/speechflow.ts +188 -53
package/speechflow-ui-db/etc/eslint.mjs +106 -0
package/speechflow-ui-db/etc/htmllint.json +55 -0
package/speechflow-ui-db/etc/stx.conf +79 -0
package/speechflow-ui-db/etc/stylelint.js +46 -0
package/speechflow-ui-db/etc/stylelint.yaml +33 -0
package/speechflow-ui-db/etc/tsc-client.json +30 -0
package/speechflow-ui-db/etc/tsc.node.json +9 -0
package/speechflow-ui-db/etc/vite-client.mts +63 -0
package/speechflow-ui-db/package.d/htmllint-cli+0.0.7.patch +20 -0
package/speechflow-ui-db/package.json +75 -0
package/speechflow-ui-db/src/app-icon.ai +1989 -4
package/speechflow-ui-db/src/app-icon.svg +26 -0
package/speechflow-ui-db/src/app.styl +64 -0
package/speechflow-ui-db/src/app.vue +221 -0
package/speechflow-ui-db/src/index.html +23 -0
package/speechflow-ui-db/src/index.ts +26 -0
package/{dst/speechflow.d.ts → speechflow-ui-db/src/lib.d.ts} +5 -3
package/speechflow-ui-db/src/tsconfig.json +3 -0
package/speechflow-ui-st/etc/eslint.mjs +106 -0
package/speechflow-ui-st/etc/htmllint.json +55 -0
package/speechflow-ui-st/etc/stx.conf +79 -0
package/speechflow-ui-st/etc/stylelint.js +46 -0
package/speechflow-ui-st/etc/stylelint.yaml +33 -0
package/speechflow-ui-st/etc/tsc-client.json +30 -0
package/speechflow-ui-st/etc/tsc.node.json +9 -0
package/speechflow-ui-st/etc/vite-client.mts +63 -0
package/speechflow-ui-st/package.d/htmllint-cli+0.0.7.patch +20 -0
package/speechflow-ui-st/package.json +79 -0
package/speechflow-ui-st/src/app-icon.ai +1989 -4
package/speechflow-ui-st/src/app-icon.svg +26 -0
package/speechflow-ui-st/src/app.styl +64 -0
package/speechflow-ui-st/src/app.vue +142 -0
package/speechflow-ui-st/src/index.html +23 -0
package/speechflow-ui-st/src/index.ts +26 -0
package/speechflow-ui-st/src/lib.d.ts +9 -0
package/speechflow-ui-st/src/tsconfig.json +3 -0
package/dst/speechflow-node-a2a-ffmpeg.d.ts +0 -13
package/dst/speechflow-node-a2a-ffmpeg.js +0 -153
package/dst/speechflow-node-a2a-ffmpeg.js.map +0 -1
package/dst/speechflow-node-a2a-gender.d.ts +0 -18
package/dst/speechflow-node-a2a-gender.js +0 -271
package/dst/speechflow-node-a2a-gender.js.map +0 -1
package/dst/speechflow-node-a2a-meter.d.ts +0 -12
package/dst/speechflow-node-a2a-meter.js +0 -155
package/dst/speechflow-node-a2a-meter.js.map +0 -1
package/dst/speechflow-node-a2a-mute.d.ts +0 -16
package/dst/speechflow-node-a2a-mute.js +0 -91
package/dst/speechflow-node-a2a-mute.js.map +0 -1
package/dst/speechflow-node-a2a-vad.d.ts +0 -16
package/dst/speechflow-node-a2a-vad.js +0 -285
package/dst/speechflow-node-a2a-vad.js.map +0 -1
package/dst/speechflow-node-a2a-wav.d.ts +0 -11
package/dst/speechflow-node-a2a-wav.js +0 -195
package/dst/speechflow-node-a2a-wav.js.map +0 -1
package/dst/speechflow-node-a2t-deepgram.d.ts +0 -15
package/dst/speechflow-node-a2t-deepgram.js +0 -255
package/dst/speechflow-node-a2t-deepgram.js.map +0 -1
package/dst/speechflow-node-t2a-elevenlabs.d.ts +0 -16
package/dst/speechflow-node-t2a-elevenlabs.js +0 -195
package/dst/speechflow-node-t2a-elevenlabs.js.map +0 -1
package/dst/speechflow-node-t2a-kokoro.d.ts +0 -13
package/dst/speechflow-node-t2a-kokoro.js +0 -149
package/dst/speechflow-node-t2a-kokoro.js.map +0 -1
package/dst/speechflow-node-t2t-deepl.d.ts +0 -15
package/dst/speechflow-node-t2t-deepl.js +0 -142
package/dst/speechflow-node-t2t-deepl.js.map +0 -1
package/dst/speechflow-node-t2t-format.d.ts +0 -11
package/dst/speechflow-node-t2t-format.js +0 -82
package/dst/speechflow-node-t2t-format.js.map +0 -1
package/dst/speechflow-node-t2t-ollama.d.ts +0 -13
package/dst/speechflow-node-t2t-ollama.js +0 -247
package/dst/speechflow-node-t2t-ollama.js.map +0 -1
package/dst/speechflow-node-t2t-openai.d.ts +0 -13
package/dst/speechflow-node-t2t-openai.js +0 -227
package/dst/speechflow-node-t2t-openai.js.map +0 -1
package/dst/speechflow-node-t2t-sentence.d.ts +0 -17
package/dst/speechflow-node-t2t-sentence.js +0 -234
package/dst/speechflow-node-t2t-sentence.js.map +0 -1
package/dst/speechflow-node-t2t-subtitle.d.ts +0 -13
package/dst/speechflow-node-t2t-subtitle.js +0 -278
package/dst/speechflow-node-t2t-subtitle.js.map +0 -1
package/dst/speechflow-node-t2t-transformers.d.ts +0 -14
package/dst/speechflow-node-t2t-transformers.js +0 -265
package/dst/speechflow-node-t2t-transformers.js.map +0 -1
package/dst/speechflow-node-x2x-filter.d.ts +0 -11
package/dst/speechflow-node-x2x-filter.js +0 -117
package/dst/speechflow-node-x2x-filter.js.map +0 -1
package/dst/speechflow-node-x2x-trace.d.ts +0 -11
package/dst/speechflow-node-x2x-trace.js +0 -111
package/dst/speechflow-node-x2x-trace.js.map +0 -1
package/dst/speechflow-node-xio-device.d.ts +0 -13
package/dst/speechflow-node-xio-device.js +0 -226
package/dst/speechflow-node-xio-device.js.map +0 -1
package/dst/speechflow-node-xio-file.d.ts +0 -11
package/dst/speechflow-node-xio-file.js +0 -210
package/dst/speechflow-node-xio-file.js.map +0 -1
package/dst/speechflow-node-xio-mqtt.d.ts +0 -13
package/dst/speechflow-node-xio-mqtt.js +0 -185
package/dst/speechflow-node-xio-mqtt.js.map +0 -1
package/dst/speechflow-node-xio-websocket.d.ts +0 -13
package/dst/speechflow-node-xio-websocket.js +0 -278
package/dst/speechflow-node-xio-websocket.js.map +0 -1
package/dst/speechflow-node.d.ts +0 -65
package/dst/speechflow-node.js +0 -180
package/dst/speechflow-node.js.map +0 -1
package/dst/speechflow-utils.d.ts +0 -69
package/dst/speechflow-utils.js +0 -486
package/dst/speechflow-utils.js.map +0 -1
package/dst/speechflow.js +0 -768
package/dst/speechflow.js.map +0 -1
package/src/speechflow-node-a2a-meter.ts +0 -130
package/src/speechflow-node-a2a-vad.ts +0 -285
package/src/speechflow-node-a2t-deepgram.ts +0 -234
package/src/speechflow-node-t2t-subtitle.ts +0 -149
/package/{etc → speechflow-cli/etc}/biome.jsonc +0 -0
/package/{etc → speechflow-cli/etc}/oxlint.jsonc +0 -0
/package/{etc → speechflow-cli/etc}/speechflow.bat +0 -0
/package/{etc → speechflow-cli/etc}/speechflow.sh +0 -0
/package/{etc → speechflow-cli/etc}/speechflow.yaml +0 -0
/package/{etc → speechflow-cli/etc}/tsconfig.json +0 -0
/package/{package.d → speechflow-cli/package.d}/@ericedouard+vad-node-realtime+0.2.0.patch +0 -0
/package/{src → speechflow-cli/src}/lib.d.ts +0 -0
/package/{src → speechflow-cli/src}/speechflow-logo.ai +0 -0
/package/{src → speechflow-cli/src}/speechflow-logo.svg +0 -0
/package/{src → speechflow-cli/src}/speechflow-node-a2a-ffmpeg.ts +0 -0
/package/{tsconfig.json → speechflow-cli/tsconfig.json} +0 -0

package/speechflow-cli/src/speechflow-node-a2a-vad.ts ADDED Viewed

@@ -0,0 +1,384 @@
+/*
+**  SpeechFlow - Speech Processing Flow Graph
+**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
+*/
+/*  standard dependencies  */
+import Stream             from "node:stream"
+/*  external dependencies  */
+import { RealTimeVAD }    from "@ericedouard/vad-node-realtime"
+/*  internal dependencies  */
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
+import * as utils                          from "./speechflow-utils"
+/*  audio stream queue element */
+type AudioQueueElementSegment = {
+    data:        Float32Array,
+    isSpeech?:   boolean
+}
+type AudioQueueElement = {
+    type:       "audio-frame",
+    chunk:       SpeechFlowChunk,
+    segmentIdx:  number,
+    segmentData: AudioQueueElementSegment[],
+    isSpeech?:   boolean
+} | {
+    type:        "audio-eof"
+}
+/*  SpeechFlow node for VAD speech-to-speech processing  */
+export default class SpeechFlowNodeVAD extends SpeechFlowNode {
+    /*  declare official node name  */
+    public static name = "vad"
+    /*  internal state  */
+    private vad: RealTimeVAD | null = null
+    private queue     = new utils.Queue<AudioQueueElement>()
+    private queueRecv = this.queue.pointerUse("recv")
+    private queueVAD  = this.queue.pointerUse("vad")
+    private queueSend = this.queue.pointerUse("send")
+    private destroyed = false
+    private tailTimer: ReturnType<typeof setTimeout> | null = null
+    private activeEventListeners = new Set<() => void>()
+    /*  construct node  */
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
+        /*  declare node configuration parameters  */
+        this.configure({
+            mode:               { type: "string", val: "silenced", match: /^(?:silenced|unplugged)$/ },
+            posSpeechThreshold: { type: "number", val: 0.50 },
+            negSpeechThreshold: { type: "number", val: 0.35 },
+            minSpeechFrames:    { type: "number", val: 2    },
+            redemptionFrames:   { type: "number", val: 12   },
+            preSpeechPadFrames: { type: "number", val: 1    },
+            postSpeechTail:     { type: "number", val: 1500 }
+        })
+        /*  declare node input/output format  */
+        this.input  = "audio"
+        this.output = "audio"
+    }
+    /*  open node  */
+    async open () {
+        /*  sanity check situation  */
+        if (this.config.audioBitDepth !== 16 || !this.config.audioLittleEndian)
+            throw new Error("VAD node currently supports PCM-S16LE audio only")
+        /*  clear destruction flag  */
+        this.destroyed = false
+        /*  internal processing constants  */
+        const vadSampleRateTarget = 16000 /* internal target of VAD */
+        const vadSamplesPerFrame  = 512   /* required for VAD v5 */
+        /*  helper function for timer cleanup  */
+        const clearTailTimer = () => {
+            if (this.tailTimer !== null) {
+                clearTimeout(this.tailTimer)
+                this.tailTimer = null
+            }
+        }
+        /*  establish Voice Activity Detection (VAD) facility  */
+        let tail = false
+        try {
+            this.vad = await RealTimeVAD.new({
+                model:                   "v5",
+                sampleRate:              this.config.audioSampleRate, /* before resampling to 16KHz */
+                frameSamples:            vadSamplesPerFrame,          /* after  resampling to 16KHz */
+                positiveSpeechThreshold: this.params.posSpeechThreshold,
+                negativeSpeechThreshold: this.params.negSpeechThreshold,
+                minSpeechFrames:         this.params.minSpeechFrames,
+                redemptionFrames:        this.params.redemptionFrames,
+                preSpeechPadFrames:      this.params.preSpeechPadFrames,
+                onSpeechStart: () => {
+                    if (this.destroyed)
+                        return
+                    this.log("info", "VAD: speech start")
+                    if (this.params.mode === "unplugged") {
+                        tail = false
+                        clearTailTimer()
+                    }
+                },
+                onSpeechEnd: (audio) => {
+                    if (this.destroyed)
+                        return
+                    const duration = utils.audioArrayDuration(audio, vadSampleRateTarget)
+                    this.log("info", `VAD: speech end (duration: ${duration.toFixed(2)}s)`)
+                    if (this.params.mode === "unplugged") {
+                        tail = true
+                        clearTailTimer()
+                        this.tailTimer = setTimeout(() => {
+                            if (this.destroyed || this.tailTimer === null)
+                                return
+                            tail = false
+                            this.tailTimer = null
+                        }, this.params.postSpeechTail)
+                    }
+                },
+                onVADMisfire: () => {
+                    if (this.destroyed)
+                        return
+                    this.log("info", "VAD: speech end (segment too short)")
+                    if (this.params.mode === "unplugged") {
+                        tail = true
+                        clearTailTimer()
+                        this.tailTimer = setTimeout(() => {
+                            if (this.destroyed || this.tailTimer === null)
+                                return
+                            tail = false
+                            this.tailTimer = null
+                        }, this.params.postSpeechTail)
+                    }
+                },
+                onFrameProcessed: (audio) => {
+                    if (this.destroyed)
+                        return
+                    try {
+                        /*  annotate the current audio segment  */
+                        const element = this.queueVAD.peek()
+                        if (element === undefined || element.type !== "audio-frame")
+                            throw new Error("internal error which cannot happen: no more queued element")
+                        if (element.segmentIdx >= element.segmentData.length)
+                            throw new Error("segment index out of bounds")
+                        const segment = element.segmentData[element.segmentIdx++]
+                        segment.isSpeech = (audio.isSpeech > audio.notSpeech) || tail
+                        /*  annotate the entire audio chunk  */
+                        if (element.segmentIdx >= element.segmentData.length) {
+                            element.isSpeech = element.segmentData.some(segment => segment.isSpeech)
+                            this.queueVAD.touch()
+                            this.queueVAD.walk(+1)
+                        }
+                    }
+                    catch (error) {
+                        this.log("error", `VAD frame processing error: ${error}`)
+                    }
+                }
+            })
+            this.vad.start()
+        }
+        catch (error) {
+            throw new Error(`failed to initialize VAD: ${error}`)
+        }
+        /*  provide Duplex stream and internally attach to VAD  */
+        const self = this
+        this.stream = new Stream.Duplex({
+            writableObjectMode: true,
+            readableObjectMode: true,
+            decodeStrings:      false,
+            highWaterMark:      1,
+            /*  receive audio chunk (writable side of stream)  */
+            write (chunk: SpeechFlowChunk, encoding, callback) {
+                if (self.destroyed) {
+                    callback(new Error("stream already destroyed"))
+                    return
+                }
+                if (!Buffer.isBuffer(chunk.payload))
+                    callback(new Error("expected audio input as Buffer chunks"))
+                else if (chunk.payload.byteLength === 0)
+                    callback()
+                else {
+                    try {
+                        /*  convert audio samples from PCM/I16 to PCM/F32  */
+                        const data = utils.convertBufToF32(chunk.payload,
+                            self.config.audioLittleEndian)
+                        /*  segment audio samples as individual VAD-sized frames  */
+                        const segmentData: AudioQueueElementSegment[] = []
+                        const chunkSize = vadSamplesPerFrame *
+                            (self.config.audioSampleRate / vadSampleRateTarget)
+                        const chunks = Math.trunc(data.length / chunkSize)
+                        for (let i = 0; i < chunks; i++) {
+                            const frame = data.slice(i * chunkSize, (i + 1) * chunkSize)
+                            const segment: AudioQueueElementSegment = { data: frame }
+                            segmentData.push(segment)
+                        }
+                        if ((chunks * chunkSize) < data.length) {
+                            const frame = new Float32Array(chunkSize)
+                            frame.fill(0)
+                            frame.set(data.slice(chunks * chunkSize, data.length))
+                            const segment: AudioQueueElementSegment = { data: frame }
+                            segmentData.push(segment)
+                        }
+                        /*  queue the results  */
+                        self.queueRecv.append({
+                            type: "audio-frame", chunk,
+                            segmentIdx: 0, segmentData
+                        })
+                        /*  push segments through Voice Activity Detection (VAD)  */
+                        if (self.vad && !self.destroyed) {
+                            try {
+                                for (const segment of segmentData)
+                                    self.vad.processAudio(segment.data)
+                            }
+                            catch (error) {
+                                self.log("error", `VAD processAudio error: ${error}`)
+                            }
+                        }
+                        callback()
+                    }
+                    catch (error) {
+                        callback(error instanceof Error ? error : new Error("VAD processing failed"))
+                    }
+                }
+            },
+            /*  receive no more audio chunks (writable side of stream)  */
+            final (callback) {
+                if (self.destroyed) {
+                    callback()
+                    return
+                }
+                /*  signal end of file  */
+                self.queueRecv.append({ type: "audio-eof" })
+                callback()
+            },
+            /*  send audio chunk(s) (readable side of stream)  */
+            read (_size) {
+                if (self.destroyed) {
+                    this.push(null)
+                    return
+                }
+                /*  try to perform read operation from scratch  */
+                const tryToRead = () => {
+                    if (self.destroyed) {
+                        this.push(null)
+                        return
+                    }
+                    /*  flush pending audio chunks  */
+                    const flushPendingChunks = () => {
+                        let pushed = 0
+                        while (true) {
+                            if (self.destroyed) {
+                                this.push(null)
+                                return
+                            }
+                            const element = self.queueSend.peek()
+                            if (element === undefined)
+                                break
+                            else if (element.type === "audio-eof") {
+                                this.push(null)
+                                break
+                            }
+                            else if (element.type === "audio-frame"
+                                && element.isSpeech === undefined)
+                                break
+                            self.queueSend.walk(+1)
+                            self.queue.trim()
+                            if (element.isSpeech) {
+                                this.push(element.chunk)
+                                pushed++
+                            }
+                            else if (self.params.mode === "silenced") {
+                                const chunk = element.chunk.clone()
+                                const buffer = chunk.payload as Buffer
+                                buffer.fill(0)
+                                this.push(chunk)
+                                pushed++
+                            }
+                            else if (self.params.mode === "unplugged" && pushed === 0) {
+                                /*  we have to await chunks now, as in unplugged
+                                    mode we else would be never called again until
+                                    we at least once push a new chunk as the result  */
+                                setTimeout(() => {
+                                    if (self.destroyed)
+                                        return
+                                    tryToRead()
+                                }, 0)
+                                return
+                            }
+                        }
+                    }
+                    /*  await forthcoming audio chunks  */
+                    const awaitForthcomingChunks = () => {
+                        if (self.destroyed)
+                            return
+                        const element = self.queueSend.peek()
+                        if (element !== undefined
+                            && element.type === "audio-frame"
+                            && element.isSpeech !== undefined)
+                            flushPendingChunks()
+                        else if (!self.destroyed) {
+                            self.queue.once("write", awaitForthcomingChunks)
+                            self.activeEventListeners.add(awaitForthcomingChunks)
+                        }
+                    }
+                    const element = self.queueSend.peek()
+                    if (element !== undefined && element.type === "audio-eof")
+                        this.push(null)
+                    else if (element !== undefined
+                        && element.type === "audio-frame"
+                        && element.isSpeech !== undefined)
+                        flushPendingChunks()
+                    else if (!self.destroyed) {
+                        self.queue.once("write", awaitForthcomingChunks)
+                        self.activeEventListeners.add(awaitForthcomingChunks)
+                    }
+                }
+                tryToRead()
+            }
+        })
+    }
+    /*  close node  */
+    async close () {
+        /*  indicate destruction  */
+        this.destroyed = true
+        /*  cleanup tail timer  */
+        if (this.tailTimer !== null) {
+            clearTimeout(this.tailTimer)
+            this.tailTimer = null
+        }
+        /*  remove all event listeners  */
+        this.activeEventListeners.forEach((listener) => {
+            this.queue.removeListener("write", listener)
+        })
+        this.activeEventListeners.clear()
+        /*  close stream  */
+        if (this.stream !== null) {
+            this.stream.destroy()
+            this.stream = null
+        }
+        /*  cleanup queue pointers before closing VAD to prevent callback access  */
+        this.queue.pointerDelete("recv")
+        this.queue.pointerDelete("vad")
+        this.queue.pointerDelete("send")
+        /*  close VAD  */
+        if (this.vad !== null) {
+            try {
+                const flushPromise = this.vad.flush()
+                const timeoutPromise = new Promise((resolve) =>
+                    setTimeout(resolve, 5000))
+                await Promise.race([ flushPromise, timeoutPromise ])
+            }
+            catch (error) {
+                this.log("warning", `VAD flush error during close: ${error}`)
+            }
+            this.vad.destroy()
+            this.vad = null
+        }
+    }
+}

package/{src → speechflow-cli/src}/speechflow-node-a2a-wav.ts RENAMED Viewed

@@ -103,8 +103,10 @@ export default class SpeechFlowNodeWAV extends SpeechFlowNode {
             decodeStrings:      false,
             highWaterMark:      1,
             transform (chunk: SpeechFlowChunk, encoding, callback) {
-                if (!Buffer.isBuffer(chunk.payload))
+                if (!Buffer.isBuffer(chunk.payload)) {
                     callback(new Error("invalid chunk payload type"))
+                    return
+                }
                 else if (firstChunk) {
                     if (self.params.mode === "encode") {
                         /*  convert raw/PCM to WAV/PCM
@@ -127,6 +129,10 @@ export default class SpeechFlowNodeWAV extends SpeechFlowNode {
                     }
                     else if (self.params.mode === "decode") {
                         /*  convert WAV/PCM to raw/PCM  */
+                        if (chunk.payload.length < 44) {
+                            callback(new Error("WAV header too short, expected at least 44 bytes"))
+                            return
+                        }
                         const header = readWavHeader(chunk.payload)
                         self.log("info", "WAV audio stream: " +
                             `audioFormat=${header.audioFormat === 0x0001 ? "PCM" :
@@ -134,20 +140,30 @@ export default class SpeechFlowNodeWAV extends SpeechFlowNode {
                             `channels=${header.channels} ` +
                             `sampleRate=${header.sampleRate} ` +
                             `bitDepth=${header.bitDepth}`)
-                        if (header.audioFormat !== 0x0001 /* PCM */)
-                            throw new Error("WAV not based on PCM format")
-                        if (header.bitDepth !== 16)
-                            throw new Error("WAV not based on 16 bit samples")
-                        if (header.sampleRate !== 48000)
-                            throw new Error("WAV not based on 48Khz sample rate")
-                        if (header.channels !== 1)
-                            throw new Error("WAV not based on mono channel")
+                        if (header.audioFormat !== 0x0001 /* PCM */) {
+                            callback(new Error("WAV not based on PCM format"))
+                            return
+                        }
+                        if (header.bitDepth !== self.config.audioBitDepth) {
+                            callback(new Error(`WAV not based on ${self.config.audioBitDepth} bit samples`))
+                            return
+                        }
+                        if (header.sampleRate !== self.config.audioSampleRate) {
+                            callback(new Error(`WAV not based on ${self.config.audioSampleRate}Hz sample rate`))
+                            return
+                        }
+                        if (header.channels !== self.config.audioChannels) {
+                            callback(new Error(`WAV not based on ${self.config.audioChannels} channel(s)`))
+                            return
+                        }
                         chunk.payload = chunk.payload.subarray(44)
                         this.push(chunk)
                         callback()
                     }
-                    else
-                        throw new Error(`invalid operation mode "${self.params.mode}"`)
+                    else {
+                        callback(new Error(`invalid operation mode "${self.params.mode}"`))
+                        return
+                    }
                 }
                 else {
                     /*  pass-through original chunk  */