npm - speechflow - Versions diffs - 1.4.4 → 1.5.0 - Mend

speechflow 1.4.4 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

package/speechflow-cli/src/speechflow-node-a2a-expander.ts ADDED Viewed

@@ -0,0 +1,212 @@
+/*
+**  SpeechFlow - Speech Processing Flow Graph
+**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
+*/
+/*  standard dependencies  */
+import path             from "node:path"
+import Stream           from "node:stream"
+/*  external dependencies  */
+import { AudioWorkletNode } from "node-web-audio-api"
+/*  internal dependencies  */
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
+import * as utils                          from "./speechflow-utils"
+import { WebAudio }                        from "./speechflow-utils-audio"
+/*  internal types  */
+interface AudioExpanderConfig {
+    thresholdDb?: number
+    floorDb?:     number
+    ratio?:       number
+    attackMs?:    number
+    releaseMs?:   number
+    kneeDb?:      number
+    makeupDb?:    number
+}
+/*  audio noise expander class  */
+class AudioExpander extends WebAudio {
+    /*  internal state  */
+    private config:       Required<AudioExpanderConfig>
+    private expanderNode: AudioWorkletNode | null = null
+    /*  construct object  */
+    constructor(
+        sampleRate: number,
+        channels:   number,
+        config:     AudioExpanderConfig = {}
+    ) {
+        super(sampleRate, channels)
+        /*  store configuration  */
+        this.config = {
+            thresholdDb: config.thresholdDb ?? -45,
+            floorDb:     config.floorDb     ?? -64,
+            ratio:       config.ratio       ?? 4.0,
+            attackMs:    config.attackMs    ?? 10,
+            releaseMs:   config.releaseMs   ?? 50,
+            kneeDb:      config.kneeDb      ?? 6.0,
+            makeupDb:    config.makeupDb    ?? 0
+        }
+    }
+    /*  initialize object  */
+    public async setup (): Promise<void> {
+        await super.setup()
+        /*  add audio worklet module  */
+        const url = path.resolve(__dirname, "speechflow-node-a2a-expander-wt.js")
+        await this.audioContext.audioWorklet.addModule(url)
+        /*  create expander node  */
+        this.expanderNode = new AudioWorkletNode(this.audioContext, "expander", {
+            numberOfInputs:  1,
+            numberOfOutputs: 1,
+            processorOptions: {
+                sampleRate: this.audioContext.sampleRate
+            }
+        })
+        /*  configure expander node  */
+        const currentTime = this.audioContext.currentTime
+        const node = this.expanderNode!
+        const params = node.parameters as Map<string, AudioParam>
+        params.get("threshold")!.setValueAtTime(this.config.thresholdDb, currentTime)
+        params.get("floor")!.setValueAtTime(this.config.floorDb, currentTime)
+        params.get("ratio")!.setValueAtTime(this.config.ratio, currentTime)
+        params.get("attack")!.setValueAtTime(this.config.attackMs / 1000, currentTime)
+        params.get("release")!.setValueAtTime(this.config.releaseMs / 1000, currentTime)
+        params.get("knee")!.setValueAtTime(this.config.kneeDb, currentTime)
+        params.get("makeup")!.setValueAtTime(this.config.makeupDb, currentTime)
+        /*  connect nodes  */
+        this.sourceNode!.connect(this.expanderNode)
+        this.expanderNode.connect(this.captureNode!)
+    }
+    public async destroy (): Promise<void> {
+        await super.destroy()
+        /*  destroy expander node  */
+        if (this.expanderNode !== null) {
+            this.expanderNode.disconnect()
+            this.expanderNode = null
+        }
+    }
+}
+/*  SpeechFlow node for noise expander in audio-to-audio passing  */
+export default class SpeechFlowNodeExpander extends SpeechFlowNode {
+    /*  declare official node name  */
+    public static name = "expander"
+    /*  internal state  */
+    private destroyed = false
+    private expander: AudioExpander | null = null
+    /*  construct node  */
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
+        /*  declare node configuration parameters  */
+        this.configure({
+            thresholdDb: { type: "number", val: -45, match: (n: number) => n <= 0   && n >= -100 },
+            floorDb:     { type: "number", val: -64, match: (n: number) => n <= 0   && n >= -100 },
+            ratio:       { type: "number", val: 4.0, match: (n: number) => n >= 1   && n <= 20   },
+            attackMs:    { type: "number", val: 10,  match: (n: number) => n >= 0   && n <= 1000 },
+            releaseMs:   { type: "number", val: 50,  match: (n: number) => n >= 0   && n <= 1000 },
+            kneeDb:      { type: "number", val: 6.0, match: (n: number) => n >= 0   && n <= 40   },
+            makeupDb:    { type: "number", val: 0,   match: (n: number) => n >= -24 && n <= 24   }
+        })
+        /*  sanity check floor vs threshold  */
+        if (this.params.floorDb >= this.params.thresholdDb)
+            throw new Error("floor dB must be less than threshold dB for proper expansion")
+        /*  declare node input/output format  */
+        this.input  = "audio"
+        this.output = "audio"
+    }
+    /*  open node  */
+    async open () {
+        /*  clear destruction flag  */
+        this.destroyed = false
+        /*  setup expander  */
+        this.expander = new AudioExpander(
+            this.config.audioSampleRate,
+            this.config.audioChannels, {
+                thresholdDb: this.params.thresholdDb,
+                floorDb:     this.params.floorDb,
+                ratio:       this.params.ratio,
+                attackMs:    this.params.attackMs,
+                releaseMs:   this.params.releaseMs,
+                kneeDb:      this.params.kneeDb,
+                makeupDb:    this.params.makeupDb
+            }
+        )
+        await this.expander.setup()
+        /*  establish a transform stream  */
+        const self = this
+        this.stream = new Stream.Transform({
+            readableObjectMode: true,
+            writableObjectMode: true,
+            decodeStrings:      false,
+            transform (chunk: SpeechFlowChunk & { payload: Buffer }, encoding, callback) {
+                if (self.destroyed) {
+                    callback(new Error("stream already destroyed"))
+                    return
+                }
+                if (!Buffer.isBuffer(chunk.payload))
+                    callback(new Error("invalid chunk payload type"))
+                else {
+                    /*  expand chunk  */
+                    const payload = utils.convertBufToI16(chunk.payload)
+                    self.expander?.process(payload).then((result) => {
+                        if (self.destroyed)
+                            throw new Error("stream already destroyed")
+                        /*  take over expanded data  */
+                        const payload = utils.convertI16ToBuf(result)
+                        chunk.payload = payload
+                        this.push(chunk)
+                        callback()
+                    }).catch((error) => {
+                        callback(new Error(`expansion failed: ${error}`))
+                    })
+                }
+            },
+            final (callback) {
+                if (self.destroyed) {
+                    callback()
+                    return
+                }
+                this.push(null)
+                callback()
+            }
+        })
+    }
+    /*  close node  */
+    async close () {
+        /*  indicate destruction  */
+        this.destroyed = true
+        /*  destroy expander  */
+        if (this.expander !== null) {
+            await this.expander.destroy()
+            this.expander = null
+        }
+        /*  close stream  */
+        if (this.stream !== null) {
+            this.stream.destroy()
+            this.stream = null
+        }
+    }
+}

package/speechflow-cli/src/speechflow-node-a2a-ffmpeg.ts CHANGED Viewed

@@ -75,7 +75,7 @@ export default class SpeechFlowNodeFFmpeg extends SpeechFlowNode {
                 "c:a":         "pcm_s16le",
                 "ar":          this.config.audioSampleRate,
                 "ac":          this.config.audioChannels,
-                "f":           "s16le",
+                "f":           "s16le"
             } : {}),
             ...(this.params.dst === "wav" ? {
                 "f":           "wav"
@@ -90,7 +90,12 @@ export default class SpeechFlowNodeFFmpeg extends SpeechFlowNode {
                 "f":           "opus"
             } : {})
         })
-        this.ffmpeg.run()
+        try {
+            this.ffmpeg.run()
+        }
+        catch (err) {
+            throw new Error(`failed to start FFmpeg process: ${err}`)
+        }
         /*  establish a duplex stream and connect it to FFmpeg  */
         this.stream = Stream.Duplex.from({
@@ -120,7 +125,12 @@ export default class SpeechFlowNodeFFmpeg extends SpeechFlowNode {
         /*  shutdown FFmpeg  */
         if (this.ffmpeg !== null) {
-            this.ffmpeg.kill()
+            try {
+                this.ffmpeg.kill()
+            }
+            catch {
+                /*  ignore kill errors during cleanup  */
+            }
             this.ffmpeg = null
         }
     }

package/speechflow-cli/src/speechflow-node-a2a-filler.ts ADDED Viewed

@@ -0,0 +1,223 @@
+/*
+**  SpeechFlow - Speech Processing Flow Graph
+**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
+*/
+/*  standard dependencies  */
+import Stream           from "node:stream"
+import { EventEmitter } from "node:events"
+import { Duration }     from "luxon"
+/*  internal dependencies  */
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
+import * as utils                          from "./speechflow-utils"
+class AudioFiller extends EventEmitter {
+    private emittedEndSamples = 0           /* stream position in samples already emitted */
+    private readonly bytesPerSample = 2     /* PCM I16 */
+    private readonly bytesPerFrame: number
+    private readonly sampleTolerance = 0.5  /* tolerance for floating-point sample comparisons */
+    constructor (private sampleRate = 48000, private channels = 1) {
+        super()
+        this.bytesPerFrame = this.channels * this.bytesPerSample
+    }
+    /*  optional helper to allow subscribing with strong typing  */
+    public on(event: "chunk", listener: (chunk: SpeechFlowChunk) => void): this
+    public on(event: string, listener: (...args: any[]) => void): this {
+        return super.on(event, listener)
+    }
+    /*  convert fractional samples to duration  */
+    private samplesFromDuration(duration: Duration): number {
+        const seconds = duration.as("seconds")
+        const samples = seconds * this.sampleRate
+        return samples
+    }
+    /*  convert duration to fractional samples  */
+    private durationFromSamples(samples: number): Duration {
+        const seconds = samples / this.sampleRate
+        return Duration.fromObject({ seconds })
+    }
+    /*  emit a chunk of silence  */
+    private emitSilence (fromSamples: number, toSamples: number) {
+        const frames = Math.max(0, Math.floor(toSamples - fromSamples))
+        if (frames <= 0)
+            return
+        const payload = Buffer.alloc(frames * this.bytesPerFrame) /* already zeroed */
+        const timestampStart = this.durationFromSamples(fromSamples)
+        const timestampEnd   = this.durationFromSamples(toSamples)
+        const chunk = new SpeechFlowChunk(timestampStart, timestampEnd, "final", "audio", payload)
+        this.emit("chunk", chunk)
+    }
+    /*  add a chunk of audio for processing  */
+    public add (chunk: SpeechFlowChunk & { type: "audio", payload: Buffer }): void {
+        const startSamp = this.samplesFromDuration(chunk.timestampStart)
+        const endSamp   = this.samplesFromDuration(chunk.timestampEnd)
+        if (endSamp < startSamp)
+            throw new Error("invalid timestamps")
+        /*  if chunk starts beyond what we've emitted, insert silence for the gap  */
+        if (startSamp > this.emittedEndSamples + this.sampleTolerance) {
+            this.emitSilence(this.emittedEndSamples, startSamp)
+            this.emittedEndSamples = startSamp
+        }
+        /*  if chunk ends before or at emitted end, we have it fully covered, so drop it  */
+        if (endSamp <= this.emittedEndSamples + this.sampleTolerance)
+            return
+        /*  trim any overlap at the head  */
+        const trimHead = Math.max(0, Math.floor(this.emittedEndSamples - startSamp))
+        const availableFrames = Math.floor((endSamp - startSamp) - trimHead)
+        if (availableFrames <= 0)
+            return
+        /*  determine how many frames the buffer actually has; trust timestamps primarily  */
+        const bufFrames = Math.floor(chunk.payload.length / this.bytesPerFrame)
+        const startFrame = Math.min(trimHead, bufFrames)
+        const endFrame = Math.min(startFrame + availableFrames, bufFrames)
+        if (endFrame <= startFrame)
+            return
+        /*  determine trimmed/normalized chunk  */
+        const payload = chunk.payload.subarray(
+            startFrame * this.bytesPerFrame,
+            endFrame * this.bytesPerFrame)
+        /*  emit trimmed/normalized chunk  */
+        const outStartSamples = startSamp + startFrame
+        const outEndSamples   = outStartSamples + Math.floor(payload.length / this.bytesPerFrame)
+        const timestampStart  = this.durationFromSamples(outStartSamples)
+        const timestampEnd    = this.durationFromSamples(outEndSamples)
+        const c = new SpeechFlowChunk(timestampStart, timestampEnd, "final", "audio", payload)
+        this.emit("chunk", c)
+        /*  advance emitted cursor  */
+        this.emittedEndSamples = Math.max(this.emittedEndSamples, outEndSamples)
+    }
+}
+/*  SpeechFlow node for filling audio gaps  */
+export default class SpeechFlowNodeFiller extends SpeechFlowNode {
+    /*  declare official node name  */
+    public static name = "filler"
+    /*  internal state  */
+    private destroyed = false
+    private filler: AudioFiller | null = null
+    private sendQueue: utils.AsyncQueue<SpeechFlowChunk | null> | null = null
+    /*  construct node  */
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
+        /*  declare node configuration parameters  */
+        this.configure({
+            segment: { type: "number", val: 50, pos: 0, match: (n: number) => n >= 10 && n <= 1000 }
+        })
+        /*  declare node input/output format  */
+        this.input  = "audio"
+        this.output = "audio"
+    }
+    /*  open node  */
+    async open () {
+        /*  clear destruction flag  */
+        this.destroyed = false
+        /*  establish queues  */
+        this.filler  = new AudioFiller(this.config.audioSampleRate, this.config.audioChannels)
+        this.sendQueue = new utils.AsyncQueue<SpeechFlowChunk | null>()
+        /*  shift chunks from filler to send queue  */
+        this.filler.on("chunk", (chunk) => {
+            this.sendQueue?.write(chunk)
+        })
+        /*  establish a duplex stream  */
+        const self = this
+        this.stream = new Stream.Duplex({
+            readableObjectMode: true,
+            writableObjectMode: true,
+            decodeStrings:      false,
+            write (chunk: SpeechFlowChunk & { type: "audio", payload: Buffer }, encoding, callback) {
+                if (self.destroyed || self.filler === null)
+                    callback(new Error("stream already destroyed"))
+                else if (!Buffer.isBuffer(chunk.payload))
+                    callback(new Error("invalid chunk payload type"))
+                else {
+                    try {
+                        self.filler.add(chunk)
+                        callback()
+                    }
+                    catch (error: any) {
+                        callback(error)
+                    }
+                }
+            },
+            read (size) {
+                if (self.destroyed || self.sendQueue === null) {
+                    this.push(null)
+                    return
+                }
+                self.sendQueue.read().then((chunk) => {
+                    if (self.destroyed) {
+                        this.push(null)
+                        return
+                    }
+                    if (chunk === null) {
+                        self.log("info", "received EOF signal")
+                        this.push(null)
+                    }
+                    else {
+                        self.log("debug", `received data (${chunk.payload.length} bytes)`)
+                        this.push(chunk)
+                    }
+                }).catch((error) => {
+                    if (!self.destroyed)
+                        self.log("error", `queue read error: ${error.message}`)
+                })
+            },
+            final (callback) {
+                if (self.destroyed) {
+                    callback()
+                    return
+                }
+                this.push(null)
+                callback()
+            }
+        })
+    }
+    /*  close node  */
+    async close () {
+        /*  indicate destruction  */
+        this.destroyed = true
+        /*  destroy queues  */
+        if (this.sendQueue !== null) {
+            this.sendQueue.destroy()
+            this.sendQueue = null
+        }
+        /*  destroy filler  */
+        if (this.filler !== null) {
+            this.filler.removeAllListeners()
+            this.filler = null
+        }
+        /*  close stream  */
+        if (this.stream !== null) {
+            this.stream.destroy()
+            this.stream = null
+        }
+    }
+}

package/speechflow-cli/src/speechflow-node-a2a-gain.ts ADDED Viewed

@@ -0,0 +1,98 @@
+/*
+**  SpeechFlow - Speech Processing Flow Graph
+**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
+*/
+/*  standard dependencies  */
+import Stream from "node:stream"
+/*  internal dependencies  */
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
+import * as utils                          from "./speechflow-utils"
+/*  SpeechFlow node for gain adjustment in audio-to-audio passing  */
+export default class SpeechFlowNodeGain extends SpeechFlowNode {
+    /*  declare official node name  */
+    public static name = "gain"
+    /*  internal state  */
+    private destroyed = false
+    /*  construct node  */
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
+        /*  declare node configuration parameters  */
+        this.configure({
+            db: { type: "number", val: 0, pos: 0, match: (n: number) => n >= -60 && n <= 60 }
+        })
+        /*  declare node input/output format  */
+        this.input  = "audio"
+        this.output = "audio"
+    }
+    /*  open node  */
+    async open () {
+        /*  clear destruction flag  */
+        this.destroyed = false
+        /*  adjust gain  */
+        const adjustGain = (chunk: SpeechFlowChunk & { payload: Buffer }, db: number) => {
+            const dv = new DataView(chunk.payload.buffer, chunk.payload.byteOffset, chunk.payload.byteLength)
+            const gainFactor = utils.dB2lin(db)
+            for (let i = 0; i < dv.byteLength; i += 2) {
+                let sample = dv.getInt16(i, true)
+                sample *= gainFactor
+                sample = Math.max(Math.min(sample, 32767), -32768)
+                dv.setInt16(i, sample, true)
+            }
+        }
+        /*  establish a transform stream  */
+        const self = this
+        this.stream = new Stream.Transform({
+            readableObjectMode: true,
+            writableObjectMode: true,
+            decodeStrings:      false,
+            transform (chunk: SpeechFlowChunk & { payload: Buffer }, encoding, callback) {
+                if (self.destroyed) {
+                    callback(new Error("stream already destroyed"))
+                    return
+                }
+                if (!Buffer.isBuffer(chunk.payload))
+                    callback(new Error("invalid chunk payload type"))
+                else if (chunk.payload.byteLength % 2 !== 0)
+                    callback(new Error("invalid audio buffer size (not 16-bit aligned)"))
+                else {
+                    /*  adjust chunk  */
+                    adjustGain(chunk, self.params.db)
+                    this.push(chunk)
+                    callback()
+                }
+            },
+            final (callback) {
+                if (self.destroyed) {
+                    callback()
+                    return
+                }
+                this.push(null)
+                callback()
+            }
+        })
+    }
+    /*  close node  */
+    async close () {
+        /*  indicate destruction  */
+        this.destroyed = true
+        /*  close stream  */
+        if (this.stream !== null) {
+            this.stream.destroy()
+            this.stream = null
+        }
+    }
+}

package/speechflow-cli/src/speechflow-node-a2a-gender.ts CHANGED Viewed

@@ -21,7 +21,7 @@ type AudioQueueElement = {
     type:         "audio-frame",
     chunk:        SpeechFlowChunk,
     data:         Float32Array,
-    gender?:      "male" | "female"
+    gender?:      "male" | "female" | "unknown"
 } | {
     type:         "audio-eof"
 }
@@ -32,7 +32,6 @@ export default class SpeechFlowNodeGender extends SpeechFlowNode {
     public static name = "gender"
     /*  internal state  */
-    private static speexInitialized = false
     private classifier: Transformers.AudioClassificationPipeline | null = null
     private queue     = new utils.Queue<AudioQueueElement>()
     private queueRecv = this.queue.pointerUse("recv")
@@ -66,7 +65,7 @@ export default class SpeechFlowNodeGender extends SpeechFlowNode {
         this.shutdown = false
         /*  pass-through logging  */
-        const log = (level: string, msg: string) => { this.log(level, msg) }
+        const log = this.log.bind(this)
         /*  the used model  */
         const model = "Xenova/wav2vec2-large-xlsr-53-gender-recognition-librispeech"
@@ -81,7 +80,7 @@ export default class SpeechFlowNodeGender extends SpeechFlowNode {
                 artifact += `:${progress.file}`
             let percent = 0
             if (typeof progress.loaded === "number" && typeof progress.total === "number")
-                percent = (progress.loaded as number / progress.total as number) * 100
+                percent = (progress.loaded / progress.total) * 100
             else if (typeof progress.progress === "number")
                 percent = progress.progress
             if (percent > 0)
@@ -92,7 +91,7 @@ export default class SpeechFlowNodeGender extends SpeechFlowNode {
                 return
             for (const [ artifact, percent ] of progressState) {
                 this.log("info", `downloaded ${percent.toFixed(2)}% of artifact "${artifact}"`)
-                if (percent >= 1.0)
+                if (percent >= 100.0)
                     progressState.delete(artifact)
             }
         }, 1000)
@@ -103,11 +102,17 @@ export default class SpeechFlowNodeGender extends SpeechFlowNode {
                 device:    "auto",
                 progress_callback: progressCallback
             })
-            const timeoutPromise = new Promise((resolve, reject) => setTimeout(() =>
-                reject(new Error("model initialization timeout")), 30 * 1000))
+            let timeoutId: ReturnType<typeof setTimeout> | null = null
+            const timeoutPromise = new Promise((resolve, reject) => {
+                timeoutId = setTimeout(() =>
+                    reject(new Error("model initialization timeout")), 30 * 1000)
+            })
             this.classifier = await Promise.race([
                 pipelinePromise, timeoutPromise
-            ]) as Transformers.AudioClassificationPipeline
+            ]).finally(() => {
+                if (timeoutId !== null)
+                    clearTimeout(timeoutId)
+            }) as Transformers.AudioClassificationPipeline
         }
         catch (error) {
             if (this.progressInterval) {
@@ -128,10 +133,15 @@ export default class SpeechFlowNodeGender extends SpeechFlowNode {
             if (this.shutdown || this.classifier === null)
                 throw new Error("classifier shutdown during operation")
             const classifyPromise = this.classifier(data)
-            const timeoutPromise = new Promise((resolve, reject) => setTimeout(() =>
-                reject(new Error("classification timeout")), 30 * 1000))
-            const result = await Promise.race([ classifyPromise, timeoutPromise ]) as
-                Transformers.AudioClassificationOutput | Transformers.AudioClassificationOutput[]
+            let timeoutId: ReturnType<typeof setTimeout> | null = null
+            const timeoutPromise = new Promise((resolve, reject) => {
+                timeoutId = setTimeout(() =>
+                    reject(new Error("classification timeout")), 30 * 1000)
+            })
+            const result = await Promise.race([ classifyPromise, timeoutPromise ]).finally(() => {
+                if (timeoutId !== null)
+                    clearTimeout(timeoutId)
+            }) as Transformers.AudioClassificationOutput | Transformers.AudioClassificationOutput[]
             const classified = Array.isArray(result) ?
                 result as Transformers.AudioClassificationOutput :
                 [ result ]
@@ -139,15 +149,20 @@ export default class SpeechFlowNodeGender extends SpeechFlowNode {
             const c2 = classified.find((c: any) => c.label === "female")
             const male   = c1 ? c1.score : 0.0
             const female = c2 ? c2.score : 0.0
-            return (male > female ? "male" : "female")
+            if (male > female)
+                return "male"
+            else if (male < female)
+                return "female"
+            else
+                return "unknown"
         }
         /*  define sample rate required by model  */
         const sampleRateTarget = 16000
         /*  work off queued audio frames  */
-        const frameWindowDuration = 0.5
-        const frameWindowSamples  = frameWindowDuration * sampleRateTarget
+        const frameWindowDuration = this.params.window / 1000
+        const frameWindowSamples  = Math.floor(frameWindowDuration * sampleRateTarget)
         let lastGender = ""
         let workingOff = false
         const workOffQueue = async () => {
@@ -236,8 +251,7 @@ export default class SpeechFlowNodeGender extends SpeechFlowNode {
                         const wav = new WaveFile()
                         wav.fromScratch(self.config.audioChannels, self.config.audioSampleRate, "32f", data)
                         wav.toSampleRate(sampleRateTarget, { method: "cubic" })
-                        data = wav.getSamples(false, Float32Array<ArrayBuffer>) as
-                            any as Float32Array<ArrayBuffer>
+                        data = wav.getSamples(false, Float32Array) as any as Float32Array<ArrayBuffer>
                         /*  queue chunk and converted data  */
                         self.queueRecv.append({ type: "audio-frame", chunk, data })