npm - speechflow - Versions diffs - 2.2.1 → 2.3.0 - Mend

speechflow 2.2.1 → 2.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (235) hide show

package/speechflow-cli/src/speechflow-node-xio-file.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -96,7 +96,8 @@ export default class SpeechFlowNodeXIOFile extends SpeechFlowNode {
                     chunker = new Stream.PassThrough({ highWaterMark: highWaterMarkText })
                 }
                 const wrapper = util.createTransformStreamForReadableSide(
-                    this.params.type, () => this.timeZero)
+                    this.params.type, () => this.timeZero, undefined,
+                    this.config.audioSampleRate, this.config.audioBitDepth, this.config.audioChannels)
                 this.stream = Stream.compose(process.stdin, chunker, wrapper)
             }
             else {
@@ -109,7 +110,8 @@ export default class SpeechFlowNodeXIOFile extends SpeechFlowNode {
                     readable = fs.createReadStream(this.params.path,
                         { highWaterMark: highWaterMarkText, encoding: this.config.textEncoding })
                 const wrapper = util.createTransformStreamForReadableSide(
-                    this.params.type, () => this.timeZero)
+                    this.params.type, () => this.timeZero, undefined,
+                    this.config.audioSampleRate, this.config.audioBitDepth, this.config.audioChannels)
                 this.stream = Stream.compose(readable, wrapper)
             }
         }
@@ -158,8 +160,9 @@ export default class SpeechFlowNodeXIOFile extends SpeechFlowNode {
                         },
                         destroy (err, callback) {
                             if (self.fd !== null) {
-                                fs.close(self.fd, () => {
-                                    self.fd = null
+                                const fd = self.fd
+                                self.fd = null
+                                fs.close(fd, () => {
                                     callback(err)
                                 })
                             }
@@ -199,6 +202,7 @@ export default class SpeechFlowNodeXIOFile extends SpeechFlowNode {
                 const stream = this.stream
                 if ((stream instanceof Stream.Writable || stream instanceof Stream.Duplex)
                     && (!stream.writableEnded && !stream.destroyed)) {
+                    const ac = new AbortController()
                     await Promise.race([
                         new Promise<void>((resolve, reject) => {
                             stream.end((err?: Error) => {
@@ -208,8 +212,12 @@ export default class SpeechFlowNodeXIOFile extends SpeechFlowNode {
                                     resolve()
                             })
                         }),
-                        util.timeout(5000)
-                    ])
+                        util.timeout(5000, "timeout", ac.signal)
+                    ]).finally(() => {
+                        ac.abort()
+                    }).catch(() => {
+                        /*  ignore timeout -- stdio stream cannot be destroyed  */
+                    })
                 }
             }
             this.stream = null

package/speechflow-cli/src/speechflow-node-xio-mqtt.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -23,7 +23,7 @@ export default class SpeechFlowNodeXIOMQTT extends SpeechFlowNode {
     /*  internal state  */
     private broker:     MQTT.MqttClient | null                   = null
     private clientId:   string                                   = (new UUID(1)).format()
-    private chunkQueue: util.SingleQueue<SpeechFlowChunk> | null = null
+    private chunkQueue: util.AsyncQueue<SpeechFlowChunk> | null = null
     /*  construct node  */
     constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
@@ -100,13 +100,15 @@ export default class SpeechFlowNodeXIOMQTT extends SpeechFlowNode {
             const reasonCode = packet.reasonCode ?? 0
             this.log("info", `connection closed to MQTT ${this.params.url} (reason code: ${reasonCode})`)
         })
-        this.chunkQueue = new util.SingleQueue<SpeechFlowChunk>()
+        this.chunkQueue = new util.AsyncQueue<SpeechFlowChunk>()
         this.broker.on("message", (topic: string, payload: Buffer, packet: MQTT.IPublishPacket) => {
             if (topic !== this.params.topicRead || this.params.mode === "w")
                 return
+            if (this.chunkQueue === null)
+                return
             try {
                 const chunk = util.streamChunkDecode(payload)
-                this.chunkQueue!.write(chunk)
+                this.chunkQueue.write(chunk)
             }
             catch (_err: unknown) {
                 this.log("warning", `received invalid CBOR chunk from MQTT ${this.params.url}`)
@@ -141,12 +143,20 @@ export default class SpeechFlowNodeXIOMQTT extends SpeechFlowNode {
                 callback()
             },
             read (size: number) {
-                if (self.params.mode === "w")
-                    throw new Error("read operation on write-only node")
-                reads.add(self.chunkQueue!.read().then((chunk) => {
+                if (self.params.mode === "w") {
+                    self.log("error", "read operation on write-only node")
+                    this.push(null)
+                    return
+                }
+                if (self.chunkQueue === null)
+                    return
+                const queue = self.chunkQueue
+                reads.add(queue.read().then((chunk) => {
                     this.push(chunk, "binary")
                 }).catch((err: Error) => {
                     self.log("warning", `read on chunk queue operation failed: ${err}`)
+                    if (queue.destroyed)
+                        this.push(null)
                 }))
             }
         })
@@ -154,14 +164,10 @@ export default class SpeechFlowNodeXIOMQTT extends SpeechFlowNode {
     /*  close node  */
     async close () {
-        /*  clear chunk queue reference  */
-        this.chunkQueue = null
-        /*  close MQTT broker  */
-        if (this.broker !== null) {
-            if (this.broker.connected)
-                this.broker.end()
-            this.broker = null
+        /*  drain and clear chunk queue reference  */
+        if (this.chunkQueue !== null) {
+            this.chunkQueue.destroy()
+            this.chunkQueue = null
         }
         /*  shutdown stream  */
@@ -169,5 +175,12 @@ export default class SpeechFlowNodeXIOMQTT extends SpeechFlowNode {
             await util.destroyStream(this.stream)
             this.stream = null
         }
+        /*  close MQTT broker  */
+        if (this.broker !== null) {
+            if (this.broker.connected)
+                this.broker.end()
+            this.broker = null
+        }
     }
 }

package/speechflow-cli/src/speechflow-node-xio-vban.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -32,7 +32,7 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
     /*  internal state  */
     private server:        VBANServer                        | null = null
-    private chunkQueue:    util.SingleQueue<SpeechFlowChunk> | null = null
+    private chunkQueue:    util.AsyncQueue<SpeechFlowChunk> | null = null
     private frameCounter                                            = 0
     private targetAddress                                           = ""
     private targetPort                                              = 0
@@ -99,7 +99,7 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
         })
         /*  setup chunk queue for incoming audio  */
-        this.chunkQueue = new util.SingleQueue<SpeechFlowChunk>()
+        this.chunkQueue = new util.AsyncQueue<SpeechFlowChunk>()
         /*  determine target for sending  */
         if (this.params.connect !== "") {
@@ -128,6 +128,12 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
             }
             const data = packet.data
+            /*  check sample rate compatibility  */
+            if (packet.sr !== this.config.audioSampleRate) {
+                this.log("warning", `incompatible VBAN sample rate: packet=${packet.sr}Hz, configured=${this.config.audioSampleRate}Hz`)
+                return
+            }
             /*  convert audio format if necessary  */
             let audioBuffer: Buffer
             const bitResolution = packet.bitResolution
@@ -139,7 +145,7 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
                 /*  8-bit unsigned to 16-bit signed  */
                 audioBuffer = Buffer.alloc(data.length * 2)
                 for (let i = 0; i < data.length; i++) {
-                    const sample = ((data[i] - 128) / 128) * 32767
+                    const sample = ((data[i] - 128) / 128) * 32768
                     audioBuffer.writeInt16LE(Math.round(sample), i * 2)
                 }
             }
@@ -153,7 +159,7 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
                     const b2 = data[i * 3 + 2]
                     const value = ((b2 << 16) | (b1 << 8) | b0) & 0xFFFFFF
                     const signed = value > 0x7FFFFF ? value - 0x1000000 : value
-                    const sample = (signed / 0x800000) * 32767
+                    const sample = (signed / 0x800000) * 32768
                     audioBuffer.writeInt16LE(Math.round(sample), i * 2)
                 }
             }
@@ -163,7 +169,7 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
                 audioBuffer = Buffer.alloc(samples * 2)
                 for (let i = 0; i < samples; i++) {
                     const value = data.readInt32LE(i * 4)
-                    const sample = (value / 0x80000000) * 32767
+                    const sample = (value / 0x80000000) * 32768
                     audioBuffer.writeInt16LE(Math.round(sample), i * 2)
                 }
             }
@@ -173,7 +179,7 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
                 audioBuffer = Buffer.alloc(samples * 2)
                 for (let i = 0; i < samples; i++) {
                     const value = data.readFloatLE(i * 4)
-                    const sample = Math.max(-32768, Math.min(32767, Math.round(value * 32767)))
+                    const sample = Math.max(-32768, Math.min(32767, Math.round(value * 32768)))
                     audioBuffer.writeInt16LE(sample, i * 2)
                 }
             }
@@ -183,7 +189,7 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
                 audioBuffer = Buffer.alloc(samples * 2)
                 for (let i = 0; i < samples; i++) {
                     const value = data.readDoubleLE(i * 8)
-                    const sample = Math.max(-32768, Math.min(32767, Math.round(value * 32767)))
+                    const sample = Math.max(-32768, Math.min(32767, Math.round(value * 32768)))
                     audioBuffer.writeInt16LE(sample, i * 2)
                 }
             }
@@ -227,11 +233,11 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
         /*  bind to listen port  */
         if (this.params.listen !== "") {
             const listen = this.parseAddress(this.params.listen, 6980)
-            this.server.bind(listen.port, listen.host)
+            await this.server.bind(listen.port, listen.host)
         }
         else
             /*  still need to bind for sending  */
-            this.server.bind(0)
+            await this.server.bind(0)
         /*  create duplex stream  */
         const self = this
@@ -279,7 +285,7 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
                     nbChannel:     self.config.audioChannels - 1,
                     bitResolution: EBitsResolutions.VBAN_DATATYPE_INT16,
                     codec:         ECodecs.VBAN_CODEC_PCM,
-                    frameCounter:  self.frameCounter++
+                    frameCounter:  self.frameCounter++ & 0xFFFFFFFF
                 }, audioBuffer)
                 /*  send packet  */
@@ -292,13 +298,20 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
                 callback()
             },
             read (size: number) {
-                if (self.params.mode === "w")
-                    throw new Error("read operation on write-only node")
-                reads.add(self.chunkQueue!.read().then((chunk) => {
+                if (self.params.mode === "w") {
+                    self.log("error", "read operation on write-only node")
+                    this.push(null)
+                    return
+                }
+                if (self.chunkQueue === null)
+                    return
+                const queue = self.chunkQueue
+                reads.add(queue.read().then((chunk) => {
                     this.push(chunk, "binary")
                 }).catch((err: Error) => {
                     self.log("warning", `read on chunk queue operation failed: ${err}`)
-                    this.push(null)
+                    if (queue.destroyed)
+                        this.push(null)
                 }))
             }
         })
@@ -308,20 +321,20 @@ export default class SpeechFlowNodeXIOVBAN extends SpeechFlowNode {
     async close () {
         /*  drain and clear chunk queue reference  */
         if (this.chunkQueue !== null) {
-            this.chunkQueue.drain()
+            this.chunkQueue.destroy()
             this.chunkQueue = null
         }
-        /*  close VBAN server  */
-        if (this.server !== null) {
-            this.server.close()
-            this.server = null
-        }
         /*  shutdown stream  */
         if (this.stream !== null) {
             await util.destroyStream(this.stream)
             this.stream = null
         }
+        /*  close VBAN server  */
+        if (this.server !== null) {
+            await this.server.close()
+            this.server = null
+        }
     }
 }

package/speechflow-cli/src/speechflow-node-xio-webrtc.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 /*
 **  SpeechFlow - Speech Processing Flow Graph
-**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Copyright (c) 2024-2026 Dr. Ralf S. Engelschall <rse@engelschall.com>
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
@@ -39,7 +39,7 @@ export default class SpeechFlowNodeXIOWebRTC extends SpeechFlowNode {
     /*  internal state  */
     private peerConnections                                       = new Map<string, WebRTCConnection>()
     private httpServer:  http.Server                       | null = null
-    private chunkQueue:  util.SingleQueue<SpeechFlowChunk> | null = null
+    private chunkQueue:  util.AsyncQueue<SpeechFlowChunk> | null = null
     private opusEncoder: OpusEncoder                       | null = null
     private opusDecoder: OpusEncoder                       | null = null
     private pcmBuffer                                             = Buffer.alloc(0)
@@ -265,11 +265,11 @@ export default class SpeechFlowNodeXIOWebRTC extends SpeechFlowNode {
         const resourceId = crypto.randomUUID()
         const { pc, subscription } = this.createPeerConnection(resourceId)
-        /*  protocol-specific setup  */
-        const track = setupFn(pc, resourceId)
         /*  complete SDP offer/answer exchange and establish connection  */
         try {
+            /*  protocol-specific setup  */
+            const track = setupFn(pc, resourceId)
             /*  set remote description (offer from client)  */
             await pc.setRemoteDescription({ type: "offer", sdp: offer })
@@ -367,7 +367,7 @@ export default class SpeechFlowNodeXIOWebRTC extends SpeechFlowNode {
         this.rtpSSRC      = Math.floor(Math.random() * 0x100000000) >>> 0
         /*  setup chunk queue for incoming audio  */
-        this.chunkQueue = new util.SingleQueue<SpeechFlowChunk>()
+        this.chunkQueue = new util.AsyncQueue<SpeechFlowChunk>()
         /*  parse listen address  */
         const listen = this.parseAddress(this.params.listen, 8085)
@@ -375,77 +375,89 @@ export default class SpeechFlowNodeXIOWebRTC extends SpeechFlowNode {
         /*  setup HTTP server for WHIP/WHEP signaling  */
         const self = this
         this.httpServer = http.createServer(async (req, res) => {
-            /*  determine URL  */
-            if (req.url === undefined) {
-                res.writeHead(400, { "Content-Type": "text/plain" })
-                res.end("Bad Request")
-                return
-            }
-            const host = req.headers.host?.replace(/[^a-zA-Z0-9:.\-_]/g, "") ?? "localhost"
-            const url = new URL(req.url, `http://${host}`)
-            const pathMatch = url.pathname === self.params.path
-            const resourceMatch = url.pathname.startsWith(self.params.path + "/")
-            /*  CORS headers for browser clients  */
-            res.setHeader("Access-Control-Allow-Origin",   "*")
-            res.setHeader("Access-Control-Allow-Methods",  "POST, DELETE, OPTIONS")
-            res.setHeader("Access-Control-Allow-Headers",  "Content-Type")
-            res.setHeader("Access-Control-Expose-Headers", "Location")
-            /*  handle CORS preflight  */
-            if (req.method === "OPTIONS") {
-                res.writeHead(204)
-                res.end()
-                return
-            }
-            /*  handle requests...  */
-            if (req.method === "POST" && pathMatch) {
-                /*  handle WHIP/WHEP POST  */
-                const body = await self.readRequestBody(req)
-                /*  sanity check content type  */
-                const contentType = req.headers["content-type"]
-                if (contentType !== "application/sdp") {
-                    res.writeHead(415, { "Content-Type": "text/plain" })
-                    res.end("Unsupported Media Type")
+            try {
+                /*  determine URL  */
+                if (req.url === undefined) {
+                    res.writeHead(400, { "Content-Type": "text/plain" })
+                    res.end("Bad Request")
+                    return
+                }
+                const host = req.headers.host?.replace(/[^a-zA-Z0-9:.\-_]/g, "") ?? "localhost"
+                const url = new URL(req.url, `http://${host}`)
+                const pathMatch = url.pathname === self.params.path
+                const resourceMatch = url.pathname.startsWith(self.params.path + "/")
+                /*  CORS headers for browser clients  */
+                res.setHeader("Access-Control-Allow-Origin",   "*")
+                res.setHeader("Access-Control-Allow-Methods",  "POST, DELETE, OPTIONS")
+                res.setHeader("Access-Control-Allow-Headers",  "Content-Type")
+                res.setHeader("Access-Control-Expose-Headers", "Location")
+                /*  handle CORS preflight  */
+                if (req.method === "OPTIONS") {
+                    res.writeHead(204)
+                    res.end()
                     return
                 }
-                /*  determine if WHIP (receiving) or WHEP (sending) based on SDP content  */
-                const hasSendonly  = /\ba=sendonly\b/m.test(body)
-                const hasSendrecv  = /\ba=sendrecv\b/m.test(body)
-                const hasRecvonly  = /\ba=recvonly\b/m.test(body)
-                const isPublisher  = hasSendonly || hasSendrecv
-                const isViewer     = hasRecvonly
-                /*  handle protocol based on mode  */
-                if (self.params.mode === "r" && isPublisher)
-                    /*  in read mode, accept WHIP publishers  */
-                    await self.handleWHIP(res, body)
-                else if (self.params.mode === "w" && isViewer)
-                    /*  in write mode, accept WHEP viewers  */
-                    await self.handleWHEP(res, body)
+                /*  handle requests...  */
+                if (req.method === "POST" && pathMatch) {
+                    /*  handle WHIP/WHEP POST  */
+                    const body = await self.readRequestBody(req)
+                    /*  sanity check content type  */
+                    const contentType = req.headers["content-type"]
+                    if (contentType !== "application/sdp") {
+                        res.writeHead(415, { "Content-Type": "text/plain" })
+                        res.end("Unsupported Media Type")
+                        return
+                    }
+                    /*  determine if WHIP (receiving) or WHEP (sending) based on SDP content  */
+                    const hasSendonly  = /\ba=sendonly\b/m.test(body)
+                    const hasSendrecv  = /\ba=sendrecv\b/m.test(body)
+                    const hasRecvonly  = /\ba=recvonly\b/m.test(body)
+                    const isPublisher  = hasSendonly || hasSendrecv
+                    const isViewer     = hasRecvonly
+                    /*  handle protocol based on mode  */
+                    if (self.params.mode === "r" && isPublisher)
+                        /*  in read mode, accept WHIP publishers  */
+                        await self.handleWHIP(res, body)
+                    else if (self.params.mode === "w" && isViewer)
+                        /*  in write mode, accept WHEP viewers  */
+                        await self.handleWHEP(res, body)
+                    else {
+                        res.writeHead(403, { "Content-Type": "text/plain" })
+                        res.end("Forbidden")
+                    }
+                }
+                else if (req.method === "DELETE" && resourceMatch) {
+                    /*  handle DELETE for connection teardown  */
+                    const resourceId = url.pathname.substring(self.params.path.length + 1)
+                    self.handleDELETE(res, resourceId)
+                }
                 else {
-                    res.writeHead(403, { "Content-Type": "text/plain" })
-                    res.end("Forbidden")
+                    /*  handle unknown requests  */
+                    res.writeHead(404, { "Content-Type": "text/plain" })
+                    res.end("Not Found")
                 }
             }
-            else if (req.method === "DELETE" && resourceMatch) {
-                /*  handle DELETE for connection teardown  */
-                const resourceId = url.pathname.substring(self.params.path.length + 1)
-                self.handleDELETE(res, resourceId)
-            }
-            else {
-                /*  handle unknown requests  */
-                res.writeHead(404, { "Content-Type": "text/plain" })
-                res.end("Not Found")
+            catch (err: unknown) {
+                self.log("error", `HTTP request handler failed: ${util.ensureError(err).message}`)
+                if (!res.headersSent) {
+                    res.writeHead(500, { "Content-Type": "text/plain" })
+                    res.end("Internal Server Error")
+                }
             }
         })
         /*  start HTTP server  */
-        await new Promise<void>((resolve) => {
+        await new Promise<void>((resolve, reject) => {
+            const onError = (err: Error) => { reject(err) }
+            this.httpServer!.once("error", onError)
             this.httpServer!.listen(listen.port, listen.host, () => {
+                this.httpServer!.removeListener("error", onError)
                 const mode = this.params.mode === "r" ? "WHIP" : "WHEP"
                 this.log("info", `WebRTC ${mode} server listening on http://${listen.host}:${listen.port}${this.params.path}`)
                 resolve()
@@ -486,11 +498,15 @@ export default class SpeechFlowNodeXIOWebRTC extends SpeechFlowNode {
                     this.push(null)
                     return
                 }
-                reads.add(self.chunkQueue!.read().then((chunk) => {
+                if (self.chunkQueue === null)
+                    return
+                const queue = self.chunkQueue
+                reads.add(queue.read().then((chunk) => {
                     this.push(chunk, "binary")
                 }).catch((err: Error) => {
                     self.log("warning", `read on chunk queue operation failed: ${err}`)
-                    this.push(null)
+                    if (queue.destroyed)
+                        this.push(null)
                 }))
             }
         })
@@ -517,7 +533,7 @@ export default class SpeechFlowNodeXIOWebRTC extends SpeechFlowNode {
         /*  drain and clear chunk queue  */
         if (this.chunkQueue !== null) {
-            this.chunkQueue.drain()
+            this.chunkQueue.destroy()
             this.chunkQueue = null
         }