npm - speechflow - Versions diffs - 1.1.0 → 1.2.1 - Mend

speechflow 1.1.0 → 1.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (67) hide show

package/CHANGELOG.md +18 -0
package/README.md +37 -3
package/dst/speechflow-node-a2a-gender.d.ts +17 -0
package/dst/speechflow-node-a2a-gender.js +272 -0
package/dst/speechflow-node-a2a-gender.js.map +1 -0
package/dst/speechflow-node-a2a-meter.js +2 -2
package/dst/speechflow-node-a2a-meter.js.map +1 -1
package/dst/speechflow-node-a2a-mute.js +1 -0
package/dst/speechflow-node-a2a-mute.js.map +1 -1
package/dst/speechflow-node-a2a-vad.js +47 -63
package/dst/speechflow-node-a2a-vad.js.map +1 -1
package/dst/speechflow-node-a2a-wav.js +145 -122
package/dst/speechflow-node-a2a-wav.js.map +1 -1
package/dst/speechflow-node-a2t-deepgram.js +13 -3
package/dst/speechflow-node-a2t-deepgram.js.map +1 -1
package/dst/speechflow-node-t2a-elevenlabs.js +10 -5
package/dst/speechflow-node-t2a-elevenlabs.js.map +1 -1
package/dst/speechflow-node-t2a-kokoro.js.map +1 -1
package/dst/speechflow-node-t2t-deepl.js.map +1 -1
package/dst/speechflow-node-t2t-format.js.map +1 -1
package/dst/speechflow-node-t2t-ollama.js.map +1 -1
package/dst/speechflow-node-t2t-openai.js.map +1 -1
package/dst/speechflow-node-t2t-subtitle.js.map +1 -1
package/dst/speechflow-node-t2t-transformers.js.map +1 -1
package/dst/speechflow-node-x2x-filter.d.ts +11 -0
package/dst/speechflow-node-x2x-filter.js +113 -0
package/dst/speechflow-node-x2x-filter.js.map +1 -0
package/dst/speechflow-node-x2x-trace.js +24 -10
package/dst/speechflow-node-x2x-trace.js.map +1 -1
package/dst/speechflow-node-xio-device.js +14 -5
package/dst/speechflow-node-xio-device.js.map +1 -1
package/dst/speechflow-node-xio-file.js +58 -27
package/dst/speechflow-node-xio-file.js.map +1 -1
package/dst/speechflow-node-xio-mqtt.js.map +1 -1
package/dst/speechflow-node-xio-websocket.js.map +1 -1
package/dst/speechflow-node.js +1 -0
package/dst/speechflow-node.js.map +1 -1
package/dst/speechflow-utils.d.ts +14 -1
package/dst/speechflow-utils.js +110 -2
package/dst/speechflow-utils.js.map +1 -1
package/dst/speechflow.js +56 -53
package/dst/speechflow.js.map +1 -1
package/etc/speechflow.yaml +51 -24
package/package.json +6 -5
package/src/speechflow-node-a2a-gender.ts +272 -0
package/src/speechflow-node-a2a-meter.ts +3 -3
package/src/speechflow-node-a2a-mute.ts +1 -0
package/src/speechflow-node-a2a-vad.ts +58 -68
package/src/speechflow-node-a2a-wav.ts +128 -91
package/src/speechflow-node-a2t-deepgram.ts +15 -4
package/src/speechflow-node-t2a-elevenlabs.ts +13 -8
package/src/speechflow-node-t2a-kokoro.ts +3 -3
package/src/speechflow-node-t2t-deepl.ts +2 -2
package/src/speechflow-node-t2t-format.ts +2 -2
package/src/speechflow-node-t2t-ollama.ts +2 -2
package/src/speechflow-node-t2t-openai.ts +2 -2
package/src/speechflow-node-t2t-subtitle.ts +1 -1
package/src/speechflow-node-t2t-transformers.ts +2 -2
package/src/speechflow-node-x2x-filter.ts +122 -0
package/src/speechflow-node-x2x-trace.ts +28 -11
package/src/speechflow-node-xio-device.ts +20 -8
package/src/speechflow-node-xio-file.ts +74 -36
package/src/speechflow-node-xio-mqtt.ts +3 -3
package/src/speechflow-node-xio-websocket.ts +1 -1
package/src/speechflow-node.ts +2 -0
package/src/speechflow-utils.ts +81 -2
package/src/speechflow.ts +84 -81

package/src/speechflow-node-xio-device.ts CHANGED Viewed

@@ -32,7 +32,8 @@ export default class SpeechFlowNodeDevice extends SpeechFlowNode {
         /*  declare node configuration parameters  */
         this.configure({
             device: { type: "string", pos: 0, val: "",   match: /^(.+?):(.+)$/ },
-            mode:   { type: "string", pos: 1, val: "rw", match: /^(?:r|w|rw)$/ }
+            mode:   { type: "string", pos: 1, val: "rw", match: /^(?:r|w|rw)$/ },
+            chunk:  { type: "number", pos: 2, val: 200,  match: (n: number) => n >= 10 && n <= 1000 }
         })
         /*  declare node input/output format  */
@@ -98,6 +99,13 @@ export default class SpeechFlowNodeDevice extends SpeechFlowNode {
             throw new Error(`audio device sample rate ${device.defaultSampleRate} is ` +
                 `incompatible with required sample rate ${this.config.audioSampleRate}`)
+        /*  determine how many bytes we need per chunk when
+            the chunk should be the requested duration  */
+        const highwaterMark = (
+            this.config.audioSampleRate *
+            (this.config.audioBitDepth / 8)
+        ) / (1000 / this.params.chunk)
         /*  establish device connection
             Notice: "naudion" actually implements Stream.{Readable,Writable,Duplex}, but
             declares just its sub-interface NodeJS.{Readable,Writable,Duplex}Stream,
@@ -115,13 +123,15 @@ export default class SpeechFlowNodeDevice extends SpeechFlowNode {
                     deviceId:     device.id,
                     channelCount: this.config.audioChannels,
                     sampleRate:   this.config.audioSampleRate,
-                    sampleFormat: this.config.audioBitDepth
+                    sampleFormat: this.config.audioBitDepth,
+                    highwaterMark
                 },
                 outOptions: {
                     deviceId:     device.id,
                     channelCount: this.config.audioChannels,
                     sampleRate:   this.config.audioSampleRate,
-                    sampleFormat: this.config.audioBitDepth
+                    sampleFormat: this.config.audioBitDepth,
+                    highwaterMark
                 }
             })
             this.stream = this.io as unknown as Stream.Duplex
@@ -138,10 +148,11 @@ export default class SpeechFlowNodeDevice extends SpeechFlowNode {
             this.log("info", `resolved "${this.params.device}" to input device "${device.id}"`)
             this.io = PortAudio.AudioIO({
                 inOptions: {
-                    deviceId:     device.id,
-                    channelCount: this.config.audioChannels,
-                    sampleRate:   this.config.audioSampleRate,
-                    sampleFormat: this.config.audioBitDepth
+                    deviceId:      device.id,
+                    channelCount:  this.config.audioChannels,
+                    sampleRate:    this.config.audioSampleRate,
+                    sampleFormat:  this.config.audioBitDepth,
+                    highwaterMark
                 }
             })
             this.stream = this.io as unknown as Stream.Readable
@@ -161,7 +172,8 @@ export default class SpeechFlowNodeDevice extends SpeechFlowNode {
                     deviceId:     device.id,
                     channelCount: this.config.audioChannels,
                     sampleRate:   this.config.audioSampleRate,
-                    sampleFormat: this.config.audioBitDepth
+                    sampleFormat: this.config.audioBitDepth,
+                    highwaterMark
                 }
             })
             this.stream = this.io as unknown as Stream.Writable

package/src/speechflow-node-xio-file.ts CHANGED Viewed

@@ -23,9 +23,11 @@ export default class SpeechFlowNodeFile extends SpeechFlowNode {
         /*  declare node configuration parameters  */
         this.configure({
-            path: { type: "string", pos: 0, val: "" },
-            mode: { type: "string", pos: 1, val: "r",     match: /^(?:r|w|rw)$/ },
-            type: { type: "string", pos: 2, val: "audio", match: /^(?:audio|text)$/ }
+            path:   { type: "string", pos: 0, val: "" },
+            mode:   { type: "string", pos: 1, val: "r",     match: /^(?:r|w|rw)$/ },
+            type:   { type: "string", pos: 2, val: "audio", match: /^(?:audio|text)$/ },
+            chunka: { type: "number",         val: 200,     match: (n: number) => n >= 10 && n <= 1000 },
+            chunkt: { type: "number",         val: 65536,   match: (n: number) => n >= 1024 && n <= 131072 }
         })
         /*  declare node input/output format  */
@@ -45,92 +47,128 @@ export default class SpeechFlowNodeFile extends SpeechFlowNode {
     /*  open node  */
     async open () {
+        /*  determine how many bytes we need per chunk when
+            the chunk should be of the required duration/size */
+        const highWaterMarkAudio = (
+            this.config.audioSampleRate *
+            (this.config.audioBitDepth / 8)
+        ) / (1000 / this.params.chunka)
+        const highWaterMarkText = this.params.chunkt
+        /*  sanity check  */
         if (this.params.path === "")
             throw new Error("required parameter \"path\" has to be given")
+        /*  dispatch according to mode and path  */
         if (this.params.mode === "rw") {
             if (this.params.path === "-") {
                 /*  standard I/O  */
                 if (this.params.type === "audio") {
                     process.stdin.setEncoding()
                     process.stdout.setEncoding()
+                    const streamR = new Stream.PassThrough({ highWaterMark: highWaterMarkAudio })
+                    process.stdin.pipe(streamR)
+                    const streamW = new Stream.PassThrough({ highWaterMark: highWaterMarkAudio })
+                    streamW.pipe(process.stdout)
+                    this.stream = Stream.Duplex.from({ readable: streamR, writable: streamW })
                 }
                 else {
                     process.stdin.setEncoding(this.config.textEncoding)
                     process.stdout.setEncoding(this.config.textEncoding)
+                    const streamR = new Stream.PassThrough({ highWaterMark: highWaterMarkText })
+                    process.stdin.pipe(streamR)
+                    const streamW = new Stream.PassThrough({ highWaterMark: highWaterMarkText })
+                    streamW.pipe(process.stdout)
+                    this.stream = Stream.Duplex.from({ readable: streamR, writable: streamW })
                 }
-                this.stream = Stream.Duplex.from({
-                    readable: process.stdin,
-                    writable: process.stdout
-                })
             }
             else {
                 /*  file I/O  */
                 if (this.params.type === "audio") {
                     this.stream = Stream.Duplex.from({
-                        readable: fs.createReadStream(this.params.path),
-                        writable: fs.createWriteStream(this.params.path)
+                        readable: fs.createReadStream(this.params.path,
+                            { highWaterMark: highWaterMarkAudio }),
+                        writable: fs.createWriteStream(this.params.path,
+                            { highWaterMark: highWaterMarkAudio })
                     })
                 }
                 else {
                     this.stream = Stream.Duplex.from({
-                        readable: fs.createReadStream(this.params.path,
-                            { encoding: this.config.textEncoding }),
-                        writable: fs.createWriteStream(this.params.path,
-                            { encoding: this.config.textEncoding })
+                        readable: fs.createReadStream(this.params.path, {
+                            highWaterMark: highWaterMarkText,
+                            encoding: this.config.textEncoding
+                        }),
+                        writable: fs.createWriteStream(this.params.path, {
+                            highWaterMark: highWaterMarkText,
+                            encoding: this.config.textEncoding
+                        })
                     })
                 }
             }
             /*  convert regular stream into object-mode stream  */
             const wrapper1 = utils.createTransformStreamForWritableSide()
-            const wrapper2 = utils.createTransformStreamForReadableSide(this.params.type, () => this.timeZero)
+            const wrapper2 = utils.createTransformStreamForReadableSide(
+                this.params.type, () => this.timeZero)
             this.stream = Stream.compose(wrapper1, this.stream, wrapper2)
         }
         else if (this.params.mode === "r") {
             if (this.params.path === "-") {
                 /*  standard I/O  */
-                if (this.params.type === "audio")
+                let chunker: Stream.PassThrough
+                if (this.params.type === "audio") {
                     process.stdin.setEncoding()
-                else
+                    chunker = new Stream.PassThrough({ highWaterMark: highWaterMarkAudio })
+                }
+                else {
                     process.stdin.setEncoding(this.config.textEncoding)
-                this.stream = process.stdin
+                    chunker = new Stream.PassThrough({ highWaterMark: highWaterMarkText })
+                }
+                const wrapper = utils.createTransformStreamForReadableSide(
+                    this.params.type, () => this.timeZero)
+                this.stream = Stream.compose(process.stdin, chunker, wrapper)
             }
             else {
                 /*  file I/O  */
+                let readable: Stream.Readable
                 if (this.params.type === "audio")
-                    this.stream = fs.createReadStream(this.params.path)
+                    readable = fs.createReadStream(this.params.path,
+                        { highWaterMark: highWaterMarkAudio })
                 else
-                    this.stream = fs.createReadStream(this.params.path,
-                        { encoding: this.config.textEncoding })
+                    readable = fs.createReadStream(this.params.path,
+                        { highWaterMark: highWaterMarkText, encoding: this.config.textEncoding })
+                const wrapper = utils.createTransformStreamForReadableSide(
+                    this.params.type, () => this.timeZero)
+                this.stream = Stream.compose(readable, wrapper)
             }
-            /*  convert regular stream into object-mode stream  */
-            const wrapper = utils.createTransformStreamForReadableSide(this.params.type, () => this.timeZero)
-            this.stream.pipe(wrapper)
-            this.stream = wrapper
         }
         else if (this.params.mode === "w") {
             if (this.params.path === "-") {
                 /*  standard I/O  */
-                if (this.params.type === "audio")
+                let chunker: Stream.PassThrough
+                if (this.params.type === "audio") {
                     process.stdout.setEncoding()
-                else
+                    chunker = new Stream.PassThrough({ highWaterMark: highWaterMarkAudio })
+                }
+                else {
                     process.stdout.setEncoding(this.config.textEncoding)
-                this.stream = process.stdout
+                    chunker = new Stream.PassThrough({ highWaterMark: highWaterMarkText })
+                }
+                const wrapper = utils.createTransformStreamForWritableSide()
+                this.stream = Stream.compose(wrapper, chunker, process.stdout)
             }
             else {
                 /*  file I/O  */
+                let writable: Stream.Writable
                 if (this.params.type === "audio")
-                    this.stream = fs.createWriteStream(this.params.path)
+                    writable = fs.createWriteStream(this.params.path,
+                        { highWaterMark: highWaterMarkAudio })
                 else
-                    this.stream = fs.createWriteStream(this.params.path,
-                        { encoding: this.config.textEncoding })
+                    writable = fs.createWriteStream(this.params.path,
+                        { highWaterMark: highWaterMarkText, encoding: this.config.textEncoding })
+                const wrapper = utils.createTransformStreamForWritableSide()
+                this.stream = Stream.compose(wrapper, writable)
             }
-            /*  convert regular stream into object-mode stream  */
-            const wrapper = utils.createTransformStreamForWritableSide()
-            wrapper.pipe(this.stream as Stream.Writable)
-            this.stream = wrapper
         }
         else
             throw new Error(`invalid file mode "${this.params.mode}"`)

package/src/speechflow-node-xio-mqtt.ts CHANGED Viewed

@@ -5,11 +5,11 @@
 */
 /*  standard dependencies  */
-import Stream                          from "node:stream"
+import Stream from "node:stream"
 /*  external dependencies  */
-import MQTT                            from "mqtt"
-import UUID                            from "pure-uuid"
+import MQTT   from "mqtt"
+import UUID   from "pure-uuid"
 /*  internal dependencies  */
 import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"

package/src/speechflow-node-xio-websocket.ts CHANGED Viewed

@@ -5,7 +5,7 @@
 */
 /*  standard dependencies  */
-import Stream                          from "node:stream"
+import Stream from "node:stream"
 /*  external dependencies  */
 import ws                              from "ws"

package/src/speechflow-node.ts CHANGED Viewed

@@ -7,6 +7,8 @@
 /*  standard dependencies  */
 import Events from "node:events"
 import Stream from "node:stream"
+/*  external dependencies  */
 import { DateTime, Duration } from "luxon"
 /*  the definition of a single payload chunk passed through the SpeechFlow nodes  */

package/src/speechflow-utils.ts CHANGED Viewed

@@ -4,14 +4,17 @@
 **  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
 */
-/*  external dependencies  */
+/*  standard dependencies  */
 import Stream                 from "node:stream"
 import { EventEmitter }       from "node:events"
+/*  external dependencies  */
 import { DateTime, Duration } from "luxon"
 import CBOR                   from "cbor2"
+import * as IntervalTree      from "node-interval-tree"
 /*  internal dependencies  */
-import { SpeechFlowChunk } from "./speechflow-node"
+import { SpeechFlowChunk }    from "./speechflow-node"
 /*  calculate duration of an audio buffer  */
 export function audioBufferDuration (
@@ -68,6 +71,10 @@ export function createTransformStreamForWritableSide () {
         transform (chunk: SpeechFlowChunk, encoding, callback) {
             this.push(chunk.payload)
             callback()
+        },
+        final (callback) {
+            this.push(null)
+            callback()
         }
     })
 }
@@ -90,6 +97,10 @@ export function createTransformStreamForReadableSide (type: "text" | "audio", ge
             const obj = new SpeechFlowChunk(start, end, "final", type, chunk)
             this.push(obj)
             callback()
+        },
+        final (callback) {
+            this.push(null)
+            callback()
         }
     })
 }
@@ -252,6 +263,7 @@ export class QueuePointer<T extends QueueElement> extends EventEmitter {
         private queue: Queue<T>
     ) {
         super()
+        this.setMaxListeners(100)
     }
     /*  positioning operations  */
@@ -379,6 +391,10 @@ export class QueuePointer<T extends QueueElement> extends EventEmitter {
 export class Queue<T extends QueueElement> extends EventEmitter {
     public elements: T[] = []
     private pointers = new Map<string, QueuePointer<T>>()
+    constructor () {
+        super()
+        this.setMaxListeners(100)
+    }
     pointerUse (name: string): QueuePointer<T> {
         if (!this.pointers.has(name))
             this.pointers.set(name, new QueuePointer<T>(name, this))
@@ -405,3 +421,66 @@ export class Queue<T extends QueueElement> extends EventEmitter {
     }
 }
+/*  utility class for wrapping a custom stream into a regular Transform stream  */
+export class StreamWrapper extends Stream.Transform {
+    private foreignStream: any
+    constructor (foreignStream: any, options: Stream.TransformOptions = {}) {
+        options.readableObjectMode = true
+        options.writableObjectMode = true
+        super(options)
+        this.foreignStream = foreignStream
+        this.foreignStream.on("data", (chunk: any) => {
+            this.push(chunk)
+        })
+        this.foreignStream.on("error", (err: Error) => {
+            this.emit("error", err)
+        })
+        this.foreignStream.on("end", () => {
+            this.push(null)
+        })
+    }
+    _transform (chunk: any, encoding: BufferEncoding, callback: Stream.TransformCallback): void {
+        try {
+            const canContinue = this.foreignStream.write(chunk)
+            if (canContinue)
+                callback()
+            else
+                this.foreignStream.once("drain", callback)
+        }
+        catch (err) {
+            callback(err as Error)
+        }
+    }
+    _flush (callback: Stream.TransformCallback): void {
+        try {
+            if (typeof this.foreignStream.end === "function")
+                this.foreignStream.end()
+            callback()
+        }
+        catch (err) {
+            callback(err as Error)
+        }
+    }
+}
+/*  meta store  */
+interface TimeStoreInterval<T> extends IntervalTree.Interval {
+    item: T
+}
+export class TimeStore<T> extends EventEmitter {
+    private tree = new IntervalTree.IntervalTree<TimeStoreInterval<T>>()
+    store (start: Duration, end: Duration, item: T): void {
+        this.tree.insert({ low: start.toMillis(), high: end.toMillis(), item })
+    }
+    fetch (start: Duration, end: Duration): T[] {
+        const intervals = this.tree.search(start.toMillis(), end.toMillis())
+        return intervals.map((interval) => interval.item)
+    }
+    prune (_before: Duration): void {
+        const before = _before.toMillis()
+        const intervals = this.tree.search(0, before - 1)
+        for (const interval of intervals)
+            if (interval.low < before && interval.high < before)
+                this.tree.remove(interval)
+    }
+}