npm - speechflow - Versions diffs - 0.9.5 → 0.9.8 - Mend

speechflow 0.9.5 → 0.9.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (109) hide show

package/CHANGELOG.md +24 -0
package/README.md +220 -53
package/dst/speechflow-node-a2a-ffmpeg.d.ts +13 -0
package/dst/speechflow-node-a2a-ffmpeg.js +152 -0
package/dst/speechflow-node-a2a-wav.d.ts +11 -0
package/dst/speechflow-node-a2a-wav.js +170 -0
package/dst/speechflow-node-a2t-deepgram.d.ts +12 -0
package/dst/speechflow-node-a2t-deepgram.js +220 -0
package/dst/speechflow-node-deepgram.d.ts +3 -1
package/dst/speechflow-node-deepgram.js +86 -22
package/dst/speechflow-node-deepl.d.ts +3 -1
package/dst/speechflow-node-deepl.js +25 -20
package/dst/speechflow-node-device.d.ts +3 -1
package/dst/speechflow-node-device.js +53 -2
package/dst/speechflow-node-elevenlabs.d.ts +3 -1
package/dst/speechflow-node-elevenlabs.js +37 -42
package/dst/speechflow-node-ffmpeg.d.ts +3 -1
package/dst/speechflow-node-ffmpeg.js +42 -4
package/dst/speechflow-node-file.d.ts +3 -1
package/dst/speechflow-node-file.js +84 -13
package/dst/speechflow-node-format.d.ts +11 -0
package/dst/speechflow-node-format.js +80 -0
package/dst/speechflow-node-gemma.d.ts +3 -1
package/dst/speechflow-node-gemma.js +84 -23
package/dst/speechflow-node-mqtt.d.ts +13 -0
package/dst/speechflow-node-mqtt.js +181 -0
package/dst/speechflow-node-opus.d.ts +12 -0
package/dst/speechflow-node-opus.js +135 -0
package/dst/speechflow-node-subtitle.d.ts +12 -0
package/dst/speechflow-node-subtitle.js +96 -0
package/dst/speechflow-node-t2a-elevenlabs.d.ts +13 -0
package/dst/speechflow-node-t2a-elevenlabs.js +182 -0
package/dst/speechflow-node-t2t-deepl.d.ts +12 -0
package/dst/speechflow-node-t2t-deepl.js +133 -0
package/dst/speechflow-node-t2t-format.d.ts +11 -0
package/dst/speechflow-node-t2t-format.js +80 -0
package/dst/speechflow-node-t2t-gemma.d.ts +13 -0
package/dst/speechflow-node-t2t-gemma.js +213 -0
package/dst/speechflow-node-t2t-opus.d.ts +12 -0
package/dst/speechflow-node-t2t-opus.js +135 -0
package/dst/speechflow-node-t2t-subtitle.d.ts +12 -0
package/dst/speechflow-node-t2t-subtitle.js +96 -0
package/dst/speechflow-node-trace.d.ts +11 -0
package/dst/speechflow-node-trace.js +88 -0
package/dst/speechflow-node-wav.d.ts +11 -0
package/dst/speechflow-node-wav.js +170 -0
package/dst/speechflow-node-websocket.d.ts +3 -1
package/dst/speechflow-node-websocket.js +149 -49
package/dst/speechflow-node-whisper-common.d.ts +34 -0
package/dst/speechflow-node-whisper-common.js +7 -0
package/dst/speechflow-node-whisper-ggml.d.ts +1 -0
package/dst/speechflow-node-whisper-ggml.js +97 -0
package/dst/speechflow-node-whisper-onnx.d.ts +1 -0
package/dst/speechflow-node-whisper-onnx.js +131 -0
package/dst/speechflow-node-whisper-worker-ggml.d.ts +1 -0
package/dst/speechflow-node-whisper-worker-ggml.js +97 -0
package/dst/speechflow-node-whisper-worker-onnx.d.ts +1 -0
package/dst/speechflow-node-whisper-worker-onnx.js +131 -0
package/dst/speechflow-node-whisper-worker.d.ts +1 -0
package/dst/speechflow-node-whisper-worker.js +116 -0
package/dst/speechflow-node-whisper-worker2.d.ts +1 -0
package/dst/speechflow-node-whisper-worker2.js +82 -0
package/dst/speechflow-node-whisper.d.ts +19 -0
package/dst/speechflow-node-whisper.js +604 -0
package/dst/speechflow-node-x2x-trace.d.ts +11 -0
package/dst/speechflow-node-x2x-trace.js +88 -0
package/dst/speechflow-node-xio-device.d.ts +13 -0
package/dst/speechflow-node-xio-device.js +205 -0
package/dst/speechflow-node-xio-file.d.ts +11 -0
package/dst/speechflow-node-xio-file.js +176 -0
package/dst/speechflow-node-xio-mqtt.d.ts +13 -0
package/dst/speechflow-node-xio-mqtt.js +181 -0
package/dst/speechflow-node-xio-websocket.d.ts +13 -0
package/dst/speechflow-node-xio-websocket.js +275 -0
package/dst/speechflow-node.d.ts +24 -6
package/dst/speechflow-node.js +63 -6
package/dst/speechflow-utils.d.ts +23 -0
package/dst/speechflow-utils.js +194 -0
package/dst/speechflow.js +146 -43
package/etc/biome.jsonc +12 -4
package/etc/speechflow.bat +6 -0
package/etc/speechflow.sh +5 -0
package/etc/speechflow.yaml +71 -0
package/etc/stx.conf +65 -0
package/package.d/@ericedouard+vad-node-realtime+0.2.0.patch +18 -0
package/package.json +49 -31
package/src/lib.d.ts +6 -1
package/src/{speechflow-node-ffmpeg.ts → speechflow-node-a2a-ffmpeg.ts} +10 -4
package/src/speechflow-node-a2a-wav.ts +143 -0
package/src/speechflow-node-a2t-deepgram.ts +199 -0
package/src/{speechflow-node-elevenlabs.ts → speechflow-node-t2a-elevenlabs.ts} +38 -45
package/src/{speechflow-node-deepl.ts → speechflow-node-t2t-deepl.ts} +36 -25
package/src/speechflow-node-t2t-format.ts +85 -0
package/src/{speechflow-node-gemma.ts → speechflow-node-t2t-gemma.ts} +89 -25
package/src/speechflow-node-t2t-opus.ts +111 -0
package/src/speechflow-node-t2t-subtitle.ts +101 -0
package/src/speechflow-node-x2x-trace.ts +92 -0
package/src/{speechflow-node-device.ts → speechflow-node-xio-device.ts} +25 -3
package/src/speechflow-node-xio-file.ts +153 -0
package/src/speechflow-node-xio-mqtt.ts +154 -0
package/src/speechflow-node-xio-websocket.ts +248 -0
package/src/speechflow-node.ts +63 -6
package/src/speechflow-utils.ts +212 -0
package/src/speechflow.ts +150 -43
package/etc/nps.yaml +0 -40
package/sample.yaml +0 -39
package/src/speechflow-node-deepgram.ts +0 -133
package/src/speechflow-node-file.ts +0 -108
package/src/speechflow-node-websocket.ts +0 -179

package/src/{speechflow-node-elevenlabs.ts → speechflow-node-t2a-elevenlabs.ts} RENAMED Viewed

@@ -6,31 +6,16 @@
 /*  standard dependencies  */
 import Stream                from "node:stream"
-import { EventEmitter }      from "node:events"
 /*  external dependencies  */
-import * as ElevenLabs       from "elevenlabs"
+import * as ElevenLabs       from "@elevenlabs/elevenlabs-js"
 import { getStreamAsBuffer } from "get-stream"
 import SpeexResampler        from "speex-resampler"
 /*  internal dependencies  */
-import SpeechFlowNode        from "./speechflow-node"
-/*
-const elevenlabsVoices = {
-    "drew":    { name: "Drew",    model: "eleven_multilingual_v2", lang: [ "en", "de" ] },
-    "george":  { name: "George",  model: "eleven_multilingual_v2", lang: [ "en", "de" ] },
-    "bill":    { name: "Bill",    model: "eleven_multilingual_v2", lang: [ "en", "de" ] },
-    "daniel":  { name: "Daniel",  model: "eleven_multilingual_v1", lang: [ "en", "de" ] },
-    "brian":   { name: "Brian",   model: "eleven_turbo_v2",        lang: [ "en"       ] },
-    "sarah":   { name: "Sarah",   model: "eleven_multilingual_v2", lang: [ "en", "de" ] },
-    "racel":   { name: "Racel",   model: "eleven_multilingual_v2", lang: [ "en", "de" ] },
-    "grace":   { name: "Grace",   model: "eleven_multilingual_v1", lang: [ "en", "de" ] },
-    "matilda": { name: "Matilda", model: "eleven_multilingual_v1", lang: [ "en", "de" ] },
-    "alice":   { name: "Alice",   model: "eleven_turbo_v2",        lang: [ "en"       ] }
-}
-*/
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
+/*  SpeechFlow node for Elevenlabs text-to-speech conversion  */
 export default class SpeechFlowNodeElevenlabs extends SpeechFlowNode {
     /*  declare official node name  */
     public static name = "elevenlabs"
@@ -40,8 +25,8 @@ export default class SpeechFlowNodeElevenlabs extends SpeechFlowNode {
     private static speexInitialized = false
     /*  construct node  */
-    constructor (id: string, opts: { [ id: string ]: any }, args: any[]) {
-        super(id, opts, args)
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
         /*  declare node configuration parameters  */
         this.configure({
@@ -73,7 +58,7 @@ export default class SpeechFlowNodeElevenlabs extends SpeechFlowNode {
             "growing_business":      44100,
             "enterprise":            44100
         }
-        const sub = await this.elevenlabs.user.getSubscription()
+        const sub = await this.elevenlabs.user.subscription.get()
         const tier = (sub.tier ?? "free") as keyof typeof maxSampleRates
         this.log("info", `determined ElevenLabs tier: "${tier}"`)
         let maxSampleRate = 16000
@@ -100,13 +85,14 @@ export default class SpeechFlowNodeElevenlabs extends SpeechFlowNode {
             "eleven_multilingual_v2" :
             "eleven_flash_v2_5"
         const speechStream = (text: string) => {
-            return this.elevenlabs!.textToSpeech.convert(voice.voice_id, {
+            this.log("info", `ElevenLabs: send text "${text}"`)
+            return this.elevenlabs!.textToSpeech.convert(voice.voiceId, {
                 text,
-                model_id:         model,
-                language_code:    this.params.language,
-                output_format:    `pcm_${maxSampleRate}` as ElevenLabs.ElevenLabs.OutputFormat,
+                modelId:          model,
+                languageCode:     this.params.language,
+                outputFormat:     `pcm_${maxSampleRate}` as ElevenLabs.ElevenLabs.OutputFormat,
                 seed:             815, /* arbitrary, but fixated by us */
-                voice_settings: {
+                voiceSettings: {
                     speed:        this.params.speed
                 }
             }, {
@@ -115,9 +101,6 @@ export default class SpeechFlowNodeElevenlabs extends SpeechFlowNode {
             })
         }
-        /*  internal queue of results  */
-        const queue = new EventEmitter()
         /*  establish resampler from ElevenLabs's maximum 24Khz
             output to our standard audio sample rate (48KHz)  */
         if (!SpeechFlowNodeElevenlabs.speexInitialized) {
@@ -127,26 +110,36 @@ export default class SpeechFlowNodeElevenlabs extends SpeechFlowNode {
         }
         const resampler = new SpeexResampler(1, maxSampleRate, this.config.audioSampleRate, 7)
-        /*  create duplex stream and connect it to the ElevenLabs API  */
-        this.stream = new Stream.Duplex({
-            write (chunk: Buffer, encoding, callback) {
-                const data = chunk.toString()
-                speechStream(data).then((stream) => {
-                    getStreamAsBuffer(stream).then((buffer) => {
-                        const bufferResampled = resampler.processChunk(buffer)
-                        queue.emit("audio", bufferResampled)
-                        callback()
+        /*  create transform stream and connect it to the ElevenLabs API  */
+        const log = (level: string, msg: string) => { this.log(level, msg) }
+        this.stream = new Stream.Transform({
+            writableObjectMode: true,
+            readableObjectMode: true,
+            decodeStrings:      false,
+            transform (chunk: SpeechFlowChunk, encoding, callback) {
+                if (Buffer.isBuffer(chunk.payload))
+                    callback(new Error("invalid chunk payload type"))
+                else {
+                    speechStream(chunk.payload).then((stream) => {
+                        getStreamAsBuffer(stream).then((buffer) => {
+                            const bufferResampled = resampler.processChunk(buffer)
+                            log("info", `ElevenLabs: received audio (buffer length: ${buffer.byteLength})`)
+                            const chunkNew = chunk.clone()
+                            chunkNew.type = "audio"
+                            chunkNew.payload = bufferResampled
+                            this.push(chunkNew)
+                            callback()
+                        }).catch((error) => {
+                            callback(error)
+                        })
                     }).catch((error) => {
                         callback(error)
                     })
-                }).catch((error) => {
-                    callback(error)
-                })
+                }
             },
-            read (size) {
-                queue.once("audio", (buffer: Buffer) => {
-                    this.push(buffer, "binary")
-                })
+            final (callback) {
+                this.push(null)
+                callback()
             }
         })
     }

package/src/{speechflow-node-deepl.ts → speechflow-node-t2t-deepl.ts} RENAMED Viewed

@@ -6,13 +6,12 @@
 /*  standard dependencies  */
 import Stream           from "node:stream"
-import { EventEmitter } from "node:events"
 /*  external dependencies  */
 import * as DeepL       from "deepl-node"
 /*  internal dependencies  */
-import SpeechFlowNode   from "./speechflow-node"
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
 /*  SpeechFlow node for DeepL text-to-text translations  */
 export default class SpeechFlowNodeDeepL extends SpeechFlowNode {
@@ -23,17 +22,21 @@ export default class SpeechFlowNodeDeepL extends SpeechFlowNode {
     private deepl: DeepL.Translator | null = null
     /*  construct node  */
-    constructor (id: string, opts: { [ id: string ]: any }, args: any[]) {
-        super(id, opts, args)
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
         /*  declare node configuration parameters  */
         this.configure({
             key:      { type: "string", val: process.env.SPEECHFLOW_KEY_DEEPL },
-            src:      { type: "string", pos: 0, val: "de",      match: /^(?:de|en-US)$/ },
-            dst:      { type: "string", pos: 1, val: "en-US",   match: /^(?:de|en-US)$/ },
+            src:      { type: "string", pos: 0, val: "de",      match: /^(?:de|en)$/ },
+            dst:      { type: "string", pos: 1, val: "en",      match: /^(?:de|en)$/ },
             optimize: { type: "string", pos: 2, val: "latency", match: /^(?:latency|quality)$/ }
         })
+        /*  sanity check situation  */
+        if (this.params.src === this.params.dst)
+            throw new Error("source and destination languages cannot be the same")
         /*  declare node input/output format  */
         this.input  = "text"
         this.output = "text"
@@ -46,7 +49,9 @@ export default class SpeechFlowNodeDeepL extends SpeechFlowNode {
         /*  provide text-to-text translation  */
         const translate = async (text: string) => {
-            const result = await this.deepl!.translateText(text, this.params.src, this.params.dst, {
+            const src = this.params.src === "en" ? "en-US" : this.params.src
+            const dst = this.params.dst === "en" ? "en-US" : this.params.dst
+            const result = await this.deepl!.translateText(text, src, dst, {
                 splitSentences: "off",
                 modelType: this.params.optimize === "latency" ?
                     "latency_optimized" : "prefer_quality_optimized",
@@ -57,32 +62,38 @@ export default class SpeechFlowNodeDeepL extends SpeechFlowNode {
         }
         /*  establish a duplex stream and connect it to DeepL translation  */
-        const queue = new EventEmitter()
-        this.stream = new Stream.Duplex({
-            write (chunk: Buffer, encoding, callback) {
-                const data = chunk.toString()
-                if (data === "") {
-                    queue.emit("result", "")
-                    callback()
-                }
+        this.stream = new Stream.Transform({
+            readableObjectMode: true,
+            writableObjectMode: true,
+            decodeStrings:      false,
+            transform (chunk: SpeechFlowChunk, encoding, callback) {
+                if (Buffer.isBuffer(chunk.payload))
+                    callback(new Error("invalid chunk payload type"))
                 else {
-                    translate(data).then((result) => {
-                        queue.emit("result", result)
+                    if (chunk.payload === "") {
+                        this.push(chunk)
                         callback()
-                    }).catch((err) => {
-                        callback(err)
-                    })
+                    }
+                    else {
+                        translate(chunk.payload).then((payload) => {
+                            const chunkNew = chunk.clone()
+                            chunkNew.payload = payload
+                            this.push(chunkNew)
+                            callback()
+                        }).catch((err) => {
+                            callback(err)
+                        })
+                    }
                 }
             },
-            read (size: number) {
-                queue.once("result", (result: string) => {
-                    this.push(result)
-                })
+            final (callback) {
+                this.push(null)
+                callback()
             }
         })
     }
-    /*  open node  */
+    /*  close node  */
     async close () {
         /*  close stream  */
         if (this.stream !== null) {

package/src/speechflow-node-t2t-format.ts ADDED Viewed

@@ -0,0 +1,85 @@
+/*
+**  SpeechFlow - Speech Processing Flow Graph
+**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
+*/
+/*  standard dependencies  */
+import Stream           from "node:stream"
+/*  external dependencies  */
+import wrapText         from "wrap-text"
+/*  internal dependencies  */
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
+/*  SpeechFlow node for text-to-text formatting  */
+export default class SpeechFlowNodeFormat extends SpeechFlowNode {
+    /*  declare official node name  */
+    public static name = "format"
+    /*  construct node  */
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
+        /*  declare node configuration parameters  */
+        this.configure({
+            width: { type: "number", val: 80 }
+        })
+        /*  declare node input/output format  */
+        this.input  = "text"
+        this.output = "text"
+    }
+    /*  open node  */
+    async open () {
+        /*  provide text-to-text formatter  */
+        const format = async (text: string) => {
+            text = wrapText(text, this.params.width)
+            text = text.replace(/([^\n])$/, "$1\n")
+            return text
+        }
+        /*  establish a duplex stream and connect it to DeepL translation  */
+        this.stream = new Stream.Transform({
+            readableObjectMode: true,
+            writableObjectMode: true,
+            decodeStrings:      false,
+            transform (chunk: SpeechFlowChunk, encoding, callback) {
+                if (Buffer.isBuffer(chunk.payload))
+                    callback(new Error("invalid chunk payload type"))
+                else {
+                    if (chunk.payload === "") {
+                        this.push(chunk)
+                        callback()
+                    }
+                    else {
+                        format(chunk.payload).then((payload) => {
+                            const chunkNew = chunk.clone()
+                            chunkNew.payload = payload
+                            this.push(chunkNew)
+                            callback()
+                        }).catch((err) => {
+                            callback(err)
+                        })
+                    }
+                }
+            },
+            final (callback) {
+                this.push(null)
+                callback()
+            }
+        })
+    }
+    /*  open node  */
+    async close () {
+        /*  close stream  */
+        if (this.stream !== null) {
+            this.stream.destroy()
+            this.stream = null
+        }
+    }
+}

package/src/{speechflow-node-gemma.ts → speechflow-node-t2t-gemma.ts} RENAMED Viewed

@@ -6,13 +6,12 @@
 /*  standard dependencies  */
 import Stream           from "node:stream"
-import { EventEmitter } from "node:events"
 /*  external dependencies  */
 import { Ollama }       from "ollama"
 /*  internal dependencies  */
-import SpeechFlowNode   from "./speechflow-node"
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
 /*  internal utility types  */
 type ConfigEntry = { systemPrompt: string, chat: Array<{ role: string, content: string }> }
@@ -28,6 +27,69 @@ export default class SpeechFlowNodeGemma extends SpeechFlowNode {
     /*  internal LLM setup  */
     private setup: Config = {
+        /*  English (EN) spellchecking only  */
+        "en-en": {
+            systemPrompt:
+                "You are a proofreader and spellchecker for English.\n" +
+                "Output only the corrected text.\n" +
+                "Do NOT use markdown.\n" +
+                "Do NOT give any explanations.\n" +
+                "Do NOT give any introduction.\n" +
+                "Do NOT give any comments.\n" +
+                "Do NOT give any preamble.\n" +
+                "Do NOT give any prolog.\n" +
+                "Do NOT give any epilog.\n" +
+                "Do NOT change the gammar.\n" +
+                "Do NOT use synonyms for words.\n" +
+                "Keep all words.\n" +
+                "Fill in missing commas.\n" +
+                "Fill in missing points.\n" +
+                "Fill in missing question marks.\n" +
+                "Fill in missing hyphens.\n" +
+                "Focus ONLY on the word spelling.\n" +
+                "The text you have to correct is:\n",
+            chat: [
+                { role: "user",   content: "I luve my wyfe" },
+                { role: "system", content: "I love my wife." },
+                { role: "user",   content: "The weether is wunderfull!" },
+                { role: "system", content: "The weather is wonderful!" },
+                { role: "user",   content: "The live awesome but I'm hungry." },
+                { role: "system", content: "The live is awesome, but I'm hungry." }
+            ]
+        },
+        /*  German (DE) spellchecking only  */
+        "de-de": {
+            systemPrompt:
+                "Du bist ein Korrekturleser und Rechtschreibprüfer für Deutsch.\n" +
+                "Gib nur den korrigierten Text aus.\n" +
+                "Benutze KEIN Markdown.\n" +
+                "Gib KEINE Erklärungen.\n" +
+                "Gib KEINE Einleitung.\n" +
+                "Gib KEINE Kommentare.\n" +
+                "Gib KEINE Preamble.\n" +
+                "Gib KEINEN Prolog.\n" +
+                "Gib KEINEN Epilog.\n" +
+                "Ändere NICHT die Grammatik.\n" +
+                "Verwende KEINE Synonyme für Wörter.\n" +
+                "Behalte alle Wörter bei.\n" +
+                "Füge fehlende Kommas ein.\n" +
+                "Füge fehlende Punkte ein.\n" +
+                "Füge fehlende Fragezeichen ein.\n" +
+                "Füge fehlende Bindestriche ein.\n" +
+                "Füge fehlende Gedankenstriche ein.\n" +
+                "Fokussiere dich NUR auf die Rechtschreibung der Wörter.\n" +
+                "Der von dir zu korrigierende Text ist:\n",
+            chat: [
+                { role: "user",   content: "Ich ljebe meine Frao" },
+                { role: "system", content: "Ich liebe meine Frau." },
+                { role: "user",   content: "Die Wedter ist wunderschoen." },
+                { role: "system", content: "Das Wetter ist wunderschön." },
+                { role: "user",   content: "Das Leben einfach großartig aber ich bin hungrig." },
+                { role: "system", content: "Das Leben ist einfach großartig, aber ich bin hungrig." }
+            ]
+        },
         /*  English (EN) to German (DE) translation  */
         "en-de": {
             systemPrompt:
@@ -78,8 +140,8 @@ export default class SpeechFlowNodeGemma extends SpeechFlowNode {
     }
     /*  construct node  */
-    constructor (id: string, opts: { [ id: string ]: any }, args: any[]) {
-        super(id, opts, args)
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
         /*  declare node configuration parameters  */
         this.configure({
@@ -88,10 +150,6 @@ export default class SpeechFlowNodeGemma extends SpeechFlowNode {
             dst: { type: "string", pos: 1, val: "en", match: /^(?:de|en)$/ }
         })
-        /*  sanity check situation  */
-        if (this.params.src === this.params.dst)
-            throw new Error("source and destination languages cannot be the same")
         /*  declare node input/output format  */
         this.input  = "text"
         this.output = "text"
@@ -126,27 +184,33 @@ export default class SpeechFlowNodeGemma extends SpeechFlowNode {
         }
         /*  establish a duplex stream and connect it to Ollama  */
-        const queue = new EventEmitter()
-        this.stream = new Stream.Duplex({
-            write (chunk: Buffer, encoding, callback) {
-                const data = chunk.toString()
-                if (data === "") {
-                    queue.emit("result", "")
-                    callback()
-                }
+        this.stream = new Stream.Transform({
+            readableObjectMode: true,
+            writableObjectMode: true,
+            decodeStrings:      false,
+            transform (chunk: SpeechFlowChunk, encoding, callback) {
+                if (Buffer.isBuffer(chunk.payload))
+                    callback(new Error("invalid chunk payload type"))
                 else {
-                    translate(data).then((result) => {
-                        queue.emit("result", result)
+                    if (chunk.payload === "") {
+                        this.push(chunk)
                         callback()
-                    }).catch((err) => {
-                        callback(err)
-                    })
+                    }
+                    else {
+                        translate(chunk.payload).then((payload) => {
+                            const chunkNew = chunk.clone()
+                            chunkNew.payload = payload
+                            this.push(chunkNew)
+                            callback()
+                        }).catch((err) => {
+                            callback(err)
+                        })
+                    }
                 }
             },
-            read (size) {
-                queue.once("result", (result: string) => {
-                    this.push(result)
-                })
+            final (callback) {
+                this.push(null)
+                callback()
             }
         })
     }

package/src/speechflow-node-t2t-opus.ts ADDED Viewed

@@ -0,0 +1,111 @@
+/*
+**  SpeechFlow - Speech Processing Flow Graph
+**  Copyright (c) 2024-2025 Dr. Ralf S. Engelschall <rse@engelschall.com>
+**  Licensed under GPL 3.0 <https://spdx.org/licenses/GPL-3.0-only>
+*/
+/*  standard dependencies  */
+import path             from "node:path"
+import Stream           from "node:stream"
+/*  external dependencies  */
+import * as Transformers from "@huggingface/transformers"
+/*  internal dependencies  */
+import SpeechFlowNode, { SpeechFlowChunk } from "./speechflow-node"
+/*  SpeechFlow node for OPUS text-to-text translation  */
+export default class SpeechFlowNodeOPUS extends SpeechFlowNode {
+    /*  declare official node name  */
+    public static name = "opus"
+    /*  internal state  */
+    private translator: Transformers.TranslationPipeline | null = null
+    /*  construct node  */
+    constructor (id: string, cfg: { [ id: string ]: any }, opts: { [ id: string ]: any }, args: any[]) {
+        super(id, cfg, opts, args)
+        /*  declare node configuration parameters  */
+        this.configure({
+            src: { type: "string", pos: 0, val: "de", match: /^(?:de|en)$/ },
+            dst: { type: "string", pos: 1, val: "en", match: /^(?:de|en)$/ }
+        })
+        /*  sanity check situation  */
+        if (this.params.src === this.params.dst)
+            throw new Error("source and destination languages cannot be the same")
+        /*  declare node input/output format  */
+        this.input  = "text"
+        this.output = "text"
+    }
+    /*  open node  */
+    async open () {
+        /*  instantiate OPUS  */
+        const model = `onnx-community/opus-mt-${this.params.src}-${this.params.dst}`
+        this.translator = await Transformers.pipeline("translation", model, {
+            cache_dir: path.join(this.config.cacheDir, "opus"),
+            dtype:     "q4",
+            device:    "gpu"
+        })
+        if (this.translator === null)
+            throw new Error("failed to instantiate translator pipeline")
+        /*  provide text-to-text translation  */
+        const translate = async (text: string) => {
+            const result = await this.translator!(text)
+            return Array.isArray(result) ?
+                (result[0] as Transformers.TranslationSingle).translation_text :
+                (result as Transformers.TranslationSingle).translation_text
+        }
+        /*  establish a duplex stream and connect it to Ollama  */
+        this.stream = new Stream.Transform({
+            readableObjectMode: true,
+            writableObjectMode: true,
+            decodeStrings:      false,
+            transform (chunk: SpeechFlowChunk, encoding, callback) {
+                if (Buffer.isBuffer(chunk.payload))
+                    callback(new Error("invalid chunk payload type"))
+                else {
+                    if (chunk.payload === "") {
+                        this.push(chunk)
+                        callback()
+                    }
+                    else {
+                        translate(chunk.payload).then((payload) => {
+                            const chunkNew = chunk.clone()
+                            chunkNew.payload = payload
+                            this.push(chunkNew)
+                            callback()
+                        }).catch((err) => {
+                            callback(err)
+                        })
+                    }
+                }
+            },
+            final (callback) {
+                this.push(null)
+                callback()
+            }
+        })
+    }
+    /*  close node  */
+    async close () {
+        /*  close stream  */
+        if (this.stream !== null) {
+            this.stream.destroy()
+            this.stream = null
+        }
+        /*  shutdown OPUS  */
+        if (this.translator !== null) {
+            this.translator.dispose()
+            this.translator = null
+        }
+    }
+}