npm - @tensamin/audio - Versions diffs - 0.1.4 → 0.1.6 - Mend

@tensamin/audio 0.1.4 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/dist/{chunk-AHBRT4RD.mjs → chunk-DF4AYGHJ.mjs} +6 -2
package/dist/{chunk-NMHKX64G.mjs → chunk-TLPO52HV.mjs} +34 -8
package/dist/{chunk-ERJVV5JR.mjs → chunk-TWQJGBBU.mjs} +1 -1
package/dist/{chunk-YOSTLLCS.mjs → chunk-ZCC7ID7L.mjs} +1 -1
package/dist/extensibility/plugins.js +34 -8
package/dist/extensibility/plugins.mjs +2 -2
package/dist/index.js +39 -9
package/dist/index.mjs +4 -4
package/dist/livekit/integration.js +39 -9
package/dist/livekit/integration.mjs +4 -4
package/dist/pipeline/audio-pipeline.js +39 -9
package/dist/pipeline/audio-pipeline.mjs +3 -3
package/dist/vad/vad-node.d.mts +2 -0
package/dist/vad/vad-node.d.ts +2 -0
package/dist/vad/vad-node.js +34 -8
package/dist/vad/vad-node.mjs +1 -1
package/package.json +1 -1

package/dist/{chunk-AHBRT4RD.mjs → chunk-DF4AYGHJ.mjs} RENAMED Viewed

@@ -9,7 +9,7 @@ import {
 import {
   getNoiseSuppressionPlugin,
   getVADPlugin
-} from "./chunk-YOSTLLCS.mjs";
+} from "./chunk-ZCC7ID7L.mjs";
 // src/pipeline/audio-pipeline.ts
 import mitt from "mitt";
@@ -93,12 +93,16 @@ async function createAudioPipeline(sourceTrack, config = {}) {
     throw err;
   }
   const vadStateMachine = new VADStateMachine(fullConfig.vad);
+  let vadPlugin;
   try {
-    const vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
+    vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
     vadNode = await vadPlugin.createNode(context, fullConfig.vad, (prob) => {
       try {
         const timestamp = context.currentTime * 1e3;
         const newState = vadStateMachine.processFrame(prob, timestamp);
+        if (vadPlugin && typeof vadPlugin.updateSpeakingState === "function") {
+          vadPlugin.updateSpeakingState(newState.isSpeaking);
+        }
         if (newState.state !== lastVadState.state || Math.abs(newState.probability - lastVadState.probability) > 0.1) {
           emitter.emit("vadChange", newState);
           lastVadState = newState;

package/dist/{chunk-NMHKX64G.mjs → chunk-TLPO52HV.mjs} RENAMED Viewed

@@ -4,7 +4,7 @@ var createEnergyVadWorkletCode = (vadConfig) => {
   const smoothing = energyParams.smoothing ?? 0.95;
   const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
   const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
-  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-4;
   const minSNR = energyParams.minSNR ?? 2;
   const snrRange = energyParams.snrRange ?? 8;
   return `
@@ -18,6 +18,13 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
     this.minSNR = ${minSNR};
     this.snrRange = ${snrRange};
+    this.isSpeaking = false;
+    this.port.onmessage = (event) => {
+      if (event.data && event.data.isSpeaking !== undefined) {
+        this.isSpeaking = event.data.isSpeaking;
+      }
+    };
   }
   process(inputs, outputs, parameters) {
@@ -32,14 +39,26 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Adaptive noise floor estimation
-    // When signal is quiet, adapt quickly to find new noise floor
-    // When signal is loud (speech), adapt slowly to avoid raising noise floor
-    if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
-    } else {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+    // Adaptive noise floor estimation - ONLY during silence
+    // This prevents the noise floor from rising during speech
+    if (!this.isSpeaking) {
+      if (rms < this.noiseFloor) {
+        this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
+      } else {
+        // Even during silence, if we detect a loud signal, adapt very slowly
+        // This could be brief noise we haven't classified as speech yet
+        // SAFEGUARD: If the signal is significantly louder than the noise floor (e.g. > 3x),
+        // assume it's unclassified speech or a sudden loud noise and DO NOT adapt.
+        // This prevents the noise floor from "chasing" the speech level during brief pauses or onsets.
+        const instantSnr = rms / (this.noiseFloor + 1e-6);
+        if (instantSnr < 3.0) {
+          this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+        }
+      }
     }
+    // During speech, freeze the noise floor to maintain consistent detection
     // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
@@ -60,6 +79,7 @@ registerProcessor('energy-vad-processor', EnergyVadProcessor);
 };
 var EnergyVADPlugin = class {
   name = "energy-vad";
+  workletNode = null;
   async createNode(context, config, onDecision) {
     if (!config?.enabled) {
       console.log("VAD disabled, using passthrough node");
@@ -86,6 +106,7 @@ var EnergyVADPlugin = class {
     let node;
     try {
       node = new AudioWorkletNode(context, "energy-vad-processor");
+      this.workletNode = node;
       console.log("Energy VAD node created successfully");
     } catch (e) {
       const error = new Error(
@@ -111,6 +132,11 @@ var EnergyVADPlugin = class {
     };
     return node;
   }
+  updateSpeakingState(isSpeaking) {
+    if (this.workletNode) {
+      this.workletNode.port.postMessage({ isSpeaking });
+    }
+  }
 };
 export {

package/dist/{chunk-ERJVV5JR.mjs → chunk-TWQJGBBU.mjs} RENAMED Viewed

@@ -1,6 +1,6 @@
 import {
   createAudioPipeline
-} from "./chunk-AHBRT4RD.mjs";
+} from "./chunk-DF4AYGHJ.mjs";
 // src/livekit/integration.ts
 async function attachProcessingToTrack(track, config = {}) {

package/dist/{chunk-YOSTLLCS.mjs → chunk-ZCC7ID7L.mjs} RENAMED Viewed

@@ -3,7 +3,7 @@ import {
 } from "./chunk-XO6B3D4A.mjs";
 import {
   EnergyVADPlugin
-} from "./chunk-NMHKX64G.mjs";
+} from "./chunk-TLPO52HV.mjs";
 // src/extensibility/plugins.ts
 var nsPlugins = /* @__PURE__ */ new Map();

package/dist/extensibility/plugins.js CHANGED Viewed

@@ -107,7 +107,7 @@ var createEnergyVadWorkletCode = (vadConfig) => {
   const smoothing = energyParams.smoothing ?? 0.95;
   const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
   const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
-  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-4;
   const minSNR = energyParams.minSNR ?? 2;
   const snrRange = energyParams.snrRange ?? 8;
   return `
@@ -121,6 +121,13 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
     this.minSNR = ${minSNR};
     this.snrRange = ${snrRange};
+    this.isSpeaking = false;
+    this.port.onmessage = (event) => {
+      if (event.data && event.data.isSpeaking !== undefined) {
+        this.isSpeaking = event.data.isSpeaking;
+      }
+    };
   }
   process(inputs, outputs, parameters) {
@@ -135,14 +142,26 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Adaptive noise floor estimation
-    // When signal is quiet, adapt quickly to find new noise floor
-    // When signal is loud (speech), adapt slowly to avoid raising noise floor
-    if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
-    } else {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+    // Adaptive noise floor estimation - ONLY during silence
+    // This prevents the noise floor from rising during speech
+    if (!this.isSpeaking) {
+      if (rms < this.noiseFloor) {
+        this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
+      } else {
+        // Even during silence, if we detect a loud signal, adapt very slowly
+        // This could be brief noise we haven't classified as speech yet
+        // SAFEGUARD: If the signal is significantly louder than the noise floor (e.g. > 3x),
+        // assume it's unclassified speech or a sudden loud noise and DO NOT adapt.
+        // This prevents the noise floor from "chasing" the speech level during brief pauses or onsets.
+        const instantSnr = rms / (this.noiseFloor + 1e-6);
+        if (instantSnr < 3.0) {
+          this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+        }
+      }
     }
+    // During speech, freeze the noise floor to maintain consistent detection
     // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
@@ -163,6 +182,7 @@ registerProcessor('energy-vad-processor', EnergyVadProcessor);
 };
 var EnergyVADPlugin = class {
   name = "energy-vad";
+  workletNode = null;
   async createNode(context, config, onDecision) {
     if (!config?.enabled) {
       console.log("VAD disabled, using passthrough node");
@@ -189,6 +209,7 @@ var EnergyVADPlugin = class {
     let node;
     try {
       node = new AudioWorkletNode(context, "energy-vad-processor");
+      this.workletNode = node;
       console.log("Energy VAD node created successfully");
     } catch (e) {
       const error = new Error(
@@ -214,6 +235,11 @@ var EnergyVADPlugin = class {
     };
     return node;
   }
+  updateSpeakingState(isSpeaking) {
+    if (this.workletNode) {
+      this.workletNode.port.postMessage({ isSpeaking });
+    }
+  }
 };
 // src/extensibility/plugins.ts

package/dist/extensibility/plugins.mjs CHANGED Viewed

@@ -3,9 +3,9 @@ import {
   getVADPlugin,
   registerNoiseSuppressionPlugin,
   registerVADPlugin
-} from "../chunk-YOSTLLCS.mjs";
+} from "../chunk-ZCC7ID7L.mjs";
 import "../chunk-XO6B3D4A.mjs";
-import "../chunk-NMHKX64G.mjs";
+import "../chunk-TLPO52HV.mjs";
 export {
   getNoiseSuppressionPlugin,
   getVADPlugin,

package/dist/index.js CHANGED Viewed

@@ -159,7 +159,7 @@ var createEnergyVadWorkletCode = (vadConfig) => {
   const smoothing = energyParams.smoothing ?? 0.95;
   const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
   const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
-  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-4;
   const minSNR = energyParams.minSNR ?? 2;
   const snrRange = energyParams.snrRange ?? 8;
   return `
@@ -173,6 +173,13 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
     this.minSNR = ${minSNR};
     this.snrRange = ${snrRange};
+    this.isSpeaking = false;
+    this.port.onmessage = (event) => {
+      if (event.data && event.data.isSpeaking !== undefined) {
+        this.isSpeaking = event.data.isSpeaking;
+      }
+    };
   }
   process(inputs, outputs, parameters) {
@@ -187,14 +194,26 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Adaptive noise floor estimation
-    // When signal is quiet, adapt quickly to find new noise floor
-    // When signal is loud (speech), adapt slowly to avoid raising noise floor
-    if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
-    } else {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+    // Adaptive noise floor estimation - ONLY during silence
+    // This prevents the noise floor from rising during speech
+    if (!this.isSpeaking) {
+      if (rms < this.noiseFloor) {
+        this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
+      } else {
+        // Even during silence, if we detect a loud signal, adapt very slowly
+        // This could be brief noise we haven't classified as speech yet
+        // SAFEGUARD: If the signal is significantly louder than the noise floor (e.g. > 3x),
+        // assume it's unclassified speech or a sudden loud noise and DO NOT adapt.
+        // This prevents the noise floor from "chasing" the speech level during brief pauses or onsets.
+        const instantSnr = rms / (this.noiseFloor + 1e-6);
+        if (instantSnr < 3.0) {
+          this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+        }
+      }
     }
+    // During speech, freeze the noise floor to maintain consistent detection
     // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
@@ -215,6 +234,7 @@ registerProcessor('energy-vad-processor', EnergyVadProcessor);
 };
 var EnergyVADPlugin = class {
   name = "energy-vad";
+  workletNode = null;
   async createNode(context, config, onDecision) {
     if (!config?.enabled) {
       console.log("VAD disabled, using passthrough node");
@@ -241,6 +261,7 @@ var EnergyVADPlugin = class {
     let node;
     try {
       node = new AudioWorkletNode(context, "energy-vad-processor");
+      this.workletNode = node;
       console.log("Energy VAD node created successfully");
     } catch (e) {
       const error = new Error(
@@ -266,6 +287,11 @@ var EnergyVADPlugin = class {
     };
     return node;
   }
+  updateSpeakingState(isSpeaking) {
+    if (this.workletNode) {
+      this.workletNode.port.postMessage({ isSpeaking });
+    }
+  }
 };
 // src/extensibility/plugins.ts
@@ -473,12 +499,16 @@ async function createAudioPipeline(sourceTrack, config = {}) {
     throw err;
   }
   const vadStateMachine = new VADStateMachine(fullConfig.vad);
+  let vadPlugin;
   try {
-    const vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
+    vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
     vadNode = await vadPlugin.createNode(context, fullConfig.vad, (prob) => {
       try {
         const timestamp = context.currentTime * 1e3;
         const newState = vadStateMachine.processFrame(prob, timestamp);
+        if (vadPlugin && typeof vadPlugin.updateSpeakingState === "function") {
+          vadPlugin.updateSpeakingState(newState.isSpeaking);
+        }
         if (newState.state !== lastVadState.state || Math.abs(newState.probability - lastVadState.probability) > 0.1) {
           emitter.emit("vadChange", newState);
           lastVadState = newState;

package/dist/index.mjs CHANGED Viewed

@@ -1,10 +1,10 @@
 import "./chunk-WBQAMGXK.mjs";
 import {
   attachProcessingToTrack
-} from "./chunk-ERJVV5JR.mjs";
+} from "./chunk-TWQJGBBU.mjs";
 import {
   createAudioPipeline
-} from "./chunk-AHBRT4RD.mjs";
+} from "./chunk-DF4AYGHJ.mjs";
 import {
   VADStateMachine
 } from "./chunk-N553RHTI.mjs";
@@ -21,13 +21,13 @@ import {
   getVADPlugin,
   registerNoiseSuppressionPlugin,
   registerVADPlugin
-} from "./chunk-YOSTLLCS.mjs";
+} from "./chunk-ZCC7ID7L.mjs";
 import {
   RNNoisePlugin
 } from "./chunk-XO6B3D4A.mjs";
 import {
   EnergyVADPlugin
-} from "./chunk-NMHKX64G.mjs";
+} from "./chunk-TLPO52HV.mjs";
 export {
   EnergyVADPlugin,
   RNNoisePlugin,

package/dist/livekit/integration.js CHANGED Viewed

@@ -128,7 +128,7 @@ var createEnergyVadWorkletCode = (vadConfig) => {
   const smoothing = energyParams.smoothing ?? 0.95;
   const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
   const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
-  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-4;
   const minSNR = energyParams.minSNR ?? 2;
   const snrRange = energyParams.snrRange ?? 8;
   return `
@@ -142,6 +142,13 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
     this.minSNR = ${minSNR};
     this.snrRange = ${snrRange};
+    this.isSpeaking = false;
+    this.port.onmessage = (event) => {
+      if (event.data && event.data.isSpeaking !== undefined) {
+        this.isSpeaking = event.data.isSpeaking;
+      }
+    };
   }
   process(inputs, outputs, parameters) {
@@ -156,14 +163,26 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Adaptive noise floor estimation
-    // When signal is quiet, adapt quickly to find new noise floor
-    // When signal is loud (speech), adapt slowly to avoid raising noise floor
-    if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
-    } else {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+    // Adaptive noise floor estimation - ONLY during silence
+    // This prevents the noise floor from rising during speech
+    if (!this.isSpeaking) {
+      if (rms < this.noiseFloor) {
+        this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
+      } else {
+        // Even during silence, if we detect a loud signal, adapt very slowly
+        // This could be brief noise we haven't classified as speech yet
+        // SAFEGUARD: If the signal is significantly louder than the noise floor (e.g. > 3x),
+        // assume it's unclassified speech or a sudden loud noise and DO NOT adapt.
+        // This prevents the noise floor from "chasing" the speech level during brief pauses or onsets.
+        const instantSnr = rms / (this.noiseFloor + 1e-6);
+        if (instantSnr < 3.0) {
+          this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+        }
+      }
     }
+    // During speech, freeze the noise floor to maintain consistent detection
     // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
@@ -184,6 +203,7 @@ registerProcessor('energy-vad-processor', EnergyVadProcessor);
 };
 var EnergyVADPlugin = class {
   name = "energy-vad";
+  workletNode = null;
   async createNode(context, config, onDecision) {
     if (!config?.enabled) {
       console.log("VAD disabled, using passthrough node");
@@ -210,6 +230,7 @@ var EnergyVADPlugin = class {
     let node;
     try {
       node = new AudioWorkletNode(context, "energy-vad-processor");
+      this.workletNode = node;
       console.log("Energy VAD node created successfully");
     } catch (e) {
       const error = new Error(
@@ -235,6 +256,11 @@ var EnergyVADPlugin = class {
     };
     return node;
   }
+  updateSpeakingState(isSpeaking) {
+    if (this.workletNode) {
+      this.workletNode.port.postMessage({ isSpeaking });
+    }
+  }
 };
 // src/extensibility/plugins.ts
@@ -436,12 +462,16 @@ async function createAudioPipeline(sourceTrack, config = {}) {
     throw err;
   }
   const vadStateMachine = new VADStateMachine(fullConfig.vad);
+  let vadPlugin;
   try {
-    const vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
+    vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
     vadNode = await vadPlugin.createNode(context, fullConfig.vad, (prob) => {
       try {
         const timestamp = context.currentTime * 1e3;
         const newState = vadStateMachine.processFrame(prob, timestamp);
+        if (vadPlugin && typeof vadPlugin.updateSpeakingState === "function") {
+          vadPlugin.updateSpeakingState(newState.isSpeaking);
+        }
         if (newState.state !== lastVadState.state || Math.abs(newState.probability - lastVadState.probability) > 0.1) {
           emitter.emit("vadChange", newState);
           lastVadState = newState;

package/dist/livekit/integration.mjs CHANGED Viewed

@@ -1,12 +1,12 @@
 import {
   attachProcessingToTrack
-} from "../chunk-ERJVV5JR.mjs";
-import "../chunk-AHBRT4RD.mjs";
+} from "../chunk-TWQJGBBU.mjs";
+import "../chunk-DF4AYGHJ.mjs";
 import "../chunk-N553RHTI.mjs";
 import "../chunk-OZ7KMC4S.mjs";
-import "../chunk-YOSTLLCS.mjs";
+import "../chunk-ZCC7ID7L.mjs";
 import "../chunk-XO6B3D4A.mjs";
-import "../chunk-NMHKX64G.mjs";
+import "../chunk-TLPO52HV.mjs";
 export {
   attachProcessingToTrack
 };

package/dist/pipeline/audio-pipeline.js CHANGED Viewed

@@ -126,7 +126,7 @@ var createEnergyVadWorkletCode = (vadConfig) => {
   const smoothing = energyParams.smoothing ?? 0.95;
   const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
   const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
-  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-4;
   const minSNR = energyParams.minSNR ?? 2;
   const snrRange = energyParams.snrRange ?? 8;
   return `
@@ -140,6 +140,13 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
     this.minSNR = ${minSNR};
     this.snrRange = ${snrRange};
+    this.isSpeaking = false;
+    this.port.onmessage = (event) => {
+      if (event.data && event.data.isSpeaking !== undefined) {
+        this.isSpeaking = event.data.isSpeaking;
+      }
+    };
   }
   process(inputs, outputs, parameters) {
@@ -154,14 +161,26 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Adaptive noise floor estimation
-    // When signal is quiet, adapt quickly to find new noise floor
-    // When signal is loud (speech), adapt slowly to avoid raising noise floor
-    if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
-    } else {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+    // Adaptive noise floor estimation - ONLY during silence
+    // This prevents the noise floor from rising during speech
+    if (!this.isSpeaking) {
+      if (rms < this.noiseFloor) {
+        this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
+      } else {
+        // Even during silence, if we detect a loud signal, adapt very slowly
+        // This could be brief noise we haven't classified as speech yet
+        // SAFEGUARD: If the signal is significantly louder than the noise floor (e.g. > 3x),
+        // assume it's unclassified speech or a sudden loud noise and DO NOT adapt.
+        // This prevents the noise floor from "chasing" the speech level during brief pauses or onsets.
+        const instantSnr = rms / (this.noiseFloor + 1e-6);
+        if (instantSnr < 3.0) {
+          this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+        }
+      }
     }
+    // During speech, freeze the noise floor to maintain consistent detection
     // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
@@ -182,6 +201,7 @@ registerProcessor('energy-vad-processor', EnergyVadProcessor);
 };
 var EnergyVADPlugin = class {
   name = "energy-vad";
+  workletNode = null;
   async createNode(context, config, onDecision) {
     if (!config?.enabled) {
       console.log("VAD disabled, using passthrough node");
@@ -208,6 +228,7 @@ var EnergyVADPlugin = class {
     let node;
     try {
       node = new AudioWorkletNode(context, "energy-vad-processor");
+      this.workletNode = node;
       console.log("Energy VAD node created successfully");
     } catch (e) {
       const error = new Error(
@@ -233,6 +254,11 @@ var EnergyVADPlugin = class {
     };
     return node;
   }
+  updateSpeakingState(isSpeaking) {
+    if (this.workletNode) {
+      this.workletNode.port.postMessage({ isSpeaking });
+    }
+  }
 };
 // src/extensibility/plugins.ts
@@ -434,12 +460,16 @@ async function createAudioPipeline(sourceTrack, config = {}) {
     throw err;
   }
   const vadStateMachine = new VADStateMachine(fullConfig.vad);
+  let vadPlugin;
   try {
-    const vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
+    vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
     vadNode = await vadPlugin.createNode(context, fullConfig.vad, (prob) => {
       try {
         const timestamp = context.currentTime * 1e3;
         const newState = vadStateMachine.processFrame(prob, timestamp);
+        if (vadPlugin && typeof vadPlugin.updateSpeakingState === "function") {
+          vadPlugin.updateSpeakingState(newState.isSpeaking);
+        }
         if (newState.state !== lastVadState.state || Math.abs(newState.probability - lastVadState.probability) > 0.1) {
           emitter.emit("vadChange", newState);
           lastVadState = newState;

package/dist/pipeline/audio-pipeline.mjs CHANGED Viewed

@@ -1,11 +1,11 @@
 import {
   createAudioPipeline
-} from "../chunk-AHBRT4RD.mjs";
+} from "../chunk-DF4AYGHJ.mjs";
 import "../chunk-N553RHTI.mjs";
 import "../chunk-OZ7KMC4S.mjs";
-import "../chunk-YOSTLLCS.mjs";
+import "../chunk-ZCC7ID7L.mjs";
 import "../chunk-XO6B3D4A.mjs";
-import "../chunk-NMHKX64G.mjs";
+import "../chunk-TLPO52HV.mjs";
 export {
   createAudioPipeline
 };

package/dist/vad/vad-node.d.mts CHANGED Viewed

@@ -3,7 +3,9 @@ import 'mitt';
 declare class EnergyVADPlugin implements VADPlugin {
     name: string;
+    private workletNode;
     createNode(context: AudioContext, config: AudioProcessingConfig["vad"], onDecision: (probability: number) => void): Promise<AudioNode>;
+    updateSpeakingState(isSpeaking: boolean): void;
 }
 export { EnergyVADPlugin };

package/dist/vad/vad-node.d.ts CHANGED Viewed

@@ -3,7 +3,9 @@ import 'mitt';
 declare class EnergyVADPlugin implements VADPlugin {
     name: string;
+    private workletNode;
     createNode(context: AudioContext, config: AudioProcessingConfig["vad"], onDecision: (probability: number) => void): Promise<AudioNode>;
+    updateSpeakingState(isSpeaking: boolean): void;
 }
 export { EnergyVADPlugin };

package/dist/vad/vad-node.js CHANGED Viewed

@@ -28,7 +28,7 @@ var createEnergyVadWorkletCode = (vadConfig) => {
   const smoothing = energyParams.smoothing ?? 0.95;
   const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
   const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
-  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-4;
   const minSNR = energyParams.minSNR ?? 2;
   const snrRange = energyParams.snrRange ?? 8;
   return `
@@ -42,6 +42,13 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
     this.minSNR = ${minSNR};
     this.snrRange = ${snrRange};
+    this.isSpeaking = false;
+    this.port.onmessage = (event) => {
+      if (event.data && event.data.isSpeaking !== undefined) {
+        this.isSpeaking = event.data.isSpeaking;
+      }
+    };
   }
   process(inputs, outputs, parameters) {
@@ -56,14 +63,26 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Adaptive noise floor estimation
-    // When signal is quiet, adapt quickly to find new noise floor
-    // When signal is loud (speech), adapt slowly to avoid raising noise floor
-    if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
-    } else {
-      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+    // Adaptive noise floor estimation - ONLY during silence
+    // This prevents the noise floor from rising during speech
+    if (!this.isSpeaking) {
+      if (rms < this.noiseFloor) {
+        this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
+      } else {
+        // Even during silence, if we detect a loud signal, adapt very slowly
+        // This could be brief noise we haven't classified as speech yet
+        // SAFEGUARD: If the signal is significantly louder than the noise floor (e.g. > 3x),
+        // assume it's unclassified speech or a sudden loud noise and DO NOT adapt.
+        // This prevents the noise floor from "chasing" the speech level during brief pauses or onsets.
+        const instantSnr = rms / (this.noiseFloor + 1e-6);
+        if (instantSnr < 3.0) {
+          this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
+        }
+      }
     }
+    // During speech, freeze the noise floor to maintain consistent detection
     // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
@@ -84,6 +103,7 @@ registerProcessor('energy-vad-processor', EnergyVadProcessor);
 };
 var EnergyVADPlugin = class {
   name = "energy-vad";
+  workletNode = null;
   async createNode(context, config, onDecision) {
     if (!config?.enabled) {
       console.log("VAD disabled, using passthrough node");
@@ -110,6 +130,7 @@ var EnergyVADPlugin = class {
     let node;
     try {
       node = new AudioWorkletNode(context, "energy-vad-processor");
+      this.workletNode = node;
       console.log("Energy VAD node created successfully");
     } catch (e) {
       const error = new Error(
@@ -135,6 +156,11 @@ var EnergyVADPlugin = class {
     };
     return node;
   }
+  updateSpeakingState(isSpeaking) {
+    if (this.workletNode) {
+      this.workletNode.port.postMessage({ isSpeaking });
+    }
+  }
 };
 // Annotate the CommonJS export names for ESM import in node:
 0 && (module.exports = {

package/dist/vad/vad-node.mjs CHANGED Viewed

@@ -1,6 +1,6 @@
 import {
   EnergyVADPlugin
-} from "../chunk-NMHKX64G.mjs";
+} from "../chunk-TLPO52HV.mjs";
 export {
   EnergyVADPlugin
 };

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@tensamin/audio",
-  "version": "0.1.4",
+  "version": "0.1.6",
   "main": "dist/index.js",
   "module": "dist/index.mjs",
   "types": "dist/index.d.ts",