npm - @tensamin/audio - Versions diffs - 0.1.3 → 0.1.4 - Mend

@tensamin/audio 0.1.3 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

package/README.md +217 -54
package/dist/{chunk-EXH2PNUE.mjs → chunk-AHBRT4RD.mjs} +128 -33
package/dist/{chunk-XMTQPMQ6.mjs → chunk-ERJVV5JR.mjs} +1 -1
package/dist/chunk-N553RHTI.mjs +93 -0
package/dist/{chunk-R5JVHKWA.mjs → chunk-NMHKX64G.mjs} +32 -12
package/dist/{chunk-6P2RDBW5.mjs → chunk-YOSTLLCS.mjs} +1 -1
package/dist/extensibility/plugins.js +32 -12
package/dist/extensibility/plugins.mjs +2 -2
package/dist/index.js +200 -51
package/dist/index.mjs +5 -5
package/dist/livekit/integration.js +200 -51
package/dist/livekit/integration.mjs +5 -5
package/dist/pipeline/audio-pipeline.js +200 -51
package/dist/pipeline/audio-pipeline.mjs +4 -4
package/dist/types.d.mts +118 -10
package/dist/types.d.ts +118 -10
package/dist/vad/vad-node.js +32 -12
package/dist/vad/vad-node.mjs +1 -1
package/dist/vad/vad-state.d.mts +1 -0
package/dist/vad/vad-state.d.ts +1 -0
package/dist/vad/vad-state.js +42 -8
package/dist/vad/vad-state.mjs +1 -1
package/package.json +1 -1
package/dist/chunk-JJASCVEW.mjs +0 -59

package/dist/{chunk-R5JVHKWA.mjs → chunk-NMHKX64G.mjs} RENAMED Viewed

@@ -1,11 +1,23 @@
 // src/vad/vad-node.ts
-var energyVadWorkletCode = `
+var createEnergyVadWorkletCode = (vadConfig) => {
+  const energyParams = vadConfig?.energyVad || {};
+  const smoothing = energyParams.smoothing ?? 0.95;
+  const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
+  const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const minSNR = energyParams.minSNR ?? 2;
+  const snrRange = energyParams.snrRange ?? 8;
+  return `
 class EnergyVadProcessor extends AudioWorkletProcessor {
   constructor() {
     super();
-    this.smoothing = 0.95;
+    this.smoothing = ${smoothing};
     this.energy = 0;
-    this.noiseFloor = 0.001;
+    this.noiseFloor = ${initialNoiseFloor};
+    this.noiseFloorAdaptRateQuiet = ${noiseFloorAdaptRateQuiet};
+    this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
+    this.minSNR = ${minSNR};
+    this.snrRange = ${snrRange};
   }
   process(inputs, outputs, parameters) {
@@ -13,32 +25,39 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     if (!input || !input.length) return true;
     const channel = input[0];
-    // Calculate RMS
+    // Calculate RMS (Root Mean Square) energy
     let sum = 0;
     for (let i = 0; i < channel.length; i++) {
       sum += channel[i] * channel[i];
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Simple adaptive noise floor (very basic)
+    // Adaptive noise floor estimation
+    // When signal is quiet, adapt quickly to find new noise floor
+    // When signal is loud (speech), adapt slowly to avoid raising noise floor
     if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * 0.99 + rms * 0.01;
+      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
     } else {
-      this.noiseFloor = this.noiseFloor * 0.999 + rms * 0.001;
+      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
     }
-    // Calculate "probability" based on SNR
-    // This is a heuristic mapping from energy to 0-1
+    // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
-    const probability = Math.min(1, Math.max(0, (snr - 1.5) / 10)); // Arbitrary scaling
+    // Map SNR to probability (0-1)
+    // Probability is 0 when SNR <= minSNR
+    // Probability scales linearly from 0 to 1 between minSNR and (minSNR + snrRange)
+    // Probability is 1 when SNR >= (minSNR + snrRange)
+    const probability = Math.min(1, Math.max(0, (snr - this.minSNR) / this.snrRange));
-    this.port.postMessage({ probability });
+    this.port.postMessage({ probability, snr, noiseFloor: this.noiseFloor, rms });
     return true;
   }
 }
 registerProcessor('energy-vad-processor', EnergyVadProcessor);
 `;
+};
 var EnergyVADPlugin = class {
   name = "energy-vad";
   async createNode(context, config, onDecision) {
@@ -47,7 +66,8 @@ var EnergyVADPlugin = class {
       const pass = context.createGain();
       return pass;
     }
-    const blob = new Blob([energyVadWorkletCode], {
+    const workletCode = createEnergyVadWorkletCode(config);
+    const blob = new Blob([workletCode], {
       type: "application/javascript"
     });
     const url = URL.createObjectURL(blob);

package/dist/{chunk-6P2RDBW5.mjs → chunk-YOSTLLCS.mjs} RENAMED Viewed

@@ -3,7 +3,7 @@ import {
 } from "./chunk-XO6B3D4A.mjs";
 import {
   EnergyVADPlugin
-} from "./chunk-R5JVHKWA.mjs";
+} from "./chunk-NMHKX64G.mjs";
 // src/extensibility/plugins.ts
 var nsPlugins = /* @__PURE__ */ new Map();

package/dist/extensibility/plugins.js CHANGED Viewed

@@ -102,13 +102,25 @@ To disable noise suppression, set noiseSuppression.enabled to false.`
 };
 // src/vad/vad-node.ts
-var energyVadWorkletCode = `
+var createEnergyVadWorkletCode = (vadConfig) => {
+  const energyParams = vadConfig?.energyVad || {};
+  const smoothing = energyParams.smoothing ?? 0.95;
+  const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
+  const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const minSNR = energyParams.minSNR ?? 2;
+  const snrRange = energyParams.snrRange ?? 8;
+  return `
 class EnergyVadProcessor extends AudioWorkletProcessor {
   constructor() {
     super();
-    this.smoothing = 0.95;
+    this.smoothing = ${smoothing};
     this.energy = 0;
-    this.noiseFloor = 0.001;
+    this.noiseFloor = ${initialNoiseFloor};
+    this.noiseFloorAdaptRateQuiet = ${noiseFloorAdaptRateQuiet};
+    this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
+    this.minSNR = ${minSNR};
+    this.snrRange = ${snrRange};
   }
   process(inputs, outputs, parameters) {
@@ -116,32 +128,39 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     if (!input || !input.length) return true;
     const channel = input[0];
-    // Calculate RMS
+    // Calculate RMS (Root Mean Square) energy
     let sum = 0;
     for (let i = 0; i < channel.length; i++) {
       sum += channel[i] * channel[i];
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Simple adaptive noise floor (very basic)
+    // Adaptive noise floor estimation
+    // When signal is quiet, adapt quickly to find new noise floor
+    // When signal is loud (speech), adapt slowly to avoid raising noise floor
     if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * 0.99 + rms * 0.01;
+      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
     } else {
-      this.noiseFloor = this.noiseFloor * 0.999 + rms * 0.001;
+      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
     }
-    // Calculate "probability" based on SNR
-    // This is a heuristic mapping from energy to 0-1
+    // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
-    const probability = Math.min(1, Math.max(0, (snr - 1.5) / 10)); // Arbitrary scaling
+    // Map SNR to probability (0-1)
+    // Probability is 0 when SNR <= minSNR
+    // Probability scales linearly from 0 to 1 between minSNR and (minSNR + snrRange)
+    // Probability is 1 when SNR >= (minSNR + snrRange)
+    const probability = Math.min(1, Math.max(0, (snr - this.minSNR) / this.snrRange));
-    this.port.postMessage({ probability });
+    this.port.postMessage({ probability, snr, noiseFloor: this.noiseFloor, rms });
     return true;
   }
 }
 registerProcessor('energy-vad-processor', EnergyVadProcessor);
 `;
+};
 var EnergyVADPlugin = class {
   name = "energy-vad";
   async createNode(context, config, onDecision) {
@@ -150,7 +169,8 @@ var EnergyVADPlugin = class {
       const pass = context.createGain();
       return pass;
     }
-    const blob = new Blob([energyVadWorkletCode], {
+    const workletCode = createEnergyVadWorkletCode(config);
+    const blob = new Blob([workletCode], {
       type: "application/javascript"
     });
     const url = URL.createObjectURL(blob);

package/dist/extensibility/plugins.mjs CHANGED Viewed

@@ -3,9 +3,9 @@ import {
   getVADPlugin,
   registerNoiseSuppressionPlugin,
   registerVADPlugin
-} from "../chunk-6P2RDBW5.mjs";
+} from "../chunk-YOSTLLCS.mjs";
 import "../chunk-XO6B3D4A.mjs";
-import "../chunk-R5JVHKWA.mjs";
+import "../chunk-NMHKX64G.mjs";
 export {
   getNoiseSuppressionPlugin,
   getVADPlugin,

package/dist/index.js CHANGED Viewed

@@ -154,13 +154,25 @@ To disable noise suppression, set noiseSuppression.enabled to false.`
 };
 // src/vad/vad-node.ts
-var energyVadWorkletCode = `
+var createEnergyVadWorkletCode = (vadConfig) => {
+  const energyParams = vadConfig?.energyVad || {};
+  const smoothing = energyParams.smoothing ?? 0.95;
+  const initialNoiseFloor = energyParams.initialNoiseFloor ?? 1e-3;
+  const noiseFloorAdaptRateQuiet = energyParams.noiseFloorAdaptRateQuiet ?? 0.01;
+  const noiseFloorAdaptRateLoud = energyParams.noiseFloorAdaptRateLoud ?? 1e-3;
+  const minSNR = energyParams.minSNR ?? 2;
+  const snrRange = energyParams.snrRange ?? 8;
+  return `
 class EnergyVadProcessor extends AudioWorkletProcessor {
   constructor() {
     super();
-    this.smoothing = 0.95;
+    this.smoothing = ${smoothing};
     this.energy = 0;
-    this.noiseFloor = 0.001;
+    this.noiseFloor = ${initialNoiseFloor};
+    this.noiseFloorAdaptRateQuiet = ${noiseFloorAdaptRateQuiet};
+    this.noiseFloorAdaptRateLoud = ${noiseFloorAdaptRateLoud};
+    this.minSNR = ${minSNR};
+    this.snrRange = ${snrRange};
   }
   process(inputs, outputs, parameters) {
@@ -168,32 +180,39 @@ class EnergyVadProcessor extends AudioWorkletProcessor {
     if (!input || !input.length) return true;
     const channel = input[0];
-    // Calculate RMS
+    // Calculate RMS (Root Mean Square) energy
     let sum = 0;
     for (let i = 0; i < channel.length; i++) {
       sum += channel[i] * channel[i];
     }
     const rms = Math.sqrt(sum / channel.length);
-    // Simple adaptive noise floor (very basic)
+    // Adaptive noise floor estimation
+    // When signal is quiet, adapt quickly to find new noise floor
+    // When signal is loud (speech), adapt slowly to avoid raising noise floor
     if (rms < this.noiseFloor) {
-      this.noiseFloor = this.noiseFloor * 0.99 + rms * 0.01;
+      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateQuiet) + rms * this.noiseFloorAdaptRateQuiet;
     } else {
-      this.noiseFloor = this.noiseFloor * 0.999 + rms * 0.001;
+      this.noiseFloor = this.noiseFloor * (1 - this.noiseFloorAdaptRateLoud) + rms * this.noiseFloorAdaptRateLoud;
     }
-    // Calculate "probability" based on SNR
-    // This is a heuristic mapping from energy to 0-1
+    // Calculate Signal-to-Noise Ratio (SNR)
     const snr = rms / (this.noiseFloor + 1e-6);
-    const probability = Math.min(1, Math.max(0, (snr - 1.5) / 10)); // Arbitrary scaling
+    // Map SNR to probability (0-1)
+    // Probability is 0 when SNR <= minSNR
+    // Probability scales linearly from 0 to 1 between minSNR and (minSNR + snrRange)
+    // Probability is 1 when SNR >= (minSNR + snrRange)
+    const probability = Math.min(1, Math.max(0, (snr - this.minSNR) / this.snrRange));
-    this.port.postMessage({ probability });
+    this.port.postMessage({ probability, snr, noiseFloor: this.noiseFloor, rms });
     return true;
   }
 }
 registerProcessor('energy-vad-processor', EnergyVadProcessor);
 `;
+};
 var EnergyVADPlugin = class {
   name = "energy-vad";
   async createNode(context, config, onDecision) {
@@ -202,7 +221,8 @@ var EnergyVADPlugin = class {
       const pass = context.createGain();
       return pass;
     }
-    const blob = new Blob([energyVadWorkletCode], {
+    const workletCode = createEnergyVadWorkletCode(config);
+    const blob = new Blob([workletCode], {
       type: "application/javascript"
     });
     const url = URL.createObjectURL(blob);
@@ -288,31 +308,60 @@ var VADStateMachine = class {
   currentState = "silent";
   lastSpeechTime = 0;
   speechStartTime = 0;
+  lastSilenceTime = 0;
   frameDurationMs = 20;
   // Assumed frame duration, updated by calls
   constructor(config) {
     this.config = {
       enabled: config?.enabled ?? true,
       pluginName: config?.pluginName ?? "energy-vad",
-      startThreshold: config?.startThreshold ?? 0.5,
-      stopThreshold: config?.stopThreshold ?? 0.4,
-      hangoverMs: config?.hangoverMs ?? 300,
-      preRollMs: config?.preRollMs ?? 200
+      // Voice-optimized defaults
+      startThreshold: config?.startThreshold ?? 0.6,
+      // Higher threshold to avoid noise
+      stopThreshold: config?.stopThreshold ?? 0.45,
+      // Balanced for voice
+      hangoverMs: config?.hangoverMs ?? 400,
+      // Smooth for natural speech
+      preRollMs: config?.preRollMs ?? 250,
+      // Generous pre-roll
+      minSpeechDurationMs: config?.minSpeechDurationMs ?? 100,
+      minSilenceDurationMs: config?.minSilenceDurationMs ?? 150,
+      energyVad: {
+        smoothing: config?.energyVad?.smoothing ?? 0.95,
+        initialNoiseFloor: config?.energyVad?.initialNoiseFloor ?? 1e-3,
+        noiseFloorAdaptRateQuiet: config?.energyVad?.noiseFloorAdaptRateQuiet ?? 0.01,
+        noiseFloorAdaptRateLoud: config?.energyVad?.noiseFloorAdaptRateLoud ?? 1e-3,
+        minSNR: config?.energyVad?.minSNR ?? 2,
+        snrRange: config?.energyVad?.snrRange ?? 8
+      }
     };
+    this.lastSilenceTime = Date.now();
   }
   updateConfig(config) {
     this.config = { ...this.config, ...config };
   }
   processFrame(probability, timestamp) {
-    const { startThreshold, stopThreshold, hangoverMs } = this.config;
+    const {
+      startThreshold,
+      stopThreshold,
+      hangoverMs,
+      minSpeechDurationMs,
+      minSilenceDurationMs
+    } = this.config;
     let newState = this.currentState;
     if (this.currentState === "silent" || this.currentState === "speech_ending") {
       if (probability >= startThreshold) {
-        newState = "speech_starting";
-        this.speechStartTime = timestamp;
-        this.lastSpeechTime = timestamp;
+        const silenceDuration = timestamp - this.lastSilenceTime;
+        if (silenceDuration >= minSilenceDurationMs) {
+          newState = "speech_starting";
+          this.speechStartTime = timestamp;
+          this.lastSpeechTime = timestamp;
+        } else {
+          newState = "silent";
+        }
       } else {
         newState = "silent";
+        this.lastSilenceTime = timestamp;
       }
     } else if (this.currentState === "speech_starting" || this.currentState === "speaking") {
       if (probability >= stopThreshold) {
@@ -320,10 +369,15 @@ var VADStateMachine = class {
         this.lastSpeechTime = timestamp;
       } else {
         const timeSinceSpeech = timestamp - this.lastSpeechTime;
+        const speechDuration = timestamp - this.speechStartTime;
         if (timeSinceSpeech < hangoverMs) {
           newState = "speaking";
+        } else if (speechDuration < minSpeechDurationMs) {
+          newState = "silent";
+          this.lastSilenceTime = timestamp;
         } else {
           newState = "speech_ending";
+          this.lastSilenceTime = timestamp;
         }
       }
     }
@@ -342,7 +396,9 @@ var VADStateMachine = class {
 async function createAudioPipeline(sourceTrack, config = {}) {
   const context = getAudioContext();
   registerPipeline();
-  const nsEnabled = config.noiseSuppression?.enabled !== false && Boolean(config.noiseSuppression?.wasmUrl && config.noiseSuppression?.simdUrl && config.noiseSuppression?.workletUrl);
+  const nsEnabled = config.noiseSuppression?.enabled !== false && Boolean(
+    config.noiseSuppression?.wasmUrl && config.noiseSuppression?.simdUrl && config.noiseSuppression?.workletUrl
+  );
   const vadEnabled = config.vad?.enabled !== false;
   const fullConfig = {
     noiseSuppression: {
@@ -351,13 +407,38 @@ async function createAudioPipeline(sourceTrack, config = {}) {
     },
     vad: {
       enabled: vadEnabled,
+      // Voice-optimized defaults (will be overridden by config)
+      startThreshold: 0.6,
+      stopThreshold: 0.45,
+      hangoverMs: 400,
+      preRollMs: 250,
+      minSpeechDurationMs: 100,
+      minSilenceDurationMs: 150,
+      energyVad: {
+        smoothing: 0.95,
+        initialNoiseFloor: 1e-3,
+        noiseFloorAdaptRateQuiet: 0.01,
+        noiseFloorAdaptRateLoud: 1e-3,
+        minSNR: 2,
+        snrRange: 8
+      },
       ...config.vad
     },
     output: {
       speechGain: 1,
-      silenceGain: vadEnabled ? 0 : 1,
-      // If no VAD, always output audio
-      gainRampTime: 0.02,
+      silenceGain: 0,
+      // Full mute for voice-only
+      gainRampTime: 0.015,
+      // Fast but smooth transitions
+      smoothTransitions: true,
+      maxGainDb: 6,
+      enableCompression: false,
+      compression: {
+        threshold: -24,
+        ratio: 3,
+        attack: 3e-3,
+        release: 0.05
+      },
       ...config.output
     },
     livekit: { manageTrackMute: false, ...config.livekit }
@@ -368,7 +449,9 @@ async function createAudioPipeline(sourceTrack, config = {}) {
     output: fullConfig.output
   });
   if (!sourceTrack || sourceTrack.kind !== "audio") {
-    throw new Error("createAudioPipeline requires a valid audio MediaStreamTrack");
+    throw new Error(
+      "createAudioPipeline requires a valid audio MediaStreamTrack"
+    );
   }
   if (sourceTrack.readyState === "ended") {
     throw new Error("Cannot create pipeline from an ended MediaStreamTrack");
@@ -382,10 +465,7 @@ async function createAudioPipeline(sourceTrack, config = {}) {
     const nsPlugin = getNoiseSuppressionPlugin(
       fullConfig.noiseSuppression?.pluginName
     );
-    nsNode = await nsPlugin.createNode(
-      context,
-      fullConfig.noiseSuppression
-    );
+    nsNode = await nsPlugin.createNode(context, fullConfig.noiseSuppression);
   } catch (error) {
     const err = error instanceof Error ? error : new Error(String(error));
     console.error("Failed to create noise suppression node:", err);
@@ -395,25 +475,21 @@ async function createAudioPipeline(sourceTrack, config = {}) {
   const vadStateMachine = new VADStateMachine(fullConfig.vad);
   try {
     const vadPlugin = getVADPlugin(fullConfig.vad?.pluginName);
-    vadNode = await vadPlugin.createNode(
-      context,
-      fullConfig.vad,
-      (prob) => {
-        try {
-          const timestamp = context.currentTime * 1e3;
-          const newState = vadStateMachine.processFrame(prob, timestamp);
-          if (newState.state !== lastVadState.state || Math.abs(newState.probability - lastVadState.probability) > 0.1) {
-            emitter.emit("vadChange", newState);
-            lastVadState = newState;
-            updateGain(newState);
-          }
-        } catch (vadError) {
-          const err = vadError instanceof Error ? vadError : new Error(String(vadError));
-          console.error("Error in VAD callback:", err);
-          emitter.emit("error", err);
+    vadNode = await vadPlugin.createNode(context, fullConfig.vad, (prob) => {
+      try {
+        const timestamp = context.currentTime * 1e3;
+        const newState = vadStateMachine.processFrame(prob, timestamp);
+        if (newState.state !== lastVadState.state || Math.abs(newState.probability - lastVadState.probability) > 0.1) {
+          emitter.emit("vadChange", newState);
+          lastVadState = newState;
+          updateGain(newState);
         }
+      } catch (vadError) {
+        const err = vadError instanceof Error ? vadError : new Error(String(vadError));
+        console.error("Error in VAD callback:", err);
+        emitter.emit("error", err);
       }
-    );
+    });
   } catch (error) {
     const err = error instanceof Error ? error : new Error(String(error));
     console.error("Failed to create VAD node:", err);
@@ -430,15 +506,31 @@ async function createAudioPipeline(sourceTrack, config = {}) {
   nsNode.connect(splitter);
   splitter.connect(vadNode);
   const delayNode = context.createDelay(1);
-  const preRollSeconds = (fullConfig.vad?.preRollMs ?? 200) / 1e3;
+  const preRollSeconds = (fullConfig.vad?.preRollMs ?? 250) / 1e3;
   delayNode.delayTime.value = preRollSeconds;
   const gainNode = context.createGain();
   gainNode.gain.value = fullConfig.output?.silenceGain ?? 0;
+  let compressor = null;
+  if (fullConfig.output?.enableCompression) {
+    compressor = context.createDynamicsCompressor();
+    const comp = fullConfig.output.compression;
+    compressor.threshold.value = comp.threshold ?? -24;
+    compressor.ratio.value = comp.ratio ?? 3;
+    compressor.attack.value = comp.attack ?? 3e-3;
+    compressor.release.value = comp.release ?? 0.05;
+    compressor.knee.value = 10;
+  }
   const destination = context.createMediaStreamDestination();
   try {
     splitter.connect(delayNode);
     delayNode.connect(gainNode);
-    gainNode.connect(destination);
+    if (compressor) {
+      gainNode.connect(compressor);
+      compressor.connect(destination);
+      console.log("Compression enabled:", fullConfig.output?.compression);
+    } else {
+      gainNode.connect(destination);
+    }
   } catch (error) {
     const err = error instanceof Error ? error : new Error(String(error));
     console.error("Failed to wire audio pipeline:", err);
@@ -447,10 +539,24 @@ async function createAudioPipeline(sourceTrack, config = {}) {
   }
   function updateGain(state) {
     try {
-      const { speechGain, silenceGain, gainRampTime } = fullConfig.output;
-      const targetGain = state.isSpeaking ? speechGain ?? 1 : silenceGain ?? 0;
+      const {
+        speechGain = 1,
+        silenceGain = 0,
+        gainRampTime = 0.015,
+        smoothTransitions = true,
+        maxGainDb = 6
+      } = fullConfig.output;
+      const maxGainLinear = Math.pow(10, maxGainDb / 20);
+      const limitedSpeechGain = Math.min(speechGain, maxGainLinear);
+      const targetGain = state.isSpeaking ? limitedSpeechGain : silenceGain;
       const now = context.currentTime;
-      gainNode.gain.setTargetAtTime(targetGain, now, gainRampTime ?? 0.02);
+      if (smoothTransitions) {
+        gainNode.gain.cancelScheduledValues(now);
+        gainNode.gain.setValueAtTime(gainNode.gain.value, now);
+        gainNode.gain.setTargetAtTime(targetGain, now, gainRampTime / 3);
+      } else {
+        gainNode.gain.setValueAtTime(targetGain, now);
+      }
     } catch (error) {
       const err = error instanceof Error ? error : new Error(String(error));
       console.error("Failed to update gain:", err);
@@ -506,6 +612,9 @@ async function createAudioPipeline(sourceTrack, config = {}) {
       vadNode.disconnect();
       delayNode.disconnect();
       gainNode.disconnect();
+      if (compressor) {
+        compressor.disconnect();
+      }
       destination.stream.getTracks().forEach((t) => t.stop());
       unregisterPipeline();
     } catch (error) {
@@ -522,7 +631,47 @@ async function createAudioPipeline(sourceTrack, config = {}) {
       try {
         if (newConfig.vad) {
           vadStateMachine.updateConfig(newConfig.vad);
+          Object.assign(fullConfig.vad, newConfig.vad);
+          if (newConfig.vad.preRollMs !== void 0) {
+            const preRollSeconds2 = newConfig.vad.preRollMs / 1e3;
+            delayNode.delayTime.setValueAtTime(
+              preRollSeconds2,
+              context.currentTime
+            );
+          }
+        }
+        if (newConfig.output) {
+          Object.assign(fullConfig.output, newConfig.output);
+          updateGain(lastVadState);
+          if (compressor && newConfig.output.compression) {
+            const comp = newConfig.output.compression;
+            if (comp.threshold !== void 0) {
+              compressor.threshold.setValueAtTime(
+                comp.threshold,
+                context.currentTime
+              );
+            }
+            if (comp.ratio !== void 0) {
+              compressor.ratio.setValueAtTime(comp.ratio, context.currentTime);
+            }
+            if (comp.attack !== void 0) {
+              compressor.attack.setValueAtTime(
+                comp.attack,
+                context.currentTime
+              );
+            }
+            if (comp.release !== void 0) {
+              compressor.release.setValueAtTime(
+                comp.release,
+                context.currentTime
+              );
+            }
+          }
+        }
+        if (newConfig.livekit) {
+          Object.assign(fullConfig.livekit, newConfig.livekit);
         }
+        console.log("Pipeline config updated:", newConfig);
       } catch (error) {
         const err = error instanceof Error ? error : new Error(String(error));
         console.error("Failed to update config:", err);

package/dist/index.mjs CHANGED Viewed

@@ -1,13 +1,13 @@
 import "./chunk-WBQAMGXK.mjs";
 import {
   attachProcessingToTrack
-} from "./chunk-XMTQPMQ6.mjs";
+} from "./chunk-ERJVV5JR.mjs";
 import {
   createAudioPipeline
-} from "./chunk-EXH2PNUE.mjs";
+} from "./chunk-AHBRT4RD.mjs";
 import {
   VADStateMachine
-} from "./chunk-JJASCVEW.mjs";
+} from "./chunk-N553RHTI.mjs";
 import {
   closeAudioContext,
   getAudioContext,
@@ -21,13 +21,13 @@ import {
   getVADPlugin,
   registerNoiseSuppressionPlugin,
   registerVADPlugin
-} from "./chunk-6P2RDBW5.mjs";
+} from "./chunk-YOSTLLCS.mjs";
 import {
   RNNoisePlugin
 } from "./chunk-XO6B3D4A.mjs";
 import {
   EnergyVADPlugin
-} from "./chunk-R5JVHKWA.mjs";
+} from "./chunk-NMHKX64G.mjs";
 export {
   EnergyVADPlugin,
   RNNoisePlugin,