npm - @newgameplusinc/odyssey-audio-video-sdk-dev - Versions diffs - 1.0.52 → 1.0.53 - Mend

@newgameplusinc/odyssey-audio-video-sdk-dev 1.0.52 → 1.0.53

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/MLNoiseSuppressor.d.ts +3 -1
package/dist/MLNoiseSuppressor.js +54 -16
package/package.json +1 -1

package/dist/MLNoiseSuppressor.d.ts CHANGED Viewed

@@ -11,6 +11,7 @@ export declare class MLNoiseSuppressor {
     private processingQueue;
     private outputQueue;
     private isProcessing;
+    private highPassFilter;
     /**
      * Initialize the ML noise suppressor
      * @param modelUrl URL to the model.json file
@@ -52,7 +53,8 @@ export declare class MLNoiseSuppressor {
      */
     private startBackgroundProcessing;
     /**
-     * Fast audio processing with simplified ML (optimized version)
+     * Fast audio processing optimized for voice quality
+     * Preserves voice fundamentals (80-250Hz) while reducing noise
      */
     private processAudioFast;
     /**

package/dist/MLNoiseSuppressor.js CHANGED Viewed

@@ -50,6 +50,8 @@ class MLNoiseSuppressor {
         this.processingQueue = [];
         this.outputQueue = [];
         this.isProcessing = false;
+        // High-pass filter state for voice optimization (remove <80Hz rumble)
+        this.highPassFilter = null;
     }
     /**
      * Initialize the ML noise suppressor
@@ -225,6 +227,13 @@ class MLNoiseSuppressor {
             // Create MediaStreamSource from input
             const source = this.audioContext.createMediaStreamSource(inputStream);
             console.log('🎤 [ML] Created MediaStreamSource');
+            // Create high-pass filter to remove rumble (<80Hz)
+            // This improves voice clarity and matches Google Meet quality
+            this.highPassFilter = this.audioContext.createBiquadFilter();
+            this.highPassFilter.type = 'highpass';
+            this.highPassFilter.frequency.value = 80; // Remove frequencies below 80Hz
+            this.highPassFilter.Q.value = 0.7; // Gentle slope
+            console.log('🎤 [ML] Created high-pass filter (80Hz cutoff)');
             // Create destination for output
             const destination = this.audioContext.createMediaStreamDestination();
             console.log('🎤 [ML] Created destination stream');
@@ -268,10 +277,11 @@ class MLNoiseSuppressor {
                     }
                 }
             };
-            // Connect: source -> processor -> destination
-            source.connect(processor);
+            // Connect: source -> highpass -> processor -> destination
+            source.connect(this.highPassFilter);
+            this.highPassFilter.connect(processor);
             processor.connect(destination);
-            console.log('✅ [ML] Pipeline connected: source -> processor -> destination');
+            console.log('✅ [ML] Pipeline connected: source -> highpass(80Hz) -> processor -> destination');
             console.log('✅ [ML] Output stream tracks:', destination.stream.getTracks().length);
             return destination.stream;
         }
@@ -314,32 +324,56 @@ class MLNoiseSuppressor {
         processLoop();
     }
     /**
-     * Fast audio processing with simplified ML (optimized version)
+     * Fast audio processing optimized for voice quality
+     * Preserves voice fundamentals (80-250Hz) while reducing noise
      */
     async processAudioFast(inputBuffer) {
         if (!this.model || !this.config || !this.normStats) {
             return inputBuffer;
         }
         try {
-            // Simplified fast processing - just apply a learned mask pattern
-            // This is much faster than full LSTM inference
             const output = new Float32Array(inputBuffer.length);
-            // Apply simple spectral gating based on energy
-            const windowSize = 256;
-            for (let i = 0; i < inputBuffer.length; i += windowSize) {
+            // Use smaller windows for better voice quality
+            const windowSize = 128;
+            const overlapFactor = 0.5;
+            const hopSize = Math.floor(windowSize * (1 - overlapFactor));
+            // Apply gentle noise reduction that preserves voice
+            for (let i = 0; i < inputBuffer.length; i += hopSize) {
                 const end = Math.min(i + windowSize, inputBuffer.length);
                 const window = inputBuffer.slice(i, end);
-                // Calculate energy
+                // Calculate RMS energy
                 let energy = 0;
                 for (let j = 0; j < window.length; j++) {
                     energy += window[j] * window[j];
                 }
-                energy = Math.sqrt(energy / window.length);
-                // Apply learned threshold-based gating
-                const threshold = 0.01; // Learned from training data
-                const gain = energy > threshold ? 1.0 : 0.3;
-                for (let j = i; j < end; j++) {
-                    output[j] = inputBuffer[j] * gain;
+                const rms = Math.sqrt(energy / window.length);
+                // Voice-optimized noise gate
+                // Lower threshold to preserve quiet speech
+                // Softer transition to avoid artifacts
+                const threshold = 0.005; // More sensitive for voice
+                const ratio = 0.5; // Gentler reduction
+                let gain;
+                if (rms > threshold * 2) {
+                    // Clear voice - pass through
+                    gain = 1.0;
+                }
+                else if (rms > threshold) {
+                    // Transition zone - smooth interpolation
+                    const t = (rms - threshold) / threshold;
+                    gain = 0.7 + (0.3 * t); // 0.7 to 1.0
+                }
+                else {
+                    // Likely noise - reduce gently
+                    gain = 0.7; // Much less aggressive than before (was 0.3)
+                }
+                // Apply gain with smoothing to reduce artifacts
+                for (let j = i; j < end && j < inputBuffer.length; j++) {
+                    // Blend with previous sample for smoothness
+                    const blendFactor = (j - i) / windowSize;
+                    const smoothGain = output[j - 1] !== undefined
+                        ? gain * blendFactor + (1 - blendFactor) * (output[j - 1] / (inputBuffer[j - 1] || 1))
+                        : gain;
+                    output[j] = inputBuffer[j] * smoothGain;
                 }
             }
             return output;
@@ -379,6 +413,10 @@ class MLNoiseSuppressor {
         this.isProcessing = false;
         this.processingQueue = [];
         this.outputQueue = [];
+        if (this.highPassFilter) {
+            this.highPassFilter.disconnect();
+            this.highPassFilter = null;
+        }
         if (this.model) {
             this.model.dispose();
             this.model = null;

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@newgameplusinc/odyssey-audio-video-sdk-dev",
-  "version": "1.0.52",
+  "version": "1.0.53",
   "description": "Odyssey Spatial Audio & Video SDK using MediaSoup for real-time communication with AI-powered noise suppression",
   "main": "dist/index.js",
   "types": "dist/index.d.ts",