npm - @stream-io/video-client - Versions diffs - 1.47.0 → 1.48.0 - Mend

@stream-io/video-client 1.47.0 → 1.48.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/CHANGELOG.md +6 -0
package/dist/index.browser.es.js +9 -192
package/dist/index.browser.es.js.map +1 -1
package/dist/index.cjs.js +8 -192
package/dist/index.cjs.js.map +1 -1
package/dist/index.d.ts +0 -1
package/dist/index.es.js +9 -192
package/dist/index.es.js.map +1 -1
package/dist/src/devices/MicrophoneManager.d.ts +0 -1
package/dist/src/types.d.ts +11 -0
package/index.ts +0 -1
package/package.json +1 -1
package/src/devices/MicrophoneManager.ts +9 -5
package/src/devices/__tests__/MicrophoneManagerRN.test.ts +28 -29
package/src/types.ts +9 -0
package/dist/src/helpers/RNSpeechDetector.d.ts +0 -23
package/src/helpers/RNSpeechDetector.ts +0 -224
package/src/helpers/__tests__/RNSpeechDetector.test.ts +0 -52

package/dist/src/devices/MicrophoneManager.d.ts CHANGED Viewed

@@ -13,7 +13,6 @@ export declare class MicrophoneManager extends AudioDeviceManager<MicrophoneMana
     private soundDetectorCleanup?;
     private soundDetectorDeviceId?;
     private noAudioDetectorCleanup?;
-    private rnSpeechDetector;
     private noiseCancellation;
     private noiseCancellationChangeUnsubscribe;
     private noiseCancellationRegistration?;

package/dist/src/types.d.ts CHANGED Viewed

@@ -371,6 +371,17 @@ export type StreamRNVideoSDKGlobals = {
          */
         check(permission: 'microphone' | 'camera'): Promise<boolean>;
     };
+    nativeEvents: {
+        speechActivity: {
+            /**
+             * Subscribes to native speech activity events.
+             * Returns an unsubscribe function.
+             */
+            subscribe(cb: (state: {
+                isSoundDetected: boolean;
+            }) => void): () => void;
+        };
+    };
 };
 declare global {
     var streamRNVideoSDK: StreamRNVideoSDKGlobals | undefined;

package/index.ts CHANGED Viewed

@@ -23,7 +23,6 @@ export * from './src/helpers/DynascaleManager';
 export * from './src/helpers/ViewportTracker';
 export * from './src/helpers/sound-detector';
 export * from './src/helpers/participantUtils';
-export * from './src/helpers/RNSpeechDetector';
 export * as Browsers from './src/helpers/browsers';
 export * from './src/logger';

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@stream-io/video-client",
-  "version": "1.47.0",
+  "version": "1.48.0",
   "main": "dist/index.cjs.js",
   "module": "dist/index.es.js",
   "browser": "dist/index.browser.es.js",

package/src/devices/MicrophoneManager.ts CHANGED Viewed

@@ -24,7 +24,6 @@ import {
   createSafeAsyncSubscription,
   createSubscription,
 } from '../store/rxUtils';
-import { RNSpeechDetector } from '../helpers/RNSpeechDetector';
 import { withoutConcurrency } from '../helpers/concurrency';
 import { disposeOfMediaStream } from './utils';
 import { promiseWithResolvers } from '../helpers/promise';
@@ -36,7 +35,6 @@ export class MicrophoneManager extends AudioDeviceManager<MicrophoneManagerState
   private soundDetectorCleanup?: () => Promise<void>;
   private soundDetectorDeviceId?: string;
   private noAudioDetectorCleanup?: () => Promise<void>;
-  private rnSpeechDetector: RNSpeechDetector | undefined;
   private noiseCancellation: INoiseCancellation | undefined;
   private noiseCancellationChangeUnsubscribe: (() => void) | undefined;
   private noiseCancellationRegistration?: Promise<void>;
@@ -422,13 +420,19 @@ export class MicrophoneManager extends AudioDeviceManager<MicrophoneManagerState
       await this.teardownSpeakingWhileMutedDetection();
       if (isReactNative()) {
-        this.rnSpeechDetector = new RNSpeechDetector();
-        const unsubscribe = await this.rnSpeechDetector.start((event) => {
+        const speechActivity =
+          globalThis.streamRNVideoSDK?.nativeEvents?.speechActivity;
+        if (!speechActivity) {
+          this.logger.warn(
+            'Native speech activity not available, make sure the "@stream-io/react-native-webrtc" peer dependency version is satisfied',
+          );
+          return;
+        }
+        const unsubscribe = speechActivity.subscribe((event) => {
           this.state.setSpeakingWhileMuted(event.isSoundDetected);
         });
         this.soundDetectorCleanup = async () => {
           unsubscribe();
-          this.rnSpeechDetector = undefined;
         };
       } else {
         // Need to start a new stream that's not connected to publisher

package/src/devices/__tests__/MicrophoneManagerRN.test.ts CHANGED Viewed

@@ -12,11 +12,12 @@ import {
 import { of } from 'rxjs';
 import '../../rtc/__tests__/mocks/webrtc.mocks';
 import { OwnCapability } from '../../gen/coordinator';
-import { SoundStateChangeHandler } from '../../helpers/sound-detector';
 import { settled, withoutConcurrency } from '../../helpers/concurrency';
-let handler: SoundStateChangeHandler = () => {};
-let unsubscribeHandlers: ReturnType<typeof vi.fn>[] = [];
+let speechActivityCallback:
+  | ((state: { isSoundDetected: boolean }) => void)
+  | null = null;
+let unsubscribeMocks: ReturnType<typeof vi.fn>[] = [];
 vi.mock('../../helpers/platforms.ts', () => {
   return {
@@ -46,28 +47,21 @@ vi.mock('../../Call.ts', () => {
   };
 });
-vi.mock('../../helpers/RNSpeechDetector.ts', () => {
-  console.log('MOCKING RNSpeechDetector');
-  return {
-    RNSpeechDetector: vi.fn().mockImplementation(() => ({
-      start: vi.fn((callback) => {
-        handler = callback;
-        const unsubscribe = vi.fn();
-        unsubscribeHandlers.push(unsubscribe);
-        return unsubscribe;
-      }),
-      stop: vi.fn(),
-      onSpeakingDetectedStateChange: vi.fn(),
-    })),
-  };
-});
 describe('MicrophoneManager React Native', () => {
   let manager: MicrophoneManager;
   let checkPermissionMock: ReturnType<typeof vi.fn>;
+  let subscribeMock: ReturnType<typeof vi.fn>;
   beforeEach(() => {
-    unsubscribeHandlers = [];
+    speechActivityCallback = null;
+    unsubscribeMocks = [];
     checkPermissionMock = vi.fn(async () => true);
+    subscribeMock = vi.fn((cb) => {
+      speechActivityCallback = cb;
+      const unsub = vi.fn();
+      unsubscribeMocks.push(unsub);
+      return unsub;
+    });
     globalThis.streamRNVideoSDK = {
       callManager: {
@@ -78,6 +72,11 @@ describe('MicrophoneManager React Native', () => {
       permissions: {
         check: checkPermissionMock,
       },
+      nativeEvents: {
+        speechActivity: {
+          subscribe: subscribeMock,
+        },
+      },
     };
     const devicePersistence = { enabled: false, storageKey: '' };
@@ -100,7 +99,7 @@ describe('MicrophoneManager React Native', () => {
     await vi.waitUntil(() => fn.mock.calls.length > 0, { timeout: 100 });
     expect(fn).toHaveBeenCalled();
-    expect(manager['rnSpeechDetector']?.start).toHaveBeenCalled();
+    expect(subscribeMock).toHaveBeenCalled();
   });
   it('should check native microphone permission before starting detection', async () => {
@@ -146,15 +145,15 @@ describe('MicrophoneManager React Native', () => {
   it('should update speaking while muted state', async () => {
     await manager['startSpeakingWhileMutedDetection']();
-    expect(manager['rnSpeechDetector']?.start).toHaveBeenCalled();
+    expect(subscribeMock).toHaveBeenCalled();
     expect(manager.state.speakingWhileMuted).toBe(false);
-    handler!({ isSoundDetected: true, audioLevel: 2 });
+    speechActivityCallback!({ isSoundDetected: true });
     expect(manager.state.speakingWhileMuted).toBe(true);
-    handler!({ isSoundDetected: false, audioLevel: 0 });
+    speechActivityCallback!({ isSoundDetected: false });
     expect(manager.state.speakingWhileMuted).toBe(false);
   });
@@ -163,21 +162,21 @@ describe('MicrophoneManager React Native', () => {
     await manager['startSpeakingWhileMutedDetection']('device-1');
     await manager['startSpeakingWhileMutedDetection']('device-1');
-    expect(unsubscribeHandlers).toHaveLength(1);
+    expect(unsubscribeMocks).toHaveLength(1);
     await manager['stopSpeakingWhileMutedDetection']();
-    expect(unsubscribeHandlers[0]).toHaveBeenCalledTimes(1);
+    expect(unsubscribeMocks[0]).toHaveBeenCalledTimes(1);
   });
   it('should cleanup previous speech detector before starting a new one', async () => {
     await manager['startSpeakingWhileMutedDetection']('device-1');
     await manager['startSpeakingWhileMutedDetection']('device-2');
-    expect(unsubscribeHandlers).toHaveLength(2);
-    expect(unsubscribeHandlers[0]).toHaveBeenCalledTimes(1);
+    expect(unsubscribeMocks).toHaveLength(2);
+    expect(unsubscribeMocks[0]).toHaveBeenCalledTimes(1);
     await manager['stopSpeakingWhileMutedDetection']();
-    expect(unsubscribeHandlers[1]).toHaveBeenCalledTimes(1);
+    expect(unsubscribeMocks[1]).toHaveBeenCalledTimes(1);
   });
   it('should stop speaking while muted notifications if user loses permission to send audio', async () => {

package/src/types.ts CHANGED Viewed

@@ -462,6 +462,15 @@ export type StreamRNVideoSDKGlobals = {
      */
     check(permission: 'microphone' | 'camera'): Promise<boolean>;
   };
+  nativeEvents: {
+    speechActivity: {
+      /**
+       * Subscribes to native speech activity events.
+       * Returns an unsubscribe function.
+       */
+      subscribe(cb: (state: { isSoundDetected: boolean }) => void): () => void;
+    };
+  };
 };
 declare global {

package/dist/src/helpers/RNSpeechDetector.d.ts DELETED Viewed

@@ -1,23 +0,0 @@
-import { SoundStateChangeHandler } from './sound-detector';
-export declare class RNSpeechDetector {
-    private readonly pc1;
-    private readonly pc2;
-    private audioStream;
-    private externalAudioStream;
-    private isStopped;
-    constructor(externalAudioStream?: MediaStream);
-    /**
-     * Starts the speech detection.
-     */
-    start(onSoundDetectedStateChanged: SoundStateChangeHandler): Promise<() => void>;
-    /**
-     * Stops the speech detection and releases all allocated resources.
-     */
-    private stop;
-    /**
-     * Public method that detects the audio levels and returns the status.
-     */
-    private onSpeakingDetectedStateChange;
-    private cleanupAudioStream;
-    private forwardIceCandidate;
-}

package/src/helpers/RNSpeechDetector.ts DELETED Viewed

@@ -1,224 +0,0 @@
-import { BaseStats, flatten } from '../stats';
-import { SoundStateChangeHandler } from './sound-detector';
-import { videoLoggerSystem } from '../logger';
-export class RNSpeechDetector {
-  private readonly pc1 = new RTCPeerConnection({});
-  private readonly pc2 = new RTCPeerConnection({});
-  private audioStream: MediaStream | undefined;
-  private externalAudioStream: MediaStream | undefined;
-  private isStopped = false;
-  constructor(externalAudioStream?: MediaStream) {
-    this.externalAudioStream = externalAudioStream;
-  }
-  /**
-   * Starts the speech detection.
-   */
-  public async start(onSoundDetectedStateChanged: SoundStateChangeHandler) {
-    let detachListeners: (() => void) | undefined;
-    let unsubscribe: (() => void) | undefined;
-    try {
-      this.isStopped = false;
-      const audioStream =
-        this.externalAudioStream != null
-          ? this.externalAudioStream
-          : await navigator.mediaDevices.getUserMedia({ audio: true });
-      this.audioStream = audioStream;
-      const onPc1IceCandidate = (e: RTCPeerConnectionIceEvent) => {
-        this.forwardIceCandidate(this.pc2, e.candidate);
-      };
-      const onPc2IceCandidate = (e: RTCPeerConnectionIceEvent) => {
-        this.forwardIceCandidate(this.pc1, e.candidate);
-      };
-      const onTrackPc2 = (e: RTCTrackEvent) => {
-        e.streams[0].getTracks().forEach((track) => {
-          // In RN, the remote track is automatically added to the audio output device
-          // so we need to mute it to avoid hearing the audio back
-          // @ts-expect-error _setVolume is a private method in react-native-webrtc
-          track._setVolume(0);
-        });
-      };
-      this.pc1.addEventListener('icecandidate', onPc1IceCandidate);
-      this.pc2.addEventListener('icecandidate', onPc2IceCandidate);
-      this.pc2.addEventListener('track', onTrackPc2);
-      detachListeners = () => {
-        this.pc1.removeEventListener('icecandidate', onPc1IceCandidate);
-        this.pc2.removeEventListener('icecandidate', onPc2IceCandidate);
-        this.pc2.removeEventListener('track', onTrackPc2);
-      };
-      audioStream
-        .getTracks()
-        .forEach((track) => this.pc1.addTrack(track, audioStream));
-      const offer = await this.pc1.createOffer({});
-      await this.pc2.setRemoteDescription(offer);
-      await this.pc1.setLocalDescription(offer);
-      const answer = await this.pc2.createAnswer();
-      await this.pc1.setRemoteDescription(answer);
-      await this.pc2.setLocalDescription(answer);
-      unsubscribe = this.onSpeakingDetectedStateChange(
-        onSoundDetectedStateChanged,
-      );
-      return () => {
-        detachListeners?.();
-        unsubscribe?.();
-        this.stop();
-      };
-    } catch (error) {
-      detachListeners?.();
-      unsubscribe?.();
-      this.stop();
-      const logger = videoLoggerSystem.getLogger('RNSpeechDetector');
-      logger.error('error handling permissions: ', error);
-      return () => {};
-    }
-  }
-  /**
-   * Stops the speech detection and releases all allocated resources.
-   */
-  private stop() {
-    if (this.isStopped) return;
-    this.isStopped = true;
-    this.pc1.close();
-    this.pc2.close();
-    if (this.externalAudioStream != null) {
-      this.externalAudioStream = undefined;
-    } else {
-      this.cleanupAudioStream();
-    }
-  }
-  /**
-   * Public method that detects the audio levels and returns the status.
-   */
-  private onSpeakingDetectedStateChange(
-    onSoundDetectedStateChanged: SoundStateChangeHandler,
-  ) {
-    const initialBaselineNoiseLevel = 0.13;
-    let baselineNoiseLevel = initialBaselineNoiseLevel;
-    let speechDetected = false;
-    let speechTimer: NodeJS.Timeout | undefined;
-    let silenceTimer: NodeJS.Timeout | undefined;
-    const audioLevelHistory: number[] = []; // Store recent audio levels for smoother detection
-    const historyLength = 10;
-    const silenceThreshold = 1.1;
-    const resetThreshold = 0.9;
-    const speechTimeout = 500; // Speech is set to true after 500ms of audio detection
-    const silenceTimeout = 5000; // Reset baseline after 5 seconds of silence
-    const checkAudioLevel = async () => {
-      try {
-        const stats = await this.pc1.getStats();
-        const report = flatten(stats);
-        // Audio levels are present inside stats of type `media-source` and of kind `audio`
-        const audioMediaSourceStats = report.find(
-          (stat) =>
-            stat.type === 'media-source' &&
-            (stat as RTCRtpStreamStats).kind === 'audio',
-        ) as BaseStats;
-        if (audioMediaSourceStats) {
-          const { audioLevel } = audioMediaSourceStats;
-          if (audioLevel) {
-            // Update audio level history (with max historyLength sized array)
-            audioLevelHistory.push(audioLevel);
-            if (audioLevelHistory.length > historyLength) {
-              audioLevelHistory.shift();
-            }
-            // Calculate average audio level
-            const avgAudioLevel =
-              audioLevelHistory.reduce((a, b) => a + b, 0) /
-              audioLevelHistory.length;
-            // Update baseline (if necessary) based on silence detection
-            if (avgAudioLevel < baselineNoiseLevel * silenceThreshold) {
-              if (!silenceTimer) {
-                silenceTimer = setTimeout(() => {
-                  baselineNoiseLevel = Math.min(
-                    avgAudioLevel * resetThreshold,
-                    initialBaselineNoiseLevel,
-                  );
-                }, silenceTimeout);
-              }
-            } else {
-              clearTimeout(silenceTimer);
-              silenceTimer = undefined;
-            }
-            // Speech detection with hysteresis
-            if (avgAudioLevel > baselineNoiseLevel * 1.5) {
-              if (!speechDetected) {
-                speechDetected = true;
-                onSoundDetectedStateChanged({
-                  isSoundDetected: true,
-                  audioLevel,
-                });
-              }
-              clearTimeout(speechTimer);
-              speechTimer = setTimeout(() => {
-                speechDetected = false;
-                onSoundDetectedStateChanged({
-                  isSoundDetected: false,
-                  audioLevel: 0,
-                });
-              }, speechTimeout);
-            }
-          }
-        }
-      } catch (error) {
-        const logger = videoLoggerSystem.getLogger('RNSpeechDetector');
-        logger.error('error checking audio level from stats', error);
-      }
-    };
-    const intervalId = setInterval(checkAudioLevel, 250);
-    return () => {
-      clearInterval(intervalId);
-      clearTimeout(speechTimer);
-      clearTimeout(silenceTimer);
-    };
-  }
-  private cleanupAudioStream() {
-    if (!this.audioStream) {
-      return;
-    }
-    this.audioStream.getTracks().forEach((track) => track.stop());
-    if (
-      // @ts-expect-error release() is present in react-native-webrtc
-      typeof this.audioStream.release === 'function'
-    ) {
-      // @ts-expect-error called to dispose the stream in RN
-      this.audioStream.release();
-    }
-  }
-  private forwardIceCandidate(
-    destination: RTCPeerConnection,
-    candidate: RTCIceCandidate | null,
-  ) {
-    if (
-      this.isStopped ||
-      !candidate ||
-      destination.signalingState === 'closed'
-    ) {
-      return;
-    }
-    destination.addIceCandidate(candidate).catch(() => {
-      // silently ignore the error
-      const logger = videoLoggerSystem.getLogger('RNSpeechDetector');
-      logger.info('cannot add ice candidate - ignoring');
-    });
-  }
-}

package/src/helpers/__tests__/RNSpeechDetector.test.ts DELETED Viewed

@@ -1,52 +0,0 @@
-import '../../rtc/__tests__/mocks/webrtc.mocks';
-import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
-import { RNSpeechDetector } from '../RNSpeechDetector';
-describe('RNSpeechDetector', () => {
-  // Shared test setup stubs RTCPeerConnection with a vi.fn constructor.
-  // We keep a typed handle to that constructor to inspect created instances.
-  let rtcPeerConnectionMockCtor: ReturnType<typeof vi.fn>;
-  beforeEach(() => {
-    rtcPeerConnectionMockCtor =
-      globalThis.RTCPeerConnection as unknown as ReturnType<typeof vi.fn>;
-    rtcPeerConnectionMockCtor.mockClear();
-  });
-  afterEach(() => {
-    vi.restoreAllMocks();
-  });
-  it('ignores late ICE candidates after cleanup', async () => {
-    const stream = {
-      getTracks: () => [],
-    } as unknown as MediaStream;
-    const detector = new RNSpeechDetector(stream);
-    const cleanup = await detector.start(() => {});
-    cleanup();
-    // start() creates two peer connections (pc1 and pc2). We pull them from
-    // constructor call results to inspect listener wiring and ICE forwarding.
-    const [pc1, pc2] = rtcPeerConnectionMockCtor.mock.results.map(
-      (result) => result.value,
-    );
-    // Find the registered ICE callback and invoke it manually after cleanup to
-    // simulate a late ICE event arriving during teardown.
-    const onIceCandidate = pc1.addEventListener.mock.calls.find(
-      ([eventName]: [string]) => eventName === 'icecandidate',
-    )?.[1] as ((e: RTCPeerConnectionIceEvent) => void) | undefined;
-    expect(onIceCandidate).toBeDefined();
-    onIceCandidate?.({
-      candidate: { candidate: 'candidate:1 1 UDP 0 127.0.0.1 11111 typ host' },
-    } as unknown as RTCPeerConnectionIceEvent);
-    expect(pc1.removeEventListener).toHaveBeenCalledWith(
-      'icecandidate',
-      onIceCandidate,
-    );
-    expect(pc2.addIceCandidate).not.toHaveBeenCalled();
-  });
-});