npm - react-native-davoice - Versions diffs - 1.0.4 - Mend

react-native-davoice 1.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (67) hide show

package/speech/index.ts ADDED Viewed

@@ -0,0 +1,1055 @@
+// speech/index.ts
+import { NativeModules, NativeEventEmitter, DeviceEventEmitter, Platform } from 'react-native';
+import resolveAssetSource from 'react-native/Libraries/Image/resolveAssetSource';
+// ✅ Needed to get original extension ("dm") from require() assets in release.
+// eslint-disable-next-line @typescript-eslint/no-var-requires
+const AssetRegistry = require('react-native/Libraries/Image/AssetRegistry');
+// -------------------- VERBOSE LOGGING --------------------
+const VERBOSE = true;
+const PFX = '[SpeechJS]';
+function ts() {
+  const d = new Date();
+  return `${d.toISOString()}`;
+}
+function dbg(...args: any[]) {
+  if (!VERBOSE) return;
+  // eslint-disable-next-line no-console
+  console.log(ts(), PFX, ...args);
+}
+function dbgErr(...args: any[]) {
+  // eslint-disable-next-line no-console
+  console.log(ts(), PFX, '❌', ...args);
+}
+function safeJson(x: any) {
+  try {
+    return JSON.stringify(x);
+  } catch {
+    return String(x);
+  }
+}
+function sleep(ms: number) {
+  return new Promise<void>((r) => setTimeout(r, ms));
+}
+// If you use typed-array -> base64, Buffer is convenient (works in RN)
+let toBase64: (u8: Uint8Array) => string;
+try {
+  // eslint-disable-next-line @typescript-eslint/no-var-requires
+  const { Buffer } = require('buffer');
+  toBase64 = (u8) => Buffer.from(u8.buffer, u8.byteOffset, u8.byteLength).toString('base64');
+} catch {
+  // very rare fallback
+  toBase64 = (u8) => globalThis.btoa(String.fromCharCode(...u8));
+}
+// Native handles
+const NativeSpeech = NativeModules.SpeechBridge;                 // iOS unified (if present)
+const NativeSTT =
+  NativeModules.STT ||
+  NativeModules.RCTSTT ||
+  NativeModules.Voice ||
+  NativeModules.RCTVoice;
+const NativeTTS = NativeModules.DaVoiceTTSBridge;
+// Print what we actually have at module load
+dbg('Platform=', Platform.OS);
+dbg('NativeSpeech (SpeechBridge) exists?', !!NativeSpeech, 'keys=', NativeSpeech ? Object.keys(NativeSpeech) : null);
+dbg('NativeSTT exists?', !!NativeSTT, 'keys=', NativeSTT ? Object.keys(NativeSTT) : null);
+dbg('NativeTTS (DaVoiceTTSBridge) exists?', !!NativeTTS, 'keys=', NativeTTS ? Object.keys(NativeTTS) : null);
+// ---- Types ----
+export type SpeechStartEvent = {};
+export type SpeechEndEvent = {};
+export type SpeechRecognizedEvent = { isFinal: boolean };
+export type SpeechErrorEvent = { error: { code?: string; message?: string } };
+export type SpeechResultsEvent = { value: string[] };
+export type SpeechVolumeChangeEvent = { value: number };
+export type NewSpeechWAVEvent = { path: string };
+// Allow passing require() asset, uri string, etc.
+export type RNAssetLike = any; // keep permissive (Metro asset numbers/objects vary)
+export type ModelRef = string | RNAssetLike;
+export type UnifiedEvents = {
+  // STT
+  onSpeechStart?: (e: SpeechStartEvent) => void;
+  onSpeechRecognized?: (e: SpeechRecognizedEvent) => void;
+  onSpeechEnd?: (e: SpeechEndEvent) => void;
+  onSpeechError?: (e: SpeechErrorEvent) => void;
+  onSpeechResults?: (e: SpeechResultsEvent) => void;
+  onSpeechPartialResults?: (e: SpeechResultsEvent) => void;
+  onSpeechVolumeChanged?: (e: SpeechVolumeChangeEvent) => void;
+  /** Android-only: emitted when native MIC+VAD saves a full utterance WAV */
+  onNewSpeechWAV?: (e: NewSpeechWAVEvent) => void;
+  // TTS
+  onFinishedSpeaking?: () => void;
+};
+type NativeEventName =
+  | 'onSpeechStart'
+  | 'onSpeechRecognized'
+  | 'onSpeechEnd'
+  | 'onSpeechError'
+  | 'onSpeechResults'
+  | 'onSpeechPartialResults'
+  | 'onSpeechVolumeChanged'
+  | 'onNewSpeechWAV'
+  | 'onFinishedSpeaking';
+  // --- NEW: descriptor for external PCM payloads ---
+export type ExternalPCM = {
+  /** base64 of raw PCM payload */
+  base64: string;
+  /** sample rate of payload (e.g., 16000, 22050, 24000, 44100, 48000) */
+  sampleRate: number;
+  /** number of channels in payload (default 1) */
+  channels?: number;
+  /** whether payload is interleaved (default true) */
+  interleaved?: boolean;
+  /** 'i16' for 16-bit signed integer, 'f32' for 32-bit float */
+  format: 'i16' | 'f32';
+  /** whether this item should trigger onFinishedSpeaking when done (default true) */
+  markAsLast?: boolean;
+};
+class Speech {
+  // ---- MIN: serialize TTS + wait-for-finished ----
+  private ttsChain: Promise<void> = Promise.resolve();
+  private ttsPendingResolve: (() => void) | null = null;
+  private ttsPendingTimeout: any = null;
+  private dbgAsset(label: string, x: any) {
+    try {
+      const a = resolveAssetSource(x);
+      dbg(`[ASSETDBG ${label}] inputType=${typeof x} input=`, x);
+      dbg(`[ASSETDBG ${label}] resolved keys=`, a ? Object.keys(a) : null);
+      dbg(`[ASSETDBG ${label}] resolved=`, a);
+      dbg(`[ASSETDBG ${label}] resolved.uri=`, a?.uri);
+      // These often exist in dev:
+      dbg(`[ASSETDBG ${label}] httpServerLocation=`, (a as any)?.httpServerLocation);
+      dbg(`[ASSETDBG ${label}] fileSystemLocation=`, (a as any)?.fileSystemLocation);
+    } catch (e) {
+      dbgErr(`[ASSETDBG ${label}] resolveAssetSource threw`, String(e));
+    }
+  }
+  private _onNativeFinishedSpeaking() {
+    dbg('[EVENT onFinishedSpeaking]');
+    // 1) let app callback run
+    try { this.handlers.onFinishedSpeaking(); } catch (e) { dbgErr('onFinishedSpeaking handler error', String(e)); }
+    // 2) resolve the internal await (if any)
+    if (this.ttsPendingTimeout) { clearTimeout(this.ttsPendingTimeout); this.ttsPendingTimeout = null; }
+    const r = this.ttsPendingResolve;
+    this.ttsPendingResolve = null;
+    if (r) r();
+  }
+  private _nativeSpeak(text: string, speakerId: number, s: number) {
+    if (Platform.OS === 'ios' && NativeSpeech?.speak) return (NativeSpeech as any).speak(text, speakerId, s);
+    if (!NativeTTS?.speak) throw new Error('TTS speak not available');
+    return (NativeTTS as any).speak(text, speakerId, s);
+  }
+  private _speakAndWait(text: string, speakerId: number, s: number, timeoutMs = 600000) {
+    return new Promise<void>((resolve, reject) => {
+      this.ttsPendingResolve = resolve;
+      // safety: never hang forever
+      this.ttsPendingTimeout = setTimeout(() => {
+        dbg('Timeout waiting for onFinishedSpeaking — releasing wait');
+        if (this.ttsPendingTimeout) { clearTimeout(this.ttsPendingTimeout); this.ttsPendingTimeout = null; }
+        const r = this.ttsPendingResolve;
+        this.ttsPendingResolve = null;
+        if (r) r(); // ✅ accept after timeout
+      }, timeoutMs);
+      try {
+        this._nativeSpeak(text, speakerId, s);
+      } catch (e) {
+        if (this.ttsPendingTimeout) { clearTimeout(this.ttsPendingTimeout); this.ttsPendingTimeout = null; }
+        this.ttsPendingResolve = null;
+        reject(e as any);
+      }
+    });
+  }
+  private sttEmitter: NativeEventEmitter | null = null;
+  private ttsEmitter: NativeEventEmitter | typeof DeviceEventEmitter | null = null;
+  private unifiedEmitter: NativeEventEmitter | null = null;
+  private subs: Array<{ remove: () => void }> = [];
+  private handlers: Required<UnifiedEvents>;
+  // top of file (new state)
+  private lastLocale: string | null = null;
+  private lastModel: string | null = null;
+  private iosTtsOnly = false; // when true, use NativeTTS directly on iOS
+  private logCall(name: string, payload?: any) {
+    dbg(`[CALL ${name}]`, payload !== undefined ? safeJson(payload) : '');
+  }
+  // ✅ NEW: best-effort extract extension for require() assets (e.g. ".dm")
+  private resolveModelExt(model: ModelRef): string | undefined {
+    try {
+      // Metro assets are usually numeric IDs on native platforms
+      if (typeof model === 'number' && AssetRegistry?.getAssetByID) {
+        const a = AssetRegistry.getAssetByID(model);
+        const t = a?.type;
+        if (typeof t === 'string' && t.length) return t;
+      }
+    } catch {}
+    try {
+      const uri = resolveAssetSource(model as any)?.uri;
+      if (typeof uri === 'string') {
+        const m = uri.match(/\.([a-zA-Z0-9]+)(?:\?|#|$)/);
+        if (m && m[1]) return m[1].toLowerCase();
+      }
+    } catch {}
+    if (typeof model === 'string') {
+      const m = model.match(/\.([a-zA-Z0-9]+)(?:\?|#|$)/);
+      if (m && m[1]) return m[1].toLowerCase();
+    }
+    return undefined;
+  }
+  // ✅ NEW: resolve require() assets to a usable URI/path string
+  private resolveModelToPath(model: ModelRef): string {
+      // ✅ Backward compatible: plain strings are passed through unchanged
+  if (typeof model === 'string') return model;
+    try {
+      const asset = resolveAssetSource(model);
+      dbg('[resolveModelToPath] resolveAssetSource ->', asset);
+      const uri = asset?.uri;
+      if (uri) return String(uri);
+    } catch {
+      // ignore and fall through
+    }
+    return typeof model === 'string' ? model : String(model);
+  }
+  constructor() {
+    this.handlers = {
+      onSpeechStart: () => {},
+      onSpeechRecognized: () => {},
+      onSpeechEnd: () => {},
+      onSpeechError: () => {},
+      onSpeechResults: () => {},
+      onSpeechPartialResults: () => {},
+      onSpeechVolumeChanged: () => {},
+      onNewSpeechWAV: () => {},
+      onFinishedSpeaking: () => {},
+    };
+    // Emitters per-platform
+    if (Platform.OS !== 'web') {
+      if (Platform.OS === 'ios' && NativeSpeech) {
+        this.unifiedEmitter = new NativeEventEmitter(NativeSpeech);
+        dbg('[constructor] iOS unifiedEmitter created');
+      } else {
+        // Android (and iOS fallback): separate modules
+        if (NativeSTT) {
+          this.sttEmitter = new NativeEventEmitter(NativeSTT);
+          dbg('[constructor] sttEmitter created');
+        }
+        // ANDROID: Native module emits through DeviceEventEmitter
+        if (Platform.OS === 'android') {
+            this.ttsEmitter = DeviceEventEmitter;
+            dbg('[constructor] android ttsEmitter=DeviceEventEmitter');
+        } else {
+            // non-unified iOS fallback (if ever used)
+            if (NativeTTS) {
+              this.ttsEmitter = new NativeEventEmitter(NativeTTS);
+              dbg('[constructor] iOS fallback ttsEmitter created');
+            }
+        }
+      }
+    }
+  }
+  // NEW: tiny helper to (re)wire listeners depending on mode
+ private rewireListenersForMode() {
+  this.teardownListeners();
+  // if iOS unified + NOT tts-only -> use unified emitter
+  if (Platform.OS === 'ios' && NativeSpeech && !this.iosTtsOnly) {
+    this.unifiedEmitter = new NativeEventEmitter(NativeSpeech);
+    // unified handles both STT + TTS events
+  } else {
+    // fallback: separate emitters
+    if (NativeSTT) this.sttEmitter = new NativeEventEmitter(NativeSTT);
+    if (Platform.OS === 'android') this.ttsEmitter = DeviceEventEmitter;
+    else if (NativeTTS) this.ttsEmitter = new NativeEventEmitter(NativeTTS);
+  }
+  this.ensureListeners();
+}
+   // ---------- Init / Destroy ----------
+  /**
+   * ANDROID ONLY: Initialize remote capture (MIC + VAD) that saves utterances to WAV
+   * and emits 'onNewSpeechWAV' with { path }. No-op on iOS (throws).
+   */
+  async initAllRemoteSTT(modelOrOpts: ModelRef | { model: ModelRef; onboardingJsonPath?: string }): Promise<void> {
+    if (Platform.OS !== 'android') {
+      throw new Error('initAllRemoteSTT is Android-only.');
+    }
+    if (!NativeSTT?.startRemoteSpeech) {
+      throw new Error('Native STT module missing startRemoteSpeech()');
+    }
+    this.ensureListeners();
+    const cfg =
+      modelOrOpts && typeof modelOrOpts === 'object' && 'model' in (modelOrOpts as any)
+        ? (modelOrOpts as any)
+        : { model: modelOrOpts as ModelRef };
+    const modelPath = this.resolveModelToPath(cfg.model);
+    await new Promise<void>((resolve, reject) => {
+      try {
+        NativeSTT.startRemoteSpeech((err: string) => (err ? reject(new Error(err)) : resolve()));
+      } catch (e) {
+        reject(e as any);
+      }
+    });
+    if (!NativeSTT || !NativeTTS) {
+      throw new Error('Missing native bridges (STT/TTS).');
+    }
+    // Init TTS
+    const modelExt = this.resolveModelExt(cfg.model);
+    console.log('[MODELDBG] initAllRemoteSTT.modelPath (resolved)=', modelPath);
+    console.log('[MODELDBG] initAllRemoteSTT.modelExt (resolved)=', modelExt);
+    await NativeTTS.initTTS({ model: modelPath, modelExt });
+    await sleep(500);
+  }
+  /**
+   * ANDROID ONLY: Start remote STT and initialize TTS in playback-only mode (no model/ONNX init).
+   * Accepts the same argument shape as initAllRemoteSTT() for API compatibility.
+   * model/onboardingJsonPath are intentionally ignored on Android for now.
+   */
+  async initAllRemoteSTTAndTTS(
+    _modelOrOpts?: ModelRef | { model: ModelRef; onboardingJsonPath?: string },
+  ): Promise<void> {
+    if (Platform.OS !== 'android') {
+      throw new Error('initAllRemoteSTTAndTTS is Android-only.');
+    }
+    if (!NativeSTT?.startRemoteSpeech) {
+      throw new Error('Native STT module missing startRemoteSpeech()');
+    }
+    this.ensureListeners();
+    await new Promise<void>((resolve, reject) => {
+      try {
+        NativeSTT.startRemoteSpeech((err: string) => (err ? reject(new Error(err)) : resolve()));
+      } catch (e) {
+        reject(e as any);
+      }
+    });
+    if (!NativeTTS?.initTTSPlaybackOnly) {
+      throw new Error('Native TTS module missing initTTSPlaybackOnly()');
+    }
+    await NativeTTS.initTTSPlaybackOnly();
+    await sleep(500);
+  }
+ dbgModel(label: string, model: any) {
+  try {
+    console.log(`[MODELDBG] ${label} typeof=`, typeof model, ' value=', model);
+    try {
+      const asset = resolveAssetSource(model);
+      console.log(`[MODELDBG] ${label} resolveAssetSource=`, asset);
+      if (asset?.uri) console.log(`[MODELDBG] ${label} asset.uri=`, asset.uri);
+    } catch (e) {
+      console.log(`[MODELDBG] ${label} resolveAssetSource threw:`, String(e));
+    }
+  } catch {}
+}
+  // ---------- Init / Destroy ----------
+  /**
+   * iOS: initialize STT then TTS via native SpeechBridge if available.
+   * Android: no special init needed; optionally preload TTS (if you want).
+   */
+  async initAll(opts: { locale: string; model: ModelRef; timeoutMs?: number; onboardingJsonPath?: string }) {
+    this.dbgModel('initAll.opts.model (raw)', opts.model);
+    this.dbgAsset('initAll.model', opts.model);
+    this._cancelTtsWait('initAll');
+    this.ttsChain = Promise.resolve();
+    this.wavChain = Promise.resolve();
+    const modelPath = this.resolveModelToPath(opts.model);
+    console.log('[MODELDBG] initAll.modelPath (resolved)=', modelPath);
+    this.lastLocale = opts.locale;
+    this.lastModel = modelPath;
+    if (Platform.OS === 'ios' && NativeSpeech?.initAll) {
+      this.iosTtsOnly = false;                  // full unified mode
+      this.teardownListeners();                 // re-wire listeners for unified
+      const r = await NativeSpeech.initAll({ ...opts, model: modelPath });
+      this.ensureListeners();
+      return r;
+    }
+    // Fallback (Android or iOS w/o SpeechBridge):
+    // 1) Start STT (engine hot will happen internally); 2) init TTS.
+    if (!NativeSTT || !NativeTTS) {
+      throw new Error('Missing native bridges (STT/TTS).');
+    }
+    // Start STT (best-effort; no-op if already running)
+    await new Promise<void>((resolve, reject) => {
+        try {
+            // iOS fallback signature: (locale, cb)
+            // Android signature: (locale, extras, cb)
+            if (Platform.OS === 'android') {
+            // Always try Android 3-arg signature first, then fall back
+                try {
+                    NativeSTT.startSpeech(
+                    opts.locale,
+                    {
+                        EXTRA_LANGUAGE_MODEL: 'LANGUAGE_MODEL_FREE_FORM',
+                        EXTRA_MAX_RESULTS: 5,
+                        EXTRA_PARTIAL_RESULTS: true,
+                        REQUEST_PERMISSIONS_AUTO: true,
+                        onboardingJsonPath: opts.onboardingJsonPath ?? null,
+                    },
+                    (err: string) => (err ? reject(new Error(err)) : resolve())
+                    );
+                } catch {
+                    // Fallback to 2-arg (some RN voice bridges use this)
+                    NativeSTT.startSpeech(opts.locale, (err: string) =>
+                    err ? reject(new Error(err)) : resolve()
+                    );
+                }
+            } else {
+                NativeSTT.startSpeech(opts.locale, (err: string) =>
+                err ? reject(new Error(err)) : resolve(),
+                );
+            }
+        } catch (e) {
+            reject(e as any);
+        }
+    });
+    // Init TTS
+    const modelExt = this.resolveModelExt(opts.model);
+    console.log('[MODELDBG] initAll.modelExt (resolved)=', modelExt);
+    await NativeTTS.initTTS({ model: modelPath, modelExt });
+  }
+  async destroyAll() {
+    this._cancelTtsWait('destroyAll');
+    this.ttsChain = Promise.resolve();
+    this.wavChain = Promise.resolve();
+    // iOS unified
+    if (Platform.OS === 'ios' && NativeSpeech?.destroyAll) {
+      const r = await NativeSpeech.destroyAll();
+      this.iosTtsOnly = false;
+      this.lastLocale = this.lastLocale ?? null;
+      this.teardownListeners();
+      return r;
+    }
+    // Fallback: destroy TTS -> STT
+    try { await NativeTTS?.destroy?.(); } catch {}
+    try {
+      await new Promise<void>((res) => {
+        if (!NativeSTT?.destroySpeech) return res();
+        NativeSTT.destroySpeech(() => res());
+      });
+    } catch {}
+    this.teardownListeners();
+    return 'Destroyed';
+  }
+  // ---------- STT ----------
+  async start(locale: string, options: Record<string, any> = {}) {
+    this.ensureListeners();
+    // Prefer unified on iOS
+    if (Platform.OS === 'ios' && NativeSpeech?.startSpeech) {
+      return new Promise<void>((resolve) => NativeSpeech.startSpeech(locale, () => resolve()));
+    }
+    // Android + iOS fallback
+    return new Promise<void>((resolve, reject) => {
+        if (!NativeSTT?.startSpeech) return reject(new Error('startSpeech not available'));
+        if (Platform.OS === 'android') {
+            try {
+                NativeSTT.startSpeech(
+                locale,
+                {
+                    EXTRA_LANGUAGE_MODEL: 'LANGUAGE_MODEL_FREE_FORM',
+                    EXTRA_MAX_RESULTS: 5,
+                    EXTRA_PARTIAL_RESULTS: true,
+                    REQUEST_PERMISSIONS_AUTO: true,
+                    ...options,
+                },
+                (err: string) => (err ? reject(new Error(err)) : resolve())
+                );
+            } catch {
+                // Fallback to 2-arg
+                NativeSTT.startSpeech(locale, (err: string) =>
+                err ? reject(new Error(err)) : resolve()
+                );
+            }
+        } else {
+            NativeSTT.startSpeech(locale, (err: string) =>
+            err ? reject(new Error(err)) : resolve(),
+            );
+        }
+    });
+  }
+  async startWithSVOnboardingJson(locale: string, onboardingJsonPath: string): Promise<void> {
+    this.ensureListeners();
+    if (Platform.OS === 'ios' && NativeSpeech?.startSpeechWithSVOnboardingJson) {
+      return new Promise<void>((resolve) =>
+        NativeSpeech.startSpeechWithSVOnboardingJson(locale, onboardingJsonPath, () => resolve()),
+      );
+    }
+    return this.start(locale);
+  }
+  pauseSpeechRecognition(): Promise<void> {
+    this.logCall('pauseSpeechRecognitionLite');
+    const mod: any = Platform.OS === 'ios' ? NativeSpeech : NativeSTT;
+    const fn = mod?.pauseSpeechRecognitionLite;
+    if (!fn) {
+      dbg(`pauseSpeechRecognitionLite not available on ${Platform.OS === 'ios' ? 'NativeSpeech' : 'NativeSTT'}`);
+      return Promise.resolve();
+    }
+    if (Platform.OS === 'ios') {
+      return new Promise((resolve, reject) => {
+        try {
+          fn.call(mod, (ok: boolean) => {
+            if (!ok) dbgErr('pauseSpeechRecognitionLite returned false');
+            resolve();
+          });
+        } catch (e) {
+          reject(e as any);
+        }
+      });
+    }
+    return new Promise<void>((resolve, reject) => {
+      try {
+        fn.call(mod, async (ok: boolean) => {
+          if (!ok) dbgErr('pauseSpeechRecognitionLite returned false');
+          // ✅ ANDROID: small delay before resolving
+          if (Platform.OS === 'android') await sleep(500);
+          resolve();
+        });
+      } catch (e) {
+        reject(e as any);
+      }
+    });
+  }
+  unPauseSpeechRecognition(times: number): Promise<void> {
+    this.logCall('unPauseSpeechRecognitionLite', { times });
+    const mod: any = Platform.OS === 'ios' ? NativeSpeech : NativeSTT;
+    const fn = mod?.unPauseSpeechRecognitionLite;
+    if (!fn) {
+      dbg(`unPauseSpeechRecognitionLite(times) not available on ${Platform.OS === 'ios' ? 'NativeSpeech' : 'NativeSTT'}`);
+      return Promise.resolve();
+    }
+    if (Platform.OS === 'ios') {
+      return new Promise((resolve, reject) => {
+        try {
+          fn.call(mod, times, (ok: boolean) => {
+            if (!ok) dbgErr('unPauseSpeechRecognitionLite(times) returned false');
+            resolve();
+          });
+        } catch (e) {
+          reject(e as any);
+        }
+      });
+    }
+    return new Promise<void>((resolve, reject) => {
+      try {
+        fn.call(mod, times, async (ok: boolean) => {
+          if (!ok) dbgErr('unPauseSpeechRecognitionLite(times) returned false');
+          // ✅ ANDROID: small delay before resolving
+          if (Platform.OS === 'android') await sleep(500);
+          resolve();
+        });
+      } catch (e) {
+        reject(e as any);
+      }
+    });
+  }
+  /** Pause mic/STT (Android native; iOS unified if present) */
+  async pauseMicrophone(): Promise<void> {
+    console.log('[pauseMicrophone] called');
+    this.logCall('pauseMicrophone');
+    // iOS: prefer async first, fallback to callback if missing
+    if (Platform.OS === 'ios' && (NativeSpeech as any)?.pauseMicrophoneAsync) {
+      dbg('IOS [pauseMicrophone] using NativeSpeech.pauseMicrophoneAsync()');
+      try {
+        const r = await (NativeSpeech as any).pauseMicrophoneAsync(1000);
+        dbg('pauseMicrophoneAsync result', r);
+        if (r?.ok === false) dbgErr('pauseMicrophoneAsync failed', r?.reason);
+        return;
+      } catch (e) {
+        dbgErr('IOS [pauseMicrophone] NativeSpeech.pauseMicrophoneAsync() ERROR:', String(e));
+        throw e;
+      }
+    }
+    if (Platform.OS === 'ios' && NativeSpeech?.pauseMicrophone) {
+      console.log('IOS [pauseMicrophone] called');
+      return new Promise((resolve, reject) => {
+        try { (NativeSpeech as any).pauseMicrophone(() => resolve()); }
+        catch (e) { reject(e as any); }
+      });
+    }
+    if (!(NativeSTT as any)?.pauseMicrophone) return Promise.resolve();
+    return new Promise((resolve, reject) => {
+      try { (NativeSTT as any).pauseMicrophone(() => resolve()); }
+      catch (e) { reject(e as any); }
+    });
+  }
+  /** Resume mic/STT (Android native; iOS unified if present) */
+ async unPauseMicrophone(): Promise<void> {
+    this.logCall('unPauseMicrophone');
+    // iOS: prefer async first, fallback to callback if missing
+    if (Platform.OS === 'ios' && (NativeSpeech as any)?.unPauseMicrophoneAsync) {
+      dbg('IOS [unPauseMicrophone] using NativeSpeech.unPauseMicrophoneAsync()');
+      try {
+        const r = await (NativeSpeech as any).unPauseMicrophoneAsync(1000);
+        if (r?.ok === false) dbgErr('unPauseMicrophone failed', r?.reason);
+        dbg('IOS [unPauseMicrophone] NativeSpeech.unPauseMicrophoneAsync() DONE');
+        return;
+      } catch (e) {
+        dbgErr('IOS [unPauseMicrophone] NativeSpeech.unPauseMicrophoneAsync() ERROR:', String(e));
+        throw e;
+      }
+    }
+    if (Platform.OS === 'ios' && NativeSpeech?.unPauseMicrophone) {
+      console.log('IOS [unPauseMicrophone] called');
+      return new Promise((resolve, reject) => {
+        try { (NativeSpeech as any).unPauseMicrophone(() => resolve()); }
+        catch (e) { reject(e as any); }
+      });
+    }
+    if (Platform.OS === 'ios')
+      console.log('IOS [unPauseMicrophone] called without native support');
+    if (!(NativeSTT as any)?.unPauseMicrophone) return Promise.resolve();
+    return new Promise((resolve, reject) => {
+      try { (NativeSTT as any).unPauseMicrophone(() => resolve()); }
+      catch (e) { reject(e as any); }
+    });
+  }
+  stop(): Promise<void> {
+    if (Platform.OS === 'ios' && NativeSpeech?.stopSpeech) {
+      return new Promise((res) => NativeSpeech.stopSpeech(() => res()));
+    }
+    if (!NativeSTT?.stopSpeech) return Promise.resolve();
+    return new Promise((res) => NativeSTT.stopSpeech(() => res()));
+  }
+  cancel(): Promise<void> {
+    if (Platform.OS === 'ios' && NativeSpeech?.cancelSpeech) {
+      return new Promise((res) => NativeSpeech.cancelSpeech(() => res()));
+    }
+    if (!NativeSTT?.cancelSpeech) return Promise.resolve();
+    return new Promise((res) => NativeSTT.cancelSpeech(() => res()));
+  }
+  isAvailable(): Promise<0 | 1> {
+    // Prefer unified
+    if (Platform.OS === 'ios' && NativeSpeech?.isSpeechAvailable) {
+      return new Promise((resolve, reject) =>
+        NativeSpeech.isSpeechAvailable((ok: 0 | 1, err: string) =>
+          err ? reject(new Error(err)) : resolve(ok),
+        ),
+      );
+    }
+    if (NativeSTT?.isSpeechAvailable) {
+      return new Promise((resolve) =>
+        NativeSTT.isSpeechAvailable((ok: 0 | 1) => resolve(ok)),
+      );
+    }
+    return Promise.resolve(1);
+  }
+  isRecognizing(): Promise<0 | 1> {
+    if (Platform.OS === 'ios' && NativeSpeech?.isRecognizing) {
+      return new Promise((resolve) =>
+        NativeSpeech.isRecognizing((v: 0 | 1) => resolve(v)),
+      );
+    }
+    if (NativeSTT?.isRecognizing) {
+      return new Promise((resolve) =>
+        NativeSTT.isRecognizing((v: 0 | 1) => resolve(v)),
+      );
+    }
+    return Promise.resolve(0);
+  }
+  async hasIOSMicPermissions(): Promise<boolean> {
+    if (Platform.OS !== 'ios') return false;
+    if (!NativeSpeech?.hasMicPermissions) return false;
+    return !!(await NativeSpeech.hasMicPermissions());
+  }
+  async requestIOSMicPermissions(wait_timeout: number): Promise<boolean> {
+    if (Platform.OS !== 'ios') return false;
+    if (!NativeSpeech?.requestMicPermissions) return false;
+    return !!(await NativeSpeech.requestMicPermissions(wait_timeout));
+  }
+  async hasIOSSpeechRecognitionPermissions(): Promise<boolean> {
+    if (Platform.OS !== 'ios') return false;
+    if (!NativeSpeech?.hasSpeechRecognitionPermissions) return false;
+    return !!(await NativeSpeech.hasSpeechRecognitionPermissions());
+  }
+  async requestIOSSpeechRecognitionPermissions(wait_timeout: number): Promise<boolean> {
+    if (Platform.OS !== 'ios') return false;
+    if (!NativeSpeech?.requestSpeechRecognitionPermissions) return false;
+    return !!(await NativeSpeech.requestSpeechRecognitionPermissions(wait_timeout));
+  }
+  async setLicense(licenseKey: string): Promise<boolean> {
+    if (!licenseKey) throw new Error('setLicense: missing licenseKey');
+    if (Platform.OS === 'ios' && NativeSpeech?.setLicense) {
+      return !!(await NativeSpeech.setLicense(licenseKey));
+    }
+    const results = await Promise.all([
+      NativeTTS?.setLicense ? NativeTTS.setLicense(licenseKey) : Promise.resolve(false),
+      NativeSTT?.setLicense ? NativeSTT.setLicense(licenseKey) : Promise.resolve(false),
+    ]);
+    return results.every(Boolean);
+  }
+  async isLicenseValid(licenseKey: string): Promise<boolean> {
+    if (!licenseKey) throw new Error('isLicenseValid: missing licenseKey');
+    if (Platform.OS === 'ios' && NativeSpeech?.isLicenseValid) {
+      return !!(await NativeSpeech.isLicenseValid(licenseKey));
+    }
+    const results = await Promise.all([
+      NativeTTS?.isLicenseValid ? NativeTTS.isLicenseValid(licenseKey) : Promise.resolve(false),
+      NativeSTT?.isLicenseValid ? NativeSTT.isLicenseValid(licenseKey) : Promise.resolve(false),
+    ]);
+    return results.every(Boolean);
+  }
+  // ---------- TTS ----------
+  async initTTS(modelOrConfig: ModelRef | { model: ModelRef }) {
+    const cfg =
+      modelOrConfig && typeof modelOrConfig === 'object' && 'model' in (modelOrConfig as any)
+        ? (modelOrConfig as any)
+        : { model: modelOrConfig as any };
+    // // iOS unified asks you to use initAll
+    // if (Platform.OS === 'ios' && NativeSpeech?.initAll) {
+    //   throw new Error('Use initAll() on iOS unified bridge.');
+    // }
+    if (!cfg?.model) throw new Error("initTTS: missing 'model'");
+    const modelPath = this.resolveModelToPath(cfg.model);
+    this.lastModel = modelPath;
+    return NativeTTS.initTTS({ model: modelPath });
+  }
+  async speak(text: string, speakerId = 0, speed = 1.0) {
+    // sanitize and invert (avoid NaN/undefined/null)
+    // Reverse speed to length.
+    const s = Number.isFinite(speed as number) && speed !== 0 ? 1.0 / (speed as number) : 1.0;
+    this.ensureListeners();
+    // MIN: serialize + await actual completion (event-driven)
+    this.ttsChain = this.ttsChain.then(() => this._speakAndWait(text, speakerId, s));
+    return this.ttsChain;
+  }
+    // --- NEW: cancel any pending "wait for finished" immediately ---
+  private _cancelTtsWait(reason = 'stopSpeaking') {
+    dbg(`[TTS cancel wait] reason=${reason}`);
+    // stop the 60-min timer
+    if (this.ttsPendingTimeout) {
+      clearTimeout(this.ttsPendingTimeout);
+      this.ttsPendingTimeout = null;
+    }
+    // release the promise waiter (if any)
+    const r = this.ttsPendingResolve;
+    this.ttsPendingResolve = null;
+    if (r) r();
+    // IMPORTANT: do NOT call app callback here (stopSpeaking should not emit "finished")
+    // this.handlers.onFinishedSpeaking() <-- DO NOT
+  }
+    async stopSpeaking() {
+    // 1) JS MUST stop waiting + clear queues immediately
+    this._cancelTtsWait('stopSpeaking');
+    // clear serialized chains so future speak/playWav starts fresh
+    this.ttsChain = Promise.resolve();
+    this.wavChain = Promise.resolve();
+    // 2) tell native to stop
+    try {
+      if (Platform.OS === 'ios' && NativeSpeech?.stopSpeaking) {
+        return await NativeSpeech.stopSpeaking();
+      }
+      if (NativeTTS?.stopSpeaking) {
+        return await NativeTTS.stopSpeaking();
+      }
+    } catch (e) {
+      // even if native throws, JS state is already unblocked
+      dbgErr('stopSpeaking native error', String(e));
+    }
+  }
+  // ADD near your other TTS queue fields (DO NOT remove existing ones)
+  private wavChain: Promise<void> = Promise.resolve();
+  // ADD helper (minimal, uses existing onFinishedSpeaking event)
+  private _playWavAndWait(realPath: string, markAsLast: boolean, timeoutMs = 600000) {
+    return new Promise<void>((resolve, reject) => {
+      this.ttsPendingResolve = resolve; // reuse existing resolver + event
+      this.ttsPendingTimeout = setTimeout(() => {
+        dbg('Timeout waiting for onFinishedSpeaking — releasing wait');
+        if (this.ttsPendingTimeout) { clearTimeout(this.ttsPendingTimeout); this.ttsPendingTimeout = null; }
+        const r = this.ttsPendingResolve;
+        this.ttsPendingResolve = null;
+        if (r) r(); // ✅ accept after timeout
+      }, timeoutMs);
+      try {
+        // Prefer unified iOS bridge if present
+        if (Platform.OS === 'ios' && NativeSpeech?.playWav) {
+          (NativeSpeech as any).playWav(realPath, markAsLast);
+          return;
+        }
+        if (!NativeTTS?.playWav) throw new Error('playWav not available on this platform.');
+        (NativeTTS as any).playWav(realPath, markAsLast);
+      } catch (e) {
+        if (this.ttsPendingTimeout) { clearTimeout(this.ttsPendingTimeout); this.ttsPendingTimeout = null; }
+        this.ttsPendingResolve = null;
+        reject(e as any);
+      }
+    });
+  }
+  async playWav(pathOrURL: any, markAsLast = true) {
+    // ✅ KEEP ALL YOUR EXISTING LOGGING + resolveAssetSource LOGIC
+    console.log('[Speech.playWav] called with:', pathOrURL, '| type:', typeof pathOrURL);
+    this.dbgAsset('playWav.arg', pathOrURL);
+    const asset = resolveAssetSource(pathOrURL);
+    console.log('[Speech.playWav] resolveAssetSource ->', asset);
+    let realPath = asset?.uri ?? pathOrURL;
+    if (Platform.OS === 'android' && typeof asset?.uri === 'string') {
+      // Pass raw resource entry name through (native will resolve via res/raw)
+      realPath = asset.uri;
+    }
+    console.log('[Speech.playWav] resolved realPath:', realPath);
+    if (typeof realPath !== 'string') {
+      realPath = String(realPath);
+      console.log('[Speech.playWav] converted ?? realPath:', realPath);
+    }
+    console.log('[Speech.playWav] before checking ios realPath:', realPath);
+    // ✅ IMPORTANT: separate logic per platform + queue only when markAsLast=true
+    this.ensureListeners();
+    if (markAsLast) {
+      // Waitable: serialize on its own queue (separate from speak)
+      this.wavChain = this.wavChain.then(() => this._playWavAndWait(realPath, true));
+      return this.wavChain;
+    }
+    // Fire-and-forget (cannot await because native will not emit completion)
+    if (Platform.OS === 'ios' && NativeSpeech?.playWav) {
+      return (NativeSpeech as any).playWav(realPath, false);
+    }
+    console.log('[Speech.playWav] after checking ios realPath:', realPath);
+    console.log('[Speech.playWav] after checking ios realPath:', typeof realPath);
+    if (!NativeTTS?.playWav) {
+      console.log('[Speech.playWav] NativeTTS:', NativeTTS);
+      if (NativeTTS) console.log('[Speech.playWav] NativeTTS.playWav :', NativeTTS.playWav);
+      throw new Error('playWav not available on this platform.');
+    }
+    console.log('[Speech.playWav] calling NativeTTS.playWav with type of realPath:', typeof realPath);
+    return (NativeTTS as any).playWav(realPath, false);
+  }
+  // /** Queue a WAV file (local path or file:// URL). Routed via AEC path, queued with speak(). */
+  // async playWav(pathOrURL: string, markAsLast = true) {
+  //   // Prefer unified iOS bridge if present
+  //   if (Platform.OS === 'ios' && NativeSpeech?.playWav) {
+  //     return NativeSpeech.playWav(pathOrURL, markAsLast);
+  //   }
+  //   // Fallback: direct TTS bridge (Android + iOS fallback)
+  //   if (!NativeTTS?.playWav) throw new Error('playWav not available on this platform.');
+  //   return NativeTTS.playWav(pathOrURL, markAsLast);
+  // }
+  /**
+   * Convenience: queue a typed array (Int16Array | Float32Array | ArrayBuffer) as PCM.
+   * We’ll base64 it and pass through to native with the right metadata.
+   */
+  async playPCM(
+    data: ArrayBuffer | Int16Array | Float32Array,
+    opts: {
+      sampleRate: number;
+      channels?: number;
+      interleaved?: boolean;
+      /** If data is Int16Array → 'i16' (default); if Float32Array → 'f32' (default) */
+      format?: 'i16' | 'f32';
+      markAsLast?: boolean;
+    }
+  ) {
+    let u8: Uint8Array;
+    let format: 'i16' | 'f32' = opts.format ?? 'i16';
+    if (data instanceof ArrayBuffer) {
+      // assume Int16 unless caller specified
+      u8 = new Uint8Array(data);
+    } else if (data instanceof Int16Array) {
+      u8 = new Uint8Array(data.buffer, data.byteOffset, data.byteLength);
+      format = opts.format ?? 'i16';
+    } else if (data instanceof Float32Array) {
+      u8 = new Uint8Array(data.buffer, data.byteOffset, data.byteLength);
+      format = opts.format ?? 'f32';
+    } else {
+      throw new Error('Unsupported PCM container');
+    }
+    const base64 = toBase64(u8);
+    return this.playBuffer({
+      base64,
+      sampleRate: opts.sampleRate,
+      channels: opts.channels ?? 1,
+      interleaved: opts.interleaved ?? true,
+      format,
+      markAsLast: opts.markAsLast ?? true,
+    });
+  }
+  /**
+   * Queue raw PCM buffer from other TTS providers (base64 payload).
+   * Use ExternalPCM for full control of metadata.
+   */
+  async playBuffer(desc: ExternalPCM) {
+    const payload = {
+      base64: desc.base64,
+      sampleRate: desc.sampleRate,
+      channels: desc.channels ?? 1,
+      interleaved: desc.interleaved ?? true,
+      format: desc.format,
+      markAsLast: desc.markAsLast ?? true,
+    };
+    if (Platform.OS === 'ios' && NativeSpeech?.playBuffer) {
+      return NativeSpeech.playBuffer(payload);
+    }
+    if (!NativeTTS?.playBuffer) throw new Error('playBuffer not available on this platform.');
+    return NativeTTS.playBuffer(payload);
+  }
+  // ---------- Events ----------
+  private ensureListeners() {
+    if (this.subs.length) return;
+    // iOS unified: subscribe once on the unified emitter
+    if (Platform.OS === 'ios' && this.unifiedEmitter) {
+      const map: Partial<Record<NativeEventName, (...args: any[]) => void>> = {
+        onSpeechStart: (e) => this.handlers.onSpeechStart(e),
+        onSpeechRecognized: (e) => this.handlers.onSpeechRecognized(e),
+        onSpeechEnd: (e) => this.handlers.onSpeechEnd(e),
+        onSpeechError: (e) => this.handlers.onSpeechError(e),
+        onSpeechResults: (e) => this.handlers.onSpeechResults(e),
+        onSpeechPartialResults: (e) => this.handlers.onSpeechPartialResults(e),
+        onSpeechVolumeChanged: (e) => this.handlers.onSpeechVolumeChanged(e),
+        onFinishedSpeaking: () => this._onNativeFinishedSpeaking(),
+      };
+      (Object.keys(map) as NativeEventName[]).forEach((name) => {
+        try {
+          const handler = map[name];
+          if (!handler) return;
+          const sub = this.unifiedEmitter!.addListener(name, handler);
+          this.subs.push(sub);
+        } catch {}
+      });
+      return;
+    }
+    // Android (and iOS fallback): subscribe to both STT and TTS emitters
+    if (this.sttEmitter) {
+      const sttMap = {
+        onSpeechStart: (e: any) => this.handlers.onSpeechStart(e),
+        onSpeechRecognized: (e: any) => this.handlers.onSpeechRecognized(e),
+        onSpeechEnd: (e: any) => this.handlers.onSpeechEnd(e),
+        onSpeechError: (e: any) => this.handlers.onSpeechError(e),
+        onSpeechResults: (e: any) => this.handlers.onSpeechResults(e),
+        onSpeechPartialResults: (e: any) => this.handlers.onSpeechPartialResults(e),
+        onSpeechVolumeChanged: (e: any) => this.handlers.onSpeechVolumeChanged(e),
+        onNewSpeechWAV: (e: any) => this.handlers.onNewSpeechWAV(e),
+      };
+      (Object.keys(sttMap) as (keyof typeof sttMap)[]).forEach((name) => {
+        try {
+          const sub = this.sttEmitter!.addListener(name, sttMap[name]);
+          this.subs.push(sub);
+        } catch {}
+      });
+    }
+    if (this.ttsEmitter) {
+      try {
+        // MIN: prevent duplicate listeners across Fast Refresh / reload
+        const g: any = globalThis as any;
+        try { g.__SpeechJS_finishedSub?.remove?.(); } catch {}
+        const sub = this.ttsEmitter.addListener('onFinishedSpeaking', () => this._onNativeFinishedSpeaking());
+        g.__SpeechJS_finishedSub = sub;
+        this.subs.push(sub);
+      } catch {}
+    }
+  }
+  private teardownListeners() {
+    this.subs.forEach(s => { try { s.remove(); } catch {} });
+    this.subs = [];
+  }
+  // ---------- Friendly setters ----------
+  set onSpeechStart(fn: (e: SpeechStartEvent) => void) { this.handlers.onSpeechStart = fn; this.ensureListeners(); }
+  set onSpeechRecognized(fn: (e: SpeechRecognizedEvent) => void) { this.handlers.onSpeechRecognized = fn; this.ensureListeners(); }
+  set onSpeechEnd(fn: (e: SpeechEndEvent) => void) { this.handlers.onSpeechEnd = fn; this.ensureListeners(); }
+  set onSpeechError(fn: (e: SpeechErrorEvent) => void) { this.handlers.onSpeechError = fn; this.ensureListeners(); }
+  set onSpeechResults(fn: (e: SpeechResultsEvent) => void) { this.handlers.onSpeechResults = fn; this.ensureListeners(); }
+  set onSpeechPartialResults(fn: (e: SpeechResultsEvent) => void) { this.handlers.onSpeechPartialResults = fn; this.ensureListeners(); }
+  set onSpeechVolumeChanged(fn: (e: SpeechVolumeChangeEvent) => void) { this.handlers.onSpeechVolumeChanged = fn; this.ensureListeners(); }
+  set onNewSpeechWAV(fn: (e: NewSpeechWAVEvent) => void) { this.handlers.onNewSpeechWAV = fn; this.ensureListeners(); }
+  set onFinishedSpeaking(fn: () => void) { this.handlers.onFinishedSpeaking = fn; this.ensureListeners(); }
+}
+const SpeechInstance = new Speech();
+export default SpeechInstance;