npm - @omote/core - Versions diffs - 0.9.1 → 0.9.3 - Mend

@omote/core 0.9.1 → 0.9.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

package/dist/ErrorCodes-AX3ADZri.d.mts +266 -0
package/dist/ErrorCodes-AX3ADZri.d.ts +266 -0
package/dist/chunk-CYBTTLG7.mjs +927 -0
package/dist/chunk-CYBTTLG7.mjs.map +1 -0
package/dist/chunk-X5OTUOE6.mjs +927 -0
package/dist/chunk-X5OTUOE6.mjs.map +1 -0
package/dist/chunk-Y3DTP5P3.mjs +927 -0
package/dist/chunk-Y3DTP5P3.mjs.map +1 -0
package/dist/index.d.mts +214 -3
package/dist/index.d.ts +214 -3
package/dist/index.js +713 -233
package/dist/index.js.map +1 -1
package/dist/index.mjs +638 -225
package/dist/index.mjs.map +1 -1
package/dist/logging/index.d.mts +2 -2
package/dist/logging/index.d.ts +2 -2
package/dist/logging/index.js +75 -1
package/dist/logging/index.js.map +1 -1
package/dist/logging/index.mjs +9 -1
package/package.json +3 -1

package/dist/index.js CHANGED Viewed

@@ -52,10 +52,12 @@ __export(index_exports, {
   EMOTION_TO_AU: () => EMOTION_TO_AU,
   EMOTION_VECTOR_SIZE: () => EMOTION_VECTOR_SIZE,
   EXPLICIT_EMOTION_COUNT: () => EXPLICIT_EMOTION_COUNT,
+  ElevenLabsTTSBackend: () => ElevenLabsTTSBackend,
   EmotionController: () => EmotionController,
   EmotionPresets: () => EmotionPresets,
   EmotionResolver: () => EmotionResolver,
   EmphasisDetector: () => EmphasisDetector,
+  ErrorCodes: () => ErrorCodes,
   ErrorTypes: () => ErrorTypes,
   EventEmitter: () => EventEmitter,
   FaceCompositor: () => FaceCompositor,
@@ -79,6 +81,7 @@ __export(index_exports, {
   PRESERVE_POSITION_BONES: () => PRESERVE_POSITION_BONES,
   PROTOCOL_VERSION: () => PROTOCOL_VERSION,
   PlaybackPipeline: () => PlaybackPipeline,
+  PollyTTSBackend: () => PollyTTSBackend,
   ProceduralLifeLayer: () => ProceduralLifeLayer,
   RingBuffer: () => RingBuffer,
   SafariSpeechRecognition: () => SafariSpeechRecognition,
@@ -102,6 +105,7 @@ __export(index_exports, {
   calculatePeak: () => calculatePeak,
   calculateRMS: () => calculateRMS,
   configureCacheLimit: () => configureCacheLimit,
+  configureClock: () => configureClock,
   configureLogging: () => configureLogging,
   configureModelUrls: () => configureModelUrls,
   configureOrtCdn: () => configureOrtCdn,
@@ -118,6 +122,7 @@ __export(index_exports, {
   formatBytes: () => formatBytes,
   getCacheConfig: () => getCacheConfig,
   getCacheKey: () => getCacheKey,
+  getClock: () => getClock,
   getEmotionPreset: () => getEmotionPreset,
   getLoggingConfig: () => getLoggingConfig,
   getModelCache: () => getModelCache,
@@ -654,6 +659,19 @@ var OTLPExporter = class {
   }
 };
+// src/logging/Clock.ts
+var defaultClock = {
+  now: () => performance.now(),
+  timestamp: () => Date.now()
+};
+var activeClock = defaultClock;
+function configureClock(clock) {
+  activeClock = clock;
+}
+function getClock() {
+  return activeClock;
+}
 // src/telemetry/OmoteTelemetry.ts
 function generateId(length = 16) {
   const bytes = new Uint8Array(length);
@@ -762,7 +780,7 @@ var OmoteTelemetry = class {
     const traceId = parentContext?.traceId ?? this.activeTraceId ?? generateId(16);
     const spanId = generateId(8);
     const parentSpanId = parentContext?.spanId;
-    const startTime = performance.now();
+    const startTime = getClock().now();
     if (!parentContext && !this.activeTraceId) {
       this.activeTraceId = traceId;
     }
@@ -776,7 +794,7 @@ var OmoteTelemetry = class {
       ended = true;
       const idx = this.spanStack.findIndex((s) => s.spanId === spanId);
       if (idx !== -1) this.spanStack.splice(idx, 1);
-      const endTime = performance.now();
+      const endTime = getClock().now();
       const durationMs = endTime - startTime;
       if (status === "error" && !sampled) {
         sampled = this.shouldSample(true);
@@ -891,7 +909,7 @@ var OmoteTelemetry = class {
    */
   flushMetrics() {
     if (!this.exporter) return;
-    const timestamp = performance.now();
+    const timestamp = getClock().now();
     for (const [key, data] of this.counters) {
       if (data.value === 0) continue;
       const name = key.split("|")[0];
@@ -1012,7 +1030,7 @@ var Logger = class _Logger {
   log(level, message, data) {
     if (!shouldLog(level)) return;
     const entry = {
-      timestamp: Date.now(),
+      timestamp: getClock().timestamp(),
       level,
       module: this.module,
       message,
@@ -1054,12 +1072,12 @@ var Logger = class _Logger {
 };
 var loggerCache = /* @__PURE__ */ new Map();
 function createLogger(module2) {
-  let logger43 = loggerCache.get(module2);
-  if (!logger43) {
-    logger43 = new Logger(module2);
-    loggerCache.set(module2, logger43);
+  let logger45 = loggerCache.get(module2);
+  if (!logger45) {
+    logger45 = new Logger(module2);
+    loggerCache.set(module2, logger45);
   }
-  return logger43;
+  return logger45;
 }
 var noopLogger = {
   module: "noop",
@@ -1078,6 +1096,63 @@ var noopLogger = {
   child: () => noopLogger
 };
+// src/logging/ErrorCodes.ts
+var ErrorCodes = {
+  // ── Inference ──────────────────────────────────────────────────────────
+  /** Model failed to load (file not found, corrupted, unsupported format) */
+  INF_LOAD_FAILED: "OMOTE_INF_001",
+  /** ORT session poisoned after WebGPU device loss — must reload tab */
+  INF_SESSION_POISON: "OMOTE_INF_002",
+  /** Inference exceeded timeout threshold */
+  INF_TIMEOUT: "OMOTE_INF_003",
+  /** Out-of-memory during inference or model loading */
+  INF_OOM: "OMOTE_INF_004",
+  /** WebGPU unavailable, fell back to WASM */
+  INF_WEBGPU_FALLBACK: "OMOTE_INF_005",
+  /** Input tensor shape does not match model expectations */
+  INF_SHAPE_MISMATCH: "OMOTE_INF_006",
+  // ── Audio ──────────────────────────────────────────────────────────────
+  /** AudioContext creation or resume failed */
+  AUD_CONTEXT_FAILED: "OMOTE_AUD_001",
+  /** Gap detected in audio scheduling (buffer underrun) */
+  AUD_SCHEDULE_GAP: "OMOTE_AUD_002",
+  /** Audio buffer decoding failed */
+  AUD_DECODE_FAILED: "OMOTE_AUD_003",
+  // ── Speech ─────────────────────────────────────────────────────────────
+  /** Voice activity detection error */
+  SPH_VAD_ERROR: "OMOTE_SPH_001",
+  /** Automatic speech recognition error */
+  SPH_ASR_ERROR: "OMOTE_SPH_002",
+  /** Microphone access denied or unavailable */
+  SPH_MIC_DENIED: "OMOTE_SPH_003",
+  // ── TTS ────────────────────────────────────────────────────────────────
+  /** TTS synthesis failed */
+  TTS_SYNTH_FAILED: "OMOTE_TTS_001",
+  /** TTS streaming error (chunk delivery failure) */
+  TTS_STREAM_ERROR: "OMOTE_TTS_002",
+  /** Phonemizer (eSpeak-NG WASM) ran out of memory */
+  TTS_PHONEMIZER_OOM: "OMOTE_TTS_003",
+  // ── Pipeline ───────────────────────────────────────────────────────────
+  /** Invalid state transition in pipeline state machine */
+  PIP_STATE_ERROR: "OMOTE_PIP_001",
+  /** Pipeline operation aborted (user interrupt or signal) */
+  PIP_ABORT: "OMOTE_PIP_002",
+  // ── Cache ──────────────────────────────────────────────────────────────
+  /** IndexedDB storage quota exceeded */
+  CAC_QUOTA_EXCEEDED: "OMOTE_CAC_001",
+  /** Cache entry evicted (LRU or manual) */
+  CAC_EVICTION: "OMOTE_CAC_002",
+  /** Cached model is stale (version mismatch) */
+  CAC_STALE: "OMOTE_CAC_003",
+  // ── Network ────────────────────────────────────────────────────────────
+  /** HTTP fetch failed (model download, CDN) */
+  NET_FETCH_FAILED: "OMOTE_NET_001",
+  /** Network request timed out */
+  NET_TIMEOUT: "OMOTE_NET_002",
+  /** WebSocket connection error */
+  NET_WEBSOCKET_ERROR: "OMOTE_NET_003"
+};
 // src/audio/MicrophoneCapture.ts
 var logger = createLogger("MicrophoneCapture");
 var MicrophoneCapture = class {
@@ -1175,7 +1250,7 @@ var MicrophoneCapture = class {
           const pcm = this.floatToPCM16(chunk);
           this.events.emit("audio.chunk", {
             pcm,
-            timestamp: performance.now()
+            timestamp: getClock().now()
           });
           chunkCount++;
         }
@@ -1406,11 +1481,23 @@ var AudioScheduler = class {
     source.connect(gainNode);
     const scheduleTime = this.nextPlayTime;
     if (scheduleTime < ctx.currentTime) {
-      logger2.warn("Audio gap detected", {
-        scheduleTime,
-        currentTime: ctx.currentTime,
-        gapSec: ctx.currentTime - scheduleTime
-      });
+      const gap = ctx.currentTime - scheduleTime;
+      const gapMs = gap * 1e3;
+      if (gap > 0.5) {
+        logger2.error("Critical audio scheduling gap", {
+          code: ErrorCodes.AUD_SCHEDULE_GAP,
+          scheduleTime,
+          currentTime: ctx.currentTime,
+          gapMs: Math.round(gapMs)
+        });
+        this.options.onError?.(new Error(`Audio scheduling gap: ${gap.toFixed(3)}s`));
+      } else {
+        logger2.warn("Audio gap detected", {
+          scheduleTime,
+          currentTime: ctx.currentTime,
+          gapMs: Math.round(gapMs)
+        });
+      }
     }
     source.start(scheduleTime);
     const entry = { source, gainNode };
@@ -1604,8 +1691,8 @@ var AudioChunkCoalescer = class {
 var logger4 = createLogger("A2EProcessor");
 var FRAME_RATE = 30;
 var DRIP_INTERVAL_MS = 33;
-var HOLD_DURATION_MS = 100;
-var DECAY_DURATION_MS = 200;
+var HOLD_DURATION_MS = 400;
+var DECAY_DURATION_MS = 300;
 var _A2EProcessor = class _A2EProcessor {
   constructor(config) {
     this.writeOffset = 0;
@@ -1769,7 +1856,7 @@ var _A2EProcessor = class _A2EProcessor {
     if (this.timestampedQueue.length > 0 && this.timestampedQueue[0].timestamp <= currentTime) {
       const { frame } = this.timestampedQueue.shift();
       this.lastPulledFrame = frame;
-      this.lastDequeuedTime = performance.now();
+      this.lastDequeuedTime = getClock().now();
       return frame;
     }
     if (this.timestampedQueue.length > 0 && this.getFrameCallCount % 60 === 0) {
@@ -1781,7 +1868,7 @@ var _A2EProcessor = class _A2EProcessor {
       });
     }
     if (this.lastPulledFrame) {
-      const elapsed = performance.now() - this.lastDequeuedTime;
+      const elapsed = getClock().now() - this.lastDequeuedTime;
       if (elapsed < HOLD_DURATION_MS) {
         return this.lastPulledFrame;
       }
@@ -1866,9 +1953,9 @@ var _A2EProcessor = class _A2EProcessor {
       while (this.pendingChunks.length > 0 && !this.disposed) {
         const { chunk, timestamp } = this.pendingChunks.shift();
         try {
-          const t0 = performance.now();
+          const t0 = getClock().now();
           const result = await this.backend.infer(chunk, this.identityIndex);
-          const inferMs = Math.round(performance.now() - t0);
+          const inferMs = Math.round(getClock().now() - t0);
           const actualDuration = chunk.length / this.sampleRate;
           const actualFrameCount = Math.ceil(actualDuration * FRAME_RATE);
           const framesToQueue = Math.min(actualFrameCount, result.blendshapes.length);
@@ -1907,7 +1994,11 @@ var _A2EProcessor = class _A2EProcessor {
   }
   handleError(err) {
     const error = err instanceof Error ? err : new Error(String(err));
-    logger4.warn("A2EProcessor inference error", { error: error.message });
+    const isOOM = typeof err === "number" || error.message && /out of memory|oom|alloc/i.test(error.message);
+    logger4.warn("A2EProcessor inference error", {
+      error: error.message,
+      code: isOOM ? ErrorCodes.INF_OOM : ErrorCodes.INF_SESSION_POISON
+    });
     this.onError?.(error);
   }
 };
@@ -1929,6 +2020,12 @@ var MetricNames = {
   CACHE_HITS: "omote.cache.hits",
   /** Counter: Cache misses */
   CACHE_MISSES: "omote.cache.misses",
+  /** Counter: Cache stale (version/etag mismatch) */
+  CACHE_STALE: "omote.cache.stale",
+  /** Counter: Cache quota warning (>90% used) */
+  CACHE_QUOTA_WARNING: "omote.cache.quota_warning",
+  /** Counter: Cache eviction (LRU) */
+  CACHE_EVICTION: "omote.cache.eviction",
   // --- Pipeline ---
   /** Histogram: VoicePipeline turn latency (speech end → transcript ready, excludes playback) */
   VOICE_TURN_LATENCY: "omote.voice.turn.latency",
@@ -2228,14 +2325,14 @@ var PlaybackPipeline = class extends EventEmitter {
     this._currentRawFrame = null;
     this.cancelNeutralTransition();
     this.scheduler.warmup();
-    this.sessionStartTime = performance.now();
+    this.sessionStartTime = getClock().now();
     this.startFrameLoop();
     this.startMonitoring();
     this.setState("playing");
   }
   /** Feed a streaming audio chunk (PCM16 Uint8Array) */
   async onAudioChunk(chunk) {
-    const chunkStart = performance.now();
+    const chunkStart = getClock().now();
     const combined = this.coalescer.add(chunk);
     if (!combined) return;
     const float32 = pcm16ToFloat32(combined);
@@ -2245,7 +2342,7 @@ var PlaybackPipeline = class extends EventEmitter {
       this.emit("playback:start", { time: scheduleTime });
     }
     this.processor.pushAudio(float32, scheduleTime);
-    getTelemetry()?.recordHistogram(MetricNames.PLAYBACK_CHUNK_LATENCY, performance.now() - chunkStart);
+    getTelemetry()?.recordHistogram(MetricNames.PLAYBACK_CHUNK_LATENCY, getClock().now() - chunkStart);
   }
   /** Signal end of audio stream (flushes remaining audio) */
   async end() {
@@ -2348,15 +2445,15 @@ var PlaybackPipeline = class extends EventEmitter {
       const currentTime = this.scheduler.getCurrentTime();
       const lamFrame = this.processor.getFrameForTime(currentTime);
       if (lamFrame && lamFrame !== this.lastKnownLamFrame) {
-        this.lastNewFrameTime = performance.now();
+        this.lastNewFrameTime = getClock().now();
         this.lastKnownLamFrame = lamFrame;
         this.staleWarningEmitted = false;
       }
-      if (this.playbackStarted && this.lastNewFrameTime > 0 && performance.now() - this.lastNewFrameTime > this.staleThresholdMs) {
+      if (this.playbackStarted && this.lastNewFrameTime > 0 && getClock().now() - this.lastNewFrameTime > this.staleThresholdMs) {
         if (!this.staleWarningEmitted) {
           this.staleWarningEmitted = true;
           logger5.warn("A2E stalled \u2014 no new inference frames", {
-            staleDurationMs: Math.round(performance.now() - this.lastNewFrameTime),
+            staleDurationMs: Math.round(getClock().now() - this.lastNewFrameTime),
             queuedFrames: this.processor.queuedFrameCount
           });
         }
@@ -2396,7 +2493,7 @@ var PlaybackPipeline = class extends EventEmitter {
     if (this.sessionStartTime > 0) {
       getTelemetry()?.recordHistogram(
         MetricNames.PLAYBACK_SESSION_DURATION,
-        performance.now() - this.sessionStartTime
+        getClock().now() - this.sessionStartTime
       );
     }
     this.stopInternal();
@@ -2414,9 +2511,9 @@ var PlaybackPipeline = class extends EventEmitter {
   // ---------------------------------------------------------------------------
   startNeutralTransition(fromFrame) {
     this.neutralTransitionFrame = new Float32Array(fromFrame);
-    this.neutralTransitionStart = performance.now();
+    this.neutralTransitionStart = getClock().now();
     const animate = () => {
-      const elapsed = performance.now() - this.neutralTransitionStart;
+      const elapsed = getClock().now() - this.neutralTransitionStart;
       const t = Math.min(1, elapsed / this.neutralTransitionMs);
       const eased = 1 - Math.pow(1 - t, 3);
       logger5.trace("neutral transition", { t: Math.round(t * 1e3) / 1e3, eased: Math.round(eased * 1e3) / 1e3 });
@@ -2429,7 +2526,7 @@ var PlaybackPipeline = class extends EventEmitter {
         blendshapes,
         rawBlendshapes: blendshapes,
         // raw = scaled during transition
-        timestamp: performance.now() / 1e3,
+        timestamp: getClock().now() / 1e3,
         emotion: this._emotion ?? void 0
       };
       this.emit("frame", frame);
@@ -2660,7 +2757,7 @@ var ModelCache = class {
         logger7.warn("Failed to request persistent storage", { error: String(err) });
       }
     }
-    const dbOpenStart = performance.now();
+    const dbOpenStart = getClock().now();
     this.dbPromise = new Promise((resolve, reject) => {
       const request = indexedDB.open(DB_NAME, DB_VERSION);
       request.onerror = () => {
@@ -2669,7 +2766,7 @@ var ModelCache = class {
       };
       request.onsuccess = () => {
         this.db = request.result;
-        logger7.debug("IndexedDB opened", { durationMs: Math.round(performance.now() - dbOpenStart) });
+        logger7.debug("IndexedDB opened", { durationMs: Math.round(getClock().now() - dbOpenStart) });
         resolve(this.db);
       };
       request.onupgradeneeded = (event) => {
@@ -2743,16 +2840,16 @@ var ModelCache = class {
           }
           span?.end();
           if (hit) {
-            telemetry?.incrementCounter("omote.cache.hits", 1, {});
+            telemetry?.incrementCounter(MetricNames.CACHE_HITS, 1, {});
           } else {
-            telemetry?.incrementCounter("omote.cache.misses", 1, {});
+            telemetry?.incrementCounter(MetricNames.CACHE_MISSES, 1, {});
           }
           resolve(cached?.data ?? null);
         };
         request.onerror = () => {
           span?.setAttributes({ "cache.hit": false });
           span?.end();
-          telemetry?.incrementCounter("omote.cache.misses", 1, {});
+          telemetry?.incrementCounter(MetricNames.CACHE_MISSES, 1, {});
           resolve(null);
         };
       });
@@ -2796,14 +2893,14 @@ var ModelCache = class {
       if (!cached?.data) {
         span?.setAttributes({ "cache.hit": false });
         span?.end();
-        telemetry?.incrementCounter("omote.cache.misses", 1, {});
+        telemetry?.incrementCounter(MetricNames.CACHE_MISSES, 1, {});
         return { data: null, stale: false };
       }
       span?.setAttributes({ "cache.hit": true, "cache.size_bytes": cached.size });
       if (!cached.etag) {
         span?.setAttributes({ "cache.validated": false, "cache.stale": false });
         span?.end();
-        telemetry?.incrementCounter("omote.cache.hits", 1, {});
+        telemetry?.incrementCounter(MetricNames.CACHE_HITS, 1, {});
         return { data: cached.data, stale: false };
       }
       const fetchUrl = originalUrl || url;
@@ -2812,7 +2909,7 @@ var ModelCache = class {
         if (!response.ok) {
           span?.setAttributes({ "cache.validated": false, "cache.stale": false });
           span?.end();
-          telemetry?.incrementCounter("omote.cache.hits", 1, {});
+          telemetry?.incrementCounter(MetricNames.CACHE_HITS, 1, {});
           return { data: cached.data, stale: false };
         }
         const serverEtag = response.headers.get("etag");
@@ -2825,17 +2922,17 @@ var ModelCache = class {
         });
         span?.end();
         if (isStale) {
-          telemetry?.incrementCounter("omote.cache.stale", 1, {});
+          telemetry?.incrementCounter(MetricNames.CACHE_STALE, 1, {});
           logger7.debug("Stale cache detected", { url });
         } else {
-          telemetry?.incrementCounter("omote.cache.hits", 1, {});
+          telemetry?.incrementCounter(MetricNames.CACHE_HITS, 1, {});
         }
         return { data: cached.data, stale: isStale };
       } catch (fetchError) {
         logger7.warn("HEAD validation failed, using cached data", { error: String(fetchError) });
         span?.setAttributes({ "cache.validated": false, "cache.stale": false });
         span?.end();
-        telemetry?.incrementCounter("omote.cache.hits", 1, {});
+        telemetry?.incrementCounter(MetricNames.CACHE_HITS, 1, {});
         return { data: cached.data, stale: false };
       }
     } catch {
@@ -2916,7 +3013,7 @@ var ModelCache = class {
     const telemetry = getTelemetry();
     if (quota.percentUsed > 90) {
       logger7.warn("Storage quota warning", { percentUsed: quota.percentUsed.toFixed(1), used: formatBytes(quota.usedBytes), quota: formatBytes(quota.quotaBytes) });
-      telemetry?.incrementCounter("omote.cache.quota_warning", 1, {
+      telemetry?.incrementCounter(MetricNames.CACHE_QUOTA_WARNING, 1, {
         percent_used: String(Math.round(quota.percentUsed))
       });
       if (config.onQuotaWarning) {
@@ -3058,7 +3155,7 @@ var ModelCache = class {
       });
       span?.end();
       if (freedBytes > 0) {
-        telemetry?.incrementCounter("omote.cache.eviction", evictedUrls.length, {
+        telemetry?.incrementCounter(MetricNames.CACHE_EVICTION, evictedUrls.length, {
           bytes_freed: String(freedBytes)
         });
       }
@@ -3578,7 +3675,7 @@ var _A2EInference = class _A2EInference {
       throw new Error("Model already loaded. Call dispose() first.");
     }
     this.isLoading = true;
-    const startTime = performance.now();
+    const startTime = getClock().now();
     const telemetry = getTelemetry();
     const span = telemetry?.startSpan("A2EInference.load", {
       "model.url": this.config.modelUrl,
@@ -3674,7 +3771,7 @@ var _A2EInference = class _A2EInference {
         executionProvider: this._backend,
         backend: this._backend
       });
-      const loadTimeMs = performance.now() - startTime;
+      const loadTimeMs = getClock().now() - startTime;
       logger10.info("Model loaded successfully", {
         backend: this._backend,
         loadTimeMs: Math.round(loadTimeMs),
@@ -3693,7 +3790,7 @@ var _A2EInference = class _A2EInference {
       });
       await new Promise((r) => setTimeout(r, 0));
       logger10.debug("Running warmup inference to initialize GPU context");
-      const warmupStart = performance.now();
+      const warmupStart = getClock().now();
       const warmupAudio = new Float32Array(this.chunkSize);
       const warmupIdentity = new Float32Array(this.numIdentityClasses);
       warmupIdentity[0] = 1;
@@ -3706,7 +3803,7 @@ var _A2EInference = class _A2EInference {
         this.session.run(warmupFeeds).then(() => "ok"),
         new Promise((r) => setTimeout(() => r("timeout"), WARMUP_TIMEOUT_MS))
       ]);
-      const warmupTimeMs = performance.now() - warmupStart;
+      const warmupTimeMs = getClock().now() - warmupStart;
       if (warmupResult === "timeout") {
         logger10.warn("Warmup inference timed out \u2014 GPU may be unresponsive. Continuing without warmup.", {
           timeoutMs: WARMUP_TIMEOUT_MS,
@@ -3786,7 +3883,7 @@ var _A2EInference = class _A2EInference {
           "inference.input_samples": this.chunkSize
         });
         try {
-          const startTime = performance.now();
+          const startTime = getClock().now();
           let timeoutId;
           const results = await Promise.race([
             this.session.run(feeds).then((r) => {
@@ -3800,7 +3897,7 @@ var _A2EInference = class _A2EInference {
               );
             })
           ]);
-          const inferenceTimeMs = performance.now() - startTime;
+          const inferenceTimeMs = getClock().now() - startTime;
           const blendshapeOutput = results["blendshapes"];
           if (!blendshapeOutput) {
             throw new Error("Missing blendshapes output from model");
@@ -4207,9 +4304,9 @@ var A2EUnifiedAdapter = class {
           "inference.input_samples": audio.length
         });
         try {
-          const startTime = performance.now();
+          const startTime = getClock().now();
           const result = await this.worker.inferLAM(audio, identityIndex);
-          const inferenceTimeMs = performance.now() - startTime;
+          const inferenceTimeMs = getClock().now() - startTime;
           const flatBuffer = result.blendshapes;
           const { numFrames, numBlendshapes } = result;
           const blendshapes = [];
@@ -4860,7 +4957,7 @@ var KokoroTTSInference = class {
       throw new Error("KokoroTTS is already loading");
     }
     this.isLoading = true;
-    const startTime = performance.now();
+    const startTime = getClock().now();
     try {
       const backendPref = this.config.backend ?? "wasm";
       const ortResult = await getOnnxRuntimeForPreference(backendPref);
@@ -4884,7 +4981,7 @@ var KokoroTTSInference = class {
           "KokoroTTS InferenceSession.create"
         );
       }
-      const loadTimeMs = performance.now() - startTime;
+      const loadTimeMs = getClock().now() - startTime;
       logger17.info("Kokoro TTS loaded", {
         backend: this._backend,
         loadTimeMs: Math.round(loadTimeMs),
@@ -4971,7 +5068,18 @@ var KokoroTTSInference = class {
         logger17.debug("stream aborted");
         return;
       }
-      const phonemes = await phonemize(sentence, language);
+      let phonemes;
+      try {
+        phonemes = await phonemize(sentence, language);
+      } catch (phonErr) {
+        logger17.error("Phonemizer failed (possible OOM)", {
+          code: ErrorCodes.TTS_PHONEMIZER_OOM,
+          error: String(phonErr),
+          textLength: sentence.length
+        });
+        yield { audio: new Float32Array(0), text: sentence, phonemes: "", duration: 0 };
+        continue;
+      }
       const tokens = tokenize(phonemes);
       const voiceData = await this.ensureVoice(voiceName);
       const style = getStyleForTokenCount(voiceData, tokens.length);
@@ -5031,16 +5139,27 @@ var KokoroTTSInference = class {
           "tts.speed": speed
         });
         try {
-          const startTime = performance.now();
+          const startTime = getClock().now();
           const language = getVoiceLanguage(voiceName);
-          const phonemes = await phonemize(text, language);
+          let phonemes;
+          try {
+            phonemes = await phonemize(text, language);
+          } catch (phonErr) {
+            logger17.error("Phonemizer failed (possible OOM)", {
+              code: ErrorCodes.TTS_PHONEMIZER_OOM,
+              error: String(phonErr),
+              textLength: text.length
+            });
+            resolve({ audio: new Float32Array(0), duration: 0, inferenceTimeMs: 0 });
+            return;
+          }
           logger17.trace("Phonemized", { text: text.substring(0, 50), phonemes: phonemes.substring(0, 50) });
           const tokens = tokenize(phonemes);
           logger17.trace("Tokenized", { numTokens: tokens.length });
           const voiceData = await this.ensureVoice(voiceName);
           const style = getStyleForTokenCount(voiceData, tokens.length);
           const audio = await this.runInference(tokens, style, speed);
-          const inferenceTimeMs = performance.now() - startTime;
+          const inferenceTimeMs = getClock().now() - startTime;
           const duration = audio.length / SAMPLE_RATE;
           logger17.trace("Synthesis complete", {
             duration: `${duration.toFixed(2)}s`,
@@ -5159,11 +5278,11 @@ var KokoroTTSUnifiedAdapter = class {
       "model.url": this.modelUrl
     });
     try {
-      const startTime = performance.now();
+      const startTime = getClock().now();
       await this.worker.loadKokoro({ modelUrl: this.modelUrl });
       this._isLoaded = true;
       this.loadedGeneration = this.worker.workerGeneration;
-      const loadTimeMs = performance.now() - startTime;
+      const loadTimeMs = getClock().now() - startTime;
       logger18.info("Kokoro TTS loaded via unified worker", {
         backend: "wasm",
         loadTimeMs: Math.round(loadTimeMs),
@@ -5238,11 +5357,11 @@ var KokoroTTSUnifiedAdapter = class {
   runWorkerInference(tokens, style, speed) {
     return new Promise((resolve, reject) => {
       this.inferenceQueue = this.inferenceQueue.then(async () => {
-        const startTime = performance.now();
+        const startTime = getClock().now();
         const telemetry = getTelemetry();
         try {
           const result = await this.worker.inferKokoro(tokens, style, speed);
-          const latencyMs = performance.now() - startTime;
+          const latencyMs = getClock().now() - startTime;
           telemetry?.recordHistogram("omote.inference.latency", latencyMs, {
             model: "kokoro-tts-unified",
             backend: "wasm"
@@ -5357,11 +5476,11 @@ var SileroVADUnifiedAdapter = class {
     return new Promise((resolve, reject) => {
       this.inferenceQueue = this.inferenceQueue.then(async () => {
         try {
-          const startTime = performance.now();
+          const startTime = getClock().now();
           const result = await this.worker.processVAD(audioChunkCopy, this.state, this.context);
           this.state = result.state;
           this.context = audioChunkCopy.slice(-this.contextSize);
-          const inferenceTimeMs = performance.now() - startTime;
+          const inferenceTimeMs = getClock().now() - startTime;
           const isSpeech = result.probability > this.config.threshold;
           let preSpeechChunks;
           if (isSpeech && !this.wasSpeaking) {
@@ -5419,17 +5538,20 @@ var SileroVADUnifiedAdapter = class {
 var logger20 = createLogger("createA2E");
 function createA2E(config = {}) {
   const modelUrl = config.modelUrl ?? DEFAULT_MODEL_URLS.lam;
+  const platformInfo = {
+    modelUrl,
+    isIOS: isIOS(),
+    webgpu: typeof navigator !== "undefined" && "gpu" in navigator
+  };
   if (config.unifiedWorker) {
-    logger20.info("Creating A2EUnifiedAdapter (via unified worker)", {
-      modelUrl
-    });
+    logger20.info("Creating A2EUnifiedAdapter (via unified worker)", platformInfo);
     return new A2EUnifiedAdapter(config.unifiedWorker, {
       modelUrl,
       externalDataUrl: config.externalDataUrl,
       numIdentityClasses: config.numIdentityClasses
     });
   }
-  logger20.info("Creating A2EInference", { modelUrl });
+  logger20.info("Creating A2EInference", platformInfo);
   return new A2EInference({
     modelUrl,
     externalDataUrl: config.externalDataUrl,
@@ -5805,16 +5927,28 @@ async function loadOrt(wasmPaths, isIOSDevice) {
   // ort.webgpu.min.js crashes WebKit's JIT compiler.
   var isSafariWorker = typeof navigator !== 'undefined' && /safari/i.test(navigator.userAgent) && !/chrome|crios|fxios|chromium|edg/i.test(navigator.userAgent);
   var hasWebGPU = false;
-  if (!isIOSDevice && !isSafariWorker && typeof navigator !== 'undefined' && navigator.gpu) {
+  var webgpuReason = '';
+  if (isIOSDevice) {
+    webgpuReason = 'iOS device';
+  } else if (isSafariWorker) {
+    webgpuReason = 'Safari (JSEP/ASYNCIFY crash)';
+  } else if (typeof navigator === 'undefined' || !navigator.gpu) {
+    webgpuReason = 'navigator.gpu unavailable';
+  } else {
     try {
       var adapter = await navigator.gpu.requestAdapter();
       if (adapter) {
         hasWebGPU = true;
+      } else {
+        webgpuReason = 'requestAdapter returned null';
       }
     } catch (e) {
-      // WebGPU not available \u2014 fall through to WASM
+      webgpuReason = 'requestAdapter failed: ' + String(e);
     }
   }
+  if (!hasWebGPU && webgpuReason) {
+    console.warn('[UnifiedWorker] WebGPU unavailable: ' + webgpuReason + ', falling back to WASM');
+  }
   var ortUrl;
   if (hasWebGPU) {
@@ -6299,7 +6433,12 @@ var UnifiedInferenceWorker = class {
       span?.setAttributes({ "worker.init_time_ms": loadTimeMs, "worker.backend": this._workerBackend });
       span?.end();
     } catch (error) {
-      span?.endWithError(error instanceof Error ? error : new Error(String(error)));
+      const err = error instanceof Error ? error : new Error(String(error));
+      const isTimeout = err.message.includes("timed out");
+      if (isTimeout) {
+        logger21.error("Worker init timed out", { code: "OMOTE_INF_003", timeoutMs: INIT_TIMEOUT_MS });
+      }
+      span?.endWithError(err);
       this.cleanup();
       throw error;
     }
@@ -6683,7 +6822,7 @@ var TTSSpeaker = class {
   async connect(tts, config) {
     logger22.info("Connecting TTS...");
     const span = getTelemetry()?.startSpan("TTSSpeaker.connect");
-    const connectStart = performance.now();
+    const connectStart = getClock().now();
     this.tts = tts;
     if (!tts.isLoaded) {
       await tts.load();
@@ -6692,7 +6831,7 @@ var TTSSpeaker = class {
     if (!hasLam) {
       this._audioOnly = true;
       this.scheduler = new AudioScheduler({ sampleRate: tts.sampleRate });
-      getTelemetry()?.recordHistogram(MetricNames.TTS_CONNECT_LATENCY, performance.now() - connectStart);
+      getTelemetry()?.recordHistogram(MetricNames.TTS_CONNECT_LATENCY, getClock().now() - connectStart);
       span?.end();
       logger22.info("TTS connected (audio-only mode)");
       return;
@@ -6726,7 +6865,7 @@ var TTSSpeaker = class {
       neutralTransitionMs: config?.neutralTransitionMs
     });
     await this.ttsPlayback.initialize();
-    getTelemetry()?.recordHistogram(MetricNames.TTS_CONNECT_LATENCY, performance.now() - connectStart);
+    getTelemetry()?.recordHistogram(MetricNames.TTS_CONNECT_LATENCY, getClock().now() - connectStart);
     span?.end();
     logger22.info("TTS connected (lip sync mode)");
   }
@@ -6761,7 +6900,7 @@ var TTSSpeaker = class {
     const span = getTelemetry()?.startSpan("TTSSpeaker.speak", {
       "text.length": text.length
     });
-    const speakStart = performance.now();
+    const speakStart = getClock().now();
     try {
       if (this._audioOnly) {
         await this.speakAudioOnly(text, abort, options?.voice);
@@ -6771,7 +6910,7 @@ var TTSSpeaker = class {
           voice: options?.voice
         });
       }
-      getTelemetry()?.recordHistogram(MetricNames.TTS_SPEAK_LATENCY, performance.now() - speakStart);
+      getTelemetry()?.recordHistogram(MetricNames.TTS_SPEAK_LATENCY, getClock().now() - speakStart);
       span?.end();
     } catch (err) {
       span?.endWithError(err instanceof Error ? err : new Error(String(err)));
@@ -6901,42 +7040,42 @@ var TTSSpeaker = class {
       end: async () => {
         if (ended) return;
         ended = true;
-        if (abort.signal.aborted) {
-          this._isSpeaking = false;
-          if (this.currentAbort === abort) this.currentAbort = null;
-          return;
-        }
-        if (buffer.trim()) {
-          enqueueSentence(buffer.trim());
-          buffer = "";
-        }
-        await processChain;
-        if (abort.signal.aborted) {
-          this._isSpeaking = false;
-          if (this.currentAbort === abort) this.currentAbort = null;
-          return;
-        }
-        await pipeline.end();
-        await new Promise((resolve) => {
-          let resolved = false;
-          const done = () => {
-            if (resolved) return;
-            resolved = true;
-            unsubC();
-            unsubS();
-            abort.signal.removeEventListener("abort", done);
-            resolve();
-          };
+        const unsubs = [];
+        try {
           if (abort.signal.aborted) {
-            resolve();
             return;
           }
-          const unsubC = pipeline.on("playback:complete", done);
-          const unsubS = pipeline.on("playback:stop", done);
-          abort.signal.addEventListener("abort", done);
-        });
-        this._isSpeaking = false;
-        if (this.currentAbort === abort) this.currentAbort = null;
+          if (buffer.trim()) {
+            enqueueSentence(buffer.trim());
+            buffer = "";
+          }
+          await processChain;
+          if (abort.signal.aborted) {
+            return;
+          }
+          await pipeline.end();
+          await new Promise((resolve) => {
+            let resolved = false;
+            const done = () => {
+              if (resolved) return;
+              resolved = true;
+              resolve();
+            };
+            if (abort.signal.aborted) {
+              resolve();
+              return;
+            }
+            unsubs.push(pipeline.on("playback:complete", done));
+            unsubs.push(pipeline.on("playback:stop", done));
+            const onAbort = () => done();
+            abort.signal.addEventListener("abort", onAbort);
+            unsubs.push(() => abort.signal.removeEventListener("abort", onAbort));
+          });
+        } finally {
+          unsubs.forEach((fn) => fn());
+          this._isSpeaking = false;
+          if (this.currentAbort === abort) this.currentAbort = null;
+        }
       }
     };
   }
@@ -7627,14 +7766,14 @@ function createKokoroTTS(config = {}) {
       logger24.info("iOS + unified worker: creating KokoroTTSUnifiedAdapter (off-main-thread ONNX)");
       return new KokoroTTSUnifiedAdapter(config.unifiedWorker, config);
     }
-    logger24.info("iOS detected: creating KokoroTTSInference (main thread, shared ORT)");
+    logger24.info("iOS: creating KokoroTTSInference (main thread, shared ORT)");
     return new KokoroTTSInference(config);
   }
   if (!KokoroTTSWorker.isSupported()) {
     logger24.info("Worker not supported: creating KokoroTTSInference (main thread)");
     return new KokoroTTSInference(config);
   }
-  logger24.info("Auto-detected: creating KokoroTTSWorker (off-main-thread)");
+  logger24.info("Auto: creating KokoroTTSWorker (off-main-thread)");
   return new KokoroTTSWorker(config);
 }
@@ -7868,6 +8007,9 @@ var _SenseVoiceInference = class _SenseVoiceInference {
     // so all future transcribe() calls reject immediately to prevent concurrent access.
     this.poisoned = false;
     // 10s for SenseVoice (heavier preprocessing)
+    // WebGPU shape change tracking (for dynamic shape warning)
+    this.lastLfrFrames = 0;
+    this.webgpuShapeWarned = false;
     // Preprocessing state (loaded once)
     this.tokenMap = null;
     this.negMean = null;
@@ -7902,7 +8044,7 @@ var _SenseVoiceInference = class _SenseVoiceInference {
       throw new Error("Model already loaded. Call dispose() first.");
     }
     this.isLoading = true;
-    const startTime = performance.now();
+    const startTime = getClock().now();
     const telemetry = getTelemetry();
     const span = telemetry?.startSpan("SenseVoice.load", {
       "model.url": this.config.modelUrl,
@@ -7969,7 +8111,7 @@ var _SenseVoiceInference = class _SenseVoiceInference {
       } catch (cmvnErr) {
         logger25.warn("Failed to read CMVN from model metadata", { error: cmvnErr });
       }
-      const loadTimeMs = performance.now() - startTime;
+      const loadTimeMs = getClock().now() - startTime;
       logger25.info("SenseVoice model loaded", {
         backend: this._backend,
         loadTimeMs: Math.round(loadTimeMs),
@@ -8034,24 +8176,35 @@ var _SenseVoiceInference = class _SenseVoiceInference {
           "inference.input_samples": audio.length
         });
         try {
-          const startTime = performance.now();
-          const preprocessStart = performance.now();
+          const startTime = getClock().now();
+          const preprocessStart = getClock().now();
           const fbank = computeKaldiFbank(audio, 16e3, 80);
           const numFrames = fbank.length / 80;
           if (numFrames === 0) {
             resolve({
               text: "",
-              inferenceTimeMs: performance.now() - startTime,
-              preprocessTimeMs: performance.now() - preprocessStart
+              inferenceTimeMs: getClock().now() - startTime,
+              preprocessTimeMs: getClock().now() - preprocessStart
             });
             return;
           }
           const lfrFeatures = applyLFR(fbank, 80, 7, 6);
           const numLfrFrames = lfrFeatures.length / 560;
+          if (this._backend === "webgpu" && this.lastLfrFrames !== 0 && numLfrFrames !== this.lastLfrFrames) {
+            if (!this.webgpuShapeWarned) {
+              this.webgpuShapeWarned = true;
+              logger25.warn("SenseVoice running on WebGPU with variable audio shapes \u2014 risk of kernel crash", {
+                code: ErrorCodes.INF_SHAPE_MISMATCH,
+                previousFrames: this.lastLfrFrames,
+                currentFrames: numLfrFrames
+              });
+            }
+          }
+          this.lastLfrFrames = numLfrFrames;
           if (this.negMean && this.invStddev) {
             applyCMVN(lfrFeatures, 560, this.negMean, this.invStddev);
           }
-          const preprocessTimeMs = performance.now() - preprocessStart;
+          const preprocessTimeMs = getClock().now() - preprocessStart;
           const ort = this.ort;
           const feeds = {
             x: new ort.Tensor("float32", lfrFeatures, [1, numLfrFrames, 560]),
@@ -8081,7 +8234,7 @@ var _SenseVoiceInference = class _SenseVoiceInference {
           const seqLen = logitsDims[1];
           const vocabSize = logitsDims[2];
           const decoded = ctcGreedyDecode(logitsData, seqLen, vocabSize, this.tokenMap);
-          const inferenceTimeMs = performance.now() - startTime;
+          const inferenceTimeMs = getClock().now() - startTime;
           logger25.trace("Transcription complete", {
             text: decoded.text.substring(0, 50),
             language: decoded.language,
@@ -9420,7 +9573,7 @@ var SileroVADInference = class {
       throw new Error("Model already loaded. Call dispose() first.");
     }
     this.isLoading = true;
-    const startTime = performance.now();
+    const startTime = getClock().now();
     const telemetry = getTelemetry();
     const span = telemetry?.startSpan("SileroVAD.load", {
       "model.url": this.config.modelUrl,
@@ -9452,7 +9605,7 @@ var SileroVADInference = class {
       const modelData = new Uint8Array(modelBuffer);
       this.session = await ort.InferenceSession.create(modelData, sessionOptions);
       this.reset();
-      const loadTimeMs = performance.now() - startTime;
+      const loadTimeMs = getClock().now() - startTime;
       logger28.info("Model loaded successfully", {
         backend: this._backend,
         loadTimeMs: Math.round(loadTimeMs),
@@ -9632,7 +9785,7 @@ var SileroVADInference = class {
           "inference.chunk_size": this.chunkSize
         });
         try {
-          const startTime = performance.now();
+          const startTime = getClock().now();
           const inputSize = this.contextSize + this.chunkSize;
           const inputBuffer = new Float32Array(inputSize);
           inputBuffer.set(this.context, 0);
@@ -9662,7 +9815,7 @@ var SileroVADInference = class {
             );
           }
           this.context = audioChunkCopy.slice(-this.contextSize);
-          const inferenceTimeMs = performance.now() - startTime;
+          const inferenceTimeMs = getClock().now() - startTime;
           const isSpeech = probability > this.config.threshold;
           let preSpeechChunks;
           if (isSpeech && !this.wasSpeaking) {
@@ -10477,6 +10630,7 @@ var _SpeechListener = class _SpeechListener extends EventEmitter {
     this.lastProgressiveSamples = 0;
     // ASR error recovery
     this.asrErrorCount = 0;
+    this.progressiveErrorCount = 0;
     this.config = config ?? {};
   }
   /** Current listener state */
@@ -10669,7 +10823,7 @@ var _SpeechListener = class _SpeechListener extends EventEmitter {
       if (result.isSpeech) {
         if (!wasSpeaking) {
           this.isSpeechActive = true;
-          this.speechStartTime = performance.now();
+          this.speechStartTime = getClock().now();
           this.audioBuffer = [];
           this.audioBufferSamples = 0;
           this.lastProgressiveResult = null;
@@ -10708,13 +10862,13 @@ var _SpeechListener = class _SpeechListener extends EventEmitter {
     const extended = this.config.silenceTimeoutExtendedMs ?? 700;
     const adaptive = this.config.adaptiveTimeout ?? true;
     if (!adaptive) return base;
-    const speechDurationMs = performance.now() - this.speechStartTime;
+    const speechDurationMs = getClock().now() - this.speechStartTime;
     return speechDurationMs > 3e3 ? extended : base;
   }
   onSilenceDetected() {
     const capturedEpoch = this.epoch;
     this.isSpeechActive = false;
-    const durationMs = performance.now() - this.speechStartTime;
+    const durationMs = getClock().now() - this.speechStartTime;
     logger31.debug("Speech end", { durationMs: Math.round(durationMs) });
     this.emit("speech:end", { durationMs });
     this.clearSilenceTimer();
@@ -10811,7 +10965,15 @@ var _SpeechListener = class _SpeechListener extends EventEmitter {
             this.lastProgressiveSamples = snapshotSamples;
             this.emit("transcript", { ...result, isFinal: false });
           }
-        } catch {
+        } catch (err) {
+          this.progressiveErrorCount = (this.progressiveErrorCount ?? 0) + 1;
+          if (this.progressiveErrorCount % 10 === 1) {
+            logger31.warn("Progressive transcription error", {
+              code: ErrorCodes.SPH_ASR_ERROR,
+              error: String(err),
+              count: this.progressiveErrorCount
+            });
+          }
         }
       })();
     }, intervalMs);
@@ -10828,7 +10990,7 @@ var _SpeechListener = class _SpeechListener extends EventEmitter {
   async transcribeWithTimeout(audio) {
     if (!this.asr) return null;
     const timeoutMs = this.config.transcriptionTimeoutMs ?? 1e4;
-    const startTime = performance.now();
+    const startTime = getClock().now();
     const span = getTelemetry()?.startSpan("SpeechListener.transcribe", {
       "inference.input_samples": audio.length,
       "inference.input_duration_ms": audio.length / 16e3 * 1e3
@@ -10842,7 +11004,7 @@ var _SpeechListener = class _SpeechListener extends EventEmitter {
         })
       ]);
       clearTimeout(timeoutId);
-      const latency = performance.now() - startTime;
+      const latency = getClock().now() - startTime;
       this.asrErrorCount = 0;
       getTelemetry()?.recordHistogram(MetricNames.VOICE_TRANSCRIPTION_LATENCY, latency);
       getTelemetry()?.incrementCounter(MetricNames.VOICE_TRANSCRIPTIONS);
@@ -11016,11 +11178,11 @@ var InterruptionHandler = class extends EventEmitter {
   getState() {
     return {
       isSpeaking: this.isSpeaking,
-      speechDurationMs: this.isSpeaking ? performance.now() - this.speechStartTime : 0
+      speechDurationMs: this.isSpeaking ? getClock().now() - this.speechStartTime : 0
     };
   }
   onSpeechDetected(rms) {
-    const now = performance.now();
+    const now = getClock().now();
     this.lastSpeechTime = now;
     if (this.silenceTimer) {
       clearTimeout(this.silenceTimer);
@@ -11237,7 +11399,7 @@ var SafariSpeechRecognition = class _SafariSpeechRecognition {
       this.setupEventHandlers();
       this.recognition.start();
       this.isListening = true;
-      this.startTime = performance.now();
+      this.startTime = getClock().now();
       this.accumulatedText = "";
       logger33.info("Speech recognition started", {
         language: this.config.language
@@ -11338,7 +11500,7 @@ var SafariSpeechRecognition = class _SafariSpeechRecognition {
             const speechResult = {
               text: isFinal ? this.accumulatedText.trim() : text,
               language: this.config.language,
-              inferenceTimeMs: performance.now() - this.startTime,
+              inferenceTimeMs: getClock().now() - this.startTime,
               isFinal,
               confidence: alternative.confidence
             };
@@ -11370,13 +11532,13 @@ var SafariSpeechRecognition = class _SafariSpeechRecognition {
       this.isListening = false;
       logger33.info("Speech recognition ended", {
         totalText: this.accumulatedText.length,
-        durationMs: performance.now() - this.startTime
+        durationMs: getClock().now() - this.startTime
       });
       if (this.stopResolver) {
         const result = {
           text: this.accumulatedText.trim(),
           language: this.config.language,
-          inferenceTimeMs: performance.now() - this.startTime,
+          inferenceTimeMs: getClock().now() - this.startTime,
           isFinal: true
         };
         this.stopResolver(result);
@@ -11420,6 +11582,303 @@ var SafariSpeechRecognition = class _SafariSpeechRecognition {
   }
 };
+// src/inference/ElevenLabsTTSBackend.ts
+var logger34 = createLogger("ElevenLabsTTS");
+var DEFAULT_MODEL = "eleven_multilingual_v2";
+var DEFAULT_OUTPUT_FORMAT = "pcm_16000";
+var DEFAULT_STABILITY = 0.5;
+var DEFAULT_SIMILARITY_BOOST = 0.75;
+var DEFAULT_BASE_URL = "https://api.elevenlabs.io";
+var FORMAT_TO_SAMPLE_RATE = {
+  pcm_16000: 16e3,
+  pcm_22050: 22050,
+  pcm_24000: 24e3,
+  pcm_44100: 44100
+};
+var ElevenLabsTTSBackend = class {
+  constructor(config) {
+    this._isLoaded = false;
+    if (!config.apiKey) throw new Error("ElevenLabsTTS: apiKey is required");
+    if (!config.voiceId) throw new Error("ElevenLabsTTS: voiceId is required");
+    this.apiKey = config.apiKey;
+    this.voiceId = config.voiceId;
+    this.model = config.model ?? DEFAULT_MODEL;
+    this.outputFormat = config.outputFormat ?? DEFAULT_OUTPUT_FORMAT;
+    this.stability = config.stability ?? DEFAULT_STABILITY;
+    this.similarityBoost = config.similarityBoost ?? DEFAULT_SIMILARITY_BOOST;
+    this.baseUrl = config.baseUrl ?? DEFAULT_BASE_URL;
+    const rate = FORMAT_TO_SAMPLE_RATE[this.outputFormat];
+    if (!rate) {
+      throw new Error(
+        `ElevenLabsTTS: unsupported outputFormat "${this.outputFormat}". Supported: ${Object.keys(FORMAT_TO_SAMPLE_RATE).join(", ")}`
+      );
+    }
+    this._sampleRate = rate;
+  }
+  get sampleRate() {
+    return this._sampleRate;
+  }
+  get isLoaded() {
+    return this._isLoaded;
+  }
+  // ─── Load ───────────────────────────────────────────────────────────────
+  /**
+   * No-op for cloud TTS (no model to load).
+   * Marks backend as ready.
+   */
+  async load() {
+    this._isLoaded = true;
+    logger34.info("ElevenLabs TTS ready", { voiceId: this.voiceId, model: this.model });
+  }
+  // ─── Stream ─────────────────────────────────────────────────────────────
+  /**
+   * Stream audio from ElevenLabs for the given text.
+   *
+   * Uses the streaming endpoint. Yields a single chunk for non-streaming
+   * or multiple chunks as response data arrives.
+   */
+  async *stream(text, options) {
+    if (!this._isLoaded) {
+      throw new Error("ElevenLabsTTS: not loaded. Call load() first.");
+    }
+    const trimmed = text.trim();
+    if (trimmed.length === 0) {
+      throw new Error("ElevenLabsTTS: text must not be empty");
+    }
+    const startTime = getClock().now();
+    const telemetry = getTelemetry();
+    const span = telemetry?.startSpan("ElevenLabsTTS.stream", {
+      "tts.text_length": trimmed.length,
+      "tts.voice_id": this.voiceId,
+      "tts.model": this.model
+    });
+    const url = `${this.baseUrl}/v1/text-to-speech/${this.voiceId}?output_format=${this.outputFormat}`;
+    try {
+      const response = await fetch(url, {
+        method: "POST",
+        headers: {
+          "xi-api-key": this.apiKey,
+          "Content-Type": "application/json",
+          Accept: "audio/pcm"
+        },
+        body: JSON.stringify({
+          text: trimmed,
+          model_id: this.model,
+          voice_settings: {
+            stability: this.stability,
+            similarity_boost: this.similarityBoost
+          }
+        }),
+        signal: options?.signal
+      });
+      if (!response.ok) {
+        const errorText = await response.text().catch(() => "unknown");
+        const msg = `ElevenLabsTTS: HTTP ${response.status} \u2014 ${this.getHttpErrorMessage(response.status, errorText)}`;
+        logger34.error(msg);
+        throw new Error(msg);
+      }
+      if (!response.body) {
+        const buffer = await response.arrayBuffer();
+        const audio = pcm16ToFloat32(buffer);
+        const duration = audio.length / this._sampleRate;
+        const latency2 = getClock().now() - startTime;
+        span?.setAttributes({ "tts.duration_s": duration, "tts.latency_ms": latency2 });
+        span?.end();
+        telemetry?.recordHistogram("omote.inference.latency", latency2, {
+          model: "elevenlabs-tts",
+          backend: "cloud"
+        });
+        yield { audio, duration, text: trimmed };
+        return;
+      }
+      const reader = response.body.getReader();
+      let totalSamples = 0;
+      try {
+        while (true) {
+          if (options?.signal?.aborted) {
+            reader.cancel();
+            logger34.debug("Stream aborted by signal");
+            return;
+          }
+          const { done, value } = await reader.read();
+          if (done) break;
+          if (value && value.byteLength > 0) {
+            const usableBytes = value.byteLength & ~1;
+            if (usableBytes === 0) continue;
+            const audio = pcm16ToFloat32(value.buffer.slice(value.byteOffset, value.byteOffset + usableBytes));
+            const duration = audio.length / this._sampleRate;
+            totalSamples += audio.length;
+            yield { audio, duration, text: trimmed };
+          }
+        }
+      } finally {
+        reader.releaseLock();
+      }
+      const latency = getClock().now() - startTime;
+      const totalDuration = totalSamples / this._sampleRate;
+      logger34.debug("Stream complete", {
+        totalDuration: `${totalDuration.toFixed(2)}s`,
+        latencyMs: Math.round(latency),
+        totalSamples
+      });
+      span?.setAttributes({ "tts.duration_s": totalDuration, "tts.latency_ms": latency });
+      span?.end();
+      telemetry?.recordHistogram("omote.inference.latency", latency, {
+        model: "elevenlabs-tts",
+        backend: "cloud"
+      });
+      telemetry?.incrementCounter("omote.inference.total", 1, {
+        model: "elevenlabs-tts",
+        backend: "cloud",
+        status: "success"
+      });
+    } catch (err) {
+      if (err instanceof DOMException && err.name === "AbortError") {
+        logger34.debug("Stream aborted");
+        span?.end();
+        return;
+      }
+      const errMsg = err instanceof Error ? err.message : String(err);
+      logger34.error("Stream failed", { error: errMsg });
+      span?.endWithError(err instanceof Error ? err : new Error(String(err)));
+      telemetry?.incrementCounter("omote.inference.total", 1, {
+        model: "elevenlabs-tts",
+        backend: "cloud",
+        status: "error"
+      });
+      throw err;
+    }
+  }
+  // ─── Dispose ────────────────────────────────────────────────────────────
+  async dispose() {
+    this._isLoaded = false;
+    logger34.info("ElevenLabs TTS disposed");
+  }
+  // ─── Private ────────────────────────────────────────────────────────────
+  getHttpErrorMessage(status, body) {
+    switch (status) {
+      case 401:
+        return "Unauthorized \u2014 check your API key";
+      case 403:
+        return "Forbidden \u2014 API key lacks required permissions";
+      case 429:
+        return "Rate limited \u2014 too many requests";
+      case 400:
+        return `Bad request \u2014 ${body}`;
+      default:
+        return body || `HTTP error ${status}`;
+    }
+  }
+};
+// src/inference/PollyTTSBackend.ts
+var logger35 = createLogger("PollyTTS");
+var DEFAULT_VOICE = "Joanna";
+var DEFAULT_SAMPLE_RATE = 16e3;
+var PollyTTSBackend = class {
+  constructor(config) {
+    this._isLoaded = false;
+    if (!config.synthesizeFn) {
+      throw new Error("PollyTTS: synthesizeFn is required");
+    }
+    this.synthesizeFn = config.synthesizeFn;
+    this.voice = config.voice ?? DEFAULT_VOICE;
+    this._sampleRate = config.sampleRate ?? DEFAULT_SAMPLE_RATE;
+    this.engine = config.engine ?? "neural";
+  }
+  get sampleRate() {
+    return this._sampleRate;
+  }
+  get isLoaded() {
+    return this._isLoaded;
+  }
+  // ─── Load ───────────────────────────────────────────────────────────────
+  /**
+   * No-op for cloud TTS (no model to load).
+   * Marks backend as ready.
+   */
+  async load() {
+    this._isLoaded = true;
+    logger35.info("Polly TTS ready", { voice: this.voice, engine: this.engine, sampleRate: this._sampleRate });
+  }
+  // ─── Stream ─────────────────────────────────────────────────────────────
+  /**
+   * Synthesize audio via consumer's Polly function.
+   *
+   * Polly's SynthesizeSpeech is request/response (not streaming for PCM),
+   * so this yields a single chunk per call. For long text, consider splitting
+   * into sentences on the consumer side.
+   */
+  async *stream(text, options) {
+    if (!this._isLoaded) {
+      throw new Error("PollyTTS: not loaded. Call load() first.");
+    }
+    const trimmed = text.trim();
+    if (trimmed.length === 0) {
+      throw new Error("PollyTTS: text must not be empty");
+    }
+    if (options?.signal?.aborted) {
+      return;
+    }
+    const voiceName = options?.voice ?? this.voice;
+    const startTime = getClock().now();
+    const telemetry = getTelemetry();
+    const span = telemetry?.startSpan("PollyTTS.stream", {
+      "tts.text_length": trimmed.length,
+      "tts.voice": voiceName,
+      "tts.engine": this.engine
+    });
+    try {
+      const result = await this.synthesizeFn(trimmed, voiceName, this._sampleRate);
+      if (options?.signal?.aborted) {
+        span?.end();
+        return;
+      }
+      const audio = pcm16ToFloat32(result.audio);
+      const duration = audio.length / this._sampleRate;
+      const latency = getClock().now() - startTime;
+      logger35.debug("Synthesis complete", {
+        voice: voiceName,
+        duration: `${duration.toFixed(2)}s`,
+        latencyMs: Math.round(latency),
+        numSamples: audio.length
+      });
+      span?.setAttributes({ "tts.duration_s": duration, "tts.latency_ms": latency });
+      span?.end();
+      telemetry?.recordHistogram("omote.inference.latency", latency, {
+        model: "polly-tts",
+        backend: "cloud"
+      });
+      telemetry?.incrementCounter("omote.inference.total", 1, {
+        model: "polly-tts",
+        backend: "cloud",
+        status: "success"
+      });
+      yield { audio, duration, text: trimmed };
+    } catch (err) {
+      if (err instanceof DOMException && err.name === "AbortError") {
+        logger35.debug("Synthesis aborted");
+        span?.end();
+        return;
+      }
+      const errMsg = err instanceof Error ? err.message : String(err);
+      logger35.error("Synthesis failed", { error: errMsg });
+      span?.endWithError(err instanceof Error ? err : new Error(String(err)));
+      telemetry?.incrementCounter("omote.inference.total", 1, {
+        model: "polly-tts",
+        backend: "cloud",
+        status: "error"
+      });
+      throw err;
+    }
+  }
+  // ─── Dispose ────────────────────────────────────────────────────────────
+  async dispose() {
+    this._isLoaded = false;
+    logger35.info("Polly TTS disposed");
+  }
+};
 // src/inference/ortConfig.ts
 var ortCdnBase = null;
 function configureOrtCdn(cdnPath) {
@@ -11433,7 +11892,7 @@ function getOrtCdnBase() {
 }
 // src/emotion/Emotion.ts
-var logger34 = createLogger("EmotionController");
+var logger36 = createLogger("EmotionController");
 var EMOTION_NAMES = [
   "amazement",
   "anger",
@@ -11455,7 +11914,7 @@ function createEmotionVector(weights = {}) {
     if (idx >= 0) {
       vector[idx] = Math.max(0, Math.min(1, value));
     } else {
-      logger34.warn(`Invalid emotion name in createEmotionVector: "${name}"`);
+      logger36.warn(`Invalid emotion name in createEmotionVector: "${name}"`);
     }
   }
   return vector;
@@ -11538,7 +11997,7 @@ var EmotionController = class {
     this.targetEmotion.set(newEmotion);
     this.currentEmotion.set(newEmotion);
     this.transitionProgress = 1;
-    logger34.debug("set", { weights });
+    logger36.debug("set", { weights });
   }
   /**
    * Set emotion from preset immediately
@@ -11548,7 +12007,7 @@ var EmotionController = class {
     this.targetEmotion.set(newEmotion);
     this.currentEmotion.set(newEmotion);
     this.transitionProgress = 1;
-    logger34.debug("setPreset", { preset });
+    logger36.debug("setPreset", { preset });
   }
   /**
    * Transition to new emotion over time
@@ -11560,9 +12019,9 @@ var EmotionController = class {
     this.currentEmotion.set(this.emotion);
     this.targetEmotion.set(createEmotionVector(weights));
     this.transitionDuration = durationMs;
-    this.transitionStartTime = performance.now();
+    this.transitionStartTime = getClock().now();
     this.transitionProgress = 0;
-    logger34.debug("transitionTo", { weights, durationMs });
+    logger36.debug("transitionTo", { weights, durationMs });
   }
   /**
    * Transition to preset over time
@@ -11571,7 +12030,7 @@ var EmotionController = class {
     this.currentEmotion.set(this.emotion);
     this.targetEmotion.set(getEmotionPreset(preset));
     this.transitionDuration = durationMs;
-    this.transitionStartTime = performance.now();
+    this.transitionStartTime = getClock().now();
     this.transitionProgress = 0;
   }
   /**
@@ -11579,7 +12038,7 @@ var EmotionController = class {
    */
   update() {
     if (this.transitionProgress >= 1) return;
-    const elapsed = performance.now() - this.transitionStartTime;
+    const elapsed = getClock().now() - this.transitionStartTime;
     this.transitionProgress = Math.min(1, elapsed / this.transitionDuration);
   }
   /**
@@ -11595,7 +12054,7 @@ var EmotionController = class {
     this.currentEmotion.fill(0);
     this.targetEmotion.fill(0);
     this.transitionProgress = 1;
-    logger34.debug("reset");
+    logger36.debug("reset");
   }
 };
@@ -11676,7 +12135,7 @@ var DEFAULT_ANIMATION_CONFIG = {
 };
 // src/animation/AnimationGraph.ts
-var logger35 = createLogger("AnimationGraph");
+var logger37 = createLogger("AnimationGraph");
 var AnimationGraph = class extends EventEmitter {
   constructor(config = {}) {
     super();
@@ -11709,7 +12168,7 @@ var AnimationGraph = class extends EventEmitter {
     this.stateEnterTime = Date.now();
     this.lastUpdateTime = Date.now();
     this.cachedOutput = this.computeOutput();
-    logger35.info("constructor", {
+    logger37.info("constructor", {
       initialState: this.config.initialState,
       stateCount: this.config.states.length,
       transitionCount: this.config.transitions.length
@@ -11780,7 +12239,7 @@ var AnimationGraph = class extends EventEmitter {
   setState(stateName, blendDuration = 300) {
     const targetState = this.config.states.find((s) => s.name === stateName);
     if (!targetState) {
-      logger35.warn(`State '${stateName}' not found`);
+      logger37.warn(`State '${stateName}' not found`);
       return;
     }
     if (targetState.name === this.currentState.name && !this.isTransitioning) {
@@ -11858,7 +12317,7 @@ var AnimationGraph = class extends EventEmitter {
       (s) => s.name === transition.to
     );
     if (!targetState) {
-      logger35.warn(`Target state '${transition.to}' not found`);
+      logger37.warn(`Target state '${transition.to}' not found`);
       return;
     }
     const fromState = this.currentState.name;
@@ -11872,7 +12331,7 @@ var AnimationGraph = class extends EventEmitter {
     if (!this.currentState.emotionBlendEnabled) {
       this.targetEmotionWeight = 0;
     }
-    logger35.debug("state transition", {
+    logger37.debug("state transition", {
       from: fromState,
       to: targetState.name,
       trigger: event,
@@ -11909,7 +12368,7 @@ var AnimationGraph = class extends EventEmitter {
     if (this.currentState.timeout <= 0) return;
     const elapsed = now - this.stateEnterTime;
     if (elapsed >= this.currentState.timeout) {
-      logger35.debug("timeout transition", {
+      logger37.debug("timeout transition", {
         state: this.currentState.name,
         elapsed,
         timeout: this.currentState.timeout
@@ -12023,7 +12482,7 @@ var AnimationGraph = class extends EventEmitter {
 // src/animation/ProceduralLifeLayer.ts
 var import_simplex_noise = require("simplex-noise");
-var logger36 = createLogger("ProceduralLifeLayer");
+var logger38 = createLogger("ProceduralLifeLayer");
 var simplex2d = (0, import_simplex_noise.createNoise2D)();
 var LIFE_BS_INDEX = /* @__PURE__ */ new Map();
 for (let i = 0; i < LAM_BLENDSHAPES.length; i++) {
@@ -12129,7 +12588,7 @@ var ProceduralLifeLayer = class {
     }
     this.blinkInterval = this.nextBlinkInterval();
     this.gazeBreakInterval = randomRange(...this.gazeBreakIntervalRange);
-    logger36.debug("constructor", {
+    logger38.debug("constructor", {
       blinkIntervalRange: this.blinkIntervalRange,
       useLogNormalBlinks: this.useLogNormalBlinks,
       gazeBreakIntervalRange: this.gazeBreakIntervalRange,
@@ -12233,7 +12692,7 @@ var ProceduralLifeLayer = class {
    * Reset all internal state to initial values.
    */
   reset() {
-    logger36.debug("reset");
+    logger38.debug("reset");
     this.blinkTimer = 0;
     this.blinkInterval = this.nextBlinkInterval();
     this.blinkPhase = PHASE_OPEN;
@@ -12285,7 +12744,7 @@ var ProceduralLifeLayer = class {
       this.blinkTimer = 0;
       this.blinkInterval = this.nextBlinkInterval();
       this.asymmetryRight = 0.95 + Math.random() * 0.08;
-      logger36.trace("blink", { nextInterval: this.blinkInterval });
+      logger38.trace("blink", { nextInterval: this.blinkInterval });
     }
     if (this.blinkPhase > PHASE_OPEN) {
       this.blinkProgress += delta;
@@ -12366,7 +12825,7 @@ var ProceduralLifeLayer = class {
       this.gazeBreakTargetX = (Math.random() - 0.5) * 2 * amp;
       this.gazeBreakTargetY = (Math.random() - 0.5) * amp * 0.4;
       this.gazeBreakInterval = randomRange(...params.interval);
-      logger36.trace("gaze break", {
+      logger38.trace("gaze break", {
         targetX: this.gazeBreakTargetX.toFixed(3),
         targetY: this.gazeBreakTargetY.toFixed(3),
         nextInterval: this.gazeBreakInterval.toFixed(2),
@@ -12609,7 +13068,7 @@ var ALL_AUS = [...new Set(
 )];
 // src/face/EmotionResolver.ts
-var logger37 = createLogger("EmotionResolver");
+var logger39 = createLogger("EmotionResolver");
 var BS_INDEX = /* @__PURE__ */ new Map();
 for (let i = 0; i < LAM_BLENDSHAPES.length; i++) {
   BS_INDEX.set(LAM_BLENDSHAPES[i], i);
@@ -12636,7 +13095,7 @@ var EmotionResolver = class {
       if (!emotionWeight || emotionWeight < 0.01) continue;
       const auActivations = EMOTION_TO_AU[emotionName];
       if (!auActivations) {
-        logger37.warn(`Unknown emotion name with no AU mapping: "${emotionName}"`);
+        logger39.warn(`Unknown emotion name with no AU mapping: "${emotionName}"`);
         continue;
       }
       for (const activation of auActivations) {
@@ -12661,7 +13120,7 @@ var EmotionResolver = class {
 };
 // src/face/FaceCompositor.ts
-var logger38 = createLogger("FaceCompositor");
+var logger40 = createLogger("FaceCompositor");
 function smoothstep(t) {
   return t * t * (3 - 2 * t);
 }
@@ -12692,7 +13151,7 @@ var FaceCompositor = class {
     if (config?.profile) {
       this.applyProfileArrays(config.profile);
     }
-    logger38.debug("constructor", {
+    logger40.debug("constructor", {
       emotionSmoothing: this.emotionSmoothing,
       hasProfile: !!config?.profile,
       hasLifeLayer: !!config?.lifeLayer
@@ -12708,7 +13167,7 @@ var FaceCompositor = class {
    * @returns Blendshapes (Float32Array[52] clamped [0,1]) and head rotation deltas
    */
   compose(base, input, target) {
-    const composeStart = performance.now();
+    const composeStart = getClock().now();
     const out = target ?? this.outputBuffer;
     out.set(base);
     const emotion = input.emotion ?? this.stickyEmotion;
@@ -12755,7 +13214,7 @@ var FaceCompositor = class {
     }
     getTelemetry()?.recordHistogram(
       MetricNames.COMPOSITOR_COMPOSE_LATENCY,
-      (performance.now() - composeStart) * 1e3
+      (getClock().now() - composeStart) * 1e3
       // µs
     );
     return { blendshapes: out, headDelta: lifeResult.headDelta };
@@ -12765,7 +13224,7 @@ var FaceCompositor = class {
    */
   setEmotion(weights) {
     this.stickyEmotion = weights;
-    logger38.debug("setEmotion", { weights });
+    logger40.debug("setEmotion", { weights });
   }
   /**
    * Update character profile at runtime.
@@ -12774,7 +13233,7 @@ var FaceCompositor = class {
     this.multiplier.fill(1);
     this.offset.fill(0);
     this.applyProfileArrays(profile);
-    logger38.debug("setProfile", {
+    logger40.debug("setProfile", {
       multiplierKeys: profile.multiplier ? Object.keys(profile.multiplier).length : 0,
       offsetKeys: profile.offset ? Object.keys(profile.offset).length : 0
     });
@@ -12788,7 +13247,7 @@ var FaceCompositor = class {
     this.lifeBuffer.fill(0);
     this.stickyEmotion = void 0;
     this.lifeLayer.reset();
-    logger38.debug("reset");
+    logger40.debug("reset");
   }
   /** Expand partial profile maps into dense Float32Arrays */
   applyProfileArrays(profile) {
@@ -12873,7 +13332,7 @@ function parseEmotionTags(text) {
 }
 // src/character/CharacterController.ts
-var logger39 = createLogger("CharacterController");
+var logger41 = createLogger("CharacterController");
 var FRAME_BUDGET_US = 33e3;
 var EMOTION_MAP = {
   // Synced with EmotionPresets (packages/core/src/emotion/Emotion.ts)
@@ -12943,7 +13402,7 @@ var CharacterController = class {
     this.gazeYawInfluence = config?.gaze?.yawInfluence ?? 0.4;
     this.gazePitchInfluence = config?.gaze?.pitchInfluence ?? 0.3;
     this.gazeSmoothing = config?.gaze?.smoothing ?? 5;
-    logger39.debug("constructor", {
+    logger41.debug("constructor", {
       gazeEnabled: this.gazeEnabled,
       gazeYawInfluence: this.gazeYawInfluence,
       gazePitchInfluence: this.gazePitchInfluence,
@@ -12958,7 +13417,7 @@ var CharacterController = class {
    * into a single output frame.
    */
   update(input) {
-    const frameStart = performance.now();
+    const frameStart = getClock().now();
     const base = input.baseBlendshapes ?? this.zeroBase;
     const eyeTargets = this.computeEyeTargets(
       input.cameraWorldPos,
@@ -12985,7 +13444,7 @@ var CharacterController = class {
       lifeHeadDelta,
       input.avatarRotationY ?? 0
     );
-    const frameUs = (performance.now() - frameStart) * 1e3;
+    const frameUs = (getClock().now() - frameStart) * 1e3;
     this.frameTimes[this.frameTimeIdx] = frameUs;
     this.frameTimeIdx = (this.frameTimeIdx + 1) % this.frameTimes.length;
     if (this.frameTimeFill < this.frameTimes.length) this.frameTimeFill++;
@@ -13007,13 +13466,13 @@ var CharacterController = class {
     const resolved = resolveEmotion(emotion);
     if (resolved) {
       this._compositor.setEmotion(resolved);
-      logger39.debug("setEmotion", { emotion, resolved });
+      logger41.debug("setEmotion", { emotion, resolved });
     }
   }
   /** Update character profile at runtime. */
   setProfile(profile) {
     this._compositor.setProfile(profile);
-    logger39.debug("setProfile", {
+    logger41.debug("setProfile", {
       multiplierKeys: profile.multiplier ? Object.keys(profile.multiplier).length : 0,
       offsetKeys: profile.offset ? Object.keys(profile.offset).length : 0
     });
@@ -13048,11 +13507,11 @@ var CharacterController = class {
     this._compositor.reset();
     this.gazeHeadYaw = 0;
     this.gazeHeadPitch = -0.1;
-    logger39.debug("reset");
+    logger41.debug("reset");
   }
   dispose() {
     this.reset();
-    logger39.debug("dispose");
+    logger41.debug("dispose");
   }
   // ---------------------------------------------------------------------------
   // Eye angle math (extracted from r3f useGazeTracking.computeEyeTargets)
@@ -13134,7 +13593,7 @@ var CharacterController = class {
 };
 // src/orchestration/MicLipSync.ts
-var logger40 = createLogger("MicLipSync");
+var logger42 = createLogger("MicLipSync");
 var MicLipSync = class extends EventEmitter {
   constructor(config) {
     super();
@@ -13153,7 +13612,7 @@ var MicLipSync = class extends EventEmitter {
     this.vadChunkSize = 0;
     this.vadBuffer = null;
     this.vadBufferOffset = 0;
-    logger40.info("MicLipSync created", {
+    logger42.info("MicLipSync created", {
       sampleRate: config.sampleRate ?? 16e3,
       micChunkSize: config.micChunkSize ?? 512,
       hasVAD: !!config.vad,
@@ -13175,12 +13634,12 @@ var MicLipSync = class extends EventEmitter {
         this._currentFrame = scaled;
         if (!this._firstFrameEmitted) {
           this._firstFrameEmitted = true;
-          logger40.trace("First blendshape frame emitted");
+          logger42.trace("First blendshape frame emitted");
         }
         this.emit("frame", { blendshapes: scaled, rawBlendshapes: raw });
       },
       onError: (error) => {
-        logger40.error("A2E inference error", { message: error.message });
+        logger42.error("A2E inference error", { message: error.message });
         this.emit("error", error);
       }
     });
@@ -13188,7 +13647,9 @@ var MicLipSync = class extends EventEmitter {
       const float32 = int16ToFloat32(pcm);
       this.processor.pushAudio(float32);
       if (this.vad) {
-        this.vadQueue = this.vadQueue.then(() => this.processVAD(float32)).catch(() => {
+        this.vadQueue = this.vadQueue.then(() => this.processVAD(float32)).catch((err) => {
+          logger42.warn("VAD processing error", { error: String(err), code: ErrorCodes.SPH_VAD_ERROR });
+          this.emit("error", err instanceof Error ? err : new Error(String(err)));
         });
       }
     });
@@ -13223,7 +13684,7 @@ var MicLipSync = class extends EventEmitter {
   /** Start microphone capture and inference loop */
   async start() {
     if (this._state === "active") return;
-    logger40.info("Starting MicLipSync");
+    logger42.info("Starting MicLipSync");
     getTelemetry()?.incrementCounter(MetricNames.MIC_SESSIONS);
     await this.mic.start();
     this.processor.startDrip();
@@ -13233,7 +13694,7 @@ var MicLipSync = class extends EventEmitter {
   /** Stop microphone and inference */
   stop() {
     if (this._state === "idle") return;
-    logger40.info("Stopping MicLipSync");
+    logger42.info("Stopping MicLipSync");
     this.processor.stopDrip();
     this.mic.stop();
     this._isSpeaking = false;
@@ -13275,14 +13736,15 @@ var MicLipSync = class extends EventEmitter {
           const wasSpeaking = this._isSpeaking;
           this._isSpeaking = result.isSpeech;
           if (!wasSpeaking && result.isSpeech) {
-            this.speechStartTime = performance.now();
+            this.speechStartTime = getClock().now();
             this.emit("speech:start");
           } else if (wasSpeaking && !result.isSpeech) {
-            const durationMs = performance.now() - this.speechStartTime;
+            const durationMs = getClock().now() - this.speechStartTime;
             this.emit("speech:end", { durationMs });
           }
         } catch (err) {
-          logger40.warn("VAD process error", { error: String(err) });
+          logger42.warn("VAD process error", { error: String(err), code: ErrorCodes.SPH_VAD_ERROR });
+          this.emit("error", err instanceof Error ? err : new Error(String(err)));
         }
         this.vadBufferOffset = 0;
       }
@@ -13299,7 +13761,7 @@ var MicLipSync = class extends EventEmitter {
 };
 // src/orchestration/VoicePipeline.ts
-var logger41 = createLogger("VoicePipeline");
+var logger43 = createLogger("VoicePipeline");
 var _VoicePipeline = class _VoicePipeline extends EventEmitter {
   constructor(config) {
     super();
@@ -13331,6 +13793,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     this.lastProgressiveSamples = 0;
     // ASR error recovery
     this.asrErrorCount = 0;
+    this.progressiveErrorCount = 0;
     // Response abort
     this.responseAbortController = null;
     // Listener cleanup
@@ -13374,7 +13837,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
       if (typeof requestAnimationFrame !== "undefined") {
         await new Promise((r) => requestAnimationFrame(() => r()));
       }
-      logger41.debug("Creating PlaybackPipeline", {
+      logger43.debug("Creating PlaybackPipeline", {
         neutralTransitionEnabled: this.config.neutralTransitionEnabled ?? true,
         audioDelayMs: this.config.audioDelayMs,
         chunkTargetMs: this.config.chunkTargetMs
@@ -13414,8 +13877,9 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
       this.setState("ready");
     } catch (error) {
       const err = error instanceof Error ? error : new Error(String(error));
+      span?.setAttributes({ "error.type": ErrorTypes.MODEL });
       span?.endWithError(err);
-      logger41.error("Model loading failed", { message: err.message });
+      logger43.error("Model loading failed", { message: err.message });
       this.emit("error", err);
       this.setState("error");
       throw err;
@@ -13429,7 +13893,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     const { backends } = this.config;
     if (!backends) throw new Error("No backends config");
     this.emitProgress("Loading models", 0, 1, 0);
-    logger41.info("Loading from pre-built backends");
+    logger43.info("Loading from pre-built backends");
     const toLoad = [];
     if (!backends.asr.isLoaded) toLoad.push(backends.asr.load());
     if (!backends.lam.isLoaded) toLoad.push(backends.lam.load());
@@ -13463,7 +13927,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
       } else if (UnifiedInferenceWorker.isSupported()) {
         this.unifiedWorker = new UnifiedInferenceWorker();
         await this.unifiedWorker.init();
-        logger41.info("Created internal unified worker", { backend: this.unifiedWorker.backend });
+        logger43.info("Created internal unified worker", { backend: this.unifiedWorker.backend });
       }
     }
     this.emitProgress("Loading models", 0, 3, 0);
@@ -13500,17 +13964,17 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
         throw asrResult.reason;
       }
       this.asr = asr;
-      logger41.info("SenseVoice loaded");
+      logger43.info("SenseVoice loaded");
       if (vadResult.status === "rejected") {
         throw vadResult.reason;
       }
       this.vad = vad;
-      logger41.info("Silero VAD loaded");
+      logger43.info("Silero VAD loaded");
       if (lamResult.status === "rejected") {
         throw lamResult.reason;
       }
       this.lam = lam;
-      logger41.info("LAM loaded");
+      logger43.info("LAM loaded");
     } finally {
       clearInterval(progressInterval);
     }
@@ -13518,7 +13982,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     if (this.isLocalMode) {
       const localConfig = this.config;
       if (localConfig.ttsConfig && !localConfig.tts) {
-        logger41.info("Creating Kokoro TTS from config", {
+        logger43.info("Creating Kokoro TTS from config", {
           hasUnifiedWorker: !!this.unifiedWorker,
           voice: localConfig.ttsConfig.defaultVoice
         });
@@ -13528,7 +13992,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
         });
       }
       if (localConfig.tts && !localConfig.ttsConfig && isIOS()) {
-        logger41.warn(
+        logger43.warn(
           "External TTS on iOS creates a separate ORT WASM instance, risking OOM. Prefer ttsConfig for automatic unified worker integration."
         );
       }
@@ -13536,9 +14000,9 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
         throw new Error("VoicePipeline local mode requires either tts or ttsConfig");
       }
       if (!localConfig.tts.isLoaded) {
-        logger41.info("Loading local TTS model...");
+        logger43.info("Loading local TTS model...");
         await localConfig.tts.load();
-        logger41.info("Local TTS model loaded");
+        logger43.info("Local TTS model loaded");
       }
     }
     this.emitProgress("Loading models", 100, 3, 3);
@@ -13554,8 +14018,8 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     this.epoch++;
     this._sessionId = crypto.randomUUID();
     this.asrErrorCount = 0;
-    logger41.info("Starting voice pipeline", { sessionId: this._sessionId });
-    logger41.debug("Pipeline mode", { mode: this.isLocalMode ? "local" : "cloud" });
+    logger43.info("Starting voice pipeline", { sessionId: this._sessionId });
+    logger43.debug("Pipeline mode", { mode: this.isLocalMode ? "local" : "cloud" });
     this.mic = new MicrophoneCapture(this.omoteEvents, {
       sampleRate: 16e3,
       chunkSize: 512
@@ -13568,11 +14032,11 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
       this.emit("audio:level", level);
     });
     await this.mic.start();
-    logger41.debug("Microphone started");
+    logger43.debug("Microphone started");
     this.setState("listening");
   }
   stop() {
-    logger41.info("Stopping voice pipeline", { sessionId: this._sessionId });
+    logger43.info("Stopping voice pipeline", { sessionId: this._sessionId });
     this.stopped = true;
     this.epoch++;
     this.clearSilenceTimer();
@@ -13601,7 +14065,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     this.playback?.setProfile(profile);
   }
   async dispose() {
-    logger41.debug("Disposing VoicePipeline");
+    logger43.debug("Disposing VoicePipeline");
     this.stop();
     this.epoch++;
     await Promise.allSettled([
@@ -13635,19 +14099,20 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
       if (result.isSpeech) {
         if (!wasSpeaking) {
           this.isSpeaking = true;
-          this.speechStartTime = performance.now();
+          this.speechStartTime = getClock().now();
           this.audioBuffer = [];
           this.audioBufferSamples = 0;
           this.lastProgressiveResult = null;
           this.lastProgressiveSamples = 0;
-          logger41.debug("VAD speech start");
+          this.progressiveErrorCount = 0;
+          logger43.debug("VAD speech start");
           this.emit("speech:start");
           this.startProgressiveTranscription();
         }
         this.audioBuffer.push(new Float32Array(samples));
         this.audioBufferSamples += samples.length;
         if (this.audioBufferSamples >= _VoicePipeline.MAX_AUDIO_BUFFER_SAMPLES) {
-          logger41.warn("Audio buffer exceeded max, forcing transcription flush");
+          logger43.warn("Audio buffer exceeded max, forcing transcription flush");
           this.onSilenceDetected();
           return;
         }
@@ -13663,7 +14128,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
         }
       }
     } catch (err) {
-      logger41.warn("VAD error", { error: String(err) });
+      logger43.warn("VAD error", { error: String(err) });
     }
   }
   // ---------------------------------------------------------------------------
@@ -13674,18 +14139,18 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     const extended = this.config.silenceTimeoutExtendedMs ?? 700;
     const adaptive = this.config.adaptiveTimeout ?? true;
     if (!adaptive) return base;
-    const speechDurationMs = performance.now() - this.speechStartTime;
+    const speechDurationMs = getClock().now() - this.speechStartTime;
     return speechDurationMs > 3e3 ? extended : base;
   }
   onSilenceDetected() {
     const capturedEpoch = this.epoch;
     this.isSpeaking = false;
-    const durationMs = performance.now() - this.speechStartTime;
-    logger41.debug("VAD speech end", { durationMs: Math.round(durationMs) });
+    const durationMs = getClock().now() - this.speechStartTime;
+    logger43.debug("VAD speech end", { durationMs: Math.round(durationMs) });
     this.emit("speech:end", { durationMs });
     this.clearSilenceTimer();
     this.processEndOfSpeech(capturedEpoch).catch((err) => {
-      logger41.error("End of speech processing failed", { error: String(err) });
+      logger43.error("End of speech processing failed", { error: String(err) });
       if (this.epoch === capturedEpoch && !this.stopped) {
         this.emit("error", err instanceof Error ? err : new Error(String(err)));
         this.setState("listening");
@@ -13699,7 +14164,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     const turnSpan = getTelemetry()?.startSpan("VoicePipeline.turn", {
       "session.id": this._sessionId ?? ""
     });
-    const turnStart = performance.now();
+    const turnStart = getClock().now();
     if (this.progressivePromise) {
       try {
         await this.progressivePromise;
@@ -13724,7 +14189,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     const minEnergy = this.config.minAudioEnergy ?? 0.02;
     const durationSec = totalSamples / 16e3;
     if (durationSec < minDuration) {
-      logger41.info("Audio too short, discarding", { durationSec });
+      logger43.info("Audio too short, discarding", { durationSec });
       turnSpan?.end();
       this.setState("listening");
       return;
@@ -13735,7 +14200,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     }
     rms = Math.sqrt(rms / fullAudio.length);
     if (rms < minEnergy) {
-      logger41.info("Audio too quiet, discarding", { rms });
+      logger43.info("Audio too quiet, discarding", { rms });
       turnSpan?.end();
       this.setState("listening");
       return;
@@ -13746,12 +14211,12 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     const coverageThreshold = this.config.progressiveCoverageThreshold ?? 0.8;
     if (this.lastProgressiveResult && this.lastProgressiveResult.text.trim().length > 0 && this.lastProgressiveSamples >= totalSamples * coverageThreshold) {
       transcript = { ...this.lastProgressiveResult, isFinal: true };
-      logger41.info("Using progressive result", {
+      logger43.info("Using progressive result", {
         coverage: (this.lastProgressiveSamples / totalSamples).toFixed(2),
         text: transcript.text
       });
     } else {
-      logger41.debug("Progressive result insufficient, running final transcription", {
+      logger43.debug("Progressive result insufficient, running final transcription", {
         samples: totalSamples,
         hadProgressive: !!this.lastProgressiveResult
       });
@@ -13766,7 +14231,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
       return;
     }
     if (!transcript || !transcript.text.trim()) {
-      logger41.info("No transcript, resuming listening");
+      logger43.info("No transcript, resuming listening");
       turnSpan?.end();
       this.setState("listening");
       return;
@@ -13774,7 +14239,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     this.emit("transcript", transcript);
     getTelemetry()?.recordHistogram(
       MetricNames.VOICE_TURN_LATENCY,
-      performance.now() - turnStart,
+      getClock().now() - turnStart,
       { mode: this.isLocalMode ? "local" : "cloud" }
     );
     await this.callResponseHandler(transcript, capturedEpoch, turnSpan?.getContext());
@@ -13788,7 +14253,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
     const span = getTelemetry()?.startSpan("VoicePipeline.response", {
       "text.length": transcript.text.length
     }, parentContext);
-    const responseStart = performance.now();
+    const responseStart = getClock().now();
     this.setState("speaking");
     this.interruption?.setAISpeaking(true);
     if (transcript.emotion) {
@@ -13805,7 +14270,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
       }
       getTelemetry()?.recordHistogram(
         MetricNames.VOICE_RESPONSE_LATENCY,
-        performance.now() - responseStart,
+        getClock().now() - responseStart,
         { mode: this.isLocalMode ? "local" : "cloud" }
       );
       span?.end();
@@ -13815,8 +14280,9 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
         return;
       }
       const err = error instanceof Error ? error : new Error(String(error));
+      span?.setAttributes({ "error.type": ErrorTypes.RUNTIME });
       span?.endWithError(err);
-      logger41.error("Response handler error", { message: err.message });
+      logger43.error("Response handler error", { message: err.message });
       this.emit("error", err);
       if (this.epoch === capturedEpoch && !this.stopped) {
         this.interruption?.setAISpeaking(false);
@@ -13887,11 +14353,11 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
   // ---------------------------------------------------------------------------
   handleInterruption() {
     if (this._state !== "speaking") return;
-    logger41.info("Interruption triggered");
+    logger43.info("Interruption triggered");
     getTelemetry()?.incrementCounter(MetricNames.VOICE_INTERRUPTIONS);
     this.epoch++;
     if (this.responseAbortController) {
-      logger41.debug("Aborting in-flight response");
+      logger43.debug("Aborting in-flight response");
     }
     this.responseAbortController?.abort();
     this.playback?.stop();
@@ -13929,7 +14395,15 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
             this.lastProgressiveSamples = snapshotSamples;
             this.emit("transcript", { ...result, isFinal: false });
           }
-        } catch {
+        } catch (err) {
+          this.progressiveErrorCount++;
+          if (this.progressiveErrorCount % 10 === 1) {
+            logger43.warn("Progressive transcription error", {
+              code: ErrorCodes.SPH_ASR_ERROR,
+              count: this.progressiveErrorCount,
+              error: String(err)
+            });
+          }
         }
       })();
     }, intervalMs);
@@ -13945,8 +14419,9 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
   // ---------------------------------------------------------------------------
   async transcribeWithTimeout(audio) {
     if (!this.asr) return null;
+    const currentEpoch = this.epoch;
     const timeoutMs = this.config.transcriptionTimeoutMs ?? 1e4;
-    const startTime = performance.now();
+    const startTime = getClock().now();
     const span = getTelemetry()?.startSpan("VoicePipeline.transcribe", {
       "inference.input_samples": audio.length,
       "inference.input_duration_ms": audio.length / 16e3 * 1e3
@@ -13960,7 +14435,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
         })
       ]);
       clearTimeout(timeoutId);
-      const latency = performance.now() - startTime;
+      const latency = getClock().now() - startTime;
       this.asrErrorCount = 0;
       getTelemetry()?.recordHistogram(MetricNames.VOICE_TRANSCRIPTION_LATENCY, latency);
       getTelemetry()?.incrementCounter(MetricNames.VOICE_TRANSCRIPTIONS);
@@ -13974,14 +14449,18 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
         inferenceTimeMs: latency
       };
     } catch (error) {
+      span?.setAttributes({ "error.type": ErrorTypes.INFERENCE });
       span?.endWithError(error instanceof Error ? error : new Error(String(error)));
       this.asrErrorCount++;
-      logger41.warn("Transcription failed", {
+      logger43.warn("Transcription failed", {
         attempt: this.asrErrorCount,
         error: String(error)
       });
       if (this.asrErrorCount >= 3 && this.config.models) {
-        logger41.warn("3 consecutive ASR errors, recreating session");
+        if (this.epoch !== currentEpoch) return null;
+        logger43.warn("3 consecutive ASR errors, recreating session", {
+          code: ErrorCodes.SPH_ASR_ERROR
+        });
         try {
           await this.asr.dispose();
           this.asr = createSenseVoice({
@@ -13991,9 +14470,10 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
             unifiedWorker: this.unifiedWorker ?? void 0
           });
           await this.asr.load();
+          if (this.epoch !== currentEpoch) return null;
           this.asrErrorCount = 0;
         } catch (recreateErr) {
-          logger41.error("ASR session recreation failed", { error: String(recreateErr) });
+          logger43.error("ASR session recreation failed", { error: String(recreateErr) });
         }
       }
       return null;
@@ -14022,7 +14502,7 @@ var _VoicePipeline = class _VoicePipeline extends EventEmitter {
   // ---------------------------------------------------------------------------
   setState(state) {
     if (this._state === state) return;
-    logger41.info("State transition", { from: this._state, to: state });
+    logger43.info("State transition", { from: this._state, to: state });
     this._state = state;
     this.emit("state", state);
   }
@@ -14041,7 +14521,7 @@ _VoicePipeline.MAX_AUDIO_BUFFER_SAMPLES = 16e3 * 30;
 var VoicePipeline = _VoicePipeline;
 // src/orchestration/VoiceOrchestrator.ts
-var logger42 = createLogger("VoiceOrchestrator");
+var logger44 = createLogger("VoiceOrchestrator");
 var VoiceOrchestrator = class extends EventEmitter {
   constructor() {
     super(...arguments);
@@ -14091,7 +14571,7 @@ var VoiceOrchestrator = class extends EventEmitter {
     const epoch = ++this.connectEpoch;
     this._mode = config.mode ?? "local";
     this._sessionId = crypto.randomUUID();
-    logger42.info("Connecting voice orchestrator", { mode: this._mode });
+    logger44.info("Connecting voice orchestrator", { mode: this._mode });
     if (this._mode === "local") {
       const localCfg = config;
       this.ttsSpeaker = new TTSSpeaker();
@@ -14144,7 +14624,7 @@ var VoiceOrchestrator = class extends EventEmitter {
     } else {
       this.wireCloudTranscript(config);
     }
-    logger42.info("Voice orchestrator connected", { mode: this._mode });
+    logger44.info("Voice orchestrator connected", { mode: this._mode });
   }
   async disconnect() {
     this.connectEpoch++;
@@ -14258,7 +14738,7 @@ var VoiceOrchestrator = class extends EventEmitter {
           await this.speak(text);
         }
       } catch (e) {
-        logger42.error("Voice transcript handler error", { error: String(e) });
+        logger44.error("Voice transcript handler error", { error: String(e) });
       } finally {
         this.interruption?.setAISpeaking(false);
         this.speechListener?.resume();
@@ -14299,7 +14779,7 @@ var VoiceOrchestrator = class extends EventEmitter {
         });
       } catch (e) {
         if (!abortController.signal.aborted) {
-          logger42.error("Cloud response handler error", { error: String(e) });
+          logger44.error("Cloud response handler error", { error: String(e) });
         }
       } finally {
         this.responseAbortController = null;
@@ -14313,7 +14793,7 @@ var VoiceOrchestrator = class extends EventEmitter {
   // -------------------------------------------------------------------------
   handleInterruption() {
     if (this._state !== "speaking") return;
-    logger42.info("Interruption triggered");
+    logger44.info("Interruption triggered");
     this.stopSpeaking();
     this.speechListener?.resume();
     this.setState("listening");