npm - open-agents-ai - Versions diffs - 0.187.277 → 0.187.278 - Mend

open-agents-ai 0.187.277 → 0.187.278

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +92 -16
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -294676,6 +294676,8 @@ var init_voice = __esm({
       currentPlayback = null;
       speakQueue = [];
       speaking = false;
+      drainPromise = null;
+      drainResolve = null;
       phonemizeFn = null;
       /** True when current model uses MLX Audio backend */
       mlxActive = false;
@@ -294992,6 +294994,15 @@ var init_voice = __esm({
         const speedFactor = emotion ? emotionToSpeedFactor(emotion, this.starkMode, this.autistMode) : 1;
         this.enqueueSpeech(text, 0.55, 1 + pitchBias, speedFactor, 0.15);
       }
+      /** Wait until the speak queue is fully drained (all audio played). */
+      async waitUntilIdle() {
+        if (!this.speaking && this.speakQueue.length === 0) return;
+        if (this.drainPromise) {
+          await this.drainPromise;
+        } else {
+          await this.sleep(100);
+        }
+      }
       enqueueSpeech(text, volume, pitchFactor, speedFactor = 1, stereoDelayMs = 0.6) {
         if (!this.enabled || !this.ready) return;
         text = sanitizeForTTS(text);
@@ -295190,6 +295201,11 @@ var init_voice = __esm({
        */
       async drainQueue() {
         this.speaking = true;
+        if (!this.drainPromise) {
+          this.drainPromise = new Promise((resolve40) => {
+            this.drainResolve = resolve40;
+          });
+        }
         let isFirst = true;
         let prefetchedWav = null;
         while (this.speakQueue.length > 0) {
@@ -295241,6 +295257,14 @@ var init_voice = __esm({
           }
         }
         this.speaking = false;
+        if (this.drainResolve) {
+          try {
+            this.drainResolve();
+          } catch {
+          }
+        }
+        this.drainResolve = null;
+        this.drainPromise = null;
       }
       sleep(ms) {
         return new Promise((resolve40) => setTimeout(resolve40, ms));
@@ -328218,13 +328242,12 @@ __export(voicechat_exports, {
   VoiceChatSession: () => VoiceChatSession
 });
 import { EventEmitter as EventEmitter10 } from "node:events";
-var VAD_SILENCE_MS, MAX_SEGMENT_MS, SUMMARY_INJECTION_INTERVAL, MAX_CONTEXT_TURNS, SYSTEM_PROMPT2, VoiceChatSession;
+var VAD_SILENCE_MS, MAX_SEGMENT_MS, MAX_CONTEXT_TURNS, SYSTEM_PROMPT2, VoiceChatSession;
 var init_voicechat = __esm({
   "packages/cli/src/tui/voicechat.ts"() {
     "use strict";
-    VAD_SILENCE_MS = 1100;
+    VAD_SILENCE_MS = 2e3;
     MAX_SEGMENT_MS = 6500;
-    SUMMARY_INJECTION_INTERVAL = 4;
     MAX_CONTEXT_TURNS = 20;
     SYSTEM_PROMPT2 = `You are a voice assistant having a live spoken conversation. Keep responses extremely brief — 1-2 sentences max. You're speaking aloud, not writing. Be conversational, direct, and helpful. Don't use markdown, bullet points, or formatting — just natural speech. If you don't know something, say so briefly. Do not over-think — respond quickly and concisely.`;
     VoiceChatSession = class extends EventEmitter10 {
@@ -328256,6 +328279,7 @@ var init_voicechat = __esm({
       // Bound handlers for cleanup
       _onTranscript = null;
       _onError = null;
+      _retryMicTimer = null;
       constructor(opts) {
         super();
         this.voice = opts.voice;
@@ -328321,6 +328345,19 @@ var init_voicechat = __esm({
         this._onError = (err) => {
           const msg = err instanceof Error ? err.message : String(err);
           this.onStatus(`ASR error (voicechat continues without mic): ${msg.slice(0, 80)}`);
+          if (this.active && !this._retryMicTimer) {
+            this._retryMicTimer = setTimeout(async () => {
+              this._retryMicTimer = null;
+              if (!this.active) return;
+              try {
+                await this.listen.stop().catch(() => {
+                });
+                await this.listen.start();
+                this.onStatus("Mic auto-recovered — LISTENING");
+              } catch {
+              }
+            }, 1e3);
+          }
         };
         this.listen.on("transcript", this._onTranscript);
         this.listen.on("error", this._onError);
@@ -328422,6 +328459,12 @@ var init_voicechat = __esm({
         this.onUserSpeech(text);
         this.context.push({ role: "user", content: text });
         this.turnCount++;
+        if (this.runner) {
+          try {
+            this.runner.injectUserMessage(`[VOICECHAT] ${text}`);
+          } catch {
+          }
+        }
         while (this.context.length > MAX_CONTEXT_TURNS + 1) {
           this.context.splice(1, 1);
         }
@@ -328443,11 +328486,18 @@ var init_voicechat = __esm({
             this.setState("SPEAKING");
             this.onAgentSpeech(response.trim());
             this.voice.speak(response.trim());
-            if (this.runner && this.turnCount % SUMMARY_INJECTION_INTERVAL === 0) {
+            if (this.runner) {
               this.injectSummary();
             }
-            const estimatedMs = Math.max(1500, response.length / 5 * (6e4 / 150));
-            await new Promise((r2) => setTimeout(r2, estimatedMs));
+            if (typeof this.voice.waitUntilIdle === "function") {
+              try {
+                await this.voice.waitUntilIdle();
+              } catch {
+              }
+            } else {
+              const estimatedMs = Math.max(1500, response.length / 5 * (6e4 / 150));
+              await new Promise((r2) => setTimeout(r2, estimatedMs));
+            }
           }
         } catch (err) {
           if (!this.active) return;
@@ -328570,13 +328620,19 @@ var init_voicechat = __esm({
       // ---------------------------------------------------------------------------
       injectSummary() {
         if (!this.runner) return;
-        const recentTurns = this.context.filter((t2) => t2.role !== "system").slice(-6).map((t2) => `${t2.role === "user" ? "User" : "Assistant"}: ${t2.content}`).join("\n");
+        const recentTurns = this.context.filter((t2) => t2.role !== "system").slice(-8).map((t2) => `${t2.role === "user" ? "User" : "Assistant"}: ${t2.content}`).join("\n");
         this.runner.injectUserMessage(
-          `[VOICECHAT SUMMARY] The following is a summary of the recent voice conversation happening in parallel. You don't need to respond to this directly — it's for your awareness. Continue your current task.
+          `[VOICECHAT SUMMARY] Parallel voice liaison update (for awareness only). Continue your current task; do not respond to this directly.
 ${recentTurns}`
         );
       }
+      /** Enqueue narration from main agent events into the voice channel */
+      enqueueAgentNarration(text, subordinate = true) {
+        if (!text || !this.active) return;
+        if (subordinate) this.voice.speakSubordinate(text);
+        else this.voice.speak(text);
+      }
     };
   }
 });
@@ -330156,6 +330212,17 @@ ${entry.fullContent}`
             }
           });
         }
+        if (voice?.enabled && voice.voiceMode === "voicechat" && _voiceChatSession?.isActive && event.toolName === "task_complete") {
+          const emoStateFinal = emotionEngine?.getState();
+          const emoCtxFinal = emoStateFinal ? { valence: emoStateFinal.valence, arousal: emoStateFinal.arousal, label: emoStateFinal.label, emoji: emoStateFinal.emoji } : void 0;
+          const desc = describeTaskComplete(String(event.content ?? ""), true, vLevel);
+          if (desc) {
+            try {
+              _voiceChatSession.enqueueAgentNarration(desc, false);
+            } catch {
+            }
+          }
+        }
         break;
       }
       case "model_response":
@@ -330237,6 +330304,15 @@ ${entry.fullContent}`
             voice.speak(chatText);
             voice._spokenStreamText = true;
           }
+        } else if (voice?.enabled && voice.voiceMode === "voicechat" && (streamTextBuffer || event.content)) {
+          const chatText = (streamTextBuffer || event.content || "").trim();
+          streamTextBuffer = "";
+          if (chatText.length > 10 && _voiceChatSession?.isActive) {
+            try {
+              _voiceChatSession.enqueueAgentNarration(chatText, false);
+            } catch {
+            }
+          }
         }
         break;
       }
@@ -331274,7 +331350,7 @@ ${opts.systemPromptAddition}` : `Working directory: ${repoRoot}`;
   autoUpdateTimer.unref();
   const voiceEngine = new VoiceEngine();
   let voiceSession = null;
-  let _voiceChatSession = null;
+  let _voiceChatSession2 = null;
   let tunnelGateway = null;
   let p2pGateway = null;
   let peerMesh = null;
@@ -332963,7 +333039,7 @@ Respond concisely and safely. Remember: you are talking to the general public.`;
     },
     // --- /voicechat: Voryn-style state machine voice conversation ---
     async voiceChatStart() {
-      if (_voiceChatSession?.isActive) return;
+      if (_voiceChatSession2?.isActive) return;
       if (!voiceEngine.enabled || !voiceEngine.ready) {
         writeContent(() => renderInfo2("Auto-enabling voice for voice chat..."));
         const voiceMsg = await voiceEngine.toggle();
@@ -332980,7 +333056,7 @@ Respond concisely and safely. Remember: you are talking to the general public.`;
           }
         }
       };
-      _voiceChatSession = new VoiceChatSession2({
+      _voiceChatSession2 = new VoiceChatSession2({
         voice: voiceEngine,
         listen: listenEng,
         backendUrl: currentConfig.backendUrl,
@@ -333005,16 +333081,16 @@ Respond concisely and safely. Remember: you are talking to the general public.`;
           writeContent(() => renderInfo2(`\x1B[38;5;243m[voicechat] ${state}\x1B[0m`));
         }
       });
-      await _voiceChatSession.start();
+      await _voiceChatSession2.start();
     },
     async voiceChatStop() {
-      if (_voiceChatSession?.isActive) {
-        await _voiceChatSession.stop();
-        _voiceChatSession = null;
+      if (_voiceChatSession2?.isActive) {
+        await _voiceChatSession2.stop();
+        _voiceChatSession2 = null;
       }
     },
     isVoiceChatActive() {
-      return _voiceChatSession?.isActive ?? false;
+      return _voiceChatSession2?.isActive ?? false;
     },
     async exposeStart(kindOrUrl, authKey, transport, fullAccess, passthrough, loadbalance) {
       const knownKinds = ["ollama", "vllm", "llvm", "passthrough"];

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "open-agents-ai",
-  "version": "0.187.277",
+  "version": "0.187.278",
   "description": "AI coding agent powered by open-source models (Ollama/vLLM) — interactive TUI with agentic tool-calling loop",
   "type": "module",
   "main": "./dist/index.js",