npm - open-agents-ai - Versions diffs - 0.187.254 → 0.187.255 - Mend

open-agents-ai 0.187.254 → 0.187.255

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +45 -7
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -299450,6 +299450,7 @@ var init_voice = __esm({
        * - "action": only narrate tool calls/results (current default behavior)
        * - "chat": only speak streamed model text responses (normal pitch/volume)
        * - "verbose": both chat + action (chat at normal tone, actions at subordinate volume)
+       * - "voicechat": live mic + TTS conversation via sub agent (no tool narration)
        */
       voiceMode = "action";
       /**
@@ -302916,20 +302917,35 @@ async function handleSlashCommand(input, ctx3) {
         }
         if (arg.startsWith("mode")) {
           const modeArg = arg.replace(/^mode\s*/, "").trim().toLowerCase();
-          if (modeArg === "chat" || modeArg === "action" || modeArg === "verbose") {
+          if (modeArg === "chat" || modeArg === "action" || modeArg === "verbose" || modeArg === "voicechat") {
             ctx3.voiceSetMode?.(modeArg);
             save2({ voiceMode: modeArg });
+            if (modeArg === "voicechat" && ctx3.voiceChatStart && !ctx3.isVoiceChatActive?.()) {
+              try {
+                await ctx3.voiceChatStart();
+              } catch (err) {
+                renderWarning(`Voice chat mic failed: ${err instanceof Error ? err.message : String(err)}`);
+              }
+            }
+            if (modeArg !== "voicechat" && ctx3.isVoiceChatActive?.()) {
+              try {
+                await ctx3.voiceChatStop?.();
+              } catch {
+              }
+            }
             const modeDesc = {
               chat: "chat — speaks model responses only",
               action: "action — speaks tool call narrations only",
-              verbose: "verbose — speaks both model responses and tool narrations"
+              verbose: "verbose — speaks both model responses and tool narrations",
+              voicechat: "voicechat — live mic + TTS conversation via sub agent"
             };
             renderInfo(`Voice mode: ${modeDesc[modeArg]}${hasLocal ? " (project-local)" : ""}`);
           } else {
-            renderInfo("Usage: /voice mode <chat|action|verbose>");
-            renderInfo("  chat    — speaks streamed model text responses at normal pitch");
-            renderInfo("  action  — speaks tool call descriptions with emotion-modulated pitch");
-            renderInfo("  verbose — speaks both (chat at normal tone, actions at variable pitch)");
+            renderInfo("Usage: /voice mode <chat|action|verbose|voicechat>");
+            renderInfo("  chat      — speaks streamed model text responses at normal pitch");
+            renderInfo("  action    — speaks tool call descriptions with emotion-modulated pitch");
+            renderInfo("  verbose   — speaks both (chat at normal tone, actions at variable pitch)");
+            renderInfo("  voicechat — live mic + TTS back-and-forth conversation");
             const current = ctx3.voiceGetMode?.() ?? "action";
             renderInfo(`Current mode: ${current}`);
           }
@@ -305105,7 +305121,8 @@ async function handleVoiceMenu(ctx3, save2, hasLocal) {
         const modeItems = [
           { key: "chat", label: "Chat", detail: "speaks streamed model text at normal pitch" },
           { key: "action", label: "Action", detail: "speaks tool call narrations with emotion pitch" },
-          { key: "verbose", label: "Verbose", detail: "speaks both chat and actions" }
+          { key: "verbose", label: "Verbose", detail: "speaks both chat and actions" },
+          { key: "voicechat", label: "Voice Chat", detail: "live mic + TTS conversation alongside agent" }
         ];
         const modeResult = await tuiSelect({
           items: modeItems,
@@ -305119,6 +305136,18 @@ async function handleVoiceMenu(ctx3, save2, hasLocal) {
           const mode = modeResult.key;
           ctx3.voiceSetMode?.(mode);
           save2({ voiceMode: mode });
+          if (mode === "voicechat" && ctx3.voiceChatStart && !ctx3.isVoiceChatActive?.()) {
+            try {
+              await ctx3.voiceChatStart();
+            } catch {
+            }
+          }
+          if (mode !== "voicechat" && ctx3.isVoiceChatActive?.()) {
+            try {
+              await ctx3.voiceChatStop?.();
+            } catch {
+            }
+          }
         }
         continue;
       }
@@ -327029,6 +327058,7 @@ var init_voicechat = __esm({
       silenceTimeout;
       onStatus;
       onUserSpeech;
+      onPartialTranscript;
       onAgentSpeech;
       transcriptBuffer = "";
       silenceTimer = null;
@@ -327046,6 +327076,8 @@ var init_voicechat = __esm({
         });
         this.onUserSpeech = opts.onUserSpeech ?? (() => {
         });
+        this.onPartialTranscript = opts.onPartialTranscript ?? (() => {
+        });
         this.onAgentSpeech = opts.onAgentSpeech ?? (() => {
         });
       }
@@ -327065,6 +327097,7 @@ var init_voicechat = __esm({
           const { text, isFinal } = evt;
           if (!text?.trim()) return;
           this.transcriptBuffer = text.trim();
+          this.onPartialTranscript(this.transcriptBuffer);
           if (this.silenceTimer) clearTimeout(this.silenceTimer);
           if (isFinal || this.silenceTimeout === 0) {
             this.submitTranscript();
@@ -331414,6 +331447,11 @@ Respond concisely and safely. Remember: you are talking to the general public.`;
         onUserSpeech(text) {
           writeContent(() => renderInfo(`\x1B[38;5;45m[you]\x1B[0m ${text}`));
         },
+        onPartialTranscript(text) {
+          writeContent(() => {
+            process.stdout.write(`\r\x1B[2K\x1B[38;5;243m  [hearing] ${text.slice(0, 70)}\x1B[0m`);
+          });
+        },
         onAgentSpeech(text) {
           writeContent(() => renderInfo(`\x1B[38;5;178m[agent]\x1B[0m ${text.slice(0, 120)}`));
         }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "open-agents-ai",
-  "version": "0.187.254",
+  "version": "0.187.255",
   "description": "AI coding agent powered by open-source models (Ollama/vLLM) — interactive TUI with agentic tool-calling loop",
   "type": "module",
   "main": "./dist/index.js",