npm - @absolutejs/voice - Versions diffs - 0.0.22-beta.591 → 0.0.22-beta.593 - Mend

@absolutejs/voice 0.0.22-beta.591 → 0.0.22-beta.593

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/index.js CHANGED Viewed

@@ -3753,7 +3753,8 @@ var normalizeText2 = (text) => text.trim().replace(/\s+/g, " ");
 var getAudioChunkDurationMs = (chunk) => chunk.byteLength / (DEFAULT_FORMAT.sampleRateHz * DEFAULT_FORMAT.channels * 2) * 1000;
 var getBufferedAudioDurationMs = (chunks) => chunks.reduce((total, chunk) => total + getAudioChunkDurationMs(chunk), 0);
 var STREAM_SENTENCE_BOUNDARY = /[.!?\u2026]['")\]]*\s/;
-var MAX_TTS_CHUNK_CHARS = 220;
+var STREAM_CLAUSE_BOUNDARY = /[,;:]\s/g;
+var MAX_TTS_CHUNK_CHARS = 320;
 var nextSpeakableBoundary = (buffer) => {
   const match = STREAM_SENTENCE_BOUNDARY.exec(buffer);
   return match ? match.index + match[0].length : -1;
@@ -3762,6 +3763,12 @@ var softCutBoundary = (buffer) => {
   if (buffer.length < MAX_TTS_CHUNK_CHARS)
     return -1;
   const window2 = buffer.slice(0, MAX_TTS_CHUNK_CHARS);
+  let lastClause = -1;
+  for (const match of window2.matchAll(STREAM_CLAUSE_BOUNDARY)) {
+    lastClause = match.index + match[0].length;
+  }
+  if (lastClause > 0)
+    return lastClause;
   const lastSpace = window2.lastIndexOf(" ");
   return lastSpace > 0 ? lastSpace + 1 : MAX_TTS_CHUNK_CHARS;
 };
@@ -6282,9 +6289,21 @@ var createVoiceSession = (options) => {
         amdFirstAudioAt = Date.now();
       }
       speechDetected = true;
-      clearSilenceTimer();
       kickCallSilenceWatchdog();
       backchannelDriver?.noteSpeech();
+      const latest = await readSession();
+      const sttQuietMs = latest.currentTurn.lastTranscriptAt !== undefined ? Date.now() - latest.currentTurn.lastTranscriptAt : Number.POSITIVE_INFINITY;
+      const hasTurnTextDespiteNoise = Boolean(buildTurnText(latest.currentTurn.transcripts, latest.currentTurn.partialText, {
+        partialEndedAtMs: latest.currentTurn.partialEndedAt,
+        partialStartedAtMs: latest.currentTurn.partialStartedAt
+      }));
+      if (hasTurnTextDespiteNoise && sttQuietMs >= turnDetection.silenceMs) {
+        if (!silenceTimer) {
+          scheduleSilenceCommit(0);
+        }
+      } else {
+        clearSilenceTimer();
+      }
     } else if (speechDetected) {
       backchannelDriver?.noteSilence();
       const currentSession = await readSession();

package/dist/testing/index.js CHANGED Viewed

@@ -5980,7 +5980,8 @@ var normalizeText2 = (text) => text.trim().replace(/\s+/g, " ");
 var getAudioChunkDurationMs = (chunk) => chunk.byteLength / (DEFAULT_FORMAT.sampleRateHz * DEFAULT_FORMAT.channels * 2) * 1000;
 var getBufferedAudioDurationMs = (chunks) => chunks.reduce((total, chunk) => total + getAudioChunkDurationMs(chunk), 0);
 var STREAM_SENTENCE_BOUNDARY = /[.!?\u2026]['")\]]*\s/;
-var MAX_TTS_CHUNK_CHARS = 220;
+var STREAM_CLAUSE_BOUNDARY = /[,;:]\s/g;
+var MAX_TTS_CHUNK_CHARS = 320;
 var nextSpeakableBoundary = (buffer) => {
   const match = STREAM_SENTENCE_BOUNDARY.exec(buffer);
   return match ? match.index + match[0].length : -1;
@@ -5989,6 +5990,12 @@ var softCutBoundary = (buffer) => {
   if (buffer.length < MAX_TTS_CHUNK_CHARS)
     return -1;
   const window2 = buffer.slice(0, MAX_TTS_CHUNK_CHARS);
+  let lastClause = -1;
+  for (const match of window2.matchAll(STREAM_CLAUSE_BOUNDARY)) {
+    lastClause = match.index + match[0].length;
+  }
+  if (lastClause > 0)
+    return lastClause;
   const lastSpace = window2.lastIndexOf(" ");
   return lastSpace > 0 ? lastSpace + 1 : MAX_TTS_CHUNK_CHARS;
 };
@@ -8509,9 +8516,21 @@ var createVoiceSession = (options) => {
         amdFirstAudioAt = Date.now();
       }
       speechDetected = true;
-      clearSilenceTimer();
       kickCallSilenceWatchdog();
       backchannelDriver?.noteSpeech();
+      const latest = await readSession();
+      const sttQuietMs = latest.currentTurn.lastTranscriptAt !== undefined ? Date.now() - latest.currentTurn.lastTranscriptAt : Number.POSITIVE_INFINITY;
+      const hasTurnTextDespiteNoise = Boolean(buildTurnText(latest.currentTurn.transcripts, latest.currentTurn.partialText, {
+        partialEndedAtMs: latest.currentTurn.partialEndedAt,
+        partialStartedAtMs: latest.currentTurn.partialStartedAt
+      }));
+      if (hasTurnTextDespiteNoise && sttQuietMs >= turnDetection.silenceMs) {
+        if (!silenceTimer) {
+          scheduleSilenceCommit(0);
+        }
+      } else {
+        clearSilenceTimer();
+      }
     } else if (speechDetected) {
       backchannelDriver?.noteSilence();
       const currentSession = await readSession();

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@absolutejs/voice",
-  "version": "0.0.22-beta.591",
+  "version": "0.0.22-beta.593",
   "description": "Voice primitives and Elysia plugin for AbsoluteJS",
   "repository": {
     "type": "git",