npm - voicesmith-mcp - Versions diffs - 1.0.11 → 1.0.12 - Mend

voicesmith-mcp 1.0.11 → 1.0.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json +1 -1
package/stt/__pycache__/mic_capture.cpython-314.pyc +0 -0
package/stt/mic_capture.py +16 -0

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "voicesmith-mcp",
-  "version": "1.0.11",
+  "version": "1.0.12",
   "description": "Local AI voice for coding assistants — TTS & STT via MCP. Kokoro ONNX + faster-whisper, fully offline.",
   "bin": {
     "voicesmith-mcp": "bin/cli.js"

package/stt/__pycache__/mic_capture.cpython-314.pyc CHANGED Viewed

Binary file

package/stt/mic_capture.py CHANGED Viewed

@@ -61,6 +61,11 @@ class MicCapture:
         silence_duration = 0.0
         loop = asyncio.get_event_loop()
+        # Reset VAD state — the LSTM hidden state and context window must
+        # be cleared between recordings to avoid stale state from previous
+        # audio affecting speech detection.
+        vad.reset()
         stream = None
         try:
             stream = sd.InputStream(
@@ -73,6 +78,17 @@ class MicCapture:
             stream.start()
             logger.info("Microphone recording started")
+            # Discard the first ~200ms of audio to avoid picking up residual
+            # speaker output (Tink sound or TTS playback that just finished).
+            # This prevents VAD from detecting speaker bleed as "speech" and
+            # then cutting off when the bleed stops.
+            flush_chunks = int(0.2 * self._sample_rate / 512)  # ~6 chunks
+            for _ in range(flush_chunks):
+                try:
+                    self._audio_queue.get(timeout=0.1)
+                except queue.Empty:
+                    break
             start_time = asyncio.get_event_loop().time()
             while not self._stop_flag: