PyPI - agent-cli - Versions diffs - 0.70.2__py3-none-any.whl → 0.72.1__py3-none-any.whl - Mend

agent-cli 0.70.2py3-none-any.whl → 0.72.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (35) hide show

agent_cli/_extras.json +4 -3
agent_cli/_requirements/memory.txt +14 -1
agent_cli/_requirements/rag.txt +14 -1
agent_cli/_requirements/vad.txt +1 -85
agent_cli/_requirements/wyoming.txt +71 -0
agent_cli/agents/assistant.py +24 -28
agent_cli/agents/autocorrect.py +30 -4
agent_cli/agents/chat.py +45 -15
agent_cli/agents/memory/__init__.py +19 -1
agent_cli/agents/memory/add.py +3 -3
agent_cli/agents/memory/proxy.py +20 -11
agent_cli/agents/rag_proxy.py +42 -10
agent_cli/agents/speak.py +23 -3
agent_cli/agents/transcribe.py +21 -3
agent_cli/agents/transcribe_daemon.py +34 -22
agent_cli/agents/voice_edit.py +18 -10
agent_cli/cli.py +25 -2
agent_cli/config_cmd.py +30 -11
agent_cli/core/deps.py +6 -3
agent_cli/core/transcription_logger.py +1 -1
agent_cli/core/vad.py +6 -24
agent_cli/dev/cli.py +295 -65
agent_cli/docs_gen.py +18 -8
agent_cli/install/extras.py +44 -13
agent_cli/install/hotkeys.py +22 -11
agent_cli/install/services.py +54 -14
agent_cli/opts.py +43 -22
agent_cli/server/cli.py +128 -62
agent_cli/server/proxy/api.py +77 -19
agent_cli/services/__init__.py +46 -5
{agent_cli-0.70.2.dist-info → agent_cli-0.72.1.dist-info}/METADATA +627 -246
{agent_cli-0.70.2.dist-info → agent_cli-0.72.1.dist-info}/RECORD +35 -34
{agent_cli-0.70.2.dist-info → agent_cli-0.72.1.dist-info}/WHEEL +0 -0
{agent_cli-0.70.2.dist-info → agent_cli-0.72.1.dist-info}/entry_points.txt +0 -0
{agent_cli-0.70.2.dist-info → agent_cli-0.72.1.dist-info}/licenses/LICENSE +0 -0

agent_cli/core/vad.py CHANGED Viewed

@@ -3,38 +3,22 @@
 from __future__ import annotations
 import logging
-import urllib.request
 from collections import deque
-from pathlib import Path
 from agent_cli import constants
 try:
     import numpy as np
-    import torch
+    from silero_vad_lite import SileroVAD
 except ImportError as e:
     msg = (
-        "silero-vad is required for the transcribe-daemon command. "
+        "silero-vad-lite is required for the transcribe-daemon command. "
         "Install it with: `pip install agent-cli[vad]` or `uv sync --extra vad`."
     )
     raise ImportError(msg) from e
 LOGGER = logging.getLogger(__name__)
-_SILERO_VAD_ONNX_URL = (
-    "https://github.com/snakers4/silero-vad/raw/master/src/silero_vad/data/silero_vad.onnx"
-)
-def _get_model_path() -> Path:
-    """Get the path to the Silero VAD ONNX model, downloading if needed."""
-    cache_dir = Path.home() / ".cache" / "silero-vad"
-    cache_dir.mkdir(parents=True, exist_ok=True)
-    model_path = cache_dir / "silero_vad.onnx"
-    if not model_path.exists():
-        urllib.request.urlretrieve(_SILERO_VAD_ONNX_URL, model_path)  # noqa: S310
-    return model_path
 class VoiceActivityDetector:
     """Silero VAD-based voice activity detection for audio segmentation.
@@ -56,8 +40,6 @@ class VoiceActivityDetector:
             msg = f"Sample rate must be 8000 or 16000, got {sample_rate}"
             raise ValueError(msg)
-        from silero_vad.utils_vad import OnnxWrapper  # noqa: PLC0415
         self.sample_rate = sample_rate
         self.threshold = threshold
         self.silence_threshold_ms = silence_threshold_ms
@@ -74,7 +56,7 @@ class VoiceActivityDetector:
         )
         # Model and state
-        self._model = OnnxWrapper(str(_get_model_path()))
+        self._model = SileroVAD(sample_rate=sample_rate)
         self._pre_speech_buffer: deque[bytes] = deque(maxlen=pre_speech_windows)
         self._pending = bytearray()
         self._audio_buffer = bytearray()
@@ -92,7 +74,7 @@ class VoiceActivityDetector:
     def reset(self) -> None:
         """Reset VAD state for a new recording session."""
-        self._model.reset_states()
+        self._model = SileroVAD(sample_rate=self.sample_rate)
         self._pre_speech_buffer.clear()
         self._pending.clear()
         self._audio_buffer.clear()
@@ -103,7 +85,7 @@ class VoiceActivityDetector:
     def _is_speech(self, window: bytes) -> bool:
         """Check if audio window contains speech."""
         audio = np.frombuffer(window, dtype=np.int16).astype(np.float32) / 32768.0
-        prob = float(self._model(torch.from_numpy(audio), self.sample_rate).item())
+        prob = self._model.process(audio)
         LOGGER.debug("Speech prob: %.3f, threshold: %.2f", prob, self.threshold)
         return prob >= self.threshold
@@ -154,7 +136,7 @@ class VoiceActivityDetector:
                     self._silence_samples = 0
                     self._speech_samples = 0
                     self._audio_buffer.clear()
-                    self._model.reset_states()
+                    self._model = SileroVAD(sample_rate=self.sample_rate)
             else:
                 # Not speaking - maintain rolling pre-speech buffer (auto-limited by deque maxlen)
                 self._pre_speech_buffer.append(window)

agent-cli 0.70.2__py3-none-any.whl → 0.72.1__py3-none-any.whl

agent-cli 0.70.2py3-none-any.whl → 0.72.1py3-none-any.whl