PyPI - agent-cli - Versions diffs - 0.70.5__py3-none-any.whl - Mend

agent-cli 0.70.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

agent_cli/__init__.py +5 -0
agent_cli/__main__.py +6 -0
agent_cli/_extras.json +14 -0
agent_cli/_requirements/.gitkeep +0 -0
agent_cli/_requirements/audio.txt +79 -0
agent_cli/_requirements/faster-whisper.txt +215 -0
agent_cli/_requirements/kokoro.txt +425 -0
agent_cli/_requirements/llm.txt +183 -0
agent_cli/_requirements/memory.txt +355 -0
agent_cli/_requirements/mlx-whisper.txt +222 -0
agent_cli/_requirements/piper.txt +176 -0
agent_cli/_requirements/rag.txt +402 -0
agent_cli/_requirements/server.txt +154 -0
agent_cli/_requirements/speed.txt +77 -0
agent_cli/_requirements/vad.txt +155 -0
agent_cli/_requirements/wyoming.txt +71 -0
agent_cli/_tools.py +368 -0
agent_cli/agents/__init__.py +23 -0
agent_cli/agents/_voice_agent_common.py +136 -0
agent_cli/agents/assistant.py +383 -0
agent_cli/agents/autocorrect.py +284 -0
agent_cli/agents/chat.py +496 -0
agent_cli/agents/memory/__init__.py +31 -0
agent_cli/agents/memory/add.py +190 -0
agent_cli/agents/memory/proxy.py +160 -0
agent_cli/agents/rag_proxy.py +128 -0
agent_cli/agents/speak.py +209 -0
agent_cli/agents/transcribe.py +671 -0
agent_cli/agents/transcribe_daemon.py +499 -0
agent_cli/agents/voice_edit.py +291 -0
agent_cli/api.py +22 -0
agent_cli/cli.py +106 -0
agent_cli/config.py +503 -0
agent_cli/config_cmd.py +307 -0
agent_cli/constants.py +27 -0
agent_cli/core/__init__.py +1 -0
agent_cli/core/audio.py +461 -0
agent_cli/core/audio_format.py +299 -0
agent_cli/core/chroma.py +88 -0
agent_cli/core/deps.py +191 -0
agent_cli/core/openai_proxy.py +139 -0
agent_cli/core/process.py +195 -0
agent_cli/core/reranker.py +120 -0
agent_cli/core/sse.py +87 -0
agent_cli/core/transcription_logger.py +70 -0
agent_cli/core/utils.py +526 -0
agent_cli/core/vad.py +175 -0
agent_cli/core/watch.py +65 -0
agent_cli/dev/__init__.py +14 -0
agent_cli/dev/cli.py +1588 -0
agent_cli/dev/coding_agents/__init__.py +19 -0
agent_cli/dev/coding_agents/aider.py +24 -0
agent_cli/dev/coding_agents/base.py +167 -0
agent_cli/dev/coding_agents/claude.py +39 -0
agent_cli/dev/coding_agents/codex.py +24 -0
agent_cli/dev/coding_agents/continue_dev.py +15 -0
agent_cli/dev/coding_agents/copilot.py +24 -0
agent_cli/dev/coding_agents/cursor_agent.py +48 -0
agent_cli/dev/coding_agents/gemini.py +28 -0
agent_cli/dev/coding_agents/opencode.py +15 -0
agent_cli/dev/coding_agents/registry.py +49 -0
agent_cli/dev/editors/__init__.py +19 -0
agent_cli/dev/editors/base.py +89 -0
agent_cli/dev/editors/cursor.py +15 -0
agent_cli/dev/editors/emacs.py +46 -0
agent_cli/dev/editors/jetbrains.py +56 -0
agent_cli/dev/editors/nano.py +31 -0
agent_cli/dev/editors/neovim.py +33 -0
agent_cli/dev/editors/registry.py +59 -0
agent_cli/dev/editors/sublime.py +20 -0
agent_cli/dev/editors/vim.py +42 -0
agent_cli/dev/editors/vscode.py +15 -0
agent_cli/dev/editors/zed.py +20 -0
agent_cli/dev/project.py +568 -0
agent_cli/dev/registry.py +52 -0
agent_cli/dev/skill/SKILL.md +141 -0
agent_cli/dev/skill/examples.md +571 -0
agent_cli/dev/terminals/__init__.py +19 -0
agent_cli/dev/terminals/apple_terminal.py +82 -0
agent_cli/dev/terminals/base.py +56 -0
agent_cli/dev/terminals/gnome.py +51 -0
agent_cli/dev/terminals/iterm2.py +84 -0
agent_cli/dev/terminals/kitty.py +77 -0
agent_cli/dev/terminals/registry.py +48 -0
agent_cli/dev/terminals/tmux.py +58 -0
agent_cli/dev/terminals/warp.py +132 -0
agent_cli/dev/terminals/zellij.py +78 -0
agent_cli/dev/worktree.py +856 -0
agent_cli/docs_gen.py +417 -0
agent_cli/example-config.toml +185 -0
agent_cli/install/__init__.py +5 -0
agent_cli/install/common.py +89 -0
agent_cli/install/extras.py +174 -0
agent_cli/install/hotkeys.py +48 -0
agent_cli/install/services.py +87 -0
agent_cli/memory/__init__.py +7 -0
agent_cli/memory/_files.py +250 -0
agent_cli/memory/_filters.py +63 -0
agent_cli/memory/_git.py +157 -0
agent_cli/memory/_indexer.py +142 -0
agent_cli/memory/_ingest.py +408 -0
agent_cli/memory/_persistence.py +182 -0
agent_cli/memory/_prompt.py +91 -0
agent_cli/memory/_retrieval.py +294 -0
agent_cli/memory/_store.py +169 -0
agent_cli/memory/_streaming.py +44 -0
agent_cli/memory/_tasks.py +48 -0
agent_cli/memory/api.py +113 -0
agent_cli/memory/client.py +272 -0
agent_cli/memory/engine.py +361 -0
agent_cli/memory/entities.py +43 -0
agent_cli/memory/models.py +112 -0
agent_cli/opts.py +433 -0
agent_cli/py.typed +0 -0
agent_cli/rag/__init__.py +3 -0
agent_cli/rag/_indexer.py +67 -0
agent_cli/rag/_indexing.py +226 -0
agent_cli/rag/_prompt.py +30 -0
agent_cli/rag/_retriever.py +156 -0
agent_cli/rag/_store.py +48 -0
agent_cli/rag/_utils.py +218 -0
agent_cli/rag/api.py +175 -0
agent_cli/rag/client.py +299 -0
agent_cli/rag/engine.py +302 -0
agent_cli/rag/models.py +55 -0
agent_cli/scripts/.runtime/.gitkeep +0 -0
agent_cli/scripts/__init__.py +1 -0
agent_cli/scripts/check_plugin_skill_sync.py +50 -0
agent_cli/scripts/linux-hotkeys/README.md +63 -0
agent_cli/scripts/linux-hotkeys/toggle-autocorrect.sh +45 -0
agent_cli/scripts/linux-hotkeys/toggle-transcription.sh +58 -0
agent_cli/scripts/linux-hotkeys/toggle-voice-edit.sh +58 -0
agent_cli/scripts/macos-hotkeys/README.md +45 -0
agent_cli/scripts/macos-hotkeys/skhd-config-example +5 -0
agent_cli/scripts/macos-hotkeys/toggle-autocorrect.sh +12 -0
agent_cli/scripts/macos-hotkeys/toggle-transcription.sh +37 -0
agent_cli/scripts/macos-hotkeys/toggle-voice-edit.sh +37 -0
agent_cli/scripts/nvidia-asr-server/README.md +99 -0
agent_cli/scripts/nvidia-asr-server/pyproject.toml +27 -0
agent_cli/scripts/nvidia-asr-server/server.py +255 -0
agent_cli/scripts/nvidia-asr-server/shell.nix +32 -0
agent_cli/scripts/nvidia-asr-server/uv.lock +4654 -0
agent_cli/scripts/run-openwakeword.sh +11 -0
agent_cli/scripts/run-piper-windows.ps1 +30 -0
agent_cli/scripts/run-piper.sh +24 -0
agent_cli/scripts/run-whisper-linux.sh +40 -0
agent_cli/scripts/run-whisper-macos.sh +6 -0
agent_cli/scripts/run-whisper-windows.ps1 +51 -0
agent_cli/scripts/run-whisper.sh +9 -0
agent_cli/scripts/run_faster_whisper_server.py +136 -0
agent_cli/scripts/setup-linux-hotkeys.sh +72 -0
agent_cli/scripts/setup-linux.sh +108 -0
agent_cli/scripts/setup-macos-hotkeys.sh +61 -0
agent_cli/scripts/setup-macos.sh +76 -0
agent_cli/scripts/setup-windows.ps1 +63 -0
agent_cli/scripts/start-all-services-windows.ps1 +53 -0
agent_cli/scripts/start-all-services.sh +178 -0
agent_cli/scripts/sync_extras.py +138 -0
agent_cli/server/__init__.py +3 -0
agent_cli/server/cli.py +721 -0
agent_cli/server/common.py +222 -0
agent_cli/server/model_manager.py +288 -0
agent_cli/server/model_registry.py +225 -0
agent_cli/server/proxy/__init__.py +3 -0
agent_cli/server/proxy/api.py +444 -0
agent_cli/server/streaming.py +67 -0
agent_cli/server/tts/__init__.py +3 -0
agent_cli/server/tts/api.py +335 -0
agent_cli/server/tts/backends/__init__.py +82 -0
agent_cli/server/tts/backends/base.py +139 -0
agent_cli/server/tts/backends/kokoro.py +403 -0
agent_cli/server/tts/backends/piper.py +253 -0
agent_cli/server/tts/model_manager.py +201 -0
agent_cli/server/tts/model_registry.py +28 -0
agent_cli/server/tts/wyoming_handler.py +249 -0
agent_cli/server/whisper/__init__.py +3 -0
agent_cli/server/whisper/api.py +413 -0
agent_cli/server/whisper/backends/__init__.py +89 -0
agent_cli/server/whisper/backends/base.py +97 -0
agent_cli/server/whisper/backends/faster_whisper.py +225 -0
agent_cli/server/whisper/backends/mlx.py +270 -0
agent_cli/server/whisper/languages.py +116 -0
agent_cli/server/whisper/model_manager.py +157 -0
agent_cli/server/whisper/model_registry.py +28 -0
agent_cli/server/whisper/wyoming_handler.py +203 -0
agent_cli/services/__init__.py +343 -0
agent_cli/services/_wyoming_utils.py +64 -0
agent_cli/services/asr.py +506 -0
agent_cli/services/llm.py +228 -0
agent_cli/services/tts.py +450 -0
agent_cli/services/wake_word.py +142 -0
agent_cli-0.70.5.dist-info/METADATA +2118 -0
agent_cli-0.70.5.dist-info/RECORD +196 -0
agent_cli-0.70.5.dist-info/WHEEL +4 -0
agent_cli-0.70.5.dist-info/entry_points.txt +4 -0
agent_cli-0.70.5.dist-info/licenses/LICENSE +21 -0

agent_cli/core/utils.py ADDED Viewed

@@ -0,0 +1,526 @@
+"""Utility functions for agent CLI operations."""
+from __future__ import annotations
+import asyncio
+import json
+import logging
+import os
+import signal
+import sys
+import time
+from contextlib import (
+    AbstractContextManager,
+    asynccontextmanager,
+    contextmanager,
+    nullcontext,
+    suppress,
+)
+from typing import TYPE_CHECKING, Any
+from rich.console import Console
+from rich.live import Live
+from rich.panel import Panel
+from rich.spinner import Spinner
+from rich.status import Status
+from rich.table import Table
+from rich.text import Text
+from . import process
+SECONDS_PER_MINUTE = 60
+MINUTES_PER_HOUR = 60
+HOURS_PER_DAY = 24
+if TYPE_CHECKING:
+    from collections.abc import AsyncGenerator, Coroutine, Generator, Iterator
+    from datetime import timedelta
+    from logging import Handler
+    from pathlib import Path
+console = Console()
+err_console = Console(stderr=True)
+def enable_json_mode() -> None:
+    """Silence Rich console output for JSON mode.
+    Call this early in a command when --json flag is set.
+    All subsequent console.print() calls will be silenced.
+    """
+    console.quiet = True
+class InteractiveStopEvent:
+    """A stop event with reset capability for chat agents."""
+    def __init__(self, process_name: str | None = None) -> None:
+        """Initialize the chat stop event."""
+        self._event = asyncio.Event()
+        self._sigint_count = 0
+        self._ctrl_c_pressed = False
+        self._process_name = process_name
+    def is_set(self) -> bool:
+        """Check if the stop event is set or stop file exists (Windows)."""
+        if self._event.is_set():
+            return True
+        # On Windows, also check for stop file (cross-process signaling)
+        if self._process_name is not None and process.check_stop_file(self._process_name):
+            self._event.set()  # Set the event so subsequent checks are fast
+            return True
+        return False
+    def set(self) -> None:
+        """Set the stop event."""
+        self._event.set()
+    def clear(self) -> None:
+        """Clear the stop event and reset interrupt count for next iteration."""
+        self._event.clear()
+        self._sigint_count = 0
+        self._ctrl_c_pressed = False
+    def increment_sigint_count(self) -> int:
+        """Increment and return the SIGINT count."""
+        self._sigint_count += 1
+        self._ctrl_c_pressed = True
+        return self._sigint_count
+    @property
+    def ctrl_c_pressed(self) -> bool:
+        """Check if Ctrl+C was pressed."""
+        return self._ctrl_c_pressed
+def atomic_write_text(path: Path, content: str, encoding: str = "utf-8") -> None:
+    """Write text to a file atomically using a temporary file and rename."""
+    # Create a temp file in the same directory to ensure atomic rename works
+    temp_file = path.with_suffix(f"{path.suffix}.tmp")
+    try:
+        temp_file.write_text(content, encoding=encoding)
+        temp_file.replace(path)
+    except Exception:
+        if temp_file.exists():
+            temp_file.unlink()
+        raise
+def format_timedelta_to_ago(td: timedelta) -> str:
+    """Format a timedelta into a human-readable 'ago' string."""
+    seconds = int(td.total_seconds())
+    minutes, seconds = divmod(seconds, 60)
+    hours, minutes = divmod(minutes, 60)
+    days, hours = divmod(hours, 24)
+    if days > 0:
+        return f"{days} day{'s' if days != 1 else ''} ago"
+    if hours > 0:
+        return f"{hours} hour{'s' if hours != 1 else ''} ago"
+    if minutes > 0:
+        return f"{minutes} minute{'s' if minutes != 1 else ''} ago"
+    return f"{seconds} second{'s' if seconds != 1 else ''} ago"
+def format_short_timedelta(delta: timedelta) -> str:
+    """Format a timedelta into a compact 'Xm Ys' string."""
+    total_seconds = max(0, int(delta.total_seconds()))
+    if total_seconds < SECONDS_PER_MINUTE:
+        return f"{total_seconds}s"
+    minutes, seconds = divmod(total_seconds, SECONDS_PER_MINUTE)
+    if minutes < MINUTES_PER_HOUR:
+        return f"{minutes}m {seconds}s" if seconds else f"{minutes}m"
+    hours, minutes = divmod(minutes, MINUTES_PER_HOUR)
+    if hours < HOURS_PER_DAY:
+        return f"{hours}h {minutes}m"
+    days, hours = divmod(hours, HOURS_PER_DAY)
+    return f"{days}d {hours}h"
+def iter_lines_from_file_end(path: Path, chunk_size: int) -> Iterator[str]:
+    """Yield lines from the end of a file in reverse order."""
+    if chunk_size <= 0:
+        msg = "chunk_size must be positive"
+        raise ValueError(msg)
+    with path.open("rb") as file:
+        file.seek(0, os.SEEK_END)
+        position = file.tell()
+        buffer = b""
+        while position > 0:
+            read_size = min(chunk_size, position)
+            position -= read_size
+            file.seek(position)
+            chunk = file.read(read_size)
+            buffer = chunk + buffer
+            while True:
+                newline_idx = buffer.rfind(b"\n")
+                if newline_idx == -1:
+                    break
+                line_bytes = buffer[newline_idx + 1 :].strip()
+                buffer = buffer[:newline_idx]
+                if line_bytes:
+                    yield line_bytes.decode("utf-8", errors="ignore")
+            if position == 0:
+                final_line = buffer.strip()
+                if final_line:
+                    yield final_line.decode("utf-8", errors="ignore")
+                buffer = b""
+def parse_json_line(line: str) -> dict[str, Any] | None:
+    """Parse a JSON line and return a dictionary, or None if invalid."""
+    try:
+        return json.loads(line)
+    except json.JSONDecodeError:
+        return None
+def _create_spinner(text: str, style: str) -> Spinner:
+    """Creates a default spinner."""
+    return Spinner("dots", text=Text(text, style=style))
+def create_status(text: str, style: str = "bold yellow") -> Status:
+    """Creates a default status with spinner."""
+    spinner_text = Text(text, style=style)
+    return Status(spinner_text, console=console, spinner="dots")
+def print_input_panel(
+    text: str,
+    title: str = "Input",
+    subtitle: str = "",
+    style: str = "bold blue",
+) -> None:
+    """Prints a panel with the input text."""
+    console.print(Panel(text, title=title, subtitle=subtitle, border_style=style))
+def print_output_panel(
+    text: str,
+    title: str = "Output",
+    subtitle: str = "",
+    style: str = "bold green",
+) -> None:
+    """Prints a panel with the output text."""
+    console.print(Panel(text, title=title, subtitle=subtitle, border_style=style))
+def print_error_message(message: str, suggestion: str | None = None) -> None:
+    """Prints an error message in a panel with rich markup support."""
+    error_text = Text.from_markup(message)
+    if suggestion:
+        error_text.append("\n\n")
+        error_text.append(suggestion)
+    console.print(Panel(error_text, title="Error", border_style="bold red"))
+def print_with_style(message: str, style: str = "bold green") -> None:
+    """Prints a status message."""
+    console.print(f"[{style}]{message}[/{style}]")
+def print_device_index(input_device_index: int | None, input_device_name: str | None) -> None:
+    """Prints the device index."""
+    if input_device_index is not None:
+        name = input_device_name or "Unknown Device"
+        print_with_style(f"Using {name} device with index {input_device_index}")
+def get_clipboard_text(*, quiet: bool = False) -> str | None:
+    """Get text from clipboard, with an optional status message."""
+    import pyperclip  # noqa: PLC0415
+    text = pyperclip.paste()
+    if not text:
+        if not quiet:
+            print_with_style("Clipboard is empty.", style="yellow")
+        return None
+    return text
+@contextmanager
+def signal_handling_context(
+    logger: logging.Logger,
+    quiet: bool = False,
+    process_name: str | None = None,
+) -> Generator[InteractiveStopEvent, None, None]:
+    """Context manager for graceful signal handling with double Ctrl+C support.
+    Sets up handlers for SIGINT (Ctrl+C) and SIGTERM (kill command):
+    - First Ctrl+C: Graceful shutdown with warning message
+    - Second Ctrl+C: Force exit with code 130
+    - SIGTERM: Immediate graceful shutdown
+    On Windows, also monitors for a stop file (cross-process signaling).
+    Args:
+        logger: Logger instance for recording events
+        quiet: Whether to suppress console output
+        process_name: Optional process name for stop file monitoring (Windows)
+    Yields:
+        stop_event: InteractiveStopEvent that gets set when shutdown is requested
+    """
+    stop_event = InteractiveStopEvent(process_name=process_name)
+    def _sigint_handler() -> None:
+        sigint_count = stop_event.increment_sigint_count()
+        if sigint_count == 1:
+            logger.info("First Ctrl+C received. Processing transcription.")
+            # The Ctrl+C message will be shown by the ASR function
+            stop_event.set()
+        else:
+            logger.info("Second Ctrl+C received. Force exiting.")
+            if not quiet:
+                console.print("\n[red]Force exit![/red]")
+            sys.exit(130)  # Standard exit code for Ctrl+C
+    def _sigterm_handler() -> None:
+        logger.info("SIGTERM received. Stopping process.")
+        stop_event.set()
+    loop = asyncio.get_running_loop()
+    restore_handlers: dict[signal.Signals, Any] = {}
+    def _register_async_handlers() -> None:
+        """Register signal handlers using asyncio loop (Unix)."""
+        loop.add_signal_handler(signal.SIGINT, _sigint_handler)
+        loop.add_signal_handler(signal.SIGTERM, _sigterm_handler)
+    def _register_sync_handlers() -> None:
+        """Register signal handlers using standard signal module (Windows)."""
+        logger.debug("Using sync signal handlers (Windows platform).")
+        def register(signum: signal.Signals, handler: Any) -> None:
+            restore_handlers[signum] = signal.getsignal(signum)
+            signal.signal(signum, handler)
+        register(signal.SIGINT, lambda *_: _sigint_handler())
+        register(signal.SIGTERM, lambda *_: _sigterm_handler())
+    if sys.platform == "win32":
+        _register_sync_handlers()
+    else:
+        _register_async_handlers()
+    try:
+        yield stop_event
+    finally:
+        for signum, previous in restore_handlers.items():
+            signal.signal(signum, previous)
+def stop_or_status_or_toggle(
+    process_name: str,
+    which: str,
+    stop: bool,
+    status: bool,
+    toggle: bool,
+    *,
+    quiet: bool = False,
+) -> bool:
+    """Handle process control for a given process name."""
+    if stop:
+        if process.kill_process(process_name):
+            if not quiet:
+                print_with_style(f"✅ {which.capitalize()} stopped.")
+        elif not quiet:
+            print_with_style(f"⚠️  No {which} is running.", style="yellow")
+        return True
+    if status:
+        if process.is_process_running(process_name):
+            pid = process.read_pid_file(process_name)
+            if not quiet:
+                print_with_style(f"✅ {which.capitalize()} is running (PID: {pid}).")
+        elif not quiet:
+            print_with_style(f"⚠️ {which.capitalize()} is not running.", style="yellow")
+        return True
+    if toggle:
+        if process.is_process_running(process_name):
+            if process.kill_process(process_name) and not quiet:
+                print_with_style(f"✅ {which.capitalize()} stopped.")
+            return True
+        if not quiet:
+            print_with_style(f"⚠️ {which.capitalize()} is not running.", style="yellow")
+    return False
+def maybe_live(use_live: bool) -> AbstractContextManager[Live | None]:
+    """Create a live context manager if use_live is True."""
+    if use_live:
+        return Live(_create_spinner("Initializing", "blue"), console=console, transient=True)
+    return nullcontext()
+@asynccontextmanager
+async def live_timer(
+    live: Live,
+    base_message: str,
+    *,
+    quiet: bool = False,
+    style: str = "blue",
+    stop_event: InteractiveStopEvent | None = None,
+) -> AsyncGenerator[None, None]:
+    """Async context manager that automatically manages a timer for a Live display.
+    Args:
+        live: Live instance to update (or None to do nothing)
+        base_message: Base message to display
+        style: Rich style for the text
+        quiet: If True, don't show any display
+        stop_event: Optional stop event to check for Ctrl+C
+    Usage:
+        async with live_timer(live, "🤖 Processing", style="bold yellow"):
+            # Do your work here, timer updates automatically
+            await some_operation()
+    """
+    if quiet:
+        yield
+        return
+    # Start the timer task
+    start_time = time.monotonic()
+    async def update_timer() -> None:
+        """Update the timer display."""
+        while True:
+            elapsed = time.monotonic() - start_time
+            # Check if Ctrl+C was pressed
+            if stop_event and stop_event.ctrl_c_pressed:
+                ctrl_c_text = Text(
+                    "Ctrl+C pressed. Processing transcription... (Press Ctrl+C again to force exit)",
+                    style="yellow",
+                )
+                live.update(ctrl_c_text)
+            else:
+                spinner = _create_spinner(f"{base_message}... ({elapsed:.1f}s)", style)
+                live.update(spinner)
+            await asyncio.sleep(0.1)
+    timer_task = asyncio.create_task(update_timer())
+    try:
+        yield
+    finally:
+        # Clean up timer task automatically
+        timer_task.cancel()
+        with suppress(asyncio.CancelledError):
+            await timer_task
+        if not quiet:
+            live.update("")
+def setup_logging(log_level: str, log_file: str | None, *, quiet: bool) -> None:
+    """Sets up logging based on parsed arguments."""
+    handlers: list[Handler] = []
+    if not quiet:
+        handlers.append(logging.StreamHandler())
+    if log_file:
+        handlers.append(logging.FileHandler(log_file, mode="w"))
+    logging.basicConfig(
+        level=log_level.upper(),
+        format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
+        handlers=handlers,
+    )
+async def manage_send_receive_tasks(
+    send_task_coro: Coroutine,
+    receive_task_coro: Coroutine,
+    *,
+    return_when: str = asyncio.ALL_COMPLETED,
+) -> tuple[asyncio.Task, asyncio.Task]:
+    """Manage send and receive tasks with proper cancellation.
+    Args:
+        send_task_coro: Send task coroutine
+        receive_task_coro: Receive task coroutine
+        return_when: When to return (e.g., asyncio.ALL_COMPLETED)
+    Returns:
+        Tuple of (send_task, receive_task) - both completed or cancelled
+    """
+    send_task = asyncio.create_task(send_task_coro)
+    recv_task = asyncio.create_task(receive_task_coro)
+    _done, pending = await asyncio.wait(
+        [send_task, recv_task],
+        return_when=return_when,
+    )
+    # Cancel any pending tasks
+    for task in pending:
+        task.cancel()
+    return send_task, recv_task
+def print_command_line_args(
+    args: dict[str, str | int | bool | None],
+) -> None:
+    """Print command line arguments in a formatted way."""
+    from agent_cli import opts  # noqa: PLC0415
+    table = Table(title="Command Line Arguments", show_header=True, header_style="bold magenta")
+    table.add_column("Parameter", style="cyan", no_wrap=True)
+    table.add_column("Value", style="green")
+    table.add_column("Type", style="dim")
+    sorted_args = sorted(args.items())
+    categories: dict[str, list[tuple[str, str | int | bool | None]]] = {}
+    for key, value in sorted_args:
+        if key == "ctx":
+            continue
+        try:
+            category = getattr(opts, key.upper()).rich_help_panel
+        except AttributeError:
+            category = "Other"
+        if category not in categories:
+            categories[category] = []
+        categories[category].append((key, value))
+    sorted_categories = sorted(categories.items())
+    for category, items in sorted_categories:
+        if not items:
+            continue
+        # Add a separator row for the category
+        table.add_row(f"[bold yellow]── {category} ──[/bold yellow]", "", "")
+        for key, value in items:
+            if value is None:
+                formatted_value = "[dim]None[/dim]"
+            elif isinstance(value, bool):
+                formatted_value = "[green]✓[/green]" if value else "[red]✗[/red]"
+            elif isinstance(value, str) and not value:
+                formatted_value = "[dim]<empty>[/dim]"
+            else:
+                formatted_value = str(value)
+            type_name = type(value).__name__
+            if value is None:
+                type_name = "NoneType"
+            table.add_row(key, formatted_value, f"[dim]{type_name}[/dim]")
+    # Print the table
+    console.print()
+    console.print(table)
+    console.print()

agent_cli/core/vad.py ADDED Viewed

@@ -0,0 +1,175 @@
+"""Voice Activity Detection using Silero VAD for speech segmentation."""
+from __future__ import annotations
+import logging
+import urllib.request
+from collections import deque
+from pathlib import Path
+from agent_cli import constants
+try:
+    import numpy as np
+    import torch
+except ImportError as e:
+    msg = (
+        "silero-vad is required for the transcribe-daemon command. "
+        "Install it with: `pip install agent-cli[vad]` or `uv sync --extra vad`."
+    )
+    raise ImportError(msg) from e
+LOGGER = logging.getLogger(__name__)
+_SILERO_VAD_ONNX_URL = (
+    "https://github.com/snakers4/silero-vad/raw/master/src/silero_vad/data/silero_vad.onnx"
+)
+def _get_model_path() -> Path:
+    """Get the path to the Silero VAD ONNX model, downloading if needed."""
+    cache_dir = Path.home() / ".cache" / "silero-vad"
+    cache_dir.mkdir(parents=True, exist_ok=True)
+    model_path = cache_dir / "silero_vad.onnx"
+    if not model_path.exists():
+        urllib.request.urlretrieve(_SILERO_VAD_ONNX_URL, model_path)  # noqa: S310
+    return model_path
+class VoiceActivityDetector:
+    """Silero VAD-based voice activity detection for audio segmentation.
+    Processes audio chunks and emits complete speech segments when silence
+    is detected after speech.
+    """
+    def __init__(
+        self,
+        sample_rate: int = constants.AUDIO_RATE,
+        threshold: float = 0.3,
+        silence_threshold_ms: int = 1000,
+        min_speech_duration_ms: int = 250,
+        pre_speech_buffer_ms: int = 300,
+    ) -> None:
+        """Initialize VAD with configurable thresholds."""
+        if sample_rate not in (8000, 16000):
+            msg = f"Sample rate must be 8000 or 16000, got {sample_rate}"
+            raise ValueError(msg)
+        from silero_vad.utils_vad import OnnxWrapper  # noqa: PLC0415
+        self.sample_rate = sample_rate
+        self.threshold = threshold
+        self.silence_threshold_ms = silence_threshold_ms
+        self.min_speech_duration_ms = min_speech_duration_ms
+        # Window size: 512 samples @ 16kHz, 256 @ 8kHz (Silero requirement)
+        self.window_size_samples = 512 if sample_rate == 16000 else 256  # noqa: PLR2004
+        self.window_size_bytes = self.window_size_samples * 2  # 16-bit audio
+        # Pre-speech buffer size in windows
+        pre_speech_windows = max(
+            1,
+            (pre_speech_buffer_ms * sample_rate // 1000) // self.window_size_samples,
+        )
+        # Model and state
+        self._model = OnnxWrapper(str(_get_model_path()))
+        self._pre_speech_buffer: deque[bytes] = deque(maxlen=pre_speech_windows)
+        self._pending = bytearray()
+        self._audio_buffer = bytearray()
+        self._is_speaking = False
+        self._silence_samples = 0
+        self._speech_samples = 0
+    @property
+    def _silence_threshold_samples(self) -> int:
+        return self.silence_threshold_ms * self.sample_rate // 1000
+    @property
+    def _min_speech_samples(self) -> int:
+        return self.min_speech_duration_ms * self.sample_rate // 1000
+    def reset(self) -> None:
+        """Reset VAD state for a new recording session."""
+        self._model.reset_states()
+        self._pre_speech_buffer.clear()
+        self._pending.clear()
+        self._audio_buffer.clear()
+        self._is_speaking = False
+        self._silence_samples = 0
+        self._speech_samples = 0
+    def _is_speech(self, window: bytes) -> bool:
+        """Check if audio window contains speech."""
+        audio = np.frombuffer(window, dtype=np.int16).astype(np.float32) / 32768.0
+        prob = float(self._model(torch.from_numpy(audio), self.sample_rate).item())
+        LOGGER.debug("Speech prob: %.3f, threshold: %.2f", prob, self.threshold)
+        return prob >= self.threshold
+    def process_chunk(self, chunk: bytes) -> tuple[bool, bytes | None]:
+        """Process audio chunk and detect speech segments.
+        Returns (is_speaking, completed_segment_or_none).
+        """
+        self._pending.extend(chunk)
+        completed_segment: bytes | None = None
+        ws = self.window_size_bytes
+        # Process complete windows
+        while len(self._pending) >= ws:
+            window = bytes(self._pending[:ws])
+            del self._pending[:ws]
+            if self._is_speech(window):
+                if not self._is_speaking:
+                    # Speech just started - prepend pre-speech buffer
+                    self._is_speaking = True
+                    self._audio_buffer.clear()
+                    for pre in self._pre_speech_buffer:
+                        self._audio_buffer.extend(pre)
+                    self._pre_speech_buffer.clear()
+                    self._silence_samples = 0
+                    self._speech_samples = 0
+                self._audio_buffer.extend(window)
+                self._silence_samples = 0
+                self._speech_samples += self.window_size_samples
+            elif self._is_speaking:
+                # Silence during speech
+                self._audio_buffer.extend(window)
+                self._silence_samples += self.window_size_samples
+                if self._silence_samples >= self._silence_threshold_samples:
+                    # Segment complete - trim trailing silence
+                    if self._speech_samples >= self._min_speech_samples:
+                        trailing = (self._silence_samples // self.window_size_samples) * ws
+                        completed_segment = bytes(
+                            self._audio_buffer[:-trailing] if trailing else self._audio_buffer,
+                        )
+                    # Reset for next segment
+                    self._is_speaking = False
+                    self._silence_samples = 0
+                    self._speech_samples = 0
+                    self._audio_buffer.clear()
+                    self._model.reset_states()
+            else:
+                # Not speaking - maintain rolling pre-speech buffer (auto-limited by deque maxlen)
+                self._pre_speech_buffer.append(window)
+        return self._is_speaking, completed_segment
+    def flush(self) -> bytes | None:
+        """Flush any remaining buffered speech when stream ends."""
+        if self._is_speaking and self._speech_samples >= self._min_speech_samples:
+            result = bytes(self._audio_buffer)
+            self.reset()
+            return result
+        self.reset()
+        return None
+    def get_segment_duration_seconds(self, segment: bytes) -> float:
+        """Calculate duration of audio segment in seconds."""
+        return len(segment) // 2 / self.sample_rate