PyPI - llmcode-cli - Versions diffs - 1.0.0__py3-none-any.whl - Mend

llmcode-cli 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (212) hide show

llm_code/__init__.py +2 -0
llm_code/analysis/__init__.py +6 -0
llm_code/analysis/cache.py +33 -0
llm_code/analysis/engine.py +256 -0
llm_code/analysis/go_rules.py +114 -0
llm_code/analysis/js_rules.py +84 -0
llm_code/analysis/python_rules.py +311 -0
llm_code/analysis/rules.py +140 -0
llm_code/analysis/rust_rules.py +108 -0
llm_code/analysis/universal_rules.py +111 -0
llm_code/api/__init__.py +0 -0
llm_code/api/client.py +90 -0
llm_code/api/errors.py +73 -0
llm_code/api/openai_compat.py +390 -0
llm_code/api/provider.py +35 -0
llm_code/api/sse.py +52 -0
llm_code/api/types.py +140 -0
llm_code/cli/__init__.py +0 -0
llm_code/cli/commands.py +70 -0
llm_code/cli/image.py +122 -0
llm_code/cli/render.py +214 -0
llm_code/cli/status_line.py +79 -0
llm_code/cli/streaming.py +92 -0
llm_code/cli/tui_main.py +220 -0
llm_code/computer_use/__init__.py +11 -0
llm_code/computer_use/app_detect.py +49 -0
llm_code/computer_use/app_tier.py +57 -0
llm_code/computer_use/coordinator.py +99 -0
llm_code/computer_use/input_control.py +71 -0
llm_code/computer_use/screenshot.py +93 -0
llm_code/cron/__init__.py +13 -0
llm_code/cron/parser.py +145 -0
llm_code/cron/scheduler.py +135 -0
llm_code/cron/storage.py +126 -0
llm_code/enterprise/__init__.py +1 -0
llm_code/enterprise/audit.py +59 -0
llm_code/enterprise/auth.py +26 -0
llm_code/enterprise/oidc.py +95 -0
llm_code/enterprise/rbac.py +65 -0
llm_code/harness/__init__.py +5 -0
llm_code/harness/config.py +33 -0
llm_code/harness/engine.py +129 -0
llm_code/harness/guides.py +41 -0
llm_code/harness/sensors.py +68 -0
llm_code/harness/templates.py +84 -0
llm_code/hida/__init__.py +1 -0
llm_code/hida/classifier.py +187 -0
llm_code/hida/engine.py +49 -0
llm_code/hida/profiles.py +95 -0
llm_code/hida/types.py +28 -0
llm_code/ide/__init__.py +1 -0
llm_code/ide/bridge.py +80 -0
llm_code/ide/detector.py +76 -0
llm_code/ide/server.py +169 -0
llm_code/logging.py +29 -0
llm_code/lsp/__init__.py +0 -0
llm_code/lsp/client.py +298 -0
llm_code/lsp/detector.py +42 -0
llm_code/lsp/manager.py +56 -0
llm_code/lsp/tools.py +288 -0
llm_code/marketplace/__init__.py +0 -0
llm_code/marketplace/builtin_registry.py +102 -0
llm_code/marketplace/installer.py +162 -0
llm_code/marketplace/plugin.py +78 -0
llm_code/marketplace/registry.py +360 -0
llm_code/mcp/__init__.py +0 -0
llm_code/mcp/bridge.py +87 -0
llm_code/mcp/client.py +117 -0
llm_code/mcp/health.py +120 -0
llm_code/mcp/manager.py +214 -0
llm_code/mcp/oauth.py +219 -0
llm_code/mcp/transport.py +254 -0
llm_code/mcp/types.py +53 -0
llm_code/remote/__init__.py +0 -0
llm_code/remote/client.py +136 -0
llm_code/remote/protocol.py +22 -0
llm_code/remote/server.py +275 -0
llm_code/remote/ssh_proxy.py +56 -0
llm_code/runtime/__init__.py +0 -0
llm_code/runtime/auto_commit.py +56 -0
llm_code/runtime/auto_diagnose.py +62 -0
llm_code/runtime/checkpoint.py +70 -0
llm_code/runtime/checkpoint_recovery.py +142 -0
llm_code/runtime/compaction.py +35 -0
llm_code/runtime/compressor.py +415 -0
llm_code/runtime/config.py +533 -0
llm_code/runtime/context.py +49 -0
llm_code/runtime/conversation.py +921 -0
llm_code/runtime/cost_tracker.py +126 -0
llm_code/runtime/dream.py +127 -0
llm_code/runtime/file_protection.py +150 -0
llm_code/runtime/hardware.py +85 -0
llm_code/runtime/hooks.py +223 -0
llm_code/runtime/indexer.py +230 -0
llm_code/runtime/knowledge_compiler.py +232 -0
llm_code/runtime/memory.py +132 -0
llm_code/runtime/memory_layers.py +467 -0
llm_code/runtime/memory_lint.py +252 -0
llm_code/runtime/model_aliases.py +37 -0
llm_code/runtime/ollama.py +93 -0
llm_code/runtime/overlay.py +124 -0
llm_code/runtime/permissions.py +200 -0
llm_code/runtime/plan.py +45 -0
llm_code/runtime/prompt.py +238 -0
llm_code/runtime/repo_map.py +174 -0
llm_code/runtime/sandbox.py +116 -0
llm_code/runtime/session.py +268 -0
llm_code/runtime/skill_resolver.py +61 -0
llm_code/runtime/skills.py +133 -0
llm_code/runtime/speculative.py +75 -0
llm_code/runtime/streaming_executor.py +216 -0
llm_code/runtime/telemetry.py +196 -0
llm_code/runtime/token_budget.py +26 -0
llm_code/runtime/vcr.py +142 -0
llm_code/runtime/vision.py +102 -0
llm_code/swarm/__init__.py +1 -0
llm_code/swarm/backend_subprocess.py +108 -0
llm_code/swarm/backend_tmux.py +103 -0
llm_code/swarm/backend_worktree.py +306 -0
llm_code/swarm/checkpoint.py +74 -0
llm_code/swarm/coordinator.py +236 -0
llm_code/swarm/mailbox.py +88 -0
llm_code/swarm/manager.py +202 -0
llm_code/swarm/memory_sync.py +80 -0
llm_code/swarm/recovery.py +21 -0
llm_code/swarm/team.py +67 -0
llm_code/swarm/types.py +31 -0
llm_code/task/__init__.py +16 -0
llm_code/task/diagnostics.py +93 -0
llm_code/task/manager.py +162 -0
llm_code/task/types.py +112 -0
llm_code/task/verifier.py +104 -0
llm_code/tools/__init__.py +0 -0
llm_code/tools/agent.py +145 -0
llm_code/tools/agent_roles.py +82 -0
llm_code/tools/base.py +94 -0
llm_code/tools/bash.py +565 -0
llm_code/tools/computer_use_tools.py +278 -0
llm_code/tools/coordinator_tool.py +75 -0
llm_code/tools/cron_create.py +90 -0
llm_code/tools/cron_delete.py +49 -0
llm_code/tools/cron_list.py +51 -0
llm_code/tools/deferred.py +92 -0
llm_code/tools/dump.py +116 -0
llm_code/tools/edit_file.py +282 -0
llm_code/tools/git_tools.py +531 -0
llm_code/tools/glob_search.py +112 -0
llm_code/tools/grep_search.py +144 -0
llm_code/tools/ide_diagnostics.py +59 -0
llm_code/tools/ide_open.py +58 -0
llm_code/tools/ide_selection.py +52 -0
llm_code/tools/memory_tools.py +138 -0
llm_code/tools/multi_edit.py +143 -0
llm_code/tools/notebook_edit.py +107 -0
llm_code/tools/notebook_read.py +81 -0
llm_code/tools/parsing.py +63 -0
llm_code/tools/read_file.py +154 -0
llm_code/tools/registry.py +58 -0
llm_code/tools/search_backends/__init__.py +56 -0
llm_code/tools/search_backends/brave.py +56 -0
llm_code/tools/search_backends/duckduckgo.py +129 -0
llm_code/tools/search_backends/searxng.py +71 -0
llm_code/tools/search_backends/tavily.py +73 -0
llm_code/tools/swarm_create.py +109 -0
llm_code/tools/swarm_delete.py +95 -0
llm_code/tools/swarm_list.py +44 -0
llm_code/tools/swarm_message.py +109 -0
llm_code/tools/task_close.py +79 -0
llm_code/tools/task_plan.py +79 -0
llm_code/tools/task_verify.py +90 -0
llm_code/tools/tool_search.py +65 -0
llm_code/tools/web_common.py +258 -0
llm_code/tools/web_fetch.py +223 -0
llm_code/tools/web_search.py +280 -0
llm_code/tools/write_file.py +118 -0
llm_code/tui/__init__.py +1 -0
llm_code/tui/app.py +2432 -0
llm_code/tui/chat_view.py +82 -0
llm_code/tui/chat_widgets.py +309 -0
llm_code/tui/header_bar.py +46 -0
llm_code/tui/input_bar.py +349 -0
llm_code/tui/keybindings.py +142 -0
llm_code/tui/marketplace.py +210 -0
llm_code/tui/status_bar.py +72 -0
llm_code/tui/theme.py +96 -0
llm_code/utils/__init__.py +0 -0
llm_code/utils/diff.py +111 -0
llm_code/utils/errors.py +70 -0
llm_code/utils/hyperlink.py +73 -0
llm_code/utils/notebook.py +179 -0
llm_code/utils/search.py +69 -0
llm_code/utils/text_normalize.py +28 -0
llm_code/utils/version_check.py +62 -0
llm_code/vim/__init__.py +4 -0
llm_code/vim/engine.py +51 -0
llm_code/vim/motions.py +172 -0
llm_code/vim/operators.py +183 -0
llm_code/vim/text_objects.py +139 -0
llm_code/vim/transitions.py +279 -0
llm_code/vim/types.py +68 -0
llm_code/voice/__init__.py +1 -0
llm_code/voice/languages.py +43 -0
llm_code/voice/recorder.py +136 -0
llm_code/voice/stt.py +36 -0
llm_code/voice/stt_anthropic.py +66 -0
llm_code/voice/stt_google.py +32 -0
llm_code/voice/stt_whisper.py +52 -0
llmcode_cli-1.0.0.dist-info/METADATA +524 -0
llmcode_cli-1.0.0.dist-info/RECORD +212 -0
llmcode_cli-1.0.0.dist-info/WHEEL +4 -0
llmcode_cli-1.0.0.dist-info/entry_points.txt +2 -0
llmcode_cli-1.0.0.dist-info/licenses/LICENSE +21 -0

llm_code/cli/streaming.py ADDED Viewed

@@ -0,0 +1,92 @@
+"""Incremental Markdown renderer for streaming LLM output."""
+from __future__ import annotations
+import re
+from rich.console import Console
+from rich.markdown import Markdown
+from rich.syntax import Syntax
+_CODE_BLOCK_RE = re.compile(r"^```(\w*)\n(.*?)```\s*$", re.DOTALL)
+class IncrementalMarkdownRenderer:
+    """Renders streaming token output incrementally using Rich.
+    Strategy:
+    - Accumulate tokens in a buffer.
+    - After each feed, attempt to flush completed blocks:
+        * Code block: text between opening ``` and closing ```.
+        * Paragraph / heading / list: text terminated by \\n\\n.
+    - finish() flushes whatever remains.
+    """
+    def __init__(self, console: Console) -> None:
+        self._console = console
+        self._buffer = ""
+        self._in_code_block = False
+    def feed(self, token: str) -> None:
+        """Accumulate a token and try to flush completed blocks."""
+        self._buffer += token
+        self._try_flush()
+    def finish(self) -> None:
+        """Flush all remaining buffered content."""
+        if self._buffer.strip():
+            self._render_block(self._buffer)
+        self._buffer = ""
+        self._in_code_block = False
+    def _try_flush(self) -> None:
+        """Detect and render complete blocks from the buffer."""
+        while True:
+            if self._in_code_block:
+                # Look for closing ```
+                close_idx = self._buffer.find("```", 3)  # skip opening ```
+                if close_idx == -1:
+                    break  # code block not yet closed
+                # Include everything up to and including the closing ```
+                end = close_idx + 3
+                # Consume optional trailing newlines
+                while end < len(self._buffer) and self._buffer[end] in ("\n",):
+                    end += 1
+                block = self._buffer[:end]
+                self._buffer = self._buffer[end:]
+                self._in_code_block = False
+                self._render_block(block)
+            else:
+                # Check if we're entering a code block
+                if self._buffer.startswith("```"):
+                    self._in_code_block = True
+                    continue  # re-check with in_code_block=True
+                # Look for paragraph boundary (\n\n)
+                para_idx = self._buffer.find("\n\n")
+                if para_idx == -1:
+                    break  # no complete paragraph yet
+                block = self._buffer[: para_idx + 2]
+                self._buffer = self._buffer[para_idx + 2 :]
+                # After consuming a paragraph, the remainder might start a code block
+                if self._buffer.startswith("```"):
+                    self._in_code_block = True
+                stripped = block.strip()
+                if stripped:
+                    self._render_block(stripped)
+    def _render_block(self, block: str) -> None:
+        """Render a single block — code block as Syntax, else as Markdown."""
+        stripped = block.strip()
+        if not stripped:
+            return
+        m = _CODE_BLOCK_RE.match(stripped)
+        if m:
+            lang = m.group(1) or "text"
+            code = m.group(2)
+            self._console.print(Syntax(code, lang, theme="monokai"))
+        else:
+            self._console.print(Markdown(stripped))

llm_code/cli/tui_main.py ADDED Viewed

@@ -0,0 +1,220 @@
+"""Entry point for llm-code."""
+from __future__ import annotations
+import os
+from pathlib import Path
+import click
+_PERMISSION_CHOICES = ["prompt", "auto_accept", "read_only", "workspace_write", "full_access"]
+@click.command()
+@click.argument("prompt", required=False)
+@click.option("--model", "-m", default=None, help="Model name to use")
+@click.option("--api", default=None, help="API base URL")
+@click.option("--api-key", default=None, help="API key (or set LLM_API_KEY env var)")
+@click.option("--provider", type=click.Choice(["ollama"]), default=None, help="LLM provider shortcut")
+@click.option(
+    "--permission",
+    type=click.Choice(_PERMISSION_CHOICES),
+    default=None,
+    help="Permission mode",
+)
+@click.option("--budget", type=int, default=None, help="Token budget target")
+@click.option("--verbose", "-v", is_flag=True, help="Enable verbose logging")
+@click.option("--serve", is_flag=True, help="Start as remote server")
+@click.option("--port", type=int, default=8765, help="Server port (for --serve)")
+@click.option("--connect", default=None, help="Connect to remote server (host:port)")
+@click.option("--ssh", default=None, help="SSH to remote host and connect (user@host)")
+@click.option("--replay", default=None, help="Replay a VCR recording file (.jsonl)")
+@click.option("--replay-speed", type=float, default=1.0, help="Playback speed for --replay (0 = instant)")
+@click.option("--resume", default=None, help="Resume from a checkpoint (session_id or 'last')")
+def main(
+    prompt: str | None,
+    model: str | None,
+    api: str | None,
+    api_key: str | None,
+    provider: str | None,
+    permission: str | None,
+    budget: int | None,
+    verbose: bool = False,
+    serve: bool = False,
+    port: int = 8765,
+    connect: str | None = None,
+    ssh: str | None = None,
+    replay: str | None = None,
+    replay_speed: float = 1.0,
+    resume: str | None = None,
+) -> None:
+    """llm-code: AI coding assistant CLI."""
+    from llm_code.logging import setup_logging
+    from llm_code.runtime.config import load_config
+    setup_logging(verbose=verbose)
+    cwd = Path.cwd()
+    # Build CLI overrides
+    cli_overrides: dict = {}
+    if model:
+        cli_overrides["model"] = model
+    if api:
+        cli_overrides.setdefault("provider", {})["base_url"] = api
+    if api_key:
+        os.environ["LLM_API_KEY"] = api_key
+    if permission:
+        cli_overrides.setdefault("permissions", {})["mode"] = permission
+    # Ollama provider setup
+    if provider == "ollama":
+        ollama_result = _run_ollama_setup(
+            api_override=api,
+            model_override=model,
+        )
+        if ollama_result is None:
+            click.echo("Error: Cannot connect to Ollama at localhost:11434", err=True)
+            click.echo("Make sure Ollama is running: ollama serve", err=True)
+            raise SystemExit(1)
+        selected_model, base_url = ollama_result
+        cli_overrides["model"] = selected_model
+        cli_overrides.setdefault("provider", {})["base_url"] = base_url
+    user_dir = Path.home() / ".llm-code"
+    config = load_config(
+        user_dir=user_dir,
+        project_dir=cwd,
+        local_path=cwd / ".llm-code" / "config.json",
+        cli_overrides=cli_overrides,
+    )
+    import asyncio
+    if replay:
+        from llm_code.runtime.vcr import VCRPlayer
+        player = VCRPlayer(Path(replay))
+        summary = player.summary()
+        print(f"Replaying: {replay}")
+        print(f"  events={summary['event_count']}  duration={summary['duration']:.1f}s")
+        print()
+        for event in player.replay(speed=replay_speed):
+            print(f"[{event.type:15s}] {event.data}")
+        return
+    if serve:
+        from llm_code.remote.server import RemoteServer
+        server = RemoteServer(host="0.0.0.0", port=port, config=config)
+        asyncio.run(server.start())
+        return
+    if connect:
+        from llm_code.remote.client import RemoteClient
+        client = RemoteClient(connect)
+        asyncio.run(client.connect())
+        return
+    if ssh:
+        from llm_code.remote.ssh_proxy import ssh_connect
+        asyncio.run(ssh_connect(ssh, port=port))
+        return
+    # Resolve resume session if requested
+    resume_session = None
+    if resume:
+        from llm_code.runtime.checkpoint_recovery import CheckpointRecovery
+        checkpoints_dir = Path.home() / ".llm-code" / "checkpoints"
+        recovery = CheckpointRecovery(checkpoints_dir)
+        if resume == "last":
+            resume_session = recovery.detect_last_checkpoint()
+        else:
+            resume_session = recovery.load_checkpoint(resume)
+        if resume_session is None:
+            print(f"[warning] No checkpoint found for: {resume}")
+        else:
+            print(f"Resuming session {resume_session.id} ({len(resume_session.messages)} messages)")
+    # Textual fullscreen TUI (default and only UI mode)
+    from llm_code.tui.app import LLMCodeTUI
+    app = LLMCodeTUI(config=config, cwd=cwd, budget=budget)
+    app.run()
+_OLLAMA_DEFAULT_URL = "http://localhost:11434"
+def _run_ollama_setup(
+    api_override: str | None = None,
+    model_override: str | None = None,
+) -> tuple[str, str] | None:
+    """Probe Ollama, optionally select model. Returns (model, base_url) or None."""
+    import asyncio as _asyncio
+    base_url = api_override or _OLLAMA_DEFAULT_URL
+    async def _setup() -> tuple[str, str] | None:
+        from llm_code.runtime.ollama import OllamaClient, sort_models_for_selection
+        from llm_code.runtime.hardware import detect_vram_gb
+        client = OllamaClient(base_url=base_url)
+        try:
+            if not await client.probe():
+                return None
+            if model_override:
+                return (model_override, f"{base_url}/v1")
+            models = await client.list_models()
+            if not models:
+                click.echo("No models found in Ollama. Download one first:", err=True)
+                click.echo("  ollama pull qwen3:1.7b", err=True)
+                return None
+            if len(models) == 1:
+                click.echo(f"Using Ollama model: {models[0].name}")
+                return (models[0].name, f"{base_url}/v1")
+            vram_gb = detect_vram_gb()
+            sorted_models = sort_models_for_selection(models, vram_gb)
+            output = _format_model_list(sorted_models, vram_gb)
+            click.echo(output)
+            choice = click.prompt("Select model", default="1")
+            try:
+                idx = int(choice) - 1
+                if 0 <= idx < len(sorted_models):
+                    selected = sorted_models[idx]
+                else:
+                    selected = sorted_models[0]
+            except ValueError:
+                selected = sorted_models[0]
+            click.echo(f"Using: {selected.name}")
+            return (selected.name, f"{base_url}/v1")
+        finally:
+            await client.close()
+    return _asyncio.run(_setup())
+def _format_model_list(
+    models: list,
+    vram_gb: float | None,
+) -> str:
+    """Format models as a numbered list with VRAM annotations."""
+    lines = ["\nAvailable Ollama models:\n"]
+    for i, model in enumerate(models, 1):
+        size_str = f"~{model.estimated_vram_gb:.0f}GB"
+        prefix = "  "
+        suffix = ""
+        if vram_gb is not None:
+            if model.is_recommended(vram_gb):
+                prefix = "★ "
+                suffix = "  Recommended"
+            elif not model.fits_in_vram(vram_gb):
+                suffix = " ⚠️ May exceed available VRAM"
+        lines.append(f"  {prefix}{i}) {model.name:<20s} ({size_str}){suffix}")
+    lines.append("")
+    return "\n".join(lines)

llm_code/computer_use/__init__.py ADDED Viewed

@@ -0,0 +1,11 @@
+"""Computer use — GUI automation for llm-code."""
+def is_available() -> bool:
+    """Return True if pyautogui and Pillow are importable."""
+    try:
+        import pyautogui  # noqa: F401
+        import PIL  # noqa: F401
+        return True
+    except ImportError:
+        return False

llm_code/computer_use/app_detect.py ADDED Viewed

@@ -0,0 +1,49 @@
+"""Detect the frontmost application on macOS."""
+from __future__ import annotations
+import asyncio
+import subprocess
+from dataclasses import dataclass
+@dataclass(frozen=True)
+class AppInfo:
+    """Information about a running application."""
+    name: str
+    bundle_id: str
+    pid: int
+def _get_via_osascript() -> AppInfo:
+    """Use osascript to get frontmost app info."""
+    script = (
+        'tell application "System Events" to '
+        'set fp to first process whose frontmost is true\n'
+        'set n to name of fp\n'
+        'set b to bundle identifier of fp\n'
+        'set p to unix id of fp\n'
+        'return n & "|" & b & "|" & (p as text)'
+    )
+    result = subprocess.run(
+        ["osascript", "-e", script],
+        capture_output=True, text=True, timeout=5,
+    )
+    if result.returncode != 0:
+        raise RuntimeError(f"osascript failed: {result.stderr}")
+    parts = result.stdout.strip().split("|")
+    if len(parts) < 3:
+        raise RuntimeError(f"Unexpected osascript output: {result.stdout}")
+    return AppInfo(name=parts[0], bundle_id=parts[1], pid=int(parts[2]))
+def get_frontmost_app_sync() -> AppInfo:
+    """Get frontmost app, with fallback to Unknown on any error."""
+    try:
+        return _get_via_osascript()
+    except Exception:
+        return AppInfo(name="Unknown", bundle_id="", pid=0)
+async def get_frontmost_app() -> AppInfo:
+    """Async wrapper for get_frontmost_app_sync."""
+    return await asyncio.to_thread(get_frontmost_app_sync)

llm_code/computer_use/app_tier.py ADDED Viewed

@@ -0,0 +1,57 @@
+"""App-aware tier classification and permission enforcement for computer use."""
+from __future__ import annotations
+import fnmatch
+from dataclasses import dataclass
+from llm_code.computer_use.app_detect import AppInfo
+@dataclass(frozen=True)
+class AppTierRule:
+    """Maps a bundle_id glob pattern to a tier."""
+    pattern: str
+    tier: str
+DEFAULT_RULES: tuple[AppTierRule, ...] = (
+    AppTierRule("com.apple.Safari*", "read"),
+    AppTierRule("com.google.Chrome*", "read"),
+    AppTierRule("org.mozilla.firefox*", "read"),
+    AppTierRule("company.thebrowser.Browser*", "read"),
+    AppTierRule("com.microsoft.edgemac*", "read"),
+    AppTierRule("com.apple.Terminal*", "click"),
+    AppTierRule("com.googlecode.iterm2*", "click"),
+    AppTierRule("com.microsoft.VSCode*", "click"),
+    AppTierRule("com.jetbrains.*", "click"),
+)
+TIER_PERMISSIONS: dict[str, frozenset[str]] = {
+    "read": frozenset({"screenshot", "get_frontmost_app"}),
+    "click": frozenset({"screenshot", "get_frontmost_app", "left_click", "scroll"}),
+    "full": frozenset({
+        "screenshot", "get_frontmost_app", "left_click", "right_click",
+        "double_click", "drag", "scroll", "type", "key", "hotkey",
+    }),
+}
+class AppTierDenied(Exception):
+    def __init__(self, app: str, tier: str, action: str, hint: str = "") -> None:
+        self.app = app
+        self.tier = tier
+        self.action = action
+        self.hint = hint
+        super().__init__(f"Action '{action}' denied for app '{app}' (tier='{tier}'). {hint}")
+@dataclass(frozen=True)
+class AppTierClassifier:
+    rules: tuple[AppTierRule, ...]
+    def classify(self, app: AppInfo) -> str:
+        for rule in self.rules:
+            if fnmatch.fnmatch(app.bundle_id, rule.pattern):
+                return rule.tier
+        return "full"

llm_code/computer_use/coordinator.py ADDED Viewed

@@ -0,0 +1,99 @@
+"""Coordinator that composes screenshot + input for tool actions."""
+from __future__ import annotations
+import time
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from llm_code.runtime.config import ComputerUseConfig
+from llm_code.computer_use.app_detect import get_frontmost_app_sync
+from llm_code.computer_use.app_tier import (
+    DEFAULT_RULES,
+    TIER_PERMISSIONS,
+    AppTierClassifier,
+    AppTierDenied,
+    AppTierRule,
+)
+from llm_code.computer_use.input_control import (
+    keyboard_hotkey,
+    keyboard_type,
+    mouse_click,
+    mouse_drag,
+    scroll,
+)
+from llm_code.computer_use.screenshot import take_screenshot_base64
+class ComputerUseCoordinator:
+    """Orchestrates GUI actions with follow-up screenshots and app-aware tier enforcement."""
+    def __init__(self, config: "ComputerUseConfig") -> None:
+        self._config = config
+        user_rules = tuple(
+            AppTierRule(pattern=r["pattern"], tier=r["tier"])
+            for r in self._config.app_tiers
+            if isinstance(r, dict) and "pattern" in r and "tier" in r
+        )
+        self._classifier = AppTierClassifier(rules=user_rules + DEFAULT_RULES)
+    def _ensure_enabled(self) -> None:
+        if not self._config.enabled:
+            raise RuntimeError("Computer use is not enabled. Set computer_use.enabled=true in config.")
+    def _check_tier(self, action: str) -> None:
+        app = get_frontmost_app_sync()
+        tier = self._classifier.classify(app)
+        if action not in TIER_PERMISSIONS[tier]:
+            hint = ""
+            if tier == "read":
+                hint = "Use MCP browser tools (chrome-devtools) instead."
+            elif tier == "click" and action in ("type", "key", "hotkey"):
+                hint = "Use the Bash tool instead for terminal input."
+            raise AppTierDenied(app=app.name, tier=tier, action=action, hint=hint)
+    def _delay_then_screenshot(self) -> str:
+        if self._config.screenshot_delay > 0:
+            time.sleep(self._config.screenshot_delay)
+        return take_screenshot_base64()
+    def screenshot(self) -> dict:
+        self._ensure_enabled()
+        self._check_tier("screenshot")
+        img = self._delay_then_screenshot()
+        return {"screenshot_base64": img}
+    def click_and_observe(self, x: int, y: int, button: str = "left") -> dict:
+        self._ensure_enabled()
+        self._check_tier("left_click")
+        mouse_click(x, y, button=button)
+        img = self._delay_then_screenshot()
+        return {"action": "click", "x": x, "y": y, "button": button, "screenshot_base64": img}
+    def type_and_observe(self, text: str) -> dict:
+        self._ensure_enabled()
+        self._check_tier("type")
+        keyboard_type(text)
+        img = self._delay_then_screenshot()
+        return {"action": "type", "text": text, "screenshot_base64": img}
+    def hotkey_and_observe(self, *keys: str) -> dict:
+        self._ensure_enabled()
+        self._check_tier("hotkey")
+        keyboard_hotkey(*keys)
+        img = self._delay_then_screenshot()
+        return {"action": "hotkey", "keys": list(keys), "screenshot_base64": img}
+    def scroll_and_observe(self, clicks: int, x: int | None = None, y: int | None = None) -> dict:
+        self._ensure_enabled()
+        self._check_tier("scroll")
+        scroll(clicks, x=x, y=y)
+        img = self._delay_then_screenshot()
+        return {"action": "scroll", "clicks": clicks, "screenshot_base64": img}
+    def drag_and_observe(self, start_x: int, start_y: int, offset_x: int, offset_y: int, duration: float = 0.5) -> dict:
+        self._ensure_enabled()
+        self._check_tier("drag")
+        mouse_drag(start_x, start_y, offset_x, offset_y, duration=duration)
+        img = self._delay_then_screenshot()
+        return {"action": "drag", "start_x": start_x, "start_y": start_y, "offset_x": offset_x, "offset_y": offset_y, "screenshot_base64": img}

llm_code/computer_use/input_control.py ADDED Viewed

@@ -0,0 +1,71 @@
+"""Mouse and keyboard control via pyautogui (lazy import)."""
+from __future__ import annotations
+_DEFAULT_DELAY = 0.05  # 50ms between actions
+def _get_pyautogui():
+    """Lazy import pyautogui with clear error on missing dep."""
+    try:
+        import pyautogui
+        return pyautogui
+    except ImportError as exc:
+        raise RuntimeError(
+            "pyautogui is required for input control. "
+            "Install with: pip install llm-code[computer-use]"
+        ) from exc
+def mouse_move(x: int, y: int) -> None:
+    """Move mouse cursor to (x, y)."""
+    pag = _get_pyautogui()
+    pag.moveTo(x, y, duration=_DEFAULT_DELAY)
+def mouse_click(x: int, y: int, button: str = "left") -> None:
+    """Click at (x, y) with the given button."""
+    pag = _get_pyautogui()
+    pag.click(x, y, button=button)
+def mouse_double_click(x: int, y: int) -> None:
+    """Double-click at (x, y)."""
+    pag = _get_pyautogui()
+    pag.doubleClick(x, y)
+def mouse_drag(
+    start_x: int,
+    start_y: int,
+    offset_x: int,
+    offset_y: int,
+    duration: float = 0.5,
+    button: str = "left",
+) -> None:
+    """Drag from (start_x, start_y) by (offset_x, offset_y)."""
+    pag = _get_pyautogui()
+    pag.moveTo(start_x, start_y, duration=_DEFAULT_DELAY)
+    pag.drag(offset_x, offset_y, duration=duration, button=button)
+def keyboard_type(text: str) -> None:
+    """Type the given text string character by character."""
+    pag = _get_pyautogui()
+    pag.typewrite(text, interval=_DEFAULT_DELAY)
+def keyboard_hotkey(*keys: str) -> None:
+    """Press a keyboard shortcut (e.g., keyboard_hotkey('ctrl', 'c'))."""
+    pag = _get_pyautogui()
+    pag.hotkey(*keys)
+def scroll(clicks: int, x: int | None = None, y: int | None = None) -> None:
+    """Scroll the mouse wheel. Positive = up, negative = down."""
+    pag = _get_pyautogui()
+    kwargs: dict = {}
+    if x is not None:
+        kwargs["x"] = x
+    if y is not None:
+        kwargs["y"] = y
+    pag.scroll(clicks, **kwargs)

llm_code/computer_use/screenshot.py ADDED Viewed

@@ -0,0 +1,93 @@
+"""Cross-platform screenshot capture."""
+from __future__ import annotations
+import base64
+import platform
+import subprocess
+import tempfile
+from pathlib import Path
+from typing import Tuple
+def take_screenshot(region: Tuple[int, int, int, int] | None = None) -> bytes:
+    """Capture the screen and return raw PNG bytes.
+    Args:
+        region: Optional (x, y, width, height) crop region.
+    Returns:
+        PNG image bytes.
+    Platform strategy:
+        macOS  -> screencapture CLI
+        Linux  -> scrot CLI
+        Windows -> mss library (lazy import)
+    """
+    system = platform.system()
+    if system == "Darwin":
+        return _capture_macos(region)
+    elif system == "Linux":
+        return _capture_linux(region)
+    elif system == "Windows":
+        return _capture_windows(region)
+    else:
+        raise RuntimeError(f"Unsupported platform for screenshots: {system}")
+def take_screenshot_base64(region: Tuple[int, int, int, int] | None = None) -> str:
+    """Capture screen and return as a base64-encoded string."""
+    raw = take_screenshot(region)
+    return base64.b64encode(raw).decode("ascii")
+def _capture_macos(region: Tuple[int, int, int, int] | None) -> bytes:
+    with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
+        tmp_path = tmp.name
+    cmd = ["screencapture", "-x"]
+    if region:
+        x, y, w, h = region
+        cmd.extend(["-R", f"{x},{y},{w},{h}"])
+    cmd.append(tmp_path)
+    subprocess.run(cmd, check=True, timeout=10)
+    data = Path(tmp_path).read_bytes()
+    Path(tmp_path).unlink(missing_ok=True)
+    return data
+def _capture_linux(region: Tuple[int, int, int, int] | None) -> bytes:
+    with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
+        tmp_path = tmp.name
+    cmd = ["scrot"]
+    if region:
+        x, y, w, h = region
+        cmd.extend(["-a", f"{x},{y},{w},{h}"])
+    cmd.append(tmp_path)
+    subprocess.run(cmd, check=True, timeout=10)
+    data = Path(tmp_path).read_bytes()
+    Path(tmp_path).unlink(missing_ok=True)
+    return data
+def _capture_windows(region: Tuple[int, int, int, int] | None) -> bytes:
+    try:
+        import mss
+        import mss.tools
+    except ImportError as exc:
+        raise RuntimeError(
+            "mss is required for Windows screenshots. "
+            "Install with: pip install llm-code[computer-use]"
+        ) from exc
+    with mss.mss() as sct:
+        if region:
+            x, y, w, h = region
+            monitor = {"top": y, "left": x, "width": w, "height": h}
+        else:
+            monitor = sct.monitors[1]  # Primary monitor
+        img = sct.grab(monitor)
+        return mss.tools.to_png(img.rgb, img.size)