PyPI - hud-python - Versions diffs - 0.4.1__py3-none-any.whl → 0.4.3__py3-none-any.whl - Mend

hud-python 0.4.1py3-none-any.whl → 0.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hud-python might be problematic. Click here for more details.

Files changed (130) hide show

hud/__init__.py +22 -22
hud/agents/__init__.py +13 -15
hud/agents/base.py +599 -599
hud/agents/claude.py +373 -373
hud/agents/langchain.py +261 -250
hud/agents/misc/__init__.py +7 -7
hud/agents/misc/response_agent.py +82 -80
hud/agents/openai.py +352 -352
hud/agents/openai_chat_generic.py +154 -154
hud/agents/tests/__init__.py +1 -1
hud/agents/tests/test_base.py +742 -742
hud/agents/tests/test_claude.py +324 -324
hud/agents/tests/test_client.py +363 -363
hud/agents/tests/test_openai.py +237 -237
hud/cli/__init__.py +617 -617
hud/cli/__main__.py +8 -8
hud/cli/analyze.py +371 -371
hud/cli/analyze_metadata.py +230 -230
hud/cli/build.py +498 -427
hud/cli/clone.py +185 -185
hud/cli/cursor.py +92 -92
hud/cli/debug.py +392 -392
hud/cli/docker_utils.py +83 -83
hud/cli/init.py +280 -281
hud/cli/interactive.py +353 -353
hud/cli/mcp_server.py +764 -756
hud/cli/pull.py +330 -336
hud/cli/push.py +404 -370
hud/cli/remote_runner.py +311 -311
hud/cli/runner.py +160 -160
hud/cli/tests/__init__.py +3 -3
hud/cli/tests/test_analyze.py +284 -284
hud/cli/tests/test_cli_init.py +265 -265
hud/cli/tests/test_cli_main.py +27 -27
hud/cli/tests/test_clone.py +142 -142
hud/cli/tests/test_cursor.py +253 -253
hud/cli/tests/test_debug.py +453 -453
hud/cli/tests/test_mcp_server.py +139 -139
hud/cli/tests/test_utils.py +388 -388
hud/cli/utils.py +263 -263
hud/clients/README.md +143 -143
hud/clients/__init__.py +16 -16
hud/clients/base.py +378 -379
hud/clients/fastmcp.py +222 -222
hud/clients/mcp_use.py +298 -278
hud/clients/tests/__init__.py +1 -1
hud/clients/tests/test_client_integration.py +111 -111
hud/clients/tests/test_fastmcp.py +342 -342
hud/clients/tests/test_protocol.py +188 -188
hud/clients/utils/__init__.py +1 -1
hud/clients/utils/retry_transport.py +160 -160
hud/datasets.py +327 -322
hud/misc/__init__.py +1 -1
hud/misc/claude_plays_pokemon.py +292 -292
hud/otel/__init__.py +35 -35
hud/otel/collector.py +142 -142
hud/otel/config.py +164 -164
hud/otel/context.py +536 -536
hud/otel/exporters.py +366 -366
hud/otel/instrumentation.py +97 -97
hud/otel/processors.py +118 -118
hud/otel/tests/__init__.py +1 -1
hud/otel/tests/test_processors.py +197 -197
hud/server/__init__.py +5 -5
hud/server/context.py +114 -114
hud/server/helper/__init__.py +5 -5
hud/server/low_level.py +132 -132
hud/server/server.py +170 -166
hud/server/tests/__init__.py +3 -3
hud/settings.py +73 -73
hud/shared/__init__.py +5 -5
hud/shared/exceptions.py +180 -180
hud/shared/requests.py +264 -264
hud/shared/tests/test_exceptions.py +157 -157
hud/shared/tests/test_requests.py +275 -275
hud/telemetry/__init__.py +25 -25
hud/telemetry/instrument.py +379 -379
hud/telemetry/job.py +309 -309
hud/telemetry/replay.py +74 -74
hud/telemetry/trace.py +83 -83
hud/tools/__init__.py +33 -33
hud/tools/base.py +365 -365
hud/tools/bash.py +161 -161
hud/tools/computer/__init__.py +15 -15
hud/tools/computer/anthropic.py +437 -437
hud/tools/computer/hud.py +376 -376
hud/tools/computer/openai.py +295 -295
hud/tools/computer/settings.py +82 -82
hud/tools/edit.py +314 -314
hud/tools/executors/__init__.py +30 -30
hud/tools/executors/base.py +539 -539
hud/tools/executors/pyautogui.py +621 -621
hud/tools/executors/tests/__init__.py +1 -1
hud/tools/executors/tests/test_base_executor.py +338 -338
hud/tools/executors/tests/test_pyautogui_executor.py +165 -165
hud/tools/executors/xdo.py +511 -511
hud/tools/playwright.py +412 -412
hud/tools/tests/__init__.py +3 -3
hud/tools/tests/test_base.py +282 -282
hud/tools/tests/test_bash.py +158 -158
hud/tools/tests/test_bash_extended.py +197 -197
hud/tools/tests/test_computer.py +425 -425
hud/tools/tests/test_computer_actions.py +34 -34
hud/tools/tests/test_edit.py +259 -259
hud/tools/tests/test_init.py +27 -27
hud/tools/tests/test_playwright_tool.py +183 -183
hud/tools/tests/test_tools.py +145 -145
hud/tools/tests/test_utils.py +156 -156
hud/tools/types.py +72 -72
hud/tools/utils.py +50 -50
hud/types.py +136 -136
hud/utils/__init__.py +10 -10
hud/utils/async_utils.py +65 -65
hud/utils/design.py +236 -168
hud/utils/mcp.py +55 -55
hud/utils/progress.py +149 -149
hud/utils/telemetry.py +66 -66
hud/utils/tests/test_async_utils.py +173 -173
hud/utils/tests/test_init.py +17 -17
hud/utils/tests/test_progress.py +261 -261
hud/utils/tests/test_telemetry.py +82 -82
hud/utils/tests/test_version.py +8 -8
hud/version.py +7 -7
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/METADATA +10 -8
hud_python-0.4.3.dist-info/RECORD +131 -0
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/licenses/LICENSE +21 -21
hud/agents/art.py +0 -101
hud_python-0.4.1.dist-info/RECORD +0 -132
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/WHEEL +0 -0
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/entry_points.txt +0 -0

hud/cli/debug.py CHANGED Viewed

@@ -1,392 +1,392 @@
-"""Debug command implementation for MCP environments."""
-# ruff: noqa: G004
-from __future__ import annotations
-import asyncio
-import json
-import subprocess
-import threading
-import time
-from rich.console import Console
-from hud.clients import MCPClient
-from hud.utils.design import HUDDesign
-from .utils import CaptureLogger, Colors, analyze_error_for_hints
-console = Console()
-async def debug_mcp_stdio(command: list[str], logger: CaptureLogger, max_phase: int = 5) -> int:
-    """
-    Debug any stdio-based MCP server step by step.
-    Args:
-        command: Command and arguments to run the MCP server
-        logger: CaptureLogger instance for output
-        max_phase: Maximum phase to run (1-5, default 5 for all phases)
-    Returns:
-        Number of phases completed (0-5)
-    """
-    # Create design instance for initial output (before logger takes over)
-    if logger.print_output:
-        design = HUDDesign()
-        design.header("MCP Server Debugger", icon="🔍")
-        design.dim_info("Command:", " ".join(command))
-        design.dim_info("Time:", time.strftime("%Y-%m-%d %H:%M:%S"))
-        # Explain color coding using Rich formatting
-        design.info("\nColor Key:")
-        console.print("  [bold]■[/bold] Commands (bold)")
-        console.print("  [rgb(192,150,12)]■[/rgb(192,150,12)] STDIO (MCP protocol)")
-        console.print("  [dim]■[/dim] STDERR (server logs)")
-        console.print("  [green]■[/green] Success messages")
-        console.print("  [red]■[/red] Error messages")
-        console.print("  ■ Info messages")
-    phases_completed = 0
-    total_phases = 5
-    start_time = time.time()
-    # Phase 1: Basic Server Test
-    logger.phase(1, "Basic Server Startup Test")
-    try:
-        # Test if command runs at all
-        test_cmd = command + (["echo", "Server OK"] if "docker" in command[0] else [])
-        logger.command([*test_cmd[:3], "..."] if len(test_cmd) > 3 else test_cmd)
-        result = subprocess.run(  # noqa: S603, ASYNC221
-            command[:1],
-            capture_output=True,
-            text=True,
-            timeout=2,
-            encoding="utf-8",
-            errors="replace",
-        )
-        if result.returncode == 0 or "usage" in result.stderr.lower():
-            logger.success("Command executable found")
-            phases_completed = 1
-        else:
-            logger.error(f"Command failed with exit code {result.returncode}")
-            if result.stderr:
-                logger._log(
-                    f"Error output: {result.stderr}", Colors.RED if logger.print_output else ""
-                )
-                hint = analyze_error_for_hints(result.stderr)
-                if hint:
-                    logger.hint(hint)
-            logger.progress_bar(phases_completed, total_phases)
-            return phases_completed
-        # Check if we should stop here
-        if max_phase <= 1:
-            logger.info(f"Stopping at phase {max_phase} as requested")
-            logger.progress_bar(phases_completed, total_phases)
-            return phases_completed
-    except FileNotFoundError:
-        logger.error(f"Command not found: {command[0]}")
-        logger.hint("Ensure the command is installed and in PATH")
-        logger.progress_bar(phases_completed, total_phases)
-        return phases_completed
-    except Exception as e:
-        logger.error(f"Startup test failed: {e}")
-        logger.progress_bar(phases_completed, total_phases)
-        return phases_completed
-    # Phase 2: MCP Initialize Test
-    logger.phase(2, "MCP Server Initialize Test")
-    logger.info("STDIO is used for MCP protocol, STDERR for server logs")
-    init_request = {
-        "jsonrpc": "2.0",
-        "id": 1,
-        "method": "initialize",
-        "params": {
-            "protocolVersion": "2024-11-05",
-            "capabilities": {"roots": {"listChanged": True}},
-            "clientInfo": {"name": "DebugClient", "version": "1.0.0"},
-        },
-    }
-    try:
-        logger.command(command)
-        logger.stdio(f"Sending: {json.dumps(init_request)}")
-        proc = subprocess.Popen(  # noqa: S603, ASYNC220
-            command,
-            stdin=subprocess.PIPE,
-            stdout=subprocess.PIPE,
-            stderr=subprocess.PIPE,
-            text=True,
-            bufsize=1,
-            encoding="utf-8",
-            errors="replace",  # Replace invalid chars with � on Windows
-        )
-        # Ensure pipes are available
-        if proc.stdin is None or proc.stdout is None or proc.stderr is None:
-            raise RuntimeError("Failed to create subprocess pipes")
-        # Send initialize
-        proc.stdin.write(json.dumps(init_request) + "\n")
-        proc.stdin.flush()
-        # Collect stderr in background
-        stderr_lines = []
-        def read_stderr() -> None:
-            if proc.stderr is None:
-                return
-            for line in proc.stderr:
-                line = line.rstrip()
-                if line:
-                    logger.stderr(line)
-                    stderr_lines.append(line)
-        stderr_thread = threading.Thread(target=read_stderr)
-        stderr_thread.daemon = True
-        stderr_thread.start()
-        # Wait for response
-        response = None
-        start = time.time()
-        while time.time() - start < 15:
-            line = proc.stdout.readline()
-            if line:
-                try:
-                    response = json.loads(line)
-                    if response.get("id") == 1:
-                        logger.stdio(f"Received: {json.dumps(response)}")
-                        break
-                except Exception as e:
-                    logger.error(f"Failed to parse MCP response: {e}")
-                    continue
-        if response and "result" in response:
-            logger.success("MCP server initialized successfully")
-            server_info = response["result"].get("serverInfo", {})
-            logger.info(
-                f"Server: {server_info.get('name', 'Unknown')} v{server_info.get('version', '?')}"
-            )
-            # Show capabilities
-            caps = response["result"].get("capabilities", {})
-            if caps:
-                logger.info(f"Capabilities: {', '.join(caps.keys())}")
-            phases_completed = 2
-        else:
-            logger.error("No valid MCP response received")
-            # Analyze stderr for hints
-            if stderr_lines:
-                all_stderr = "\n".join(stderr_lines)
-                hint = analyze_error_for_hints(all_stderr)
-                if hint:
-                    logger.hint(hint)
-            else:
-                logger.hint("""MCP requires clean stdout. Ensure:
-   - All print() statements use file=sys.stderr
-   - Logging is configured to use stderr
-   - No libraries are printing to stdout""")
-            logger.progress_bar(phases_completed, total_phases)
-            proc.terminate()
-            try:
-                proc.wait(timeout=5)
-            except subprocess.TimeoutExpired:
-                proc.kill()
-                proc.wait()
-            return phases_completed
-        proc.terminate()
-        try:
-            proc.wait(timeout=5)
-        except subprocess.TimeoutExpired:
-            proc.kill()
-            proc.wait()
-        # Check if we should stop here
-        if phases_completed >= max_phase:
-            logger.info(f"Stopping at phase {max_phase} as requested")
-            logger.progress_bar(phases_completed, total_phases)
-            return phases_completed
-    except Exception as e:
-        logger.error(f"MCP test failed: {e}")
-        hint = analyze_error_for_hints(str(e))
-        if hint:
-            logger.hint(hint)
-        logger.progress_bar(phases_completed, total_phases)
-        return phases_completed
-    # Phase 3: Tool Discovery
-    logger.phase(3, "MCP Tool Discovery Test")
-    client = None
-    try:
-        # Create MCP config for the command
-        mcp_config = {
-            "test": {"command": command[0], "args": command[1:] if len(command) > 1 else []}
-        }
-        logger.command(command)
-        logger.info("Creating MCP client via hud...")
-        client = MCPClient(mcp_config=mcp_config, verbose=False, auto_trace=False)
-        await client.initialize()
-        # Wait for initialization
-        logger.info("Waiting for server initialization...")
-        await asyncio.sleep(5)
-        # Get tools
-        tools = await client.list_tools()
-        if tools:
-            logger.success(f"Found {len(tools)} tools")
-            # Check for lifecycle tools
-            tool_names = [t.name for t in tools]
-            has_setup = "setup" in tool_names
-            has_evaluate = "evaluate" in tool_names
-            logger.info(
-                f"Lifecycle tools: setup={'✅' if has_setup else '❌'}, evaluate={'✅' if has_evaluate else '❌'}"  # noqa: E501
-            )
-            # Check for interaction tools
-            interaction_tools = [
-                name
-                for name in tool_names
-                if name in ["computer", "playwright", "click", "type", "interact", "move"]
-            ]
-            if interaction_tools:
-                logger.info(f"Interaction tools: {', '.join(interaction_tools)}")
-            # List all tools
-            logger.info(f"All tools: {', '.join(tool_names)}")
-            # Try to list resources
-            try:
-                resources = await client.list_resources()
-                if resources:
-                    logger.info(
-                        f"Found {len(resources)} resources: {', '.join(str(r.uri) for r in resources[:3])}..."  # noqa: E501
-                    )
-            except Exception as e:
-                logger.error(f"Failed to list resources: {e}")
-            phases_completed = 3
-        else:
-            logger.error("No tools found")
-            logger.hint("""No tools found. Ensure:
-   - @mcp.tool() decorator is used on functions
-   - Tools are registered before mcp.run()
-   - No import errors preventing tool registration""")
-            logger.progress_bar(phases_completed, total_phases)
-            return phases_completed
-        # Check if we should stop here
-        if phases_completed >= max_phase:
-            logger.info(f"Stopping at phase {max_phase} as requested")
-            logger.progress_bar(phases_completed, total_phases)
-            return phases_completed
-        # Phase 4: Remote Deployment Readiness
-        logger.phase(4, "Remote Deployment Readiness")
-        # Test if setup/evaluate exist
-        if "setup" in tool_names:
-            try:
-                logger.info("Testing setup tool...")
-                await client.call_tool(name="setup", arguments={})
-                logger.success("Setup tool responded")
-            except Exception as e:
-                logger.info(f"Setup tool test: {e}")
-        if "evaluate" in tool_names:
-            try:
-                logger.info("Testing evaluate tool...")
-                await client.call_tool(name="evaluate", arguments={})
-                logger.success("Evaluate tool responded")
-            except Exception as e:
-                logger.info(f"Evaluate tool test: {e}")
-        # Performance check
-        init_time = time.time() - start_time
-        logger.info(f"Total initialization time: {init_time:.2f}s")
-        if init_time > 30:
-            logger.error("Initialization took >30s - may be too slow")
-            logger.hint("Consider optimizing startup time")
-        phases_completed = 4
-        # Check if we should stop here
-        if phases_completed >= max_phase:
-            logger.info(f"Stopping at phase {max_phase} as requested")
-            logger.progress_bar(phases_completed, total_phases)
-            return phases_completed
-        # Phase 5: Concurrent Clients
-        logger.phase(5, "Concurrent Clients Testing")
-        concurrent_clients = []
-        try:
-            logger.info("Creating 3 concurrent MCP clients...")
-            for i in range(3):
-                client_config = {
-                    f"test_concurrent_{i}": {
-                        "command": command[0],
-                        "args": command[1:] if len(command) > 1 else [],
-                    }
-                }
-                concurrent_client = MCPClient(
-                    mcp_config=client_config, verbose=False, auto_trace=False
-                )
-                await concurrent_client.initialize()
-                concurrent_clients.append(concurrent_client)
-                logger.info(f"Client {i + 1} connected")
-            logger.success("All concurrent clients connected")
-            # Clean shutdown
-            for i, c in enumerate(concurrent_clients):
-                await c.shutdown()
-                logger.info(f"Client {i + 1} disconnected")
-            phases_completed = 5
-        except Exception as e:
-            logger.error(f"Concurrent test failed: {e}")
-        finally:
-            for c in concurrent_clients:
-                try:
-                    await c.shutdown()
-                except Exception as e:
-                    logger.error(f"Failed to close client: {e}")
-    except Exception as e:
-        logger.error(f"Tool discovery failed: {e}")
-        logger.progress_bar(phases_completed, total_phases)
-        return phases_completed
-    finally:
-        # Ensure client is closed even on exceptions
-        if client:
-            try:
-                await client.shutdown()
-            except Exception:
-                logger.error("Failed to close client")
-    logger.progress_bar(phases_completed, total_phases)
-    return phases_completed
+"""Debug command implementation for MCP environments."""
+# ruff: noqa: G004
+from __future__ import annotations
+import asyncio
+import json
+import subprocess
+import threading
+import time
+from rich.console import Console
+from hud.clients import MCPClient
+from hud.utils.design import HUDDesign
+from .utils import CaptureLogger, Colors, analyze_error_for_hints
+console = Console()
+async def debug_mcp_stdio(command: list[str], logger: CaptureLogger, max_phase: int = 5) -> int:
+    """
+    Debug any stdio-based MCP server step by step.
+    Args:
+        command: Command and arguments to run the MCP server
+        logger: CaptureLogger instance for output
+        max_phase: Maximum phase to run (1-5, default 5 for all phases)
+    Returns:
+        Number of phases completed (0-5)
+    """
+    # Create design instance for initial output (before logger takes over)
+    if logger.print_output:
+        design = HUDDesign()
+        design.header("MCP Server Debugger", icon="🔍")
+        design.dim_info("Command:", " ".join(command))
+        design.dim_info("Time:", time.strftime("%Y-%m-%d %H:%M:%S"))
+        # Explain color coding using Rich formatting
+        design.info("\nColor Key:")
+        console.print("  [bold]■[/bold] Commands (bold)")
+        console.print("  [rgb(192,150,12)]■[/rgb(192,150,12)] STDIO (MCP protocol)")
+        console.print("  [dim]■[/dim] STDERR (server logs)")
+        console.print("  [green]■[/green] Success messages")
+        console.print("  [red]■[/red] Error messages")
+        console.print("  ■ Info messages")
+    phases_completed = 0
+    total_phases = 5
+    start_time = time.time()
+    # Phase 1: Basic Server Test
+    logger.phase(1, "Basic Server Startup Test")
+    try:
+        # Test if command runs at all
+        test_cmd = command + (["echo", "Server OK"] if "docker" in command[0] else [])
+        logger.command([*test_cmd[:3], "..."] if len(test_cmd) > 3 else test_cmd)
+        result = subprocess.run(  # noqa: S603, ASYNC221
+            command[:1],
+            capture_output=True,
+            text=True,
+            timeout=2,
+            encoding="utf-8",
+            errors="replace",
+        )
+        if result.returncode == 0 or "usage" in result.stderr.lower():
+            logger.success("Command executable found")
+            phases_completed = 1
+        else:
+            logger.error(f"Command failed with exit code {result.returncode}")
+            if result.stderr:
+                logger._log(
+                    f"Error output: {result.stderr}", Colors.RED if logger.print_output else ""
+                )
+                hint = analyze_error_for_hints(result.stderr)
+                if hint:
+                    logger.hint(hint)
+            logger.progress_bar(phases_completed, total_phases)
+            return phases_completed
+        # Check if we should stop here
+        if max_phase <= 1:
+            logger.info(f"Stopping at phase {max_phase} as requested")
+            logger.progress_bar(phases_completed, total_phases)
+            return phases_completed
+    except FileNotFoundError:
+        logger.error(f"Command not found: {command[0]}")
+        logger.hint("Ensure the command is installed and in PATH")
+        logger.progress_bar(phases_completed, total_phases)
+        return phases_completed
+    except Exception as e:
+        logger.error(f"Startup test failed: {e}")
+        logger.progress_bar(phases_completed, total_phases)
+        return phases_completed
+    # Phase 2: MCP Initialize Test
+    logger.phase(2, "MCP Server Initialize Test")
+    logger.info("STDIO is used for MCP protocol, STDERR for server logs")
+    init_request = {
+        "jsonrpc": "2.0",
+        "id": 1,
+        "method": "initialize",
+        "params": {
+            "protocolVersion": "2024-11-05",
+            "capabilities": {"roots": {"listChanged": True}},
+            "clientInfo": {"name": "DebugClient", "version": "1.0.0"},
+        },
+    }
+    try:
+        logger.command(command)
+        logger.stdio(f"Sending: {json.dumps(init_request)}")
+        proc = subprocess.Popen(  # noqa: S603, ASYNC220
+            command,
+            stdin=subprocess.PIPE,
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            text=True,
+            bufsize=1,
+            encoding="utf-8",
+            errors="replace",  # Replace invalid chars with � on Windows
+        )
+        # Ensure pipes are available
+        if proc.stdin is None or proc.stdout is None or proc.stderr is None:
+            raise RuntimeError("Failed to create subprocess pipes")
+        # Send initialize
+        proc.stdin.write(json.dumps(init_request) + "\n")
+        proc.stdin.flush()
+        # Collect stderr in background
+        stderr_lines = []
+        def read_stderr() -> None:
+            if proc.stderr is None:
+                return
+            for line in proc.stderr:
+                line = line.rstrip()
+                if line:
+                    logger.stderr(line)
+                    stderr_lines.append(line)
+        stderr_thread = threading.Thread(target=read_stderr)
+        stderr_thread.daemon = True
+        stderr_thread.start()
+        # Wait for response
+        response = None
+        start = time.time()
+        while time.time() - start < 15:
+            line = proc.stdout.readline()
+            if line:
+                try:
+                    response = json.loads(line)
+                    if response.get("id") == 1:
+                        logger.stdio(f"Received: {json.dumps(response)}")
+                        break
+                except Exception as e:
+                    logger.error(f"Failed to parse MCP response: {e}")
+                    continue
+        if response and "result" in response:
+            logger.success("MCP server initialized successfully")
+            server_info = response["result"].get("serverInfo", {})
+            logger.info(
+                f"Server: {server_info.get('name', 'Unknown')} v{server_info.get('version', '?')}"
+            )
+            # Show capabilities
+            caps = response["result"].get("capabilities", {})
+            if caps:
+                logger.info(f"Capabilities: {', '.join(caps.keys())}")
+            phases_completed = 2
+        else:
+            logger.error("No valid MCP response received")
+            # Analyze stderr for hints
+            if stderr_lines:
+                all_stderr = "\n".join(stderr_lines)
+                hint = analyze_error_for_hints(all_stderr)
+                if hint:
+                    logger.hint(hint)
+            else:
+                logger.hint("""MCP requires clean stdout. Ensure:
+   - All print() statements use file=sys.stderr
+   - Logging is configured to use stderr
+   - No libraries are printing to stdout""")
+            logger.progress_bar(phases_completed, total_phases)
+            proc.terminate()
+            try:
+                proc.wait(timeout=5)
+            except subprocess.TimeoutExpired:
+                proc.kill()
+                proc.wait()
+            return phases_completed
+        proc.terminate()
+        try:
+            proc.wait(timeout=5)
+        except subprocess.TimeoutExpired:
+            proc.kill()
+            proc.wait()
+        # Check if we should stop here
+        if phases_completed >= max_phase:
+            logger.info(f"Stopping at phase {max_phase} as requested")
+            logger.progress_bar(phases_completed, total_phases)
+            return phases_completed
+    except Exception as e:
+        logger.error(f"MCP test failed: {e}")
+        hint = analyze_error_for_hints(str(e))
+        if hint:
+            logger.hint(hint)
+        logger.progress_bar(phases_completed, total_phases)
+        return phases_completed
+    # Phase 3: Tool Discovery
+    logger.phase(3, "MCP Tool Discovery Test")
+    client = None
+    try:
+        # Create MCP config for the command
+        mcp_config = {
+            "test": {"command": command[0], "args": command[1:] if len(command) > 1 else []}
+        }
+        logger.command(command)
+        logger.info("Creating MCP client via hud...")
+        client = MCPClient(mcp_config=mcp_config, verbose=False, auto_trace=False)
+        await client.initialize()
+        # Wait for initialization
+        logger.info("Waiting for server initialization...")
+        await asyncio.sleep(5)
+        # Get tools
+        tools = await client.list_tools()
+        if tools:
+            logger.success(f"Found {len(tools)} tools")
+            # Check for lifecycle tools
+            tool_names = [t.name for t in tools]
+            has_setup = "setup" in tool_names
+            has_evaluate = "evaluate" in tool_names
+            logger.info(
+                f"Lifecycle tools: setup={'✅' if has_setup else '❌'}, evaluate={'✅' if has_evaluate else '❌'}"  # noqa: E501
+            )
+            # Check for interaction tools
+            interaction_tools = [
+                name
+                for name in tool_names
+                if name in ["computer", "playwright", "click", "type", "interact", "move"]
+            ]
+            if interaction_tools:
+                logger.info(f"Interaction tools: {', '.join(interaction_tools)}")
+            # List all tools
+            logger.info(f"All tools: {', '.join(tool_names)}")
+            # Try to list resources
+            try:
+                resources = await client.list_resources()
+                if resources:
+                    logger.info(
+                        f"Found {len(resources)} resources: {', '.join(str(r.uri) for r in resources[:3])}..."  # noqa: E501
+                    )
+            except Exception as e:
+                logger.error(f"Failed to list resources: {e}")
+            phases_completed = 3
+        else:
+            logger.error("No tools found")
+            logger.hint("""No tools found. Ensure:
+   - @mcp.tool() decorator is used on functions
+   - Tools are registered before mcp.run()
+   - No import errors preventing tool registration""")
+            logger.progress_bar(phases_completed, total_phases)
+            return phases_completed
+        # Check if we should stop here
+        if phases_completed >= max_phase:
+            logger.info(f"Stopping at phase {max_phase} as requested")
+            logger.progress_bar(phases_completed, total_phases)
+            return phases_completed
+        # Phase 4: Remote Deployment Readiness
+        logger.phase(4, "Remote Deployment Readiness")
+        # Test if setup/evaluate exist
+        if "setup" in tool_names:
+            try:
+                logger.info("Testing setup tool...")
+                await client.call_tool(name="setup", arguments={})
+                logger.success("Setup tool responded")
+            except Exception as e:
+                logger.info(f"Setup tool test: {e}")
+        if "evaluate" in tool_names:
+            try:
+                logger.info("Testing evaluate tool...")
+                await client.call_tool(name="evaluate", arguments={})
+                logger.success("Evaluate tool responded")
+            except Exception as e:
+                logger.info(f"Evaluate tool test: {e}")
+        # Performance check
+        init_time = time.time() - start_time
+        logger.info(f"Total initialization time: {init_time:.2f}s")
+        if init_time > 30:
+            logger.error("Initialization took >30s - may be too slow")
+            logger.hint("Consider optimizing startup time")
+        phases_completed = 4
+        # Check if we should stop here
+        if phases_completed >= max_phase:
+            logger.info(f"Stopping at phase {max_phase} as requested")
+            logger.progress_bar(phases_completed, total_phases)
+            return phases_completed
+        # Phase 5: Concurrent Clients
+        logger.phase(5, "Concurrent Clients Testing")
+        concurrent_clients = []
+        try:
+            logger.info("Creating 3 concurrent MCP clients...")
+            for i in range(3):
+                client_config = {
+                    f"test_concurrent_{i}": {
+                        "command": command[0],
+                        "args": command[1:] if len(command) > 1 else [],
+                    }
+                }
+                concurrent_client = MCPClient(
+                    mcp_config=client_config, verbose=False, auto_trace=False
+                )
+                await concurrent_client.initialize()
+                concurrent_clients.append(concurrent_client)
+                logger.info(f"Client {i + 1} connected")
+            logger.success("All concurrent clients connected")
+            # Clean shutdown
+            for i, c in enumerate(concurrent_clients):
+                await c.shutdown()
+                logger.info(f"Client {i + 1} disconnected")
+            phases_completed = 5
+        except Exception as e:
+            logger.error(f"Concurrent test failed: {e}")
+        finally:
+            for c in concurrent_clients:
+                try:
+                    await c.shutdown()
+                except Exception as e:
+                    logger.error(f"Failed to close client: {e}")
+    except Exception as e:
+        logger.error(f"Tool discovery failed: {e}")
+        logger.progress_bar(phases_completed, total_phases)
+        return phases_completed
+    finally:
+        # Ensure client is closed even on exceptions
+        if client:
+            try:
+                await client.shutdown()
+            except Exception:
+                logger.error("Failed to close client")
+    logger.progress_bar(phases_completed, total_phases)
+    return phases_completed

hud-python 0.4.1__py3-none-any.whl → 0.4.3__py3-none-any.whl

Potentially problematic release.

hud-python 0.4.1py3-none-any.whl → 0.4.3py3-none-any.whl