PyPI - hud-python - Versions diffs - 0.4.45__py3-none-any.whl → 0.5.1__py3-none-any.whl - Mend

hud-python 0.4.45py3-none-any.whl → 0.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (274) hide show

hud/__init__.py +27 -7
hud/agents/__init__.py +11 -5
hud/agents/base.py +220 -500
hud/agents/claude.py +200 -240
hud/agents/gemini.py +275 -0
hud/agents/gemini_cua.py +335 -0
hud/agents/grounded_openai.py +98 -100
hud/agents/misc/integration_test_agent.py +51 -20
hud/agents/misc/response_agent.py +41 -36
hud/agents/openai.py +291 -292
hud/agents/{openai_chat_generic.py → openai_chat.py} +80 -34
hud/agents/operator.py +211 -0
hud/agents/tests/conftest.py +133 -0
hud/agents/tests/test_base.py +300 -622
hud/agents/tests/test_base_runtime.py +233 -0
hud/agents/tests/test_claude.py +379 -210
hud/agents/tests/test_client.py +9 -10
hud/agents/tests/test_gemini.py +369 -0
hud/agents/tests/test_grounded_openai_agent.py +65 -50
hud/agents/tests/test_openai.py +376 -140
hud/agents/tests/test_operator.py +362 -0
hud/agents/tests/test_run_eval.py +179 -0
hud/cli/__init__.py +461 -545
hud/cli/analyze.py +43 -5
hud/cli/build.py +664 -110
hud/cli/debug.py +8 -5
hud/cli/dev.py +882 -734
hud/cli/eval.py +782 -668
hud/cli/flows/dev.py +167 -0
hud/cli/flows/init.py +191 -0
hud/cli/flows/tasks.py +153 -56
hud/cli/flows/templates.py +151 -0
hud/cli/flows/tests/__init__.py +1 -0
hud/cli/flows/tests/test_dev.py +126 -0
hud/cli/init.py +60 -58
hud/cli/push.py +29 -11
hud/cli/rft.py +311 -0
hud/cli/rft_status.py +145 -0
hud/cli/tests/test_analyze.py +5 -5
hud/cli/tests/test_analyze_metadata.py +3 -2
hud/cli/tests/test_analyze_module.py +120 -0
hud/cli/tests/test_build.py +108 -6
hud/cli/tests/test_build_failure.py +41 -0
hud/cli/tests/test_build_module.py +50 -0
hud/cli/tests/test_cli_init.py +6 -1
hud/cli/tests/test_cli_more_wrappers.py +30 -0
hud/cli/tests/test_cli_root.py +140 -0
hud/cli/tests/test_convert.py +361 -0
hud/cli/tests/test_debug.py +12 -10
hud/cli/tests/test_dev.py +197 -0
hud/cli/tests/test_eval.py +251 -0
hud/cli/tests/test_eval_bedrock.py +51 -0
hud/cli/tests/test_init.py +124 -0
hud/cli/tests/test_main_module.py +11 -5
hud/cli/tests/test_mcp_server.py +12 -100
hud/cli/tests/test_push_happy.py +74 -0
hud/cli/tests/test_push_wrapper.py +23 -0
hud/cli/tests/test_registry.py +1 -1
hud/cli/tests/test_utils.py +1 -1
hud/cli/{rl → utils}/celebrate.py +14 -12
hud/cli/utils/config.py +18 -1
hud/cli/utils/docker.py +130 -4
hud/cli/utils/env_check.py +9 -9
hud/cli/utils/git.py +136 -0
hud/cli/utils/interactive.py +39 -5
hud/cli/utils/metadata.py +69 -0
hud/cli/utils/runner.py +1 -1
hud/cli/utils/server.py +2 -2
hud/cli/utils/source_hash.py +3 -3
hud/cli/utils/tasks.py +4 -1
hud/cli/utils/tests/__init__.py +0 -0
hud/cli/utils/tests/test_config.py +58 -0
hud/cli/utils/tests/test_docker.py +93 -0
hud/cli/utils/tests/test_docker_hints.py +71 -0
hud/cli/utils/tests/test_env_check.py +74 -0
hud/cli/utils/tests/test_environment.py +42 -0
hud/cli/utils/tests/test_git.py +142 -0
hud/cli/utils/tests/test_interactive_module.py +60 -0
hud/cli/utils/tests/test_local_runner.py +50 -0
hud/cli/utils/tests/test_logging_utils.py +23 -0
hud/cli/utils/tests/test_metadata.py +49 -0
hud/cli/utils/tests/test_package_runner.py +35 -0
hud/cli/utils/tests/test_registry_utils.py +49 -0
hud/cli/utils/tests/test_remote_runner.py +25 -0
hud/cli/utils/tests/test_runner_modules.py +52 -0
hud/cli/utils/tests/test_source_hash.py +36 -0
hud/cli/utils/tests/test_tasks.py +80 -0
hud/cli/utils/version_check.py +258 -0
hud/cli/{rl → utils}/viewer.py +2 -2
hud/clients/README.md +12 -11
hud/clients/__init__.py +4 -3
hud/clients/base.py +166 -26
hud/clients/environment.py +51 -0
hud/clients/fastmcp.py +13 -6
hud/clients/mcp_use.py +40 -15
hud/clients/tests/test_analyze_scenarios.py +206 -0
hud/clients/tests/test_protocol.py +9 -3
hud/datasets/__init__.py +23 -20
hud/datasets/loader.py +327 -0
hud/datasets/runner.py +192 -105
hud/datasets/tests/__init__.py +0 -0
hud/datasets/tests/test_loader.py +221 -0
hud/datasets/tests/test_utils.py +315 -0
hud/datasets/utils.py +270 -90
hud/environment/__init__.py +50 -0
hud/environment/connection.py +206 -0
hud/environment/connectors/__init__.py +33 -0
hud/environment/connectors/base.py +68 -0
hud/environment/connectors/local.py +177 -0
hud/environment/connectors/mcp_config.py +109 -0
hud/environment/connectors/openai.py +101 -0
hud/environment/connectors/remote.py +172 -0
hud/environment/environment.py +694 -0
hud/environment/integrations/__init__.py +45 -0
hud/environment/integrations/adk.py +67 -0
hud/environment/integrations/anthropic.py +196 -0
hud/environment/integrations/gemini.py +92 -0
hud/environment/integrations/langchain.py +82 -0
hud/environment/integrations/llamaindex.py +68 -0
hud/environment/integrations/openai.py +238 -0
hud/environment/mock.py +306 -0
hud/environment/router.py +112 -0
hud/environment/scenarios.py +493 -0
hud/environment/tests/__init__.py +1 -0
hud/environment/tests/test_connection.py +317 -0
hud/environment/tests/test_connectors.py +218 -0
hud/environment/tests/test_environment.py +161 -0
hud/environment/tests/test_integrations.py +257 -0
hud/environment/tests/test_local_connectors.py +201 -0
hud/environment/tests/test_scenarios.py +280 -0
hud/environment/tests/test_tools.py +208 -0
hud/environment/types.py +23 -0
hud/environment/utils/__init__.py +35 -0
hud/environment/utils/formats.py +215 -0
hud/environment/utils/schema.py +171 -0
hud/environment/utils/tool_wrappers.py +113 -0
hud/eval/__init__.py +67 -0
hud/eval/context.py +674 -0
hud/eval/display.py +299 -0
hud/eval/instrument.py +185 -0
hud/eval/manager.py +466 -0
hud/eval/parallel.py +268 -0
hud/eval/task.py +340 -0
hud/eval/tests/__init__.py +1 -0
hud/eval/tests/test_context.py +178 -0
hud/eval/tests/test_eval.py +210 -0
hud/eval/tests/test_manager.py +152 -0
hud/eval/tests/test_parallel.py +168 -0
hud/eval/tests/test_task.py +145 -0
hud/eval/types.py +63 -0
hud/eval/utils.py +183 -0
hud/patches/__init__.py +19 -0
hud/patches/mcp_patches.py +151 -0
hud/patches/warnings.py +54 -0
hud/samples/browser.py +4 -4
hud/server/__init__.py +2 -1
hud/server/low_level.py +2 -1
hud/server/router.py +164 -0
hud/server/server.py +567 -80
hud/server/tests/test_mcp_server_integration.py +11 -11
hud/server/tests/test_mcp_server_more.py +1 -1
hud/server/tests/test_server_extra.py +2 -0
hud/settings.py +45 -3
hud/shared/exceptions.py +36 -10
hud/shared/hints.py +26 -1
hud/shared/requests.py +15 -3
hud/shared/tests/test_exceptions.py +40 -31
hud/shared/tests/test_hints.py +167 -0
hud/telemetry/__init__.py +20 -19
hud/telemetry/exporter.py +201 -0
hud/telemetry/instrument.py +158 -253
hud/telemetry/tests/test_eval_telemetry.py +356 -0
hud/telemetry/tests/test_exporter.py +258 -0
hud/telemetry/tests/test_instrument.py +401 -0
hud/tools/__init__.py +16 -2
hud/tools/apply_patch.py +639 -0
hud/tools/base.py +54 -4
hud/tools/bash.py +2 -2
hud/tools/computer/__init__.py +4 -0
hud/tools/computer/anthropic.py +2 -2
hud/tools/computer/gemini.py +385 -0
hud/tools/computer/hud.py +23 -6
hud/tools/computer/openai.py +20 -21
hud/tools/computer/qwen.py +434 -0
hud/tools/computer/settings.py +37 -0
hud/tools/edit.py +3 -7
hud/tools/executors/base.py +4 -2
hud/tools/executors/pyautogui.py +1 -1
hud/tools/grounding/grounded_tool.py +13 -18
hud/tools/grounding/grounder.py +10 -31
hud/tools/grounding/tests/test_grounded_tool.py +26 -44
hud/tools/jupyter.py +330 -0
hud/tools/playwright.py +18 -3
hud/tools/shell.py +308 -0
hud/tools/tests/test_apply_patch.py +718 -0
hud/tools/tests/test_computer.py +4 -9
hud/tools/tests/test_computer_actions.py +24 -2
hud/tools/tests/test_jupyter_tool.py +181 -0
hud/tools/tests/test_shell.py +596 -0
hud/tools/tests/test_submit.py +85 -0
hud/tools/tests/test_types.py +193 -0
hud/tools/types.py +21 -1
hud/types.py +167 -57
hud/utils/__init__.py +2 -0
hud/utils/env.py +67 -0
hud/utils/hud_console.py +61 -3
hud/utils/mcp.py +15 -58
hud/utils/strict_schema.py +162 -0
hud/utils/tests/test_init.py +1 -2
hud/utils/tests/test_mcp.py +1 -28
hud/utils/tests/test_pretty_errors.py +186 -0
hud/utils/tests/test_tool_shorthand.py +154 -0
hud/utils/tests/test_version.py +1 -1
hud/utils/types.py +20 -0
hud/version.py +1 -1
hud_python-0.5.1.dist-info/METADATA +264 -0
hud_python-0.5.1.dist-info/RECORD +299 -0
{hud_python-0.4.45.dist-info → hud_python-0.5.1.dist-info}/WHEEL +1 -1
hud/agents/langchain.py +0 -261
hud/agents/lite_llm.py +0 -72
hud/cli/rl/__init__.py +0 -180
hud/cli/rl/config.py +0 -101
hud/cli/rl/display.py +0 -133
hud/cli/rl/gpu.py +0 -63
hud/cli/rl/gpu_utils.py +0 -321
hud/cli/rl/local_runner.py +0 -595
hud/cli/rl/presets.py +0 -96
hud/cli/rl/remote_runner.py +0 -463
hud/cli/rl/rl_api.py +0 -150
hud/cli/rl/vllm.py +0 -177
hud/cli/rl/wait_utils.py +0 -89
hud/datasets/parallel.py +0 -687
hud/misc/__init__.py +0 -1
hud/misc/claude_plays_pokemon.py +0 -292
hud/otel/__init__.py +0 -35
hud/otel/collector.py +0 -142
hud/otel/config.py +0 -181
hud/otel/context.py +0 -570
hud/otel/exporters.py +0 -369
hud/otel/instrumentation.py +0 -135
hud/otel/processors.py +0 -121
hud/otel/tests/__init__.py +0 -1
hud/otel/tests/test_processors.py +0 -197
hud/rl/README.md +0 -30
hud/rl/__init__.py +0 -1
hud/rl/actor.py +0 -176
hud/rl/buffer.py +0 -405
hud/rl/chat_template.jinja +0 -101
hud/rl/config.py +0 -192
hud/rl/distributed.py +0 -132
hud/rl/learner.py +0 -637
hud/rl/tests/__init__.py +0 -1
hud/rl/tests/test_learner.py +0 -186
hud/rl/train.py +0 -382
hud/rl/types.py +0 -101
hud/rl/utils/start_vllm_server.sh +0 -30
hud/rl/utils.py +0 -524
hud/rl/vllm_adapter.py +0 -143
hud/telemetry/job.py +0 -352
hud/telemetry/replay.py +0 -74
hud/telemetry/tests/test_replay.py +0 -40
hud/telemetry/tests/test_trace.py +0 -63
hud/telemetry/trace.py +0 -158
hud/utils/agent_factories.py +0 -86
hud/utils/async_utils.py +0 -65
hud/utils/group_eval.py +0 -223
hud/utils/progress.py +0 -149
hud/utils/tasks.py +0 -127
hud/utils/tests/test_async_utils.py +0 -173
hud/utils/tests/test_progress.py +0 -261
hud_python-0.4.45.dist-info/METADATA +0 -552
hud_python-0.4.45.dist-info/RECORD +0 -228
{hud_python-0.4.45.dist-info → hud_python-0.5.1.dist-info}/entry_points.txt +0 -0
{hud_python-0.4.45.dist-info → hud_python-0.5.1.dist-info}/licenses/LICENSE +0 -0

hud/cli/utils/version_check.py ADDED Viewed

@@ -0,0 +1,258 @@
+"""Version checking utilities for HUD CLI.
+This module handles checking for updates to the hud-python package
+and prompting users to upgrade when a new version is available.
+Features:
+- Checks PyPI for the latest version of hud-python
+- Caches results for 6 hours to avoid excessive API calls
+- Displays a friendly prompt when an update is available
+- Can be disabled with HUD_SKIP_VERSION_CHECK=1 environment variable
+The version check runs automatically at the start of most CLI commands,
+but is skipped for help and version commands to keep them fast.
+"""
+from __future__ import annotations
+import contextlib
+import json
+import logging
+import os
+import time
+from pathlib import Path
+from typing import NamedTuple
+import httpx
+from packaging import version
+from hud.utils.hud_console import HUDConsole
+# Logger for version checking
+logger = logging.getLogger(__name__)
+# Cache location for version check data
+CACHE_DIR = Path.home() / ".hud" / ".cache"
+VERSION_CACHE_FILE = CACHE_DIR / "version_check.json"
+# Cache duration in seconds (6 hours)
+CACHE_DURATION = 6 * 60 * 60
+# PyPI API URL for package info
+PYPI_URL = "https://pypi.org/pypi/hud-python/json"
+class VersionInfo(NamedTuple):
+    """Version information from PyPI."""
+    latest: str
+    current: str
+    is_outdated: bool
+    checked_at: float
+def _get_current_version() -> str:
+    """Get the currently installed version of hud-python."""
+    try:
+        from hud import __version__
+        return __version__
+    except ImportError:
+        return "unknown"
+def _fetch_latest_version() -> str | None:
+    """Fetch the latest version from PyPI.
+    Returns:
+        The latest version string, or None if the request fails.
+    """
+    try:
+        with httpx.Client(timeout=3.0) as client:
+            response = client.get(PYPI_URL)
+            if response.status_code == 200:
+                data = response.json()
+                return data["info"]["version"]
+    except Exception:  # noqa: S110
+        # Silently fail - we don't want to disrupt the user's workflow
+        # if PyPI is down or there's a network issue
+        pass
+    return None
+def _load_cache() -> VersionInfo | None:
+    """Load cached version information.
+    Returns:
+        Cached VersionInfo if valid, None otherwise.
+    """
+    if not VERSION_CACHE_FILE.exists():
+        return None
+    try:
+        with open(VERSION_CACHE_FILE) as f:
+            data = json.load(f)
+        # Check if cache is still valid
+        if time.time() - data["checked_at"] > CACHE_DURATION:
+            return None
+        return VersionInfo(
+            latest=data["latest"],
+            current=data["current"],
+            is_outdated=data["is_outdated"],
+            checked_at=data["checked_at"],
+        )
+    except Exception:
+        # If cache is corrupted, return None
+        return None
+def _save_cache(info: VersionInfo) -> None:
+    """Save version information to cache.
+    Args:
+        info: Version information to cache.
+    """
+    try:
+        # Create cache directory if it doesn't exist
+        CACHE_DIR.mkdir(parents=True, exist_ok=True)
+        with open(VERSION_CACHE_FILE, "w") as f:
+            json.dump(
+                {
+                    "latest": info.latest,
+                    "current": info.current,
+                    "is_outdated": info.is_outdated,
+                    "checked_at": info.checked_at,
+                },
+                f,
+            )
+    except Exception:  # noqa: S110
+        # Silently fail if we can't write cache
+        pass
+def _compare_versions(current: str, latest: str) -> bool:
+    """Compare versions to determine if an update is available.
+    Args:
+        current: Current version string
+        latest: Latest version string
+    Returns:
+        True if latest is newer than current, False otherwise.
+    """
+    if current == "unknown":
+        return False
+    try:
+        current_v = version.parse(current)
+        latest_v = version.parse(latest)
+        return latest_v > current_v
+    except Exception:
+        # If we can't parse versions, assume no update needed
+        return False
+def check_for_updates() -> VersionInfo | None:
+    """Check for updates to hud-python.
+    This function checks PyPI for the latest version and caches the result
+    for 6 hours to avoid excessive API calls.
+    Returns:
+        VersionInfo if check succeeds, None otherwise.
+    """
+    # Check if we're in CI/testing environment
+    if os.environ.get("CI") or os.environ.get("HUD_SKIP_VERSION_CHECK"):
+        return None
+    # Get current version first
+    current = _get_current_version()
+    if current == "unknown":
+        return None
+    # Try to load from cache
+    cached_info = _load_cache()
+    # If cache exists but current version has changed (user upgraded), invalidate cache
+    if cached_info and cached_info.current != current:
+        cached_info = None  # Force fresh check
+    if cached_info:
+        # Update the current version in the cached info to reflect reality
+        # but keep the cached latest version and timestamp
+        return VersionInfo(
+            latest=cached_info.latest,
+            current=current,  # Use actual current version, not cached
+            is_outdated=_compare_versions(current, cached_info.latest),
+            checked_at=cached_info.checked_at,
+        )
+    # Fetch latest version from PyPI
+    latest = _fetch_latest_version()
+    if not latest:
+        return None
+    # Compare versions
+    is_outdated = _compare_versions(current, latest)
+    # Create version info
+    info = VersionInfo(
+        latest=latest,
+        current=current,
+        is_outdated=is_outdated,
+        checked_at=time.time(),
+    )
+    # Save to cache
+    _save_cache(info)
+    return info
+def display_update_prompt(console: HUDConsole | None = None) -> None:
+    """Display update prompt if a new version is available.
+    This function checks for updates and displays a prompt to the user
+    if their version is outdated.
+    Args:
+        console: HUDConsole instance for output. If None, creates a new one.
+    """
+    if console is None:
+        console = HUDConsole(logger=logger)
+    try:
+        info = check_for_updates()
+        if info and info.is_outdated:
+            # Create update message
+            update_msg = (
+                f"🆕 A new version of hud-python is available: "
+                f"[bold cyan]{info.latest}[/bold cyan] "
+                f"(current: [dim]{info.current}[/dim])\n"
+                f"   Run: [bold yellow]uv tool upgrade hud-python[/bold yellow] to update"
+            )
+            # Display using console info
+            console.info(f"[yellow]{update_msg}[/yellow]")
+    except Exception:  # noqa: S110
+        # Never let version checking disrupt the user's workflow
+        pass
+def force_version_check() -> VersionInfo | None:
+    """Force a version check, bypassing the cache.
+    This is useful for explicit version checks or testing.
+    Returns:
+        VersionInfo if check succeeds, None otherwise.
+    """
+    # Clear the cache to force a fresh check
+    if VERSION_CACHE_FILE.exists():
+        with contextlib.suppress(Exception):
+            VERSION_CACHE_FILE.unlink()
+    return check_for_updates()

hud/cli/{rl → utils}/viewer.py RENAMED Viewed

@@ -1,4 +1,4 @@
-"""Inline JSON preview with expandable view for RL flow.
+"""Inline JSON preview with expandable view.
 Uses minimal terminal interaction for inline display.
 """
@@ -46,7 +46,7 @@ def _truncate_value(value: Any, max_len: int = 60) -> str:
         if len(value) > max_len:
             return value[:max_len] + "…"
         return value
-    elif isinstance(value, (dict, list)):
+    elif isinstance(value, dict | list):
         s = json.dumps(value, separators=(",", ":"))
         if len(s) > max_len:
             return s[:max_len] + "…"

hud/clients/README.md CHANGED Viewed

@@ -7,8 +7,8 @@ This directory contains the MCP client implementations for HUD SDK. The architec
 ```
 hud/clients/
 ├── base.py          # Protocol definition and base class
-├── mcp_use.py       # MCP-use based implementation (legacy)
-├── fastmcp.py       # FastMCP based implementation (modern)
+├── mcp_use.py       # MCP-use based implementation (default)
+├── fastmcp.py       # FastMCP based implementation (alternative)
 └── __init__.py      # Exports and default client
 ```
@@ -30,15 +30,15 @@ class AgentMCPClient(Protocol):
 ## Available Implementations
-### 1. MCPUseHUDClient
+### 1. MCPUseHUDClient (Default)
 - Based on the `mcp_use` library
 - Supports multiple concurrent server connections
 - Battle-tested and stable
 - Good for complex multi-server setups
-### 2. FastMCPHUDClient (Default)
+### 2. FastMCPHUDClient
 - Based on the `fastmcp` library
-- Modern, clean API with better error handling
+- Alternative implementation with different transport handling
 - Supports various transports (HTTP, WebSocket, stdio, in-memory)
 - Better type safety and structured data support
@@ -47,7 +47,7 @@ class AgentMCPClient(Protocol):
 ### Basic Usage
 ```python
-from hud.clients import MCPUseHUDClient, FastMCPHUDClient
+from hud.clients import MCPClient, FastMCPHUDClient
 # Configuration works for both clients
 mcp_config = {
@@ -57,10 +57,10 @@ mcp_config = {
     }
 }
-# Option 1: MCP-use client
-client = MCPUseHUDClient(mcp_config)
+# Default client (MCPUseHUDClient)
+client = MCPClient(mcp_config)
-# Option 2: FastMCP client
+# Alternative: FastMCP client
 client = FastMCPHUDClient(mcp_config)
 # Both use the same API
@@ -73,13 +73,14 @@ async with client:
 ```python
 from hud.agents import ClaudeAgent
+from hud.clients import MCPClient
 # Either client works with agents
-client = FastMCPHUDClient(mcp_config)
+client = MCPClient(mcp_config)
 agent = ClaudeAgent(
     mcp_client=client,
-    model="claude-3-7-sonnet-20250219"
+    model="claude-sonnet-4-5"
 )
 # Agent works identically with either client

hud/clients/__init__.py CHANGED Viewed

@@ -3,15 +3,16 @@
 from __future__ import annotations
 from .base import AgentMCPClient, BaseHUDClient
+from .environment import EnvironmentClient
 from .fastmcp import FastMCPHUDClient
-from .mcp_use import MCPUseHUDClient
-# Default to MCP-use for new features
-MCPClient = MCPUseHUDClient
+# Default to FastMCP client (no optional dependencies)
+MCPClient = FastMCPHUDClient
 __all__ = [
     "AgentMCPClient",
     "BaseHUDClient",
+    "EnvironmentClient",
     "FastMCPHUDClient",
     "MCPClient",
 ]

hud/clients/base.py CHANGED Viewed

@@ -12,7 +12,6 @@ from mcp.types import Implementation
 from hud.shared.exceptions import HudAuthenticationError, HudException
 from hud.types import MCPToolCall, MCPToolResult
 from hud.utils.hud_console import HUDConsole
-from hud.utils.mcp import setup_hud_telemetry
 from hud.version import __version__ as hud_version
 if TYPE_CHECKING:
@@ -86,7 +85,6 @@ class BaseHUDClient(AgentMCPClient):
         mcp_config: dict[str, dict[str, Any]] | None = None,
         verbose: bool = False,
         strict_validation: bool = False,
-        auto_trace: bool = True,
     ) -> None:
         """
         Initialize base client.
@@ -99,11 +97,11 @@ class BaseHUDClient(AgentMCPClient):
         self.verbose = verbose
         self._mcp_config = mcp_config
         self._strict_validation = strict_validation
-        self._auto_trace = auto_trace
-        self._auto_trace_cm: Any | None = None  # Store auto-created trace context manager
         self._initialized = False
         self._telemetry_data = {}  # Initialize telemetry data
+        self._cached_resources: list[types.Resource] = []  # Cache for resources
+        self._cached_prompts: list[types.Prompt] = []  # Cache for prompts
         if self.verbose:
             self._setup_verbose_logging()
@@ -126,8 +124,6 @@ class BaseHUDClient(AgentMCPClient):
                 "Either pass it to the constructor or call initialize with a configuration"
             )
-        self._auto_trace_cm = setup_hud_telemetry(self._mcp_config, auto_trace=self._auto_trace)
         hud_console.debug("Initializing MCP client...")
         try:
@@ -135,18 +131,18 @@ class BaseHUDClient(AgentMCPClient):
             for server_config in self._mcp_config.values():
                 url = server_config.get("url", "")
                 headers = server_config.get("headers", {})
-                if "mcp.hud.so" in url and len(headers.get("Authorization", "")) < 10:
+                if "mcp.hud.ai" in url and len(headers.get("Authorization", "")) < 10:
                     raise HudAuthenticationError(
                         f'Sending authorization "{headers.get("Authorization", "")}", which may'
                         " be incomplete. Ensure HUD_API_KEY environment variable is set or send it"
-                        " as a header. You can get an API key at https://hud.so"
+                        " as a header. You can get an API key at https://hud.ai"
                     )
             # Subclasses implement connection
             await self._connect(self._mcp_config)
         except HudException:
             raise
         except Exception as e:
-            # Auto-converts to appropriate HUD exception type with hints
+            hud_console.error(f"Failed to initialize MCP client: {e}")
             raise HudException from e
         # Common hud behavior - fetch telemetry
@@ -156,21 +152,12 @@ class BaseHUDClient(AgentMCPClient):
     async def shutdown(self) -> None:
         """Disconnect from the MCP server."""
-        # Clean up auto-created trace if any
-        if self._auto_trace_cm:
-            try:
-                self._auto_trace_cm.__exit__(None, None, None)
-                hud_console.info("Closed auto-created trace")
-            except Exception as e:
-                hud_console.warning(f"Failed to close auto-created trace: {e}")
-            finally:
-                self._auto_trace_cm = None
-        # Disconnect from server
         if self._initialized:
             await self._disconnect()
             self._initialized = False
-            hud_console.info("Shutdown completed")
+            self._cached_resources.clear()
+            self._cached_prompts.clear()
+            hud_console.info("Environment Shutdown completed")
         else:
             hud_console.debug("Client was not initialized, skipping disconnect")
@@ -211,11 +198,41 @@ class BaseHUDClient(AgentMCPClient):
         """List all available tools."""
         raise NotImplementedError
-    @abstractmethod
     async def list_resources(self) -> list[types.Resource]:
-        """List all available resources."""
+        """List all available resources.
+        Uses cached resources if available, otherwise fetches from the server.
+        Returns:
+            List of available resources.
+        """
+        # If cache is empty, populate it
+        if not self._cached_resources:
+            self._cached_resources = await self._list_resources_impl()
+        return self._cached_resources
+    @abstractmethod
+    async def _list_resources_impl(self) -> list[types.Resource]:
+        """Implementation-specific resource listing. Subclasses must implement this."""
         raise NotImplementedError
+    async def list_prompts(self) -> list[types.Prompt]:
+        """List all available prompts.
+        Uses cached prompts if available, otherwise fetches from the server.
+        Prompts are optional in MCP; default implementation returns an empty list.
+        """
+        if not self._cached_prompts:
+            self._cached_prompts = await self._list_prompts_impl()
+        return self._cached_prompts
+    async def _list_prompts_impl(self) -> list[types.Prompt]:
+        """Implementation-specific prompt listing (optional).
+        Subclasses can override to support prompt discovery.
+        """
+        return []
     @abstractmethod
     async def _call_tool(self, tool_call: MCPToolCall) -> MCPToolResult:
         """Execute a tool by name."""
@@ -270,6 +287,17 @@ class BaseHUDClient(AgentMCPClient):
     async def _fetch_telemetry(self) -> None:
         """Common telemetry fetching for all hud clients."""
         try:
+            # Get resources (will use cache if available, otherwise fetch)
+            resources = await self.list_resources()
+            telemetry_available = any(
+                str(resource.uri) == "telemetry://live" for resource in resources
+            )
+            if not telemetry_available:
+                if self.verbose:
+                    hud_console.debug("Telemetry resource not available from server")
+                return
             # Try to read telemetry resource directly
             result = await self.read_resource("telemetry://live")
             if result and result.contents:
@@ -321,6 +349,9 @@ class BaseHUDClient(AgentMCPClient):
             "hub_tools": {},
             "telemetry": self._telemetry_data,
             "resources": [],
+            "prompts": [],
+            "scenarios": [],
+            "verbose": self.verbose,
             "metadata": {
                 "servers": list(self._mcp_config.keys()),  # type: ignore
                 "initialized": self._initialized,
@@ -333,7 +364,7 @@ class BaseHUDClient(AgentMCPClient):
             tool_info = {
                 "name": tool.name,
                 "description": tool.description,
-                "input_schema": tool.inputSchema,
+                "inputSchema": tool.inputSchema,
             }
             analysis["tools"].append(tool_info)
@@ -352,16 +383,125 @@ class BaseHUDClient(AgentMCPClient):
         try:
             resources = await self.list_resources()
             for resource in resources:
-                resource_info = {
+                resource_info: dict[str, Any] = {
                     "uri": str(resource.uri),
                     "name": resource.name,
                     "description": resource.description,
                     "mime_type": getattr(resource, "mimeType", None),
                 }
+                # Include meta field if present (contains scenario source code)
+                meta = getattr(resource, "meta", None)
+                if meta:
+                    resource_info["meta"] = meta
                 analysis["resources"].append(resource_info)
         except Exception as e:
             if self.verbose:
-                hud_console.debug(f"Could not list resources: {e}")
+                hud_console.debug("Could not list resources: " + str(e))
+        # Get all prompts (optional)
+        try:
+            prompts = await self.list_prompts()
+            for prompt in prompts:
+                raw_args = getattr(prompt, "arguments", []) or []
+                args: list[dict[str, Any]] = [
+                    {
+                        "name": getattr(a, "name", None),
+                        "required": getattr(a, "required", None),
+                        "description": getattr(a, "description", None),
+                    }
+                    for a in raw_args
+                ]
+                prompt_info: dict[str, Any] = {
+                    "name": prompt.name,
+                    "description": prompt.description,
+                    "arguments": args,
+                }
+                # Include meta field if present
+                meta = getattr(prompt, "meta", None)
+                if meta:
+                    prompt_info["meta"] = meta
+                    # Merge type/default info from meta.arguments into the arguments array
+                    if isinstance(meta, dict) and "arguments" in meta:
+                        meta_args = {a["name"]: a for a in meta["arguments"] if "name" in a}
+                        for arg in args:
+                            arg_name = arg.get("name")
+                            if arg_name and arg_name in meta_args:
+                                meta_arg = meta_args[arg_name]
+                                if "default" in meta_arg:
+                                    arg["default"] = meta_arg["default"]
+                                if "type" in meta_arg:
+                                    arg["type"] = meta_arg["type"]
+                                if "inputSchema" in meta_arg:
+                                    arg["inputSchema"] = meta_arg["inputSchema"]
+                analysis["prompts"].append(prompt_info)
+        except Exception as e:
+            if self.verbose:
+                hud_console.debug("Could not list prompts: " + str(e))
+        # Derive "scenarios" from Environment.@scenario prompts/resources.
+        # A scenario is exposed as:
+        # - Prompt: name "{env}:{scenario}" with description prefix "[Setup]"
+        # - Resource: uri "{env}:{scenario}" with description prefix "[Evaluate]"
+        # Both prompt and resource contain meta.code with the scenario source code
+        scenarios_by_id: dict[str, dict[str, Any]] = {}
+        for p in analysis.get("prompts", []):
+            desc = (p.get("description") or "").strip()
+            if not desc.startswith("[Setup]"):
+                continue
+            scenario_id = p.get("name")
+            if not scenario_id:
+                continue
+            env_name, scenario_name = ([*scenario_id.split(":", 1), ""])[:2]
+            scenario_info: dict[str, Any] = {
+                "id": scenario_id,
+                "env": env_name,
+                "name": scenario_name or scenario_id,
+                "setup_description": desc,
+                "arguments": p.get("arguments") or [],
+                "has_setup_prompt": True,
+                "has_evaluate_resource": False,
+            }
+            # Extract code from meta field if present
+            meta = p.get("meta")
+            if meta and isinstance(meta, dict) and "code" in meta:
+                scenario_info["code"] = meta["code"]
+            scenarios_by_id[scenario_id] = scenario_info
+        for r in analysis.get("resources", []):
+            desc = (r.get("description") or "").strip()
+            if not desc.startswith("[Evaluate]"):
+                continue
+            scenario_id = r.get("uri")
+            if not scenario_id:
+                continue
+            env_name, scenario_name = ([*scenario_id.split(":", 1), ""])[:2]
+            if scenario_id not in scenarios_by_id:
+                scenarios_by_id[scenario_id] = {
+                    "id": scenario_id,
+                    "env": env_name,
+                    "name": scenario_name or scenario_id,
+                    "arguments": [],
+                    "has_setup_prompt": False,
+                    "has_evaluate_resource": True,
+                }
+            scenarios_by_id[scenario_id]["evaluate_description"] = desc
+            scenarios_by_id[scenario_id]["has_evaluate_resource"] = True
+            # Extract code from meta field if not already present (from prompt)
+            meta = r.get("meta")
+            if (
+                meta
+                and isinstance(meta, dict)
+                and "code" in meta
+                and "code" not in scenarios_by_id[scenario_id]
+            ):
+                scenarios_by_id[scenario_id]["code"] = meta["code"]
+        analysis["scenarios"] = sorted(
+            scenarios_by_id.values(),
+            key=lambda s: (str(s.get("env") or ""), str(s.get("name") or "")),
+        )
         return analysis

hud-python 0.4.45__py3-none-any.whl → 0.5.1__py3-none-any.whl

hud-python 0.4.45py3-none-any.whl → 0.5.1py3-none-any.whl