PyPI - hud-python - Versions diffs - 0.2.5__py3-none-any.whl → 0.2.6__py3-none-any.whl - Mend

hud-python 0.2.5py3-none-any.whl → 0.2.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hud-python might be problematic. Click here for more details.

Files changed (16) hide show

hud/agent/claude_plays_pokemon.py +2 -1
hud/env/remote_docker_client.py +2 -2
hud/job.py +9 -9
hud/server/requests.py +26 -4
hud/settings.py +1 -1
hud/taskset.py +16 -4
hud/telemetry/context.py +33 -57
hud/telemetry/instrumentation/mcp.py +0 -3
hud/telemetry/tests/test_context.py +7 -3
hud/types.py +1 -1
hud/utils/tests/test_version.py +1 -1
hud/version.py +1 -1
{hud_python-0.2.5.dist-info → hud_python-0.2.6.dist-info}/METADATA +18 -18
{hud_python-0.2.5.dist-info → hud_python-0.2.6.dist-info}/RECORD +16 -16
{hud_python-0.2.5.dist-info → hud_python-0.2.6.dist-info}/WHEEL +0 -0
{hud_python-0.2.5.dist-info → hud_python-0.2.6.dist-info}/licenses/LICENSE +0 -0

hud/agent/claude_plays_pokemon.py CHANGED Viewed

@@ -11,6 +11,7 @@ from anthropic.types.beta import (
     BetaImageBlockParam,
 )
+from hud.adapters.common.types import CLA
 from hud.agent import Agent
 from hud.adapters import Adapter
 from hud.settings import settings
@@ -128,7 +129,7 @@ def extract_json_from_response(response: str) -> str:
     return response.strip()
-class ClaudePlaysPokemon(Agent[AsyncAnthropic, None]):
+class ClaudePlaysPokemon(Agent[AsyncAnthropic, CLA]):
     """AI agent that plays Pokémon games using Claude."""
     def __init__(

hud/env/remote_docker_client.py CHANGED Viewed

@@ -113,8 +113,8 @@ class RemoteDockerClient(DockerClient):
         logger.info("Creating remote environment")
-        true_gym_id = await get_gym_id("local-docker")
-        # true_gym_id = await get_gym_id("docker")
+        # true_gym_id = await get_gym_id("local-docker")
+        true_gym_id = await get_gym_id("docker")
         # augment metadata with dockerfile
         if "environment_config" not in metadata:

hud/job.py CHANGED Viewed

@@ -1,12 +1,12 @@
 from __future__ import annotations
 import asyncio
-import datetime
 import functools
 import inspect
 import logging
 import sys
 from collections.abc import Callable, Coroutine
+from datetime import datetime
 from typing import TYPE_CHECKING, Any, TypeVar, cast
 from pydantic import BaseModel, PrivateAttr, TypeAdapter
@@ -44,7 +44,7 @@ class Job(BaseModel):
     id: str
     name: str
     metadata: dict[str, Any] | None = None
-    created_at: datetime.datetime
+    created_at: datetime
     status: str
     # Internal cache for trajectories
@@ -164,13 +164,15 @@ async def create_job(
     # If not, we might need to make a subsequent GET request
     job_data = data  # Adjust if the API response structure is different
+    created_at = datetime.fromisoformat(job_data["created_at"].replace("Z", "+00:00"))
     logger.info("View job at https://app.hud.so/jobs/%s.", job_data["id"])
     return Job(
         id=job_data["id"],
         name=job_data["name"],
         metadata=job_data.get("metadata", {}),  # Ensure metadata is dict
-        created_at=datetime.datetime.fromisoformat(job_data["created_at"]),  # Parse datetime
+        created_at=created_at,  # Parse datetime
         status=job_data["status"],
     )
@@ -379,7 +381,7 @@ async def _execute_task(
                         "type": "step_error",
                         "step": step + 1,
                         "error": str(agent_step_err),
-                        "timestamp": datetime.datetime.now().isoformat(),
+                        "timestamp": datetime.now().isoformat(),
                     }
                 )
                 continue
@@ -413,7 +415,7 @@ async def _execute_task(
                         "task_id": task_id,
                         "type": "evaluation_error",
                         "error": str(eval_err),
-                        "timestamp": datetime.datetime.now().isoformat(),
+                        "timestamp": datetime.now().isoformat(),
                     }
                 )
@@ -427,7 +429,7 @@ async def _execute_task(
                 "task_id": task_id,
                 "type": "setup_error",
                 "error": str(e),
-                "timestamp": datetime.datetime.now().isoformat(),
+                "timestamp": datetime.now().isoformat(),
             }
         )
@@ -447,7 +449,7 @@ async def _execute_task(
                         "task_id": task_id,
                         "type": "env_close_error",
                         "error": str(close_err),
-                        "timestamp": datetime.datetime.now().isoformat(),
+                        "timestamp": datetime.now().isoformat(),
                     }
                 )
@@ -532,8 +534,6 @@ async def run_job(
     Returns:
         The created Job object with errors stored in job.errors.
     """
-    hud_logger = logging.getLogger("hud")
-    hud_logger.setLevel(logging.CRITICAL)
     tasks_to_run: list[Task] = []
     created_job: Job | None = None

hud/server/requests.py CHANGED Viewed

@@ -6,6 +6,7 @@ from __future__ import annotations
 import asyncio
 import logging
+import ssl
 import time
 from typing import Any
@@ -20,7 +21,7 @@ from hud.exceptions import (
 # Set up logger
 logger = logging.getLogger("hud.http")
-logger.setLevel(logging.DEBUG)
+logger.setLevel(logging.INFO)
 # Long running requests can take up to 10 minutes.
@@ -37,7 +38,7 @@ async def _handle_retry(
 ) -> None:
     """Helper function to handle retry logic and logging."""
     retry_time = retry_delay * (2 ** (attempt - 1))  # Exponential backoff
-    logger.warning(
+    logger.debug(
         "%s from %s, retrying in %.2f seconds (attempt %d/%d)",
         error_msg,
         url,
@@ -140,6 +141,12 @@ async def make_request(
                     continue
                 else:
                     raise HudNetworkError(f"Network error: {e!s}") from None
+            except ssl.SSLError as e:
+                if attempt <= max_retries:
+                    await _handle_retry(attempt, max_retries, retry_delay, url, f"SSL error: {e}")
+                    continue
+                else:
+                    raise HudNetworkError(f"SSL error: {e!s}") from None
             except Exception as e:
                 raise HudRequestError(f"Unexpected error: {e!s}") from None
         raise HudRequestError(f"Request failed after {max_retries} retries with unknown error")
@@ -201,7 +208,7 @@ def make_request_sync(
                 # Check if we got a retriable status code
                 if response.status_code in retry_status_codes and attempt <= max_retries:
                     retry_time = retry_delay * (2 ** (attempt - 1))  # Exponential backoff
-                    logger.warning(
+                    logger.debug(
                         "Received status %d from %s, retrying in %.2f seconds (attempt %d/%d)",
                         response.status_code,
                         url,
@@ -222,7 +229,7 @@ def make_request_sync(
             except httpx.RequestError as e:
                 if attempt <= max_retries:
                     retry_time = retry_delay * (2 ** (attempt - 1))
-                    logger.warning(
+                    logger.debug(
                         "Network error %s from %s, retrying in %.2f seconds (attempt %d/%d)",
                         str(e),
                         url,
@@ -234,6 +241,21 @@ def make_request_sync(
                     continue
                 else:
                     raise HudNetworkError(f"Network error: {e!s}") from None
+            except ssl.SSLError as e:
+                if attempt <= max_retries:
+                    retry_time = retry_delay * (2 ** (attempt - 1))  # Exponential backoff
+                    logger.debug(
+                        "SSL error %s from %s, retrying in %.2f seconds (attempt %d/%d)",
+                        str(e),
+                        url,
+                        retry_time,
+                        attempt,
+                        max_retries,
+                    )
+                    time.sleep(retry_time)
+                    continue
+                else:
+                    raise HudNetworkError(f"SSL error: {e!s}") from None
             except Exception as e:
                 raise HudRequestError(f"Unexpected error: {e!s}") from None
         raise HudRequestError(f"Request failed after {max_retries} retries with unknown error")

hud/settings.py CHANGED Viewed

@@ -15,7 +15,7 @@ class Settings(BaseSettings):
     model_config = SettingsConfigDict(env_file=".env", env_file_encoding="utf-8", extra="allow")
     base_url: str = Field(
-        default="https://orcstaging.hud.so/hud-gym/api",
+        default="https://orchestration.hud.so/hud-gym/api",
         description="Base URL for the HUD API",
         validation_alias="base_url",
     )

hud/taskset.py CHANGED Viewed

@@ -86,15 +86,27 @@ class TaskSet(BaseModel):
         # Convert all tasks to expanded configs
         processed_tasks = []
         for task in self.tasks:
-            setup_config = create_remote_config(None, task.setup, REMOTE_SETUP)[0].args[0]
-            evaluate_config = create_remote_config(None, task.evaluate, REMOTE_EVALUATE)[0].args[0]
+            if task.setup is not None:
+                setup_config = (
+                    create_remote_config(None, task.setup, REMOTE_SETUP)[0].args[0].model_dump()
+                )
+            else:
+                setup_config = None
+            if task.evaluate is not None:
+                evaluate_config = (
+                    create_remote_config(None, task.evaluate, REMOTE_EVALUATE)[0]
+                    .args[0]
+                    .model_dump()
+                )
+            else:
+                evaluate_config = None
             processed_tasks.append(
                 {
                     "prompt": task.prompt,
                     "gym": task.gym,
-                    "setup": setup_config.model_dump(),
-                    "evaluate": evaluate_config.model_dump(),
+                    "setup": setup_config,
+                    "evaluate": evaluate_config,
                     "config": task.config,
                 }
             )

hud/telemetry/context.py CHANGED Viewed

@@ -2,6 +2,7 @@ from __future__ import annotations
 import contextvars
 import logging
+from collections import defaultdict
 from datetime import datetime
 from typing import Any, TypeVar
@@ -11,7 +12,6 @@ from hud.telemetry.mcp_models import (
     MCPNotificationCall,
     MCPRequestCall,
     MCPResponseCall,
-    MCPTelemetryRecord,
     StatusType,
 )
@@ -21,9 +21,8 @@ logger = logging.getLogger("hud.telemetry")
 current_task_run_id: contextvars.ContextVar[str | None] = contextvars.ContextVar(
     "current_task_run_id", default=None
 )
-mcp_calls_buffer: contextvars.ContextVar[list[BaseMCPCall] | None] = contextvars.ContextVar(
-    "mcp_calls_buffer", default=None
-)
+# NEW: Global dictionary for buffering, keyed by task_run_id
+_GLOBAL_MCP_CALL_BUFFERS: defaultdict[str, list[BaseMCPCall]] = defaultdict(list)
 is_root_trace: contextvars.ContextVar[bool] = contextvars.ContextVar("is_root_trace", default=False)
 # Maximum buffer size before automatic flush
@@ -35,51 +34,37 @@ T = TypeVar("T", bound=BaseMCPCall)
 def get_current_task_run_id() -> str | None:
     """Get the task_run_id for the current trace context."""
-    value = current_task_run_id.get()
-    # Convert empty string sentinel back to None
-    return None if value == "" else value
+    return current_task_run_id.get()
 def set_current_task_run_id(task_run_id: str | None) -> None:
     """Set the task_run_id for the current trace context."""
-    # Handle None value by using empty string as sentinel
-    value_to_set = "" if task_run_id is None else task_run_id
-    current_task_run_id.set(value_to_set)
+    current_task_run_id.set(task_run_id)
 def buffer_mcp_call(record: BaseMCPCall | dict[str, Any]) -> None:
-    """
-    Add an MCP call to the buffer for the current trace.
-    Args:
-        record: Either a Pydantic model instance or dictionary with MCP call data
-    """
-    # Only buffer if we have an active trace
     task_run_id = get_current_task_run_id()
-    if task_run_id is not None and task_run_id != "":
-        buffer = mcp_calls_buffer.get()
-        if buffer is None:
-            buffer = []
-        # Convert dictionary to proper model if needed
-        if isinstance(record, dict):
-            record = BaseMCPCall.from_dict(record)
+    if not task_run_id:
+        logger.warning(
+            "BUFFER_MCP_CALL: No task_run_id. Skipping buffer for %s", type(record).__name__
+        )
+        return
-        # Ensure the record has the current task_run_id
-        if record.task_run_id != task_run_id:
-            # Create a copy with the current task_run_id
-            record_dict = record.model_dump()
-            record_dict["task_run_id"] = task_run_id
-            record = BaseMCPCall.from_dict(record_dict)
+    # Ensure 'record' is a Pydantic model instance from here
+    if isinstance(record, dict):
+        try:
+            record_model = BaseMCPCall.from_dict(record)
+            record = record_model
+        except Exception as e_conv:
+            logger.exception("BUFFER_MCP_CALL: Failed to convert dict to BaseMCPCall: %s", e_conv)
+            return
-        # Add to buffer
-        buffer.append(record)
-        mcp_calls_buffer.set(buffer)
+    _GLOBAL_MCP_CALL_BUFFERS[task_run_id].append(record)
+    buffer_len = len(_GLOBAL_MCP_CALL_BUFFERS[task_run_id])
-        # Auto-flush if buffer gets too large
-        if len(buffer) >= MAX_BUFFER_SIZE:
-            logger.debug("MCP calls buffer reached size %d, auto-flushing", len(buffer))
-            flush_buffer(export=True)
+    if buffer_len >= MAX_BUFFER_SIZE:
+        flush_buffer(export=True)
 def flush_buffer(export: bool = False) -> list[BaseMCPCall]:
@@ -92,25 +77,16 @@ def flush_buffer(export: bool = False) -> list[BaseMCPCall]:
     Returns:
         The list of buffered MCP calls
     """
-    buffer = mcp_calls_buffer.get()
-    if buffer is None:
-        buffer = []
-    # Reset buffer to empty list
-    mcp_calls_buffer.set([])
-    if export and buffer and len(buffer) > 0:
-        task_id = buffer[0].task_run_id if buffer else None
-        if task_id:
-            logger.debug("Exporting %d MCP calls for task run %s", len(buffer), task_id)
-            # Create a telemetry record for export
-            _telemetry_record = MCPTelemetryRecord(task_run_id=task_id, records=buffer)
-            # In the future, we could call an export function here
-            # For now, just log that we have telemetry
-            logger.debug("MCP telemetry record created with %d calls", len(buffer))
-        else:
-            logger.warning("No task_run_id found in buffer, skipping export")
-    return buffer
+    task_run_id = get_current_task_run_id()
+    if not task_run_id:
+        logger.warning("FLUSH_BUFFER: No current task_run_id. Cannot flush.")
+        return []
+    buffer_for_task = _GLOBAL_MCP_CALL_BUFFERS.pop(
+        task_run_id, []
+    )  # Get and remove the list for this task
+    return buffer_for_task  # Return the flushed items
 def create_request_record(
@@ -150,6 +126,7 @@ def create_response_record(
         is_error=is_error,
         **kwargs,
     )
     buffer_mcp_call(record)
     return record
@@ -189,5 +166,4 @@ def create_manual_test_record(**custom_data: Any) -> MCPManualTestCall | None:
 def reset_context() -> None:
     """Reset all telemetry context variables. Useful for test isolation."""
     set_current_task_run_id(None)
-    mcp_calls_buffer.set([])
     is_root_trace.set(False)

hud/telemetry/instrumentation/mcp.py CHANGED Viewed

@@ -31,9 +31,6 @@ from hud.telemetry.mcp_models import DirectionType, MCPCallType, MCPManualTestCa
 logger = logging.getLogger(__name__)
-# Ensure no OTel imports remain
-# from opentelemetry import context as otel_context, propagate # Should be removed
 class MCPInstrumentor:
     """

hud/telemetry/tests/test_context.py CHANGED Viewed

@@ -140,9 +140,13 @@ class TestMCPCallBuffer:
         # Flush should return all calls from both tasks
         result = flush_buffer()
-        assert len(result) == 2
-        assert result[0] == mock_call_1
-        assert result[1] == mock_call_2
+        assert len(result) == 1
+        assert result[0] == mock_call_2
+        set_current_task_run_id("task-1")
+        result2 = flush_buffer()
+        assert len(result2) == 1
+        assert result2[0] == mock_call_1
     def test_buffer_mcp_call_without_task_id(self):
         """Test adding MCP call when no task run ID is set."""

hud/types.py CHANGED Viewed

@@ -48,7 +48,7 @@ class EnvironmentStatus(str, enum.Enum):
 # Available HUD gyms
-ServerGym: TypeAlias = Literal["qa", "hud-browser", "hud-ubuntu", "OSWorld-Ubuntu"]
+ServerGym: TypeAlias = Literal["qa", "hud-browser", "OSWorld-Ubuntu"]
 # Gyms can be either custom or server-side
 Gym: TypeAlias = CustomGym | ServerGym

hud/utils/tests/test_version.py CHANGED Viewed

@@ -5,4 +5,4 @@ def test_import():
     """Test that the package can be imported."""
     import hud
-    assert hud.__version__ == "0.2.5"
+    assert hud.__version__ == "0.2.6"

hud/version.py CHANGED Viewed

@@ -4,4 +4,4 @@ Version information for the HUD SDK.
 from __future__ import annotations
-__version__ = "0.2.5"
+__version__ = "0.2.6"

{hud_python-0.2.5.dist-info → hud_python-0.2.6.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: hud-python
-Version: 0.2.5
+Version: 0.2.6
 Summary: SDK for the HUD evaluation platform.
 Project-URL: Homepage, https://github.com/hud-evals/hud-sdk
 Project-URL: Bug Tracker, https://github.com/hud-evals/hud-sdk/issues
@@ -74,17 +74,17 @@ Description-Content-Type: text/markdown
 </div>
 <h3>
-Create, evaluate, and improve AI agents across web browsers, desktop environments, and custom scenarios.
+Evaluate your Computer Use AI agents across web browsers, desktop environments, and custom scenarios.
 </h3>
-> ### 🚀 Are you a startup building agents?
->
-> [📅 Hop on a call ](https://cal.com/jay-ram-z6st6w/demo) or [📧 founders@hud.so](mailto:founders@hud.so)
->
-> We're here to help with eval strategies, custom environments, or improving your agent architecture!
+### 🚀 Are you a startup building agents?
+[📅 Hop on a call](https://cal.com/jay-ram-z6st6w/demo) or [📧 founders@hud.so](mailto:founders@hud.so)
-> **Early Release Notice**: This SDK is currently in early release status. The API is evolving and may change in future releases as we gather feedback and improve functionality.
+We're here to help with eval strategies, custom environments, or improving your agent architecture!
+> **Early Release Notice**: We'd love to hear your feedback in [Issues](https://github.com/hud-evals/hud-sdk/issues), as the SDK is still evolving!
 [![PyPI version](https://img.shields.io/pypi/v/hud-python)](https://pypi.org/project/hud-python/)
@@ -132,23 +132,23 @@ with hud.trace("my-agent-run"):
     result = await agent.run(task)
 ```
-## API Key Setup
-Before getting started, you'll need to obtain an API key:
+## Quick Start
-1. Visit [app.hud.so](https://app.hud.so) to create a free account and generate your API key
-2. Set it in your environment or .env file:
+### Installation
 ```bash
-export HUD_API_KEY=your_api_key_here
+pip install hud-python
 ```
-## Quick Start
+### API Key Setup
-### Installation
+Before getting started, you'll need to obtain an API key:
+1. Visit [app.hud.so](https://app.hud.so) to create a free account and generate your API key
+2. Set it in your environment or .env file:
 ```bash
-pip install hud-python
+export HUD_API_KEY=your_api_key_here
 ```
 ### Simple Browser Example with Claude Computer Use
@@ -269,4 +269,4 @@ If you use this SDK in your research, please cite it as follows:
   url = {https://github.com/hud-evals/hud-sdk},
   langid = {en}
 }
-```
+```

{hud_python-0.2.5.dist-info → hud_python-0.2.6.dist-info}/RECORD RENAMED Viewed

@@ -1,13 +1,13 @@
 hud/__init__.py,sha256=6PlxwtjYyaqk6UAyHLJZhsiHRlgndH-Jja9f9BtInUY,1063
 hud/exceptions.py,sha256=pifKvSqxj9_g4NfARVyH5a-lTThhi9XW06tIXaBakQw,5526
 hud/gym.py,sha256=Dl7nur2QTxoVNAcWIvFjuGAbKmoc7CVgjV5gWd35usU,4544
-hud/job.py,sha256=uSF5o5WTgk8d0UxpQ6YlNcw7fXDUaN8Lpu0RL6xbHNc,25188
-hud/settings.py,sha256=B3uBiZMhJzsy4Wd41bioN31CQRNfyBN52hLQnkLaJPU,1507
+hud/job.py,sha256=bd88L83L3uqdXE7B3Bjsk8hGk95OggJiLjItFsZXDoQ,25116
+hud/settings.py,sha256=3zALwVbPTaDc01-dR_-rGsrDfc-ieMIcmO5avv6S2Y0,1510
 hud/task.py,sha256=AMmJLYl3BjX8TfBY4ZuR_QIXhTkWDX-4C_Pbi3HziVg,5505
-hud/taskset.py,sha256=WvmwlqnbPbZshZXAfl9qSFeV89k5gHJE4rvluvgz5hk,4581
+hud/taskset.py,sha256=ou2Ivulv392txtDvXDpvJAgHj_4h2LZNBaxpeC_mRnw,4903
 hud/trajectory.py,sha256=OrcRbxK_ejFp1VhJCjZnM1WCmCXxEOK4CxNjCngcsjo,3721
-hud/types.py,sha256=kk93J7DJIL574vZIKhx3Ka1wRxQ3ZAXOaYhdecufuUo,1822
-hud/version.py,sha256=sQ1p2i655QksGNtiO7-7ybulzQTw0yiFR_QM9mRm5hk,104
+hud/types.py,sha256=O8eotDLw4onwRreX9xLPZ2T11qf8wwUidaqGI7jvagY,1808
+hud/version.py,sha256=4c7HS3iYXZGe4vuaPb8pgYwVInf3F3G95h0PITpm6aw,104
 hud/adapters/__init__.py,sha256=zz24KdC_e9TJPgWo6y57_8SzevEE5ak4Cm6tXzMxwRk,266
 hud/adapters/claude/__init__.py,sha256=i7QEF-29FLb9qxp1eYtXs-adIk_tG54tL-9g6d3xodk,100
 hud/adapters/claude/adapter.py,sha256=_qUD0iu0_Y_8yuhrsZw2E5wNv8RB-Aa7BqclAmNHdtI,6096
@@ -25,7 +25,7 @@ hud/adapters/operator/tests/test_adapter.py,sha256=4RAXwyxAtkh-1Mlt1zJayRkcv3LWa
 hud/agent/__init__.py,sha256=_OxMG3UW1vXSuixdpo09b1jexfWcUbfK44zto8t6_LE,453
 hud/agent/base.py,sha256=d7eMoRPepVSCFUyU1oV1hGvyff8rsPtXDelVcJlEF7Y,4022
 hud/agent/claude.py,sha256=bXgdzlZHaIHaxrGIYt6w1kEh5oHFDT5P2u304swi8wU,7529
-hud/agent/claude_plays_pokemon.py,sha256=cZ_hlYGux16Ucjvj_DOnFgGvu9q93PWriPIQPrifxiY,9968
+hud/agent/claude_plays_pokemon.py,sha256=H1AIXb6qNE-45G5CdBgsDGTMXOgjg44wGtySgeKgeq4,10009
 hud/agent/langchain.py,sha256=iuMpu-k55Qic0LCzfOR0Wa5kDhIv7zHCc8et3axypus,8833
 hud/agent/operator.py,sha256=Bji_v6NB-hUyTe1otdpEc3Hb0ZpyQbuL_iZu5irYFe4,8612
 hud/agent/misc/__init__.py,sha256=-ftYH1T5r7fXKKra6d8jXYmUz9KOTmYwBrPJU-V3S7g,71
@@ -38,7 +38,7 @@ hud/env/docker_client.py,sha256=-nQLGeRl9GLJKEku1eIBL3RQuteIPLrecjVHxzSD_vU,1046
 hud/env/environment.py,sha256=hSJh5KaiGuWw4IEV1IHNDVjOxyoyOxhHkavGj_5RBbQ,15154
 hud/env/local_docker_client.py,sha256=bcgmmRJGX1--bf0-5Zlk59l2W0PvABnDn4FWZKvXjjk,9565
 hud/env/remote_client.py,sha256=gjCzcuotvDC7GraVBBT2Tix5GKpntwtldv5PqnXx8wk,6109
-hud/env/remote_docker_client.py,sha256=khdAaNfwdiG6pl6XKGHI6pFqMSPBn0brQPZ-09XhZ-c,9484
+hud/env/remote_docker_client.py,sha256=ZLqbd6IeU9BDndjwanmJN3_1CEsrCkntumGavLiPi88,9484
 hud/evaluators/__init__.py,sha256=V5nktEAw3EDn2Y537pjia5Y1IjdLBIPrDjTs6YTCdX4,153
 hud/evaluators/base.py,sha256=ALO9Rj-R_9HtHIHYp84bsQQD12De0XnCTwad78_T5-k,771
 hud/evaluators/inspect.py,sha256=ZvrTXLpgibyvQ5aNXAMP4quyXISrRQHg9besDcuCx7U,692
@@ -51,19 +51,19 @@ hud/evaluators/tests/test_judge.py,sha256=c1GaAeq_WpBVgBlx-gQncHrOPokzKNxlbgiC8W
 hud/evaluators/tests/test_match.py,sha256=C04GoluyT9i41YZ65xEjN7tKHQbENbrpNhNtUd4ivmA,3919
 hud/evaluators/tests/test_remote.py,sha256=YdJpyyuRLkYP0e3jTUkD3zobS2WHQPePn8yBZtYOIN4,3243
 hud/server/__init__.py,sha256=IPxPCqtPLguryN-nBq78Sakypw2bRiE2iHv3SXG8YRk,139
-hud/server/requests.py,sha256=U0WEeY8AzsLMSICebxQyF0FEbXpKieh-3Qnisd0C6a4,7881
+hud/server/requests.py,sha256=AnFW4ELojjvfF6xjS2no6_fg4Rph2aR2hjPzYTede0Q,8841
 hud/server/tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 hud/server/tests/test_requests.py,sha256=63YCbykcib5MxKxm-OgHJPLX3QC7hmgIwnWaYukVM6s,9077
 hud/telemetry/__init__.py,sha256=ky48kuZD3Bt0vOf9FwZwkV_ka7O26Tvcxh7p1lMpsMk,582
 hud/telemetry/_trace.py,sha256=W7S6CxwtmjNl4OZbA1SQHXsaNm072J9c-fjPjQomgOY,5135
-hud/telemetry/context.py,sha256=pFwst_TLo6izM_k2h--y_qg7uZovdJ36GC7aeaZHMiE,6309
+hud/telemetry/context.py,sha256=PNbfrMgjeRTTg0nUKXYCflqn71I_cSjU8LXdvouUfc4,5209
 hud/telemetry/exporter.py,sha256=l-r7mADcHpn6i9hhB407hx3HS4khfbhuwX0txJ2X0VQ,17986
 hud/telemetry/mcp_models.py,sha256=YIArMtCVfC4NVvaEmUYs_kxDs0GQ-xtFFmB8jEGKaag,11342
 hud/telemetry/instrumentation/__init__.py,sha256=vHmSqaJMMehgRNn6EN2SMoYDD12rSHkLeVmj7Uy1my0,88
-hud/telemetry/instrumentation/mcp.py,sha256=ugkcP0V0UNO6Zy4zueF1jPr4jdqLXF81H8HNwHhcDzI,22041
+hud/telemetry/instrumentation/mcp.py,sha256=xGAMdhTgM1ixHiDX7xkS9Ax1NCjK3u7pLWIbIh8WZIA,21925
 hud/telemetry/instrumentation/registry.py,sha256=UVaSsEA693lvKYd5R3n3ve6GcAB1fwqubRwIVeZiNmo,1821
 hud/telemetry/tests/__init__.py,sha256=QMN8OzfrBUDbQESwrwHCqXLdDwCjYWX8BJcpeLUJfqA,33
-hud/telemetry/tests/test_context.py,sha256=ZQ8ubuTRQoiMq-L3Zl-Ucy8Ma1a--z1gdFoAnFO3m3Q,6421
+hud/telemetry/tests/test_context.py,sha256=BGRDlXXC_VbpD4cYl_o9gRQDDKb2ox1das_ZuX14NC8,6531
 hud/telemetry/tests/test_trace.py,sha256=JzmjNRtHdQFPqLm7hOPastENg-hMJo9p8bbxJ77iXyc,10687
 hud/utils/__init__.py,sha256=oSl_gGoS272X2VFnBYX8hLxcP2xgGoBYQXAuLhtQgw8,260
 hud/utils/common.py,sha256=R83ntEtKr8KXG1mKcy0I_OllFHkDrPMysPhW12uBckc,3926
@@ -76,9 +76,9 @@ hud/utils/tests/test_common.py,sha256=gbYpQKBNdbCcEH0v1UZpxLt_NW2T5sETMIJKvy8S8p
 hud/utils/tests/test_config.py,sha256=dPlXYWuMrxX-NOYbf0vdJ27TJpfacKG8eiKOSGOcfDU,4079
 hud/utils/tests/test_progress.py,sha256=QunwDgi_heQXhDgmC25zgjr-sFUu5FdJ_1aYigMKeIc,6351
 hud/utils/tests/test_telemetry.py,sha256=t0An1RTBaE0dZVEpF4uwuq5k1R-PXFR5k4u71h60tx8,1224
-hud/utils/tests/test_version.py,sha256=CPQuXvuX4wOLxEvIKxaaEOLjxVCx_WjCv0XyokJM3X8,159
+hud/utils/tests/test_version.py,sha256=wDkcJbOW78FEZpIGKXST347GOm3o_NBVONZ3RhkYIM4,159
 hud/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-hud_python-0.2.5.dist-info/METADATA,sha256=s6u-MGNcVTbnhFqnzdodctjywOzGx7OMzAPMivBfeaI,9511
-hud_python-0.2.5.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-hud_python-0.2.5.dist-info/licenses/LICENSE,sha256=yIzBheVUf86FC1bztAcr7RYWWNxyd3B-UJQ3uddg1HA,1078
-hud_python-0.2.5.dist-info/RECORD,,
+hud_python-0.2.6.dist-info/METADATA,sha256=xXaqxhBWDKs-vkGiCi19m4wBSbbuehk4fEd1zP5Ufbg,9469
+hud_python-0.2.6.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+hud_python-0.2.6.dist-info/licenses/LICENSE,sha256=yIzBheVUf86FC1bztAcr7RYWWNxyd3B-UJQ3uddg1HA,1078
+hud_python-0.2.6.dist-info/RECORD,,

{hud_python-0.2.5.dist-info → hud_python-0.2.6.dist-info}/WHEEL RENAMED Viewed

File without changes

{hud_python-0.2.5.dist-info → hud_python-0.2.6.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

hud-python 0.2.5__py3-none-any.whl → 0.2.6__py3-none-any.whl

Potentially problematic release.

hud-python 0.2.5py3-none-any.whl → 0.2.6py3-none-any.whl