PyPI - hud-python - Versions diffs - 0.4.0__py3-none-any.whl → 0.4.2__py3-none-any.whl - Mend

hud-python 0.4.0py3-none-any.whl → 0.4.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hud-python might be problematic. Click here for more details.

Files changed (130) hide show

hud/__init__.py +22 -22
hud/agents/__init__.py +13 -17
hud/agents/base.py +599 -599
hud/agents/claude.py +373 -373
hud/agents/langchain.py +250 -250
hud/agents/misc/__init__.py +7 -7
hud/agents/misc/response_agent.py +80 -80
hud/agents/openai.py +352 -352
hud/agents/openai_chat_generic.py +154 -154
hud/agents/tests/__init__.py +1 -1
hud/agents/tests/test_base.py +742 -742
hud/agents/tests/test_claude.py +324 -324
hud/agents/tests/test_client.py +363 -363
hud/agents/tests/test_openai.py +237 -237
hud/cli/__init__.py +617 -617
hud/cli/__main__.py +8 -8
hud/cli/analyze.py +371 -371
hud/cli/analyze_metadata.py +230 -230
hud/cli/build.py +427 -427
hud/cli/clone.py +185 -185
hud/cli/cursor.py +92 -92
hud/cli/debug.py +392 -392
hud/cli/docker_utils.py +83 -83
hud/cli/init.py +281 -281
hud/cli/interactive.py +353 -353
hud/cli/mcp_server.py +789 -756
hud/cli/pull.py +336 -336
hud/cli/push.py +370 -379
hud/cli/remote_runner.py +311 -311
hud/cli/runner.py +160 -160
hud/cli/tests/__init__.py +3 -3
hud/cli/tests/test_analyze.py +284 -284
hud/cli/tests/test_cli_init.py +265 -265
hud/cli/tests/test_cli_main.py +27 -27
hud/cli/tests/test_clone.py +142 -142
hud/cli/tests/test_cursor.py +253 -253
hud/cli/tests/test_debug.py +453 -453
hud/cli/tests/test_mcp_server.py +139 -139
hud/cli/tests/test_utils.py +388 -388
hud/cli/utils.py +263 -263
hud/clients/README.md +143 -143
hud/clients/__init__.py +16 -16
hud/clients/base.py +379 -354
hud/clients/fastmcp.py +202 -202
hud/clients/mcp_use.py +278 -278
hud/clients/tests/__init__.py +1 -1
hud/clients/tests/test_client_integration.py +111 -111
hud/clients/tests/test_fastmcp.py +342 -342
hud/clients/tests/test_protocol.py +188 -188
hud/clients/utils/__init__.py +1 -1
hud/clients/utils/retry_transport.py +160 -160
hud/datasets.py +322 -322
hud/misc/__init__.py +1 -1
hud/misc/claude_plays_pokemon.py +292 -292
hud/otel/__init__.py +35 -35
hud/otel/collector.py +142 -142
hud/otel/config.py +164 -164
hud/otel/context.py +536 -536
hud/otel/exporters.py +366 -366
hud/otel/instrumentation.py +97 -97
hud/otel/processors.py +118 -118
hud/otel/tests/__init__.py +1 -1
hud/otel/tests/test_processors.py +197 -197
hud/server/__init__.py +5 -5
hud/server/context.py +114 -114
hud/server/helper/__init__.py +5 -5
hud/server/low_level.py +132 -132
hud/server/server.py +170 -166
hud/server/tests/__init__.py +3 -3
hud/settings.py +73 -73
hud/shared/__init__.py +5 -5
hud/shared/exceptions.py +180 -180
hud/shared/requests.py +264 -264
hud/shared/tests/test_exceptions.py +157 -157
hud/shared/tests/test_requests.py +275 -275
hud/telemetry/__init__.py +25 -25
hud/telemetry/instrument.py +379 -379
hud/telemetry/job.py +309 -309
hud/telemetry/replay.py +74 -74
hud/telemetry/trace.py +83 -83
hud/tools/__init__.py +33 -33
hud/tools/base.py +365 -365
hud/tools/bash.py +161 -161
hud/tools/computer/__init__.py +15 -15
hud/tools/computer/anthropic.py +437 -437
hud/tools/computer/hud.py +376 -376
hud/tools/computer/openai.py +295 -295
hud/tools/computer/settings.py +82 -82
hud/tools/edit.py +314 -314
hud/tools/executors/__init__.py +30 -30
hud/tools/executors/base.py +539 -539
hud/tools/executors/pyautogui.py +621 -621
hud/tools/executors/tests/__init__.py +1 -1
hud/tools/executors/tests/test_base_executor.py +338 -338
hud/tools/executors/tests/test_pyautogui_executor.py +165 -165
hud/tools/executors/xdo.py +511 -511
hud/tools/playwright.py +412 -412
hud/tools/tests/__init__.py +3 -3
hud/tools/tests/test_base.py +282 -282
hud/tools/tests/test_bash.py +158 -158
hud/tools/tests/test_bash_extended.py +197 -197
hud/tools/tests/test_computer.py +425 -425
hud/tools/tests/test_computer_actions.py +34 -34
hud/tools/tests/test_edit.py +259 -259
hud/tools/tests/test_init.py +27 -27
hud/tools/tests/test_playwright_tool.py +183 -183
hud/tools/tests/test_tools.py +145 -145
hud/tools/tests/test_utils.py +156 -156
hud/tools/types.py +72 -72
hud/tools/utils.py +50 -50
hud/types.py +136 -136
hud/utils/__init__.py +10 -10
hud/utils/async_utils.py +65 -65
hud/utils/design.py +168 -168
hud/utils/mcp.py +55 -55
hud/utils/progress.py +149 -149
hud/utils/telemetry.py +66 -66
hud/utils/tests/test_async_utils.py +173 -173
hud/utils/tests/test_init.py +17 -17
hud/utils/tests/test_progress.py +261 -261
hud/utils/tests/test_telemetry.py +82 -82
hud/utils/tests/test_version.py +8 -8
hud/version.py +7 -7
{hud_python-0.4.0.dist-info → hud_python-0.4.2.dist-info}/METADATA +23 -19
hud_python-0.4.2.dist-info/RECORD +131 -0
{hud_python-0.4.0.dist-info → hud_python-0.4.2.dist-info}/licenses/LICENSE +21 -21
hud/agents/art.py +0 -101
hud_python-0.4.0.dist-info/RECORD +0 -132
{hud_python-0.4.0.dist-info → hud_python-0.4.2.dist-info}/WHEEL +0 -0
{hud_python-0.4.0.dist-info → hud_python-0.4.2.dist-info}/entry_points.txt +0 -0

hud/utils/tests/test_telemetry.py CHANGED Viewed

@@ -1,82 +1,82 @@
-from __future__ import annotations
-from unittest.mock import patch
-from hud.utils.telemetry import stream
-def test_stream():
-    html_content = stream("https://example.com")
-    assert html_content is not None
-    assert "<div style=" in html_content
-    assert 'src="https://example.com"' in html_content
-def test_stream_with_display_exception():
-    """Test stream when IPython display raises an exception."""
-    with (
-        patch("IPython.display.display", side_effect=Exception("Display error")),
-        patch("hud.utils.telemetry.logger") as mock_logger,
-    ):
-        html_content = stream("https://example.com")
-        # Should still return the HTML content
-        assert html_content is not None
-        assert 'src="https://example.com"' in html_content
-        # Should log the warning
-        mock_logger.warning.assert_called_once()
-        args = mock_logger.warning.call_args[0]
-        assert "Display error" in str(args[0])
-def test_display_screenshot():
-    from hud.utils.telemetry import display_screenshot
-    # This is a simple 1x1 transparent PNG image in base64 format
-    base64_image = (
-        "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mP8z8BQDwAEhQGAhKmMIQ"
-        "AAABJRU5ErkJggg=="
-    )
-    html_content = display_screenshot(base64_image)
-    assert html_content is not None
-    assert "<div style=" in html_content
-    assert "width: 960px" in html_content
-    assert "height: 540px" in html_content
-    assert f"data:image/png;base64,{base64_image}" in html_content
-    # Test with custom dimensions
-    custom_html = display_screenshot(base64_image, width=800, height=600)
-    assert "width: 800px" in custom_html
-    assert "height: 600px" in custom_html
-    # Test with data URI already included
-    data_uri = f"data:image/png;base64,{base64_image}"
-    uri_html = display_screenshot(data_uri)
-    assert data_uri in uri_html
-def test_display_screenshot_with_exception():
-    """Test display_screenshot when IPython display raises an exception."""
-    from hud.utils.telemetry import display_screenshot
-    base64_image = (
-        "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mP8z8BQDwAEhQGAhKmMIQ"
-        "AAABJRU5ErkJggg=="
-    )
-    with (
-        patch("IPython.display.display", side_effect=Exception("Display error")),
-        patch("hud.utils.telemetry.logger") as mock_logger,
-    ):
-        html_content = display_screenshot(base64_image)
-        # Should still return the HTML content
-        assert html_content is not None
-        assert f"data:image/png;base64,{base64_image}" in html_content
-        # Should log the warning
-        mock_logger.warning.assert_called_once()
-        args = mock_logger.warning.call_args[0]
-        assert "Display error" in str(args[0])
+from __future__ import annotations
+from unittest.mock import patch
+from hud.utils.telemetry import stream
+def test_stream():
+    html_content = stream("https://example.com")
+    assert html_content is not None
+    assert "<div style=" in html_content
+    assert 'src="https://example.com"' in html_content
+def test_stream_with_display_exception():
+    """Test stream when IPython display raises an exception."""
+    with (
+        patch("IPython.display.display", side_effect=Exception("Display error")),
+        patch("hud.utils.telemetry.logger") as mock_logger,
+    ):
+        html_content = stream("https://example.com")
+        # Should still return the HTML content
+        assert html_content is not None
+        assert 'src="https://example.com"' in html_content
+        # Should log the warning
+        mock_logger.warning.assert_called_once()
+        args = mock_logger.warning.call_args[0]
+        assert "Display error" in str(args[0])
+def test_display_screenshot():
+    from hud.utils.telemetry import display_screenshot
+    # This is a simple 1x1 transparent PNG image in base64 format
+    base64_image = (
+        "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mP8z8BQDwAEhQGAhKmMIQ"
+        "AAABJRU5ErkJggg=="
+    )
+    html_content = display_screenshot(base64_image)
+    assert html_content is not None
+    assert "<div style=" in html_content
+    assert "width: 960px" in html_content
+    assert "height: 540px" in html_content
+    assert f"data:image/png;base64,{base64_image}" in html_content
+    # Test with custom dimensions
+    custom_html = display_screenshot(base64_image, width=800, height=600)
+    assert "width: 800px" in custom_html
+    assert "height: 600px" in custom_html
+    # Test with data URI already included
+    data_uri = f"data:image/png;base64,{base64_image}"
+    uri_html = display_screenshot(data_uri)
+    assert data_uri in uri_html
+def test_display_screenshot_with_exception():
+    """Test display_screenshot when IPython display raises an exception."""
+    from hud.utils.telemetry import display_screenshot
+    base64_image = (
+        "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mP8z8BQDwAEhQGAhKmMIQ"
+        "AAABJRU5ErkJggg=="
+    )
+    with (
+        patch("IPython.display.display", side_effect=Exception("Display error")),
+        patch("hud.utils.telemetry.logger") as mock_logger,
+    ):
+        html_content = display_screenshot(base64_image)
+        # Should still return the HTML content
+        assert html_content is not None
+        assert f"data:image/png;base64,{base64_image}" in html_content
+        # Should log the warning
+        mock_logger.warning.assert_called_once()
+        args = mock_logger.warning.call_args[0]
+        assert "Display error" in str(args[0])

hud/utils/tests/test_version.py CHANGED Viewed

@@ -1,8 +1,8 @@
-from __future__ import annotations
-def test_import():
-    """Test that the package can be imported."""
-    import hud
-    assert hud.__version__ == "0.4.0"
+from __future__ import annotations
+def test_import():
+    """Test that the package can be imported."""
+    import hud
+    assert hud.__version__ == "0.4.2"

hud/version.py CHANGED Viewed

@@ -1,7 +1,7 @@
-"""
-Version information for the HUD SDK.
-"""
-from __future__ import annotations
-__version__ = "0.4.0"
+"""
+Version information for the HUD SDK.
+"""
+from __future__ import annotations
+__version__ = "0.4.2"

{hud_python-0.4.0.dist-info → hud_python-0.4.2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: hud-python
-Version: 0.4.0
+Version: 0.4.2
 Summary: SDK for the HUD platform.
 Project-URL: Homepage, https://github.com/hud-evals/hud-python
 Project-URL: Bug Tracker, https://github.com/hud-evals/hud-python/issues
@@ -114,10 +114,10 @@ OSS RL environment + evals toolkit. Wrap software as environments, run benchmark
 ## Highlights
-- 🚀 **[MCP-native connectivity](https://docs.hud.so/core-concepts/mcp-protocol)** – any agent can call any hud environment.
+- 🚀 **[MCP environment skeleton](https://docs.hud.so/core-concepts/mcp-protocol)** – any agent can call any environment.
 - ⚡️ **[Live telemetry](https://app.hud.so)** – inspect every tool call, observation, and reward in real time.
 - 🗂️ **[Public benchmarks](https://app.hud.so/leaderboards)** – OSWorld-Verified, SheetBench-50, and more.
-- 🌱 **[Reinforcement learning built-in](rl/)** – Verifiers gym pipelines for GRPO training.
+- 🌱 **[Reinforcement learning built-in](rl/)** – Verifiers gym pipelines for GRPO on any environment.
 - 🌐 **[Cloud browsers](environments/remote_browser/)** – AnchorBrowser, Steel, BrowserBase integrations for browser automation.
 - 🛠️ **[Hot-reload dev loop](environments/README.md#phase-5-hot-reload-development-with-cursor-agent)** – `hud dev` for iterating on environments without rebuilds.
@@ -129,11 +129,12 @@ OSS RL environment + evals toolkit. Wrap software as environments, run benchmark
 # Core installation - MCP servers, telemetry, basic tools for environment design
 pip install hud-python
-# Agent installation - Adds AI providers, telemetry, datasets
+# Agent installation - Adds AI providers, datasets
 pip install "hud-python[agent]"
 # CLI utilities
 uv tool install hud-python
+# uv tool update-shell
 # From source (latest)
 git clone https://github.com/hud-evals/hud-python
@@ -151,7 +152,7 @@ For a tutorial that explains the agent and evaluation design, run ([see quicksta
 uvx hud-python quickstart
 ```
-Or just write your own agent loop (more [examples here](examples/)):
+Or just write your own agent loop (more [examples here](examples/)).
 ```python
 import asyncio, hud, os
@@ -162,19 +163,20 @@ from hud.datasets import Task  # See docs: https://docs.hud.so/reference/tasks
 async def main() -> None:
     with hud.trace("Quick Start 2048"): # All telemetry works for any MCP-based agent (see https://app.hud.so)
-        task = Task(
-            prompt="Reach 64 in 2048.",
-            mcp_config={
+        task = {
+            "prompt": "Reach 64 in 2048.",
+            "mcp_config": {
                 "hud": {
-                    "url": "https://mcp.hud.so",  # HUD's cloud MCP server (see https://docs.hud.so/core-concepts/architecture)
+                    "url": "https://mcp.hud.so/v3/mcp",  # HUD's cloud MCP server (see https://docs.hud.so/core-concepts/architecture)
                     "headers": {
-                        "Authorization": f"Bearer {os.getenv('HUD_API_KEY')}",  # Get your key at https://app.hud.so
-                        "Mcp-Image": "hudpython/hud-text-2048:v1.1"  # Docker image from https://hub.docker.com/u/hudpython
+                        "Authorization": f"Bearer {settings.api_key}",  # Get your key at https://app.hud.so
+                        "Mcp-Image": "hudpython/hud-text-2048:v1.2"  # Docker image from https://hub.docker.com/u/hudpython
                     }
                 }
             },
-            evaluate_tool={"name": "evaluate", "arguments": {"name": "max_number", "target": 64}},
-        )
+            "evaluate_tool": {"name": "evaluate", "arguments": {"name": "max_number", "arguments": {"target": 64}}},
+        }
+        task = Task(**task)
         # 1. Define the client explicitly:
         client = MCPClient(mcp_config=task.mcp_config)
@@ -189,16 +191,18 @@ async def main() -> None:
         # result = await ClaudeAgent().run(task)
         print(f"Reward: {result.reward}")
-        await client.close()
+        await client.shutdown()
 asyncio.run(main())
 ```
-> Every HUD environment is MCP-based and interactable from anywhere. Requires `HUD_API_KEY` and `ANTHROPIC_API_KEY`.
+The above example let's the agent play 2048 ([See replay](https://app.hud.so/trace/6feed7bd-5f67-4d66-b77f-eb1e3164604f))
+![Agent playing 2048](https://raw.githubusercontent.com/hud-evals/hud-python/main/docs/src/images/2048_1.gif)
 ## Reinforcement Learning with GRPO
-This is a Qwen-2.5-3B agent training a policy on the [`text-2048`](environments/text_2048/) environment using [Verifiers](rl/verifiers/):
+This is a Qwen-2.5-3B agent training a policy on the [`text-2048`](environments/text_2048/) environment (see above) using [Verifiers](rl/README):
 ![RL curve](https://raw.githubusercontent.com/hud-evals/hud-python/main/docs/src/images/rl_2.png)
@@ -206,8 +210,8 @@ To start training, check out the [`rl/README.md`](rl/README.md) folder:
 ```bash
 git clone https://github.com/hud-evals/hud-python
-cd hud-python
-python rl/verifiers/train_2048.py
+cd hud-python/rl
+python train_2048.py
 ```
 Any hud MCP environment and evaluation works with our RL pipeline. Even our remote configurations!
@@ -346,7 +350,7 @@ result = await ClaudeAgent().run({  # See all agents: https://docs.hud.so/refere
     "prompt": "Please explore this environment",
     "mcp_config": {
         "my-environment": {
-            "url": "https://mcp.hud.so",
+            "url": "https://mcp.hud.so/v3/mcp",
             "headers": {
                 "Authorization": f"Bearer {os.getenv('HUD_API_KEY')}",
                 "Mcp-Image": "my-name/my-environment:latest"

hud_python-0.4.2.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,131 @@
+hud/__init__.py,sha256=BjAhZtsHbGN371Q8t3o4v4jltedkmDE85xW0yOILU9g,397
+hud/datasets.py,sha256=3QIZyAdbzlSghE44EIhehWOAoE8CPvLyS40FM2X2a4U,11892
+hud/settings.py,sha256=WIJDsyrfwBZGcaGT46YUOpW8xjBZl3siXXprd92ASAg,2039
+hud/types.py,sha256=pQWOPYXUZ2hhK0h-AHBc3DCj5tkbRXHqKZnsQQIcSFA,4237
+hud/version.py,sha256=npIZLGW0QouBuUp2GO8yLq33HW7-l4Zd9UXWHtiYJos,104
+hud/agents/__init__.py,sha256=UoIkljWdbq4bM0LD-mSaw6w826EqdEjOk7r6glNYwYQ,286
+hud/agents/base.py,sha256=OdvuPMMZFGMft5PEkImjs_nWi-05hJyGJMBSOGbtxBo,22258
+hud/agents/claude.py,sha256=snbYFPW-KAkw4n9Rdz7dC2f46RuSHJKC53HPm8SucFM,14273
+hud/agents/langchain.py,sha256=FTofalIKYZEM7W2AQ1OErk8Jdo47V4tDT7xaiR8RDsA,9129
+hud/agents/openai.py,sha256=kHG73mohO4uru49qmQiygUFt0eDCGJU06weqIUwTO3Y,14323
+hud/agents/openai_chat_generic.py,sha256=jTJ-KY6HkglPK0iwZH5v3PVnaUjDsWc9IbRo3AbXlyE,5322
+hud/agents/misc/__init__.py,sha256=BYi4Ytp9b_vycpZFXnr5Oyw6ncKLNNGml8Jrb7bWUb4,136
+hud/agents/misc/response_agent.py,sha256=qqvRSH-e5NaLXXUFSt3aXZauDE8JlWAabMymrJr9bd4,3036
+hud/agents/tests/__init__.py,sha256=W-O-_4i34d9TTyEHV-O_q1Ai1gLhzwDaaPo02_TWQIY,34
+hud/agents/tests/test_base.py,sha256=F39ajSqASGUbPyPoWSY9KARFav62qNTK74W11Tr1Tg4,28970
+hud/agents/tests/test_claude.py,sha256=wqEKlzEvx8obz1sSm4NY0j-Zyt1qWNfDOmRqYIuAEd0,13069
+hud/agents/tests/test_client.py,sha256=Sk5bGZw2hL5GsVi2LMp9tsLngl5ZQ18pkpeeQmts0ao,13908
+hud/agents/tests/test_openai.py,sha256=VcAUMcmwWttOxy9CCSu8QFIvAHG8ZMLUdQMeP04oK9Q,9026
+hud/cli/__init__.py,sha256=IsP148YyCod5gC-CduIN6MGGCLsITBe-kEtzE4NqbLo,21734
+hud/cli/__main__.py,sha256=fDH7XITyuDITwSDIVwRso06aouADO0CzTHKqp5TOwJE,143
+hud/cli/analyze.py,sha256=G-tjT1xLPLcYhDhZEaI7TAIS0z0OACUksnGFoAWd2ag,14416
+hud/cli/analyze_metadata.py,sha256=Mgs_je-XbPulG6noRLRNXe3_3a1eb20Cvxz5OQJ2NeU,8262
+hud/cli/build.py,sha256=4wMigENf6dpL9Eu0wN9SvgGWMHIh85IEJ1WKuNyVrfs,14263
+hud/cli/clone.py,sha256=AwVDIuhr8mHb1oT2Af2HrD25SiTdwATpE6zd93vzLgA,6099
+hud/cli/cursor.py,sha256=fy850p0rVp5k_1wwOCI7rK1SggbselJrywFInSQ2gio,3009
+hud/cli/debug.py,sha256=pa24bP4KVE0vdvrODuN57i2t8YDHxKJgwzXy7eD2tBE,13613
+hud/cli/docker_utils.py,sha256=5k5sXtI4V5d4VWRJR6lzVRy_Hu8Wf1nLsmW-dBNW0cM,2695
+hud/cli/init.py,sha256=wbGfKx-A17mSYw1aubRT3Ggt12A3PIkvZL6aW0AxoxU,7780
+hud/cli/interactive.py,sha256=w1fAoefizNKqjcl5Fi5EgEsUdPpXKcCFuU-Z-S3CL9o,12863
+hud/cli/mcp_server.py,sha256=ZdJA8M8DtLvda4xQOQ0MuEOTvRR8_ZEIaIW-Qs8DfZ0,29609
+hud/cli/pull.py,sha256=SmbaHXaDKgazovYbw4we1og1qtT-B4opEjiDOlaNZcs,11939
+hud/cli/push.py,sha256=Cbjiy0AAcvgFcatAz3H2t3IhxsHMbLlc0WcdQwXe9V0,14163
+hud/cli/remote_runner.py,sha256=X01x6DeVkyc9HgxVCGEZJxEhhVPvHpAMoeYR44R8_BQ,9405
+hud/cli/runner.py,sha256=ukEr6ZmD5rs-taoEBu0P_-hr275d-ZE5_WAR-dvSqrw,4888
+hud/cli/utils.py,sha256=ZgjjKVPAa7dcfJ6SMBrdfZ63d1UnnhYC-zeh7gFBXsI,8841
+hud/cli/tests/__init__.py,sha256=ZrGVkmH7DHXGqOvjOSNGZeMYaFIRB2K8c6hwr8FPJ-8,68
+hud/cli/tests/test_analyze.py,sha256=1VGIjpvZXD6N4j2yRoVddug2jQ6tJn41NWw-ScAVztw,10971
+hud/cli/tests/test_cli_init.py,sha256=_H0bAn5_skJ91Zj8P5P_wtZoPWvrN7jMhPZvmnnf0n8,11289
+hud/cli/tests/test_cli_main.py,sha256=0wMho9p9NcGjp0jLiUtCQh_FYdbMaCJtSY3sBbSgPwA,697
+hud/cli/tests/test_clone.py,sha256=oC2mf-41QQVc7ODJkjrWbVPNMB2fDW3nZ6jY6w93gvQ,4458
+hud/cli/tests/test_cursor.py,sha256=cvQ6dudMGmY4LifaJKm9iRIRvqvbFwibZgowd5goWPY,9815
+hud/cli/tests/test_debug.py,sha256=FPKWeKgOSBXoMyRphb0Q52QiJSNbGAS40f9r3ZVSMBE,18028
+hud/cli/tests/test_mcp_server.py,sha256=e5fh6AUcqdv0jp0rJ8VL-DdJ-1nNgS85N8Ua53ehdgo,4378
+hud/cli/tests/test_utils.py,sha256=dKmHgyLtDEqKVXlvs5tyNHyHhpBlZHUpmJF-iUraBVM,13466
+hud/clients/README.md,sha256=XNE3mch95ozDgVqfwCGcrhlHY9CwT1GKfNANNboowto,3826
+hud/clients/__init__.py,sha256=bcPIa7dwH5ENsjh7CzjsJ84fm7Ma93NBc2lGfSjGAKM,328
+hud/clients/base.py,sha256=vm8pQS7lwbfhOUyZsti94yzig6dcWIa6NOO3wwhl39w,13497
+hud/clients/fastmcp.py,sha256=kpVwgyltQB_gCeoD0kU9HYC1RHELaib-675qPztwfRg,8125
+hud/clients/mcp_use.py,sha256=G7jnfsFvGgye-LxyEMobgL47wxZ-Id1aq_5AQLuEaBE,11024
+hud/clients/tests/__init__.py,sha256=sKOtJFFa4mDIXh1U6O8ZUHjigE8CiRMQ2PzJTIBZuVE,33
+hud/clients/tests/test_client_integration.py,sha256=kohU6jfCNfwSnAushHeB1_CmDlRfQc7VBL0GEdJYSeI,4198
+hud/clients/tests/test_fastmcp.py,sha256=4q3TzDjuieTZa89taiNJIrzbUncNkYOG4MaubypA21k,13030
+hud/clients/tests/test_protocol.py,sha256=aK4CS4g3j1D5jPo83ykzZuHUvcZFAulYtIq9T9Hb_fQ,6640
+hud/clients/utils/__init__.py,sha256=ucYJqOVpEsN-D9OFE2YTNLG628MgxcZAzfYhnbzx02k,32
+hud/clients/utils/retry_transport.py,sha256=-DyiXTtNBqHMg6Xb340q0wTyYv6qVPQv1zyJskD4JrE,5358
+hud/misc/__init__.py,sha256=m_pprQQ-G-Y0Sd0NEiR8MtAMbElnuFZ2OWT8TXrw7c4,43
+hud/misc/claude_plays_pokemon.py,sha256=IthAkjDVr2Q-GNvX-QLJyMzN7-0pHqqJbagGNv2m7yo,10453
+hud/otel/__init__.py,sha256=ii17ayoWiS5vAhA7UAmZ8TkmP52gs2pWyHsD46-uYbE,1003
+hud/otel/collector.py,sha256=jLZymZ8r7xt2VDuWexfbnT7PY1-0aiyLMgjBy8KDY1M,4497
+hud/otel/config.py,sha256=6np_C2UXhtKHHjY41HQxZElua2Eh_EUCBiRB_YuiSuc,6249
+hud/otel/context.py,sha256=C9MvO99cRSNNDEDC7ehO3eoTPnb6J7AemUYvEp57yEU,17774
+hud/otel/exporters.py,sha256=TP7SF6ySCP-gFV1i-u5-HbpYsK3n9GP3OjW_ZBfsj-w,14246
+hud/otel/instrumentation.py,sha256=ieKHEnMMSMZxPYvZokYJG-UQYXTNyEnaYG1lGY4zIHA,3575
+hud/otel/processors.py,sha256=yI5BWsDBMEPfwMzD-iWbJd4KWH3qUDSe-5-C1yT6fjU,4615
+hud/otel/tests/__init__.py,sha256=VNJKBMaxTtbn7trW-1Ph50zCvCok_wTSGcI1HD6GOLA,43
+hud/otel/tests/test_processors.py,sha256=np0R4ssd9j6LJSJykJ5bNjl0POwNYNhgb7BqOZHwcMY,6778
+hud/server/__init__.py,sha256=8LUwgsXO8xiViWP7uImDwcOsWLu01r5F4r8U8qH3rSY,91
+hud/server/context.py,sha256=6bCdSzv1FGyItu9472HbbYef279H7QuMGJDR8EtYg5Y,3210
+hud/server/low_level.py,sha256=XYs2pOJ9kN4OcJ6ahDmXM5mWkzq5wJLpKFInUYrWEok,4701
+hud/server/server.py,sha256=3IfYyxVfdlh-mVSiBqDQSkWM2gH8NoPjrULvOSW-VI0,6598
+hud/server/helper/__init__.py,sha256=ZxO8VP3RZEBBp-q65VixuhzQgqEPSVzW0hEY9J9QqDA,116
+hud/server/tests/__init__.py,sha256=eEYYkxX5Hz9woXVOBJ2H2_CQoEih0vH6nRt3sH2Z8v8,49
+hud/shared/__init__.py,sha256=IPxPCqtPLguryN-nBq78Sakypw2bRiE2iHv3SXG8YRk,139
+hud/shared/exceptions.py,sha256=Xna_pdEK_ESwkcffsRmT5GXq4xSHLV5cu7Qu3MjstSE,5516
+hud/shared/requests.py,sha256=og2jEbBHCebrg4kiBShunWKMaxQSaO2V7SHU5HPslHg,8848
+hud/shared/tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+hud/shared/tests/test_exceptions.py,sha256=7lzEYHblbKguXHJPyy7J6dUsPFrufos6H5Cliopy6TM,5315
+hud/shared/tests/test_requests.py,sha256=nKFcSN1sjrOouVU2xik9lE5Wxapy3EWsO8iIXrM_Sts,9114
+hud/telemetry/__init__.py,sha256=pPqkq4XekqJEkzwoCwGHGAv1NcytZ55yIB1aLxBpo6U,663
+hud/telemetry/instrument.py,sha256=m3u6YK02PTk39Jr4L3se7l-cYyKx0maCaqf5Z5JqWNA,14096
+hud/telemetry/job.py,sha256=DSZU_yVpag4VOGkCC5egcjVYuZ02nuzMqFZCgJqcQvM,9998
+hud/telemetry/replay.py,sha256=YW17s314s5Wy6Rl8MXHqg1FU8EF9_XcHBMJI0rrkyS4,2306
+hud/telemetry/trace.py,sha256=gem9pcioNI71hLs18vNidv-7KAZBJAn35stjVvOu_Ic,2208
+hud/tools/__init__.py,sha256=f7M3MkPEgoUsNPanLBUJKA_Y3a30arPf5bHdIwyXQZU,905
+hud/tools/base.py,sha256=avk6dLHEmlOMfozTzga4SbjCuAN0n5zyLwIn6OfLN60,14984
+hud/tools/bash.py,sha256=LJViMGb3lTGBm_gequVVTM7ySh1Xh9bOOIZXU29Lmrw,5209
+hud/tools/edit.py,sha256=N0AYFXp07-vAJy2li7lvHOL6hfgJOU4LL3iLSZrbRWU,12745
+hud/tools/playwright.py,sha256=lF7NxyEu8YbB7tpmCoTf8p9HxIrejahC67x3Xs0Jjb4,15007
+hud/tools/types.py,sha256=g-CWnUUDSxxIfUy54S1bpY1nfTzdYO1R_nPKYReABjQ,2734
+hud/tools/utils.py,sha256=bfVyYMcBOJvr1QdptCjVb6jaHVGIL5WUxmY59kzMekQ,1447
+hud/tools/computer/__init__.py,sha256=3tQBXPtGX0WPCwFXzEs3-duwg0rPEgj_0-K7aHskeQE,367
+hud/tools/computer/anthropic.py,sha256=oJfNMnjNFAn9mW1xY1nbWnTY2IqwFqdDR0mWSf8lu-s,17352
+hud/tools/computer/hud.py,sha256=kleQcW1qaBqQGC5iNK-0wOUHiCWvMSxKZNR4FEOPJg4,16240
+hud/tools/computer/openai.py,sha256=QEsF45LWOHftDrAoIOnCFZZT1cL--s-ArSov5aluWb8,11189
+hud/tools/computer/settings.py,sha256=b1XJsEQjB9qhN1xHfVENATkzinEebe0ZPyLzMgCGkKY,2763
+hud/tools/executors/__init__.py,sha256=jHxfus9SLhkL6YGtebR5RyKYyVAix3yu5EkUp2Q27Kg,732
+hud/tools/executors/base.py,sha256=VP2SiIEBSXvklnkasGxVuy-OmDMd9rjuxZh_YuUQH7A,14481
+hud/tools/executors/pyautogui.py,sha256=11eUQJAgFmHxwd9INAb2L9tgBmEv2Vgn0cwhwvGKlC8,22361
+hud/tools/executors/xdo.py,sha256=vc3ciSojmJ58HoL1VC2MC-F_KFrk4_YQHmoJp4rgv1k,18136
+hud/tools/executors/tests/__init__.py,sha256=opFpGSH6cEqIZgt9izXd3Yt85pC7xkxiYmOZQTHf4AY,32
+hud/tools/executors/tests/test_base_executor.py,sha256=toINFwhKyjWrsiOKpIOcCwUo_sUkuukycNcNHfXBOfo,12468
+hud/tools/executors/tests/test_pyautogui_executor.py,sha256=Shv6pnWtlsMXBMlN5DjlttCu6rZ1H447d1QZumduOnU,6640
+hud/tools/tests/__init__.py,sha256=eEYYkxX5Hz9woXVOBJ2H2_CQoEih0vH6nRt3sH2Z8v8,49
+hud/tools/tests/test_base.py,sha256=m6EelJ47F_hMqvRjrr6vEdiW1AtLgz3ZH1V1IUzTxzI,8983
+hud/tools/tests/test_bash.py,sha256=-g9a6sYgKKXRXmqYGYQBgpKEF_OlKE_uDDQXYMx6rT0,5113
+hud/tools/tests/test_bash_extended.py,sha256=G1pgl2e7_7ILYYS2FE6pTwI3_IPzmkPjBjGnxMGwGq8,7000
+hud/tools/tests/test_computer.py,sha256=BmrX2PV3wzHC4-xPJnWvenDV_kWt8LF8ia0kELBgHho,16394
+hud/tools/tests/test_computer_actions.py,sha256=YtUNFL7anhpXrcvg8EoUY1CqIV-TAAyaNFLZO9CiJ40,1194
+hud/tools/tests/test_edit.py,sha256=pHw1MSs-P8mDKrwKUDW77vQfoMNwmbrEBt_MkKr2rE0,9734
+hud/tools/tests/test_init.py,sha256=fl4Tf4IUUFOKhdSRHu9GE4mkaTDiXw-2auxj4s84HuE,698
+hud/tools/tests/test_playwright_tool.py,sha256=0va9IuZ7P5vXZDzan_sn-89ahu3piQMQDaiREzEvXNc,6736
+hud/tools/tests/test_tools.py,sha256=paz28V98Am-oR7MBJPDgY-BRV14HQo_0F6X5JIC8aic,4563
+hud/tools/tests/test_utils.py,sha256=oYxEnLpSA5sEeYFGUTj74QRNv0AHP3AjmYYHXgIW0BY,5496
+hud/utils/__init__.py,sha256=ckuIzwqgTxkzASa04XTPsOu_TqsRYUKBWUYfcSi3Xnc,164
+hud/utils/async_utils.py,sha256=5cKrJcnaHV2eJNxeyx0r7fPcdPTDBK7kM9-nLaF51X4,2409
+hud/utils/design.py,sha256=JZu4Fgfr_sOpH90oi1pu__woV56jPutCKsKAcmkHsUc,4987
+hud/utils/mcp.py,sha256=0r9_ffRObfAb6Zx6PRDJP6ibOTewOsQxJU0K-6JPveM,1847
+hud/utils/progress.py,sha256=suikwFM8sdSfkV10nAOEaInDhG4XKgOSvFePg4jSj1A,5927
+hud/utils/telemetry.py,sha256=hrVIx2rUjSGyy9IVxTZ_3Jii83PiHjyFRd5ls2whimM,1863
+hud/utils/tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+hud/utils/tests/test_async_utils.py,sha256=RkdSnYErRV3Jn7dfg6CPlcE1RSUL__2B627oIqAyy1s,5945
+hud/utils/tests/test_init.py,sha256=2QLQSGgyP9wJhOvPCusm_zjJad0qApOZi1BXpxcdHXQ,383
+hud/utils/tests/test_progress.py,sha256=QSF7Kpi03Ff_l3mAeqW9qs1nhK50j9vBiSobZq7T4f4,7394
+hud/utils/tests/test_telemetry.py,sha256=5jl7bEx8C8b-FfFUko5pf4UY-mPOR-9HaeL98dGtVHM,2781
+hud/utils/tests/test_version.py,sha256=jy8VM-qboqR_TWjmFy3hCw93dCZsguyIgBsqNmUtzM4,159
+hud/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+hud_python-0.4.2.dist-info/METADATA,sha256=fTLXYCnwj5LOHUKjMeKQmmRFJ2BgWYCrcPBWD4c2Fng,19675
+hud_python-0.4.2.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+hud_python-0.4.2.dist-info/entry_points.txt,sha256=jJbodNFg1m0-CDofe5AHvB4zKBq7sSdP97-ohaQ3ae4,63
+hud_python-0.4.2.dist-info/licenses/LICENSE,sha256=yIzBheVUf86FC1bztAcr7RYWWNxyd3B-UJQ3uddg1HA,1078
+hud_python-0.4.2.dist-info/RECORD,,

{hud_python-0.4.0.dist-info → hud_python-0.4.2.dist-info}/licenses/LICENSE RENAMED Viewed

@@ -1,21 +1,21 @@
-MIT License
-Copyright (c) 2025 Human Union Data, Inc
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-The above copyright notice and this permission notice shall be included in all
-copies or substantial portions of the Software.
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-SOFTWARE.
+MIT License
+Copyright (c) 2025 Human Union Data, Inc
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

hud/agents/art.py DELETED Viewed

@@ -1,101 +0,0 @@
-"""Adapter that plugs a *Trainable* ART model into the HUD MCPAgent stack.
-This extends GenericOpenAIChatAgent to collect messages_and_choices during
-execution for ART training.
-"""
-from __future__ import annotations
-import logging
-from typing import TYPE_CHECKING, Any
-import hud
-from .openai_chat_generic import GenericOpenAIChatAgent
-if TYPE_CHECKING:
-    import mcp.types as types
-    from hud.clients import AgentMCPClient
-    from hud.types import AgentResponse
-logger = logging.getLogger(__name__)
-system_prompt = (
-    "You are an MCP (Model Context Protocol) agent.\n\n"
-    "Use MCP tools through the server to complete your task.\n\n"
-    "You have a total of {MAX_STEPS} steps."
-)
-class ArtHUDAgent(GenericOpenAIChatAgent):
-    """Use an ART *TrainableModel* as the LLM behind a HUD `MCPAgent`.
-    This agent collects messages_and_choices during execution for ART training.
-    """
-    def __init__(self, art_model: Any, mcp_client: AgentMCPClient, **agent_kwargs: Any) -> None:
-        # Use ART's openai_client() method to get proper timeouts and patching
-        openai_client = art_model.openai_client()
-        super().__init__(
-            mcp_client=mcp_client,
-            openai_client=openai_client,
-            model_name=art_model.get_inference_name(),
-            logprobs=True,
-            **agent_kwargs,
-        )
-        self.system_prompt = system_prompt
-        self.art_model = art_model
-        self.messages_and_choices: list[Any] = []  # Collect for ART training
-        logger.info(
-            "ArtHUDAgent initialised with model '%s' (project=%s)",
-            art_model.name,
-            getattr(art_model, "project", "unknown"),
-        )
-    async def get_system_messages(self) -> list[Any]:
-        """Get system messages for ART."""
-        messages = await super().get_system_messages()
-        # Store initial messages as dicts for ART
-        self.messages_and_choices.extend(messages)
-        return messages
-    async def format_blocks(self, blocks: list[types.ContentBlock]) -> list[Any]:
-        """Format blocks for ART."""
-        messages = await super().format_blocks(blocks)
-        # Store initial messages as dicts for ART
-        self.messages_and_choices.extend(messages)
-        return messages
-    @hud.instrument(
-        span_type="agent",
-        record_args=False,  # Messages can be large
-        record_result=True,
-    )
-    async def get_response(self, messages: list[Any]) -> AgentResponse:
-        """Get model response and store the Choice for ART."""
-        # Call parent's get_model_response
-        result = await super().get_response(messages)
-        # Extract and store the Choice from the raw response
-        if result.raw and hasattr(result.raw, "choices") and result.raw.choices:
-            choice = result.raw.choices[0]
-            # Ensure the message has content (required for ART tokenization)
-            if choice.message and choice.message.content is None:
-                choice.message.content = ""
-            self.messages_and_choices.append(choice)
-        return result
-    async def format_tool_results(
-        self, tool_calls: list[Any], tool_results: list[Any]
-    ) -> list[Any]:
-        """Format tool results and store them for ART."""
-        tool_messages = await super().format_tool_results(tool_calls, tool_results)
-        # Store tool messages for ART
-        self.messages_and_choices.extend(tool_messages)
-        return tool_messages

hud-python 0.4.0__py3-none-any.whl → 0.4.2__py3-none-any.whl

Potentially problematic release.

hud-python 0.4.0py3-none-any.whl → 0.4.2py3-none-any.whl