PyPI - hud-python - Versions diffs - 0.4.1__py3-none-any.whl → 0.4.3__py3-none-any.whl - Mend

hud-python 0.4.1py3-none-any.whl → 0.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hud-python might be problematic. Click here for more details.

Files changed (130) hide show

hud/__init__.py +22 -22
hud/agents/__init__.py +13 -15
hud/agents/base.py +599 -599
hud/agents/claude.py +373 -373
hud/agents/langchain.py +261 -250
hud/agents/misc/__init__.py +7 -7
hud/agents/misc/response_agent.py +82 -80
hud/agents/openai.py +352 -352
hud/agents/openai_chat_generic.py +154 -154
hud/agents/tests/__init__.py +1 -1
hud/agents/tests/test_base.py +742 -742
hud/agents/tests/test_claude.py +324 -324
hud/agents/tests/test_client.py +363 -363
hud/agents/tests/test_openai.py +237 -237
hud/cli/__init__.py +617 -617
hud/cli/__main__.py +8 -8
hud/cli/analyze.py +371 -371
hud/cli/analyze_metadata.py +230 -230
hud/cli/build.py +498 -427
hud/cli/clone.py +185 -185
hud/cli/cursor.py +92 -92
hud/cli/debug.py +392 -392
hud/cli/docker_utils.py +83 -83
hud/cli/init.py +280 -281
hud/cli/interactive.py +353 -353
hud/cli/mcp_server.py +764 -756
hud/cli/pull.py +330 -336
hud/cli/push.py +404 -370
hud/cli/remote_runner.py +311 -311
hud/cli/runner.py +160 -160
hud/cli/tests/__init__.py +3 -3
hud/cli/tests/test_analyze.py +284 -284
hud/cli/tests/test_cli_init.py +265 -265
hud/cli/tests/test_cli_main.py +27 -27
hud/cli/tests/test_clone.py +142 -142
hud/cli/tests/test_cursor.py +253 -253
hud/cli/tests/test_debug.py +453 -453
hud/cli/tests/test_mcp_server.py +139 -139
hud/cli/tests/test_utils.py +388 -388
hud/cli/utils.py +263 -263
hud/clients/README.md +143 -143
hud/clients/__init__.py +16 -16
hud/clients/base.py +378 -379
hud/clients/fastmcp.py +222 -222
hud/clients/mcp_use.py +298 -278
hud/clients/tests/__init__.py +1 -1
hud/clients/tests/test_client_integration.py +111 -111
hud/clients/tests/test_fastmcp.py +342 -342
hud/clients/tests/test_protocol.py +188 -188
hud/clients/utils/__init__.py +1 -1
hud/clients/utils/retry_transport.py +160 -160
hud/datasets.py +327 -322
hud/misc/__init__.py +1 -1
hud/misc/claude_plays_pokemon.py +292 -292
hud/otel/__init__.py +35 -35
hud/otel/collector.py +142 -142
hud/otel/config.py +164 -164
hud/otel/context.py +536 -536
hud/otel/exporters.py +366 -366
hud/otel/instrumentation.py +97 -97
hud/otel/processors.py +118 -118
hud/otel/tests/__init__.py +1 -1
hud/otel/tests/test_processors.py +197 -197
hud/server/__init__.py +5 -5
hud/server/context.py +114 -114
hud/server/helper/__init__.py +5 -5
hud/server/low_level.py +132 -132
hud/server/server.py +170 -166
hud/server/tests/__init__.py +3 -3
hud/settings.py +73 -73
hud/shared/__init__.py +5 -5
hud/shared/exceptions.py +180 -180
hud/shared/requests.py +264 -264
hud/shared/tests/test_exceptions.py +157 -157
hud/shared/tests/test_requests.py +275 -275
hud/telemetry/__init__.py +25 -25
hud/telemetry/instrument.py +379 -379
hud/telemetry/job.py +309 -309
hud/telemetry/replay.py +74 -74
hud/telemetry/trace.py +83 -83
hud/tools/__init__.py +33 -33
hud/tools/base.py +365 -365
hud/tools/bash.py +161 -161
hud/tools/computer/__init__.py +15 -15
hud/tools/computer/anthropic.py +437 -437
hud/tools/computer/hud.py +376 -376
hud/tools/computer/openai.py +295 -295
hud/tools/computer/settings.py +82 -82
hud/tools/edit.py +314 -314
hud/tools/executors/__init__.py +30 -30
hud/tools/executors/base.py +539 -539
hud/tools/executors/pyautogui.py +621 -621
hud/tools/executors/tests/__init__.py +1 -1
hud/tools/executors/tests/test_base_executor.py +338 -338
hud/tools/executors/tests/test_pyautogui_executor.py +165 -165
hud/tools/executors/xdo.py +511 -511
hud/tools/playwright.py +412 -412
hud/tools/tests/__init__.py +3 -3
hud/tools/tests/test_base.py +282 -282
hud/tools/tests/test_bash.py +158 -158
hud/tools/tests/test_bash_extended.py +197 -197
hud/tools/tests/test_computer.py +425 -425
hud/tools/tests/test_computer_actions.py +34 -34
hud/tools/tests/test_edit.py +259 -259
hud/tools/tests/test_init.py +27 -27
hud/tools/tests/test_playwright_tool.py +183 -183
hud/tools/tests/test_tools.py +145 -145
hud/tools/tests/test_utils.py +156 -156
hud/tools/types.py +72 -72
hud/tools/utils.py +50 -50
hud/types.py +136 -136
hud/utils/__init__.py +10 -10
hud/utils/async_utils.py +65 -65
hud/utils/design.py +236 -168
hud/utils/mcp.py +55 -55
hud/utils/progress.py +149 -149
hud/utils/telemetry.py +66 -66
hud/utils/tests/test_async_utils.py +173 -173
hud/utils/tests/test_init.py +17 -17
hud/utils/tests/test_progress.py +261 -261
hud/utils/tests/test_telemetry.py +82 -82
hud/utils/tests/test_version.py +8 -8
hud/version.py +7 -7
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/METADATA +10 -8
hud_python-0.4.3.dist-info/RECORD +131 -0
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/licenses/LICENSE +21 -21
hud/agents/art.py +0 -101
hud_python-0.4.1.dist-info/RECORD +0 -132
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/WHEEL +0 -0
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/entry_points.txt +0 -0

hud/agents/tests/test_claude.py CHANGED Viewed

@@ -1,324 +1,324 @@
-"""Tests for Claude MCP Agent implementation."""
-from __future__ import annotations
-from typing import TYPE_CHECKING, cast
-from unittest.mock import AsyncMock, MagicMock, patch
-import pytest
-from anthropic import BadRequestError
-from mcp import types
-from hud.agents.claude import (
-    ClaudeAgent,
-    base64_to_content_block,
-    text_to_content_block,
-    tool_use_content_block,
-)
-from hud.types import MCPToolCall, MCPToolResult
-if TYPE_CHECKING:
-    from anthropic.types.beta import BetaImageBlockParam, BetaMessageParam, BetaTextBlockParam
-class TestClaudeHelperFunctions:
-    """Test helper functions for Claude message formatting."""
-    def test_base64_to_content_block(self):
-        """Test base64 image conversion."""
-        base64_data = "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mNkYPhfDwAChwGA60e6kgAAAABJRU5ErkJggg=="  # noqa: E501
-        result = base64_to_content_block(base64_data)
-        assert result["type"] == "image"
-        assert result["source"]["type"] == "base64"
-        assert result["source"]["media_type"] == "image/png"
-        assert result["source"]["data"] == base64_data
-    def test_text_to_content_block(self):
-        """Test text conversion."""
-        text = "Hello, world!"
-        result = text_to_content_block(text)
-        assert result["type"] == "text"
-        assert result["text"] == text
-    def test_tool_use_content_block(self):
-        """Test tool result content block creation."""
-        tool_use_id = "tool_123"
-        content: list[BetaTextBlockParam | BetaImageBlockParam] = [
-            text_to_content_block("Result text")
-        ]
-        result = tool_use_content_block(tool_use_id, content)
-        assert result["type"] == "tool_result"
-        assert result["tool_use_id"] == tool_use_id
-        assert result["content"] == content  # type: ignore
-class TestClaudeAgent:
-    """Test ClaudeAgent class."""
-    @pytest.fixture
-    def mock_mcp_client(self):
-        """Create a mock MCP client."""
-        mcp_client = MagicMock()
-        return mcp_client
-    @pytest.fixture
-    def mock_anthropic(self):
-        """Create a mock Anthropic client."""
-        with patch("hud.agents.claude.AsyncAnthropic") as mock:
-            client = AsyncMock()
-            # Add beta attribute with messages
-            client.beta = AsyncMock()
-            client.beta.messages = AsyncMock()
-            mock.return_value = client
-            yield client
-    @pytest.mark.asyncio
-    async def test_init(self, mock_mcp_client, mock_anthropic):
-        """Test agent initialization."""
-        # Test with provided model_client
-        mock_model_client = MagicMock()
-        agent = ClaudeAgent(
-            mcp_client=mock_mcp_client,
-            model_client=mock_model_client,
-            model="claude-3-opus-20240229",
-            max_tokens=1000,
-        )
-        assert agent.model_name == "claude-3-opus-20240229"
-        assert agent.max_tokens == 1000
-        assert agent.anthropic_client == mock_model_client
-    @pytest.mark.asyncio
-    async def test_init_without_model_client(self, mock_mcp_client):
-        """Test agent initialization without model client."""
-        with patch("hud.settings.settings.anthropic_api_key", "test_key"):
-            agent = ClaudeAgent(mcp_client=mock_mcp_client, model="claude-3-opus-20240229")
-            assert agent.model_name == "claude-3-opus-20240229"
-            assert agent.anthropic_client is not None
-    @pytest.mark.asyncio
-    async def test_format_blocks(self, mock_mcp_client):
-        """Test formatting content blocks into Claude messages."""
-        mock_model_client = MagicMock()
-        agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_model_client)
-        # Test with text only
-        text_blocks: list[types.ContentBlock] = [
-            types.TextContent(type="text", text="Hello, Claude!")
-        ]
-        messages = await agent.format_blocks(text_blocks)
-        assert len(messages) == 1
-        assert messages[0]["role"] == "user"
-        content = messages[0]["content"]
-        assert isinstance(content, list)
-        assert len(content) == 1
-        assert content[0]["type"] == "text"
-        assert content[0]["text"] == "Hello, Claude!"
-        # Test with screenshot
-        image_blocks: list[types.ContentBlock] = [
-            types.TextContent(type="text", text="Look at this"),
-            types.ImageContent(type="image", data="base64data", mimeType="image/png"),
-        ]
-        messages = await agent.format_blocks(image_blocks)
-        assert len(messages) == 1
-        assert messages[0]["role"] == "user"
-        content = messages[0]["content"]
-        assert isinstance(content, list)
-        assert len(content) == 2
-        # Content blocks are in order
-        assert content[0]["type"] == "text"
-        assert content[0]["text"] == "Look at this"
-        assert content[1]["type"] == "image"
-        assert content[1]["source"]["data"] == "base64data"
-    @pytest.mark.asyncio
-    async def test_format_tool_results_method(self, mock_mcp_client):
-        """Test the agent's format_tool_results method."""
-        mock_model_client = MagicMock()
-        agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_model_client)
-        tool_calls = [
-            MCPToolCall(name="test_tool", arguments={}, id="id1"),
-        ]
-        tool_results = [
-            MCPToolResult(content=[types.TextContent(type="text", text="Success")], isError=False),
-        ]
-        messages = await agent.format_tool_results(tool_calls, tool_results)
-        # format_tool_results returns a single user message with tool result content
-        assert len(messages) == 1
-        assert messages[0]["role"] == "user"
-        # The content is wrapped in a tool result block
-        content = list(messages[0]["content"])
-        assert len(content) == 1
-        assert content[0]["type"] == "tool_result"  # type: ignore
-        assert content[0]["tool_use_id"] == "id1"  # type: ignore
-        # The actual content is nested inside
-        inner_content = list(content[0]["content"])  # type: ignore
-        assert inner_content[0]["type"] == "text"  # type: ignore
-        assert inner_content[0]["text"] == "Success"  # type: ignore
-    @pytest.mark.asyncio
-    async def test_get_response(self, mock_mcp_client, mock_anthropic):
-        """Test getting model response from Claude API."""
-        # Disable telemetry for this test to avoid backend configuration issues
-        with patch("hud.settings.settings.telemetry_enabled", False):
-            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
-            # Mock the API response
-            mock_response = MagicMock()
-            # Create text block
-            text_block = MagicMock()
-            text_block.type = "text"
-            text_block.text = "Hello!"
-            # Create tool use block
-            tool_block = MagicMock()
-            tool_block.type = "tool_use"
-            tool_block.id = "tool_123"
-            tool_block.name = "test_tool"
-            tool_block.input = {"param": "value"}
-            mock_response.content = [text_block, tool_block]
-            mock_response.usage = MagicMock(input_tokens=10, output_tokens=20)
-            mock_anthropic.beta.messages.create = AsyncMock(return_value=mock_response)
-            messages = [
-                cast(
-                    "BetaMessageParam",
-                    {"role": "user", "content": [{"type": "text", "text": "Hi"}]},
-                )
-            ]
-            response = await agent.get_response(messages)
-            assert response.content == "Hello!"
-            assert len(response.tool_calls) == 1
-            assert response.tool_calls[0].name == "test_tool"
-            assert response.tool_calls[0].arguments == {"param": "value"}
-            # The test was checking for Claude-specific attributes that aren't part of ModelResponse
-            # These would need to be accessed from the original Claude response if needed
-            # Verify API was called correctly
-            mock_anthropic.beta.messages.create.assert_called_once()
-    @pytest.mark.asyncio
-    async def test_get_model_response_text_only(self, mock_mcp_client, mock_anthropic):
-        """Test getting text-only response."""
-        # Disable telemetry for this test to avoid backend configuration issues
-        with patch("hud.settings.settings.telemetry_enabled", False):
-            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
-            mock_response = MagicMock()
-            # Create text block
-            text_block = MagicMock()
-            text_block.type = "text"
-            text_block.text = "Just text"
-            mock_response.content = [text_block]
-            mock_response.usage = MagicMock(input_tokens=5, output_tokens=10)
-            mock_anthropic.beta.messages.create = AsyncMock(return_value=mock_response)
-            messages = [
-                cast(
-                    "BetaMessageParam",
-                    {"role": "user", "content": [{"type": "text", "text": "Hi"}]},
-                )
-            ]
-            response = await agent.get_response(messages)
-            assert response.content == "Just text"
-            assert response.tool_calls == []
-    @pytest.mark.asyncio
-    async def test_get_model_response_error(self, mock_mcp_client, mock_anthropic):
-        """Test handling API errors."""
-        # Disable telemetry for this test to avoid backend configuration issues
-        with patch("hud.settings.settings.telemetry_enabled", False):
-            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
-            # Mock API error
-            mock_anthropic.beta.messages.create = AsyncMock(
-                side_effect=BadRequestError(
-                    message="Invalid request",
-                    response=MagicMock(status_code=400),
-                    body={"error": {"message": "Invalid request"}},
-                )
-            )
-            messages = [{"role": "user", "content": [{"type": "text", "text": "Hi"}]}]
-            with pytest.raises(BadRequestError):
-                await agent.get_response(messages)  # type: ignore
-    # This test is commented out as it's testing complex integration scenarios
-    # that may have changed in the implementation
-    # @pytest.mark.asyncio
-    # async def test_run_with_tools(self, mock_mcp_client, mock_anthropic):
-    #     """Test running agent with tool usage."""
-    #     # Disable telemetry for this test to avoid backend configuration issues
-    #     with patch("hud.settings.settings.telemetry_enabled", False):
-    #         agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
-    #         # Mock tool availability
-    #         agent._available_tools = [
-    #             types.Tool(
-    #                 name="calculator", description="Calculator", inputSchema={"type": "object"}
-    #             )
-    #         ]
-    #         agent._tool_map = {
-    #             "calculator": types.Tool(
-    #                 name="calculator", description="Calculator", inputSchema={"type": "object"}
-    #             )
-    #         }
-    #         # Mock initial response with tool use
-    #         initial_response = MagicMock()
-    #         # Create tool use block
-    #         tool_block = MagicMock()
-    #         tool_block.type = "tool_use"
-    #         tool_block.id = "calc_123"
-    #         tool_block.name = "calculator"
-    #         tool_block.input = {"operation": "add", "a": 2, "b": 3}
-    #         initial_response.content = [tool_block]
-    #         initial_response.usage = MagicMock(input_tokens=10, output_tokens=15)
-    #         # Mock follow-up response
-    #         final_response = MagicMock()
-    #         text_block = MagicMock()
-    #         text_block.type = "text"
-    #         text_block.text = "2 + 3 = 5"
-    #         final_response.content = [text_block]
-    #         final_response.usage = MagicMock(input_tokens=20, output_tokens=10)
-    #         mock_anthropic.beta.messages.create = AsyncMock(
-    #             side_effect=[initial_response, final_response]
-    #         )
-    #         # Mock tool execution
-    #         mock_mcp_client.call_tool = AsyncMock(
-    #             return_value=MCPToolResult(
-    #                 content=[types.TextContent(type="text", text="5")], isError=False
-    #             )
-    #         )
-    #         # Mock the mcp_client properties
-    #         mock_mcp_client.mcp_config = {"test_server": {"url": "http://localhost"}}
-    #         mock_mcp_client.list_tools = AsyncMock(return_value=agent._available_tools)
-    #         mock_mcp_client.initialize = AsyncMock()
-    #         # Initialize the agent
-    #         await agent.initialize()
-    #         # Use a string prompt instead of a task
-    #         result = await agent.run("What is 2 + 3?")
-    #         assert result.content == "2 + 3 = 5"
-    #         assert result.done is True
+"""Tests for Claude MCP Agent implementation."""
+from __future__ import annotations
+from typing import TYPE_CHECKING, cast
+from unittest.mock import AsyncMock, MagicMock, patch
+import pytest
+from anthropic import BadRequestError
+from mcp import types
+from hud.agents.claude import (
+    ClaudeAgent,
+    base64_to_content_block,
+    text_to_content_block,
+    tool_use_content_block,
+)
+from hud.types import MCPToolCall, MCPToolResult
+if TYPE_CHECKING:
+    from anthropic.types.beta import BetaImageBlockParam, BetaMessageParam, BetaTextBlockParam
+class TestClaudeHelperFunctions:
+    """Test helper functions for Claude message formatting."""
+    def test_base64_to_content_block(self):
+        """Test base64 image conversion."""
+        base64_data = "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mNkYPhfDwAChwGA60e6kgAAAABJRU5ErkJggg=="  # noqa: E501
+        result = base64_to_content_block(base64_data)
+        assert result["type"] == "image"
+        assert result["source"]["type"] == "base64"
+        assert result["source"]["media_type"] == "image/png"
+        assert result["source"]["data"] == base64_data
+    def test_text_to_content_block(self):
+        """Test text conversion."""
+        text = "Hello, world!"
+        result = text_to_content_block(text)
+        assert result["type"] == "text"
+        assert result["text"] == text
+    def test_tool_use_content_block(self):
+        """Test tool result content block creation."""
+        tool_use_id = "tool_123"
+        content: list[BetaTextBlockParam | BetaImageBlockParam] = [
+            text_to_content_block("Result text")
+        ]
+        result = tool_use_content_block(tool_use_id, content)
+        assert result["type"] == "tool_result"
+        assert result["tool_use_id"] == tool_use_id
+        assert result["content"] == content  # type: ignore
+class TestClaudeAgent:
+    """Test ClaudeAgent class."""
+    @pytest.fixture
+    def mock_mcp_client(self):
+        """Create a mock MCP client."""
+        mcp_client = MagicMock()
+        return mcp_client
+    @pytest.fixture
+    def mock_anthropic(self):
+        """Create a mock Anthropic client."""
+        with patch("hud.agents.claude.AsyncAnthropic") as mock:
+            client = AsyncMock()
+            # Add beta attribute with messages
+            client.beta = AsyncMock()
+            client.beta.messages = AsyncMock()
+            mock.return_value = client
+            yield client
+    @pytest.mark.asyncio
+    async def test_init(self, mock_mcp_client, mock_anthropic):
+        """Test agent initialization."""
+        # Test with provided model_client
+        mock_model_client = MagicMock()
+        agent = ClaudeAgent(
+            mcp_client=mock_mcp_client,
+            model_client=mock_model_client,
+            model="claude-3-opus-20240229",
+            max_tokens=1000,
+        )
+        assert agent.model_name == "claude-3-opus-20240229"
+        assert agent.max_tokens == 1000
+        assert agent.anthropic_client == mock_model_client
+    @pytest.mark.asyncio
+    async def test_init_without_model_client(self, mock_mcp_client):
+        """Test agent initialization without model client."""
+        with patch("hud.settings.settings.anthropic_api_key", "test_key"):
+            agent = ClaudeAgent(mcp_client=mock_mcp_client, model="claude-3-opus-20240229")
+            assert agent.model_name == "claude-3-opus-20240229"
+            assert agent.anthropic_client is not None
+    @pytest.mark.asyncio
+    async def test_format_blocks(self, mock_mcp_client):
+        """Test formatting content blocks into Claude messages."""
+        mock_model_client = MagicMock()
+        agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_model_client)
+        # Test with text only
+        text_blocks: list[types.ContentBlock] = [
+            types.TextContent(type="text", text="Hello, Claude!")
+        ]
+        messages = await agent.format_blocks(text_blocks)
+        assert len(messages) == 1
+        assert messages[0]["role"] == "user"
+        content = messages[0]["content"]
+        assert isinstance(content, list)
+        assert len(content) == 1
+        assert content[0]["type"] == "text"
+        assert content[0]["text"] == "Hello, Claude!"
+        # Test with screenshot
+        image_blocks: list[types.ContentBlock] = [
+            types.TextContent(type="text", text="Look at this"),
+            types.ImageContent(type="image", data="base64data", mimeType="image/png"),
+        ]
+        messages = await agent.format_blocks(image_blocks)
+        assert len(messages) == 1
+        assert messages[0]["role"] == "user"
+        content = messages[0]["content"]
+        assert isinstance(content, list)
+        assert len(content) == 2
+        # Content blocks are in order
+        assert content[0]["type"] == "text"
+        assert content[0]["text"] == "Look at this"
+        assert content[1]["type"] == "image"
+        assert content[1]["source"]["data"] == "base64data"
+    @pytest.mark.asyncio
+    async def test_format_tool_results_method(self, mock_mcp_client):
+        """Test the agent's format_tool_results method."""
+        mock_model_client = MagicMock()
+        agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_model_client)
+        tool_calls = [
+            MCPToolCall(name="test_tool", arguments={}, id="id1"),
+        ]
+        tool_results = [
+            MCPToolResult(content=[types.TextContent(type="text", text="Success")], isError=False),
+        ]
+        messages = await agent.format_tool_results(tool_calls, tool_results)
+        # format_tool_results returns a single user message with tool result content
+        assert len(messages) == 1
+        assert messages[0]["role"] == "user"
+        # The content is wrapped in a tool result block
+        content = list(messages[0]["content"])
+        assert len(content) == 1
+        assert content[0]["type"] == "tool_result"  # type: ignore
+        assert content[0]["tool_use_id"] == "id1"  # type: ignore
+        # The actual content is nested inside
+        inner_content = list(content[0]["content"])  # type: ignore
+        assert inner_content[0]["type"] == "text"  # type: ignore
+        assert inner_content[0]["text"] == "Success"  # type: ignore
+    @pytest.mark.asyncio
+    async def test_get_response(self, mock_mcp_client, mock_anthropic):
+        """Test getting model response from Claude API."""
+        # Disable telemetry for this test to avoid backend configuration issues
+        with patch("hud.settings.settings.telemetry_enabled", False):
+            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
+            # Mock the API response
+            mock_response = MagicMock()
+            # Create text block
+            text_block = MagicMock()
+            text_block.type = "text"
+            text_block.text = "Hello!"
+            # Create tool use block
+            tool_block = MagicMock()
+            tool_block.type = "tool_use"
+            tool_block.id = "tool_123"
+            tool_block.name = "test_tool"
+            tool_block.input = {"param": "value"}
+            mock_response.content = [text_block, tool_block]
+            mock_response.usage = MagicMock(input_tokens=10, output_tokens=20)
+            mock_anthropic.beta.messages.create = AsyncMock(return_value=mock_response)
+            messages = [
+                cast(
+                    "BetaMessageParam",
+                    {"role": "user", "content": [{"type": "text", "text": "Hi"}]},
+                )
+            ]
+            response = await agent.get_response(messages)
+            assert response.content == "Hello!"
+            assert len(response.tool_calls) == 1
+            assert response.tool_calls[0].name == "test_tool"
+            assert response.tool_calls[0].arguments == {"param": "value"}
+            # The test was checking for Claude-specific attributes that aren't part of ModelResponse
+            # These would need to be accessed from the original Claude response if needed
+            # Verify API was called correctly
+            mock_anthropic.beta.messages.create.assert_called_once()
+    @pytest.mark.asyncio
+    async def test_get_model_response_text_only(self, mock_mcp_client, mock_anthropic):
+        """Test getting text-only response."""
+        # Disable telemetry for this test to avoid backend configuration issues
+        with patch("hud.settings.settings.telemetry_enabled", False):
+            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
+            mock_response = MagicMock()
+            # Create text block
+            text_block = MagicMock()
+            text_block.type = "text"
+            text_block.text = "Just text"
+            mock_response.content = [text_block]
+            mock_response.usage = MagicMock(input_tokens=5, output_tokens=10)
+            mock_anthropic.beta.messages.create = AsyncMock(return_value=mock_response)
+            messages = [
+                cast(
+                    "BetaMessageParam",
+                    {"role": "user", "content": [{"type": "text", "text": "Hi"}]},
+                )
+            ]
+            response = await agent.get_response(messages)
+            assert response.content == "Just text"
+            assert response.tool_calls == []
+    @pytest.mark.asyncio
+    async def test_get_model_response_error(self, mock_mcp_client, mock_anthropic):
+        """Test handling API errors."""
+        # Disable telemetry for this test to avoid backend configuration issues
+        with patch("hud.settings.settings.telemetry_enabled", False):
+            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
+            # Mock API error
+            mock_anthropic.beta.messages.create = AsyncMock(
+                side_effect=BadRequestError(
+                    message="Invalid request",
+                    response=MagicMock(status_code=400),
+                    body={"error": {"message": "Invalid request"}},
+                )
+            )
+            messages = [{"role": "user", "content": [{"type": "text", "text": "Hi"}]}]
+            with pytest.raises(BadRequestError):
+                await agent.get_response(messages)  # type: ignore
+    # This test is commented out as it's testing complex integration scenarios
+    # that may have changed in the implementation
+    # @pytest.mark.asyncio
+    # async def test_run_with_tools(self, mock_mcp_client, mock_anthropic):
+    #     """Test running agent with tool usage."""
+    #     # Disable telemetry for this test to avoid backend configuration issues
+    #     with patch("hud.settings.settings.telemetry_enabled", False):
+    #         agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
+    #         # Mock tool availability
+    #         agent._available_tools = [
+    #             types.Tool(
+    #                 name="calculator", description="Calculator", inputSchema={"type": "object"}
+    #             )
+    #         ]
+    #         agent._tool_map = {
+    #             "calculator": types.Tool(
+    #                 name="calculator", description="Calculator", inputSchema={"type": "object"}
+    #             )
+    #         }
+    #         # Mock initial response with tool use
+    #         initial_response = MagicMock()
+    #         # Create tool use block
+    #         tool_block = MagicMock()
+    #         tool_block.type = "tool_use"
+    #         tool_block.id = "calc_123"
+    #         tool_block.name = "calculator"
+    #         tool_block.input = {"operation": "add", "a": 2, "b": 3}
+    #         initial_response.content = [tool_block]
+    #         initial_response.usage = MagicMock(input_tokens=10, output_tokens=15)
+    #         # Mock follow-up response
+    #         final_response = MagicMock()
+    #         text_block = MagicMock()
+    #         text_block.type = "text"
+    #         text_block.text = "2 + 3 = 5"
+    #         final_response.content = [text_block]
+    #         final_response.usage = MagicMock(input_tokens=20, output_tokens=10)
+    #         mock_anthropic.beta.messages.create = AsyncMock(
+    #             side_effect=[initial_response, final_response]
+    #         )
+    #         # Mock tool execution
+    #         mock_mcp_client.call_tool = AsyncMock(
+    #             return_value=MCPToolResult(
+    #                 content=[types.TextContent(type="text", text="5")], isError=False
+    #             )
+    #         )
+    #         # Mock the mcp_client properties
+    #         mock_mcp_client.mcp_config = {"test_server": {"url": "http://localhost"}}
+    #         mock_mcp_client.list_tools = AsyncMock(return_value=agent._available_tools)
+    #         mock_mcp_client.initialize = AsyncMock()
+    #         # Initialize the agent
+    #         await agent.initialize()
+    #         # Use a string prompt instead of a task
+    #         result = await agent.run("What is 2 + 3?")
+    #         assert result.content == "2 + 3 = 5"
+    #         assert result.done is True

hud-python 0.4.1__py3-none-any.whl → 0.4.3__py3-none-any.whl

Potentially problematic release.

hud-python 0.4.1py3-none-any.whl → 0.4.3py3-none-any.whl