PyPI - hud-python - Versions diffs - 0.3.4__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

hud-python 0.3.4py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hud-python might be problematic. Click here for more details.

Files changed (192) hide show

hud/__init__.py +22 -89
hud/agents/__init__.py +17 -0
hud/agents/art.py +101 -0
hud/agents/base.py +599 -0
hud/{mcp → agents}/claude.py +373 -321
hud/{mcp → agents}/langchain.py +250 -250
hud/agents/misc/__init__.py +7 -0
hud/{agent → agents}/misc/response_agent.py +80 -80
hud/{mcp → agents}/openai.py +352 -334
hud/agents/openai_chat_generic.py +154 -0
hud/{mcp → agents}/tests/__init__.py +1 -1
hud/agents/tests/test_base.py +742 -0
hud/agents/tests/test_claude.py +324 -0
hud/{mcp → agents}/tests/test_client.py +363 -324
hud/{mcp → agents}/tests/test_openai.py +237 -238
hud/cli/__init__.py +617 -0
hud/cli/__main__.py +8 -0
hud/cli/analyze.py +371 -0
hud/cli/analyze_metadata.py +230 -0
hud/cli/build.py +427 -0
hud/cli/clone.py +185 -0
hud/cli/cursor.py +92 -0
hud/cli/debug.py +392 -0
hud/cli/docker_utils.py +83 -0
hud/cli/init.py +281 -0
hud/cli/interactive.py +353 -0
hud/cli/mcp_server.py +756 -0
hud/cli/pull.py +336 -0
hud/cli/push.py +379 -0
hud/cli/remote_runner.py +311 -0
hud/cli/runner.py +160 -0
hud/cli/tests/__init__.py +3 -0
hud/cli/tests/test_analyze.py +284 -0
hud/cli/tests/test_cli_init.py +265 -0
hud/cli/tests/test_cli_main.py +27 -0
hud/cli/tests/test_clone.py +142 -0
hud/cli/tests/test_cursor.py +253 -0
hud/cli/tests/test_debug.py +453 -0
hud/cli/tests/test_mcp_server.py +139 -0
hud/cli/tests/test_utils.py +388 -0
hud/cli/utils.py +263 -0
hud/clients/README.md +143 -0
hud/clients/__init__.py +16 -0
hud/clients/base.py +354 -0
hud/clients/fastmcp.py +202 -0
hud/clients/mcp_use.py +278 -0
hud/clients/tests/__init__.py +1 -0
hud/clients/tests/test_client_integration.py +111 -0
hud/clients/tests/test_fastmcp.py +342 -0
hud/clients/tests/test_protocol.py +188 -0
hud/clients/utils/__init__.py +1 -0
hud/clients/utils/retry_transport.py +160 -0
hud/datasets.py +322 -192
hud/misc/__init__.py +1 -0
hud/{agent → misc}/claude_plays_pokemon.py +292 -283
hud/otel/__init__.py +35 -0
hud/otel/collector.py +142 -0
hud/otel/config.py +164 -0
hud/otel/context.py +536 -0
hud/otel/exporters.py +366 -0
hud/otel/instrumentation.py +97 -0
hud/otel/processors.py +118 -0
hud/otel/tests/__init__.py +1 -0
hud/otel/tests/test_processors.py +197 -0
hud/server/__init__.py +5 -5
hud/server/context.py +114 -0
hud/server/helper/__init__.py +5 -0
hud/server/low_level.py +132 -0
hud/server/server.py +166 -0
hud/server/tests/__init__.py +3 -0
hud/settings.py +73 -79
hud/shared/__init__.py +5 -0
hud/{exceptions.py → shared/exceptions.py} +180 -180
hud/{server → shared}/requests.py +264 -264
hud/shared/tests/test_exceptions.py +157 -0
hud/{server → shared}/tests/test_requests.py +275 -275
hud/telemetry/__init__.py +25 -30
hud/telemetry/instrument.py +379 -0
hud/telemetry/job.py +309 -141
hud/telemetry/replay.py +74 -0
hud/telemetry/trace.py +83 -0
hud/tools/__init__.py +33 -34
hud/tools/base.py +365 -65
hud/tools/bash.py +161 -137
hud/tools/computer/__init__.py +15 -13
hud/tools/computer/anthropic.py +437 -414
hud/tools/computer/hud.py +376 -328
hud/tools/computer/openai.py +295 -286
hud/tools/computer/settings.py +82 -0
hud/tools/edit.py +314 -290
hud/tools/executors/__init__.py +30 -30
hud/tools/executors/base.py +539 -532
hud/tools/executors/pyautogui.py +621 -619
hud/tools/executors/tests/__init__.py +1 -1
hud/tools/executors/tests/test_base_executor.py +338 -338
hud/tools/executors/tests/test_pyautogui_executor.py +165 -165
hud/tools/executors/xdo.py +511 -503
hud/tools/{playwright_tool.py → playwright.py} +412 -379
hud/tools/tests/__init__.py +3 -3
hud/tools/tests/test_base.py +282 -0
hud/tools/tests/test_bash.py +158 -152
hud/tools/tests/test_bash_extended.py +197 -0
hud/tools/tests/test_computer.py +425 -52
hud/tools/tests/test_computer_actions.py +34 -34
hud/tools/tests/test_edit.py +259 -240
hud/tools/tests/test_init.py +27 -27
hud/tools/tests/test_playwright_tool.py +183 -183
hud/tools/tests/test_tools.py +145 -157
hud/tools/tests/test_utils.py +156 -156
hud/tools/types.py +72 -0
hud/tools/utils.py +50 -50
hud/types.py +136 -89
hud/utils/__init__.py +10 -16
hud/utils/async_utils.py +65 -0
hud/utils/design.py +168 -0
hud/utils/mcp.py +55 -0
hud/utils/progress.py +149 -149
hud/utils/telemetry.py +66 -66
hud/utils/tests/test_async_utils.py +173 -0
hud/utils/tests/test_init.py +17 -21
hud/utils/tests/test_progress.py +261 -225
hud/utils/tests/test_telemetry.py +82 -37
hud/utils/tests/test_version.py +8 -8
hud/version.py +7 -7
hud_python-0.4.0.dist-info/METADATA +474 -0
hud_python-0.4.0.dist-info/RECORD +132 -0
hud_python-0.4.0.dist-info/entry_points.txt +3 -0
{hud_python-0.3.4.dist-info → hud_python-0.4.0.dist-info}/licenses/LICENSE +21 -21
hud/adapters/__init__.py +0 -8
hud/adapters/claude/__init__.py +0 -5
hud/adapters/claude/adapter.py +0 -180
hud/adapters/claude/tests/__init__.py +0 -1
hud/adapters/claude/tests/test_adapter.py +0 -519
hud/adapters/common/__init__.py +0 -6
hud/adapters/common/adapter.py +0 -178
hud/adapters/common/tests/test_adapter.py +0 -289
hud/adapters/common/types.py +0 -446
hud/adapters/operator/__init__.py +0 -5
hud/adapters/operator/adapter.py +0 -108
hud/adapters/operator/tests/__init__.py +0 -1
hud/adapters/operator/tests/test_adapter.py +0 -370
hud/agent/__init__.py +0 -19
hud/agent/base.py +0 -126
hud/agent/claude.py +0 -271
hud/agent/langchain.py +0 -215
hud/agent/misc/__init__.py +0 -3
hud/agent/operator.py +0 -268
hud/agent/tests/__init__.py +0 -1
hud/agent/tests/test_base.py +0 -202
hud/env/__init__.py +0 -11
hud/env/client.py +0 -35
hud/env/docker_client.py +0 -349
hud/env/environment.py +0 -446
hud/env/local_docker_client.py +0 -358
hud/env/remote_client.py +0 -212
hud/env/remote_docker_client.py +0 -292
hud/gym.py +0 -130
hud/job.py +0 -773
hud/mcp/__init__.py +0 -17
hud/mcp/base.py +0 -631
hud/mcp/client.py +0 -312
hud/mcp/tests/test_base.py +0 -512
hud/mcp/tests/test_claude.py +0 -294
hud/task.py +0 -149
hud/taskset.py +0 -237
hud/telemetry/_trace.py +0 -347
hud/telemetry/context.py +0 -230
hud/telemetry/exporter.py +0 -575
hud/telemetry/instrumentation/__init__.py +0 -3
hud/telemetry/instrumentation/mcp.py +0 -259
hud/telemetry/instrumentation/registry.py +0 -59
hud/telemetry/mcp_models.py +0 -270
hud/telemetry/tests/__init__.py +0 -1
hud/telemetry/tests/test_context.py +0 -210
hud/telemetry/tests/test_trace.py +0 -312
hud/tools/helper/README.md +0 -56
hud/tools/helper/__init__.py +0 -9
hud/tools/helper/mcp_server.py +0 -78
hud/tools/helper/server_initialization.py +0 -115
hud/tools/helper/utils.py +0 -58
hud/trajectory.py +0 -94
hud/utils/agent.py +0 -37
hud/utils/common.py +0 -256
hud/utils/config.py +0 -120
hud/utils/deprecation.py +0 -115
hud/utils/misc.py +0 -53
hud/utils/tests/test_common.py +0 -277
hud/utils/tests/test_config.py +0 -129
hud_python-0.3.4.dist-info/METADATA +0 -284
hud_python-0.3.4.dist-info/RECORD +0 -120
/hud/{adapters/common → shared}/tests/__init__.py +0 -0
{hud_python-0.3.4.dist-info → hud_python-0.4.0.dist-info}/WHEEL +0 -0

hud/{mcp → agents}/langchain.py RENAMED Viewed

@@ -1,250 +1,250 @@
-"""LangChain MCP Agent implementation."""
-from __future__ import annotations
-import logging
-from typing import TYPE_CHECKING, Any
-import mcp.types as types
-from langchain.agents import AgentExecutor, create_tool_calling_agent
-from langchain.prompts import ChatPromptTemplate, MessagesPlaceholder
-from langchain.schema import AIMessage, BaseMessage, HumanMessage, SystemMessage
-from mcp.types import CallToolRequestParams as MCPToolCall
-from mcp.types import CallToolResult as MCPToolResult
-from mcp_use.adapters.langchain_adapter import LangChainAdapter
-if TYPE_CHECKING:
-    from langchain.schema.language_model import BaseLanguageModel
-    from langchain_core.tools import BaseTool
-from .base import BaseMCPAgent, ModelResponse
-logger = logging.getLogger(__name__)
-class LangChainMCPAgent(BaseMCPAgent):
-    """
-    LangChain agent that uses MCP servers for tool execution.
-    This agent wraps any LangChain-compatible LLM and provides
-    access to MCP tools through LangChain's tool-calling interface.
-    """
-    def __init__(
-        self,
-        llm: BaseLanguageModel,
-        **kwargs: Any,
-    ) -> None:
-        """
-        Initialize LangChain MCP agent.
-        Args:
-            llm: Any LangChain-compatible language model
-            **kwargs: Additional arguments passed to BaseMCPAgent
-        """
-        super().__init__(**kwargs)
-        self.llm = llm
-        self.adapter = LangChainAdapter(disallowed_tools=self.disallowed_tools)
-        self._langchain_tools: list[BaseTool] | None = None
-        self.model_name = (
-            "langchain-" + self.llm.model_name  # type: ignore
-            if hasattr(self.llm, "model_name")
-            else "unknown"
-        )
-    def _get_langchain_tools(self) -> list[BaseTool]:
-        """Get or create LangChain tools from MCP tools."""
-        if self._langchain_tools is not None:
-            return self._langchain_tools
-        # Create LangChain tools from MCP tools using the adapter
-        self._langchain_tools = []
-        # Get tools grouped by connector
-        tools_by_connector = self.get_tools_by_connector()
-        # Convert tools using the adapter
-        for connector, tools in tools_by_connector.items():
-            langchain_tools = self.adapter._convert_tools(tools, connector)  # type: ignore[reportAttributeAccessIssue]
-            self._langchain_tools.extend(langchain_tools)
-        logger.info("Created %s LangChain tools from MCP tools", len(self._langchain_tools))
-        return self._langchain_tools
-    async def create_initial_messages(
-        self, prompt: str, screenshot: str | None
-    ) -> list[BaseMessage]:
-        """Create initial messages for LangChain."""
-        messages = []
-        # Add system message
-        system_prompt = self.get_system_prompt()
-        messages.append(SystemMessage(content=system_prompt))
-        # Add user message with prompt and optional screenshot
-        if screenshot:
-            # For multimodal models, include the image
-            content = [
-                {"type": "text", "text": prompt},
-                {"type": "image_url", "image_url": {"url": f"data:image/png;base64,{screenshot}"}},
-            ]
-            messages.append(HumanMessage(content=content))
-        else:
-            messages.append(HumanMessage(content=prompt))
-        return messages
-    async def get_model_response(self, messages: list[BaseMessage]) -> ModelResponse:
-        """Get response from LangChain model including any tool calls."""
-        # Get LangChain tools (created lazily)
-        langchain_tools = self._get_langchain_tools()
-        # Create a prompt template from current messages
-        # Extract system message if present
-        system_content = "You are a helpful assistant"
-        non_system_messages = []
-        for msg in messages:
-            if isinstance(msg, SystemMessage):
-                system_content = str(msg.content)
-            else:
-                non_system_messages.append(msg)
-        # Create prompt with placeholders
-        prompt = ChatPromptTemplate.from_messages(
-            [
-                ("system", system_content),
-                MessagesPlaceholder(variable_name="chat_history"),
-                MessagesPlaceholder(variable_name="agent_scratchpad"),
-            ]
-        )
-        # Create agent with tools
-        agent = create_tool_calling_agent(
-            llm=self.llm,
-            tools=langchain_tools,
-            prompt=prompt,
-        )
-        # Create executor
-        executor = AgentExecutor(
-            agent=agent,
-            tools=langchain_tools,
-            verbose=False,
-        )
-        # Format the last user message as input
-        last_user_msg = None
-        for msg in reversed(non_system_messages):
-            if isinstance(msg, HumanMessage):
-                last_user_msg = msg
-                break
-        if not last_user_msg:
-            return ModelResponse(content="No user message found", tool_calls=[], done=True)
-        # Extract text from message content
-        input_text = ""
-        if isinstance(last_user_msg.content, str):
-            input_text = last_user_msg.content
-        elif isinstance(last_user_msg.content, list):
-            # Extract text from multimodal content
-            for item in last_user_msg.content:
-                if isinstance(item, dict) and item.get("type") == "text":
-                    input_text = item.get("text", "")
-                    break
-        # Build chat history (exclude last user message and system)
-        chat_history = []
-        for _, msg in enumerate(non_system_messages[:-1]):
-            if isinstance(msg, HumanMessage | AIMessage):
-                chat_history.append(msg)
-        # Execute the agent
-        try:
-            result = await executor.ainvoke(
-                {
-                    "input": input_text,
-                    "chat_history": chat_history,
-                }
-            )
-            # Process the result
-            output = result.get("output", "")
-            # Check if tools were called
-            if result.get("intermediate_steps"):
-                # Tools were called
-                tool_calls = []
-                for action, _ in result["intermediate_steps"]:
-                    if hasattr(action, "tool") and hasattr(action, "tool_input"):
-                        tool_calls.append(
-                            MCPToolCall(
-                                name=action.tool,
-                                arguments=action.tool_input,
-                            )
-                        )
-                return ModelResponse(content=output, tool_calls=tool_calls, done=False)
-            else:
-                # No tools called, just text response
-                return ModelResponse(content=output, tool_calls=[], done=True)
-        except Exception as e:
-            logger.error("Agent execution failed: %s", e)
-            return ModelResponse(content=f"Error: {e!s}", tool_calls=[], done=True)
-    async def format_tool_results(
-        self, tool_calls: list[MCPToolCall], tool_results: list[MCPToolResult]
-    ) -> list[BaseMessage]:
-        """Format tool results into LangChain messages."""
-        # Create an AI message with the tool calls and results
-        messages = []
-        # First add an AI message indicating tools were called
-        tool_names = [tc.name for tc in tool_calls]
-        ai_content = f"I'll use the following tools: {', '.join(tool_names)}"
-        messages.append(AIMessage(content=ai_content))
-        # Build result text from tool results
-        text_parts = []
-        latest_screenshot = None
-        for tool_call, result in zip(tool_calls, tool_results, strict=False):
-            if result.isError:
-                error_text = "Tool execution failed"
-                for content in result.content:
-                    if isinstance(content, types.TextContent):
-                        error_text = content.text
-                        break
-                text_parts.append(f"Error - {tool_call.name}: {error_text}")
-            else:
-                # Process success content
-                tool_output = []
-                for content in result.content:
-                    if isinstance(content, types.TextContent):
-                        tool_output.append(content.text)
-                    elif isinstance(content, types.ImageContent):
-                        latest_screenshot = content.data
-                if tool_output:
-                    text_parts.append(f"{tool_call.name}: " + " ".join(tool_output))
-        result_text = "\n".join(text_parts) if text_parts else "No output from tools"
-        # Then add a human message with the tool results
-        if latest_screenshot:
-            # Include screenshot in multimodal format
-            content = [
-                {"type": "text", "text": f"Tool results:\n{result_text}"},
-                {
-                    "type": "image_url",
-                    "image_url": {"url": f"data:image/png;base64,{latest_screenshot}"},
-                },
-            ]
-            messages.append(HumanMessage(content=content))
-        else:
-            messages.append(HumanMessage(content=f"Tool results:\n{result_text}"))
-        return messages
+"""LangChain MCP Agent implementation."""
+from __future__ import annotations
+import logging
+from typing import TYPE_CHECKING, Any, ClassVar
+import mcp.types as types
+from langchain.agents import AgentExecutor, create_tool_calling_agent
+from langchain.prompts import ChatPromptTemplate, MessagesPlaceholder
+from langchain.schema import AIMessage, BaseMessage, HumanMessage, SystemMessage
+from mcp_use.adapters.langchain_adapter import LangChainAdapter
+import hud
+if TYPE_CHECKING:
+    from langchain.schema.language_model import BaseLanguageModel
+    from langchain_core.tools import BaseTool
+from hud.types import AgentResponse, MCPToolCall, MCPToolResult
+from .base import MCPAgent
+logger = logging.getLogger(__name__)
+class LangChainAgent(MCPAgent):
+    """
+    LangChain agent that uses MCP servers for tool execution.
+    This agent wraps any LangChain-compatible LLM and provides
+    access to MCP tools through LangChain's tool-calling interface.
+    """
+    metadata: ClassVar[dict[str, Any]] = {
+        "display_width": 1920,
+        "display_height": 1080,
+    }
+    def __init__(
+        self,
+        llm: BaseLanguageModel,
+        **kwargs: Any,
+    ) -> None:
+        """
+        Initialize LangChain MCP agent.
+        Args:
+            llm: Any LangChain-compatible language model
+            **kwargs: Additional arguments passed to BaseMCPAgent
+        """
+        super().__init__(**kwargs)
+        self.llm = llm
+        self.adapter = LangChainAdapter(disallowed_tools=self.disallowed_tools)
+        self._langchain_tools: list[BaseTool] | None = None
+        self.model_name = (
+            "langchain-" + self.llm.model_name  # type: ignore
+            if hasattr(self.llm, "model_name")
+            else "unknown"
+        )
+    def _get_langchain_tools(self) -> list[BaseTool]:
+        """Get or create LangChain tools from MCP tools."""
+        if self._langchain_tools is not None:
+            return self._langchain_tools
+        # Create LangChain tools from MCP tools using the adapter
+        self._langchain_tools = []
+        # Convert available tools using the adapter; no server grouping
+        langchain_tools = self.adapter._convert_tools(self._available_tools, "default")  # type: ignore[reportAttributeAccessIssue]
+        self._langchain_tools.extend(langchain_tools)
+        logger.info("Created %s LangChain tools from MCP tools", len(self._langchain_tools))
+        return self._langchain_tools
+    async def get_system_messages(self) -> list[BaseMessage]:
+        """Get system messages for LangChain."""
+        return [SystemMessage(content=self.system_prompt)]
+    async def format_blocks(self, blocks: list[types.ContentBlock]) -> list[BaseMessage]:
+        """Create initial messages for LangChain."""
+        messages = []
+        for block in blocks:
+            if isinstance(block, types.TextContent):
+                messages.append(HumanMessage(content=block.text))
+            elif isinstance(block, types.ImageContent):
+                messages.append(HumanMessage(content=block.data))
+        return messages
+    @hud.instrument(
+        span_type="agent",
+        record_args=False,  # Messages can be large
+        record_result=True,
+    )
+    async def get_response(self, messages: list[BaseMessage]) -> AgentResponse:
+        """Get response from LangChain model including any tool calls."""
+        # Get LangChain tools (created lazily)
+        langchain_tools = self._get_langchain_tools()
+        # Create a prompt template from current messages
+        # Extract system message if present
+        system_content = "You are a helpful assistant"
+        non_system_messages = []
+        for msg in messages:
+            if isinstance(msg, SystemMessage):
+                system_content = str(msg.content)
+            else:
+                non_system_messages.append(msg)
+        # Create prompt with placeholders
+        prompt = ChatPromptTemplate.from_messages(
+            [
+                ("system", system_content),
+                MessagesPlaceholder(variable_name="chat_history"),
+                MessagesPlaceholder(variable_name="agent_scratchpad"),
+            ]
+        )
+        # Create agent with tools
+        agent = create_tool_calling_agent(
+            llm=self.llm,
+            tools=langchain_tools,
+            prompt=prompt,
+        )
+        # Create executor
+        executor = AgentExecutor(
+            agent=agent,
+            tools=langchain_tools,
+            verbose=False,
+        )
+        # Format the last user message as input
+        last_user_msg = None
+        for msg in reversed(non_system_messages):
+            if isinstance(msg, HumanMessage):
+                last_user_msg = msg
+                break
+        if not last_user_msg:
+            return AgentResponse(content="No user message found", tool_calls=[], done=True)
+        # Extract text from message content
+        input_text = ""
+        if isinstance(last_user_msg.content, str):
+            input_text = last_user_msg.content
+        elif isinstance(last_user_msg.content, list):
+            # Extract text from multimodal content
+            for item in last_user_msg.content:
+                if isinstance(item, dict) and item.get("type") == "text":
+                    input_text = item.get("text", "")
+                    break
+        # Build chat history (exclude last user message and system)
+        chat_history = []
+        for _, msg in enumerate(non_system_messages[:-1]):
+            if isinstance(msg, HumanMessage | AIMessage):
+                chat_history.append(msg)
+        # Execute the agent
+        try:
+            result = await executor.ainvoke(
+                {
+                    "input": input_text,
+                    "chat_history": chat_history,
+                }
+            )
+            # Process the result
+            output = result.get("output", "")
+            # Check if tools were called
+            if result.get("intermediate_steps"):
+                # Tools were called
+                tool_calls = []
+                for action, _ in result["intermediate_steps"]:
+                    if hasattr(action, "tool") and hasattr(action, "tool_input"):
+                        tool_calls.append(
+                            MCPToolCall(
+                                name=action.tool,
+                                arguments=action.tool_input,
+                            )
+                        )
+                return AgentResponse(content=output, tool_calls=tool_calls, done=False)
+            else:
+                # No tools called, just text response
+                return AgentResponse(content=output, tool_calls=[], done=True)
+        except Exception as e:
+            logger.error("Agent execution failed: %s", e)
+            return AgentResponse(content=f"Error: {e!s}", tool_calls=[], done=True)
+    async def format_tool_results(
+        self, tool_calls: list[MCPToolCall], tool_results: list[MCPToolResult]
+    ) -> list[BaseMessage]:
+        """Format tool results into LangChain messages."""
+        # Create an AI message with the tool calls and results
+        messages = []
+        # First add an AI message indicating tools were called
+        tool_names = [tc.name for tc in tool_calls]
+        ai_content = f"I'll use the following tools: {', '.join(tool_names)}"
+        messages.append(AIMessage(content=ai_content))
+        # Build result text from tool results
+        text_parts = []
+        latest_screenshot = None
+        for tool_call, result in zip(tool_calls, tool_results, strict=False):
+            if result.isError:
+                error_text = "Tool execution failed"
+                for content in result.content:
+                    if isinstance(content, types.TextContent):
+                        error_text = content.text
+                        break
+                text_parts.append(f"Error - {tool_call.name}: {error_text}")
+            else:
+                # Process success content
+                tool_output = []
+                for content in result.content:
+                    if isinstance(content, types.TextContent):
+                        tool_output.append(content.text)
+                    elif isinstance(content, types.ImageContent):
+                        latest_screenshot = content.data
+                if tool_output:
+                    text_parts.append(f"{tool_call.name}: " + " ".join(tool_output))
+        result_text = "\n".join(text_parts) if text_parts else "No output from tools"
+        # Then add a human message with the tool results
+        if latest_screenshot:
+            # Include screenshot in multimodal format
+            content = [
+                {"type": "text", "text": f"Tool results:\n{result_text}"},
+                {
+                    "type": "image_url",
+                    "image_url": {"url": f"data:image/png;base64,{latest_screenshot}"},
+                },
+            ]
+            messages.append(HumanMessage(content=content))
+        else:
+            messages.append(HumanMessage(content=f"Tool results:\n{result_text}"))
+        return messages

hud/agents/misc/__init__.py ADDED Viewed

@@ -0,0 +1,7 @@
+"""Miscellaneous agents."""
+from __future__ import annotations
+from .response_agent import ResponseAgent
+__all__ = ["ResponseAgent"]

hud-python 0.3.4__py3-none-any.whl → 0.4.0__py3-none-any.whl

Potentially problematic release.

hud-python 0.3.4py3-none-any.whl → 0.4.0py3-none-any.whl