PyPI - hud-python - Versions diffs - 0.4.1__py3-none-any.whl → 0.4.3__py3-none-any.whl - Mend

hud-python 0.4.1py3-none-any.whl → 0.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hud-python might be problematic. Click here for more details.

Files changed (130) hide show

hud/__init__.py +22 -22
hud/agents/__init__.py +13 -15
hud/agents/base.py +599 -599
hud/agents/claude.py +373 -373
hud/agents/langchain.py +261 -250
hud/agents/misc/__init__.py +7 -7
hud/agents/misc/response_agent.py +82 -80
hud/agents/openai.py +352 -352
hud/agents/openai_chat_generic.py +154 -154
hud/agents/tests/__init__.py +1 -1
hud/agents/tests/test_base.py +742 -742
hud/agents/tests/test_claude.py +324 -324
hud/agents/tests/test_client.py +363 -363
hud/agents/tests/test_openai.py +237 -237
hud/cli/__init__.py +617 -617
hud/cli/__main__.py +8 -8
hud/cli/analyze.py +371 -371
hud/cli/analyze_metadata.py +230 -230
hud/cli/build.py +498 -427
hud/cli/clone.py +185 -185
hud/cli/cursor.py +92 -92
hud/cli/debug.py +392 -392
hud/cli/docker_utils.py +83 -83
hud/cli/init.py +280 -281
hud/cli/interactive.py +353 -353
hud/cli/mcp_server.py +764 -756
hud/cli/pull.py +330 -336
hud/cli/push.py +404 -370
hud/cli/remote_runner.py +311 -311
hud/cli/runner.py +160 -160
hud/cli/tests/__init__.py +3 -3
hud/cli/tests/test_analyze.py +284 -284
hud/cli/tests/test_cli_init.py +265 -265
hud/cli/tests/test_cli_main.py +27 -27
hud/cli/tests/test_clone.py +142 -142
hud/cli/tests/test_cursor.py +253 -253
hud/cli/tests/test_debug.py +453 -453
hud/cli/tests/test_mcp_server.py +139 -139
hud/cli/tests/test_utils.py +388 -388
hud/cli/utils.py +263 -263
hud/clients/README.md +143 -143
hud/clients/__init__.py +16 -16
hud/clients/base.py +378 -379
hud/clients/fastmcp.py +222 -222
hud/clients/mcp_use.py +298 -278
hud/clients/tests/__init__.py +1 -1
hud/clients/tests/test_client_integration.py +111 -111
hud/clients/tests/test_fastmcp.py +342 -342
hud/clients/tests/test_protocol.py +188 -188
hud/clients/utils/__init__.py +1 -1
hud/clients/utils/retry_transport.py +160 -160
hud/datasets.py +327 -322
hud/misc/__init__.py +1 -1
hud/misc/claude_plays_pokemon.py +292 -292
hud/otel/__init__.py +35 -35
hud/otel/collector.py +142 -142
hud/otel/config.py +164 -164
hud/otel/context.py +536 -536
hud/otel/exporters.py +366 -366
hud/otel/instrumentation.py +97 -97
hud/otel/processors.py +118 -118
hud/otel/tests/__init__.py +1 -1
hud/otel/tests/test_processors.py +197 -197
hud/server/__init__.py +5 -5
hud/server/context.py +114 -114
hud/server/helper/__init__.py +5 -5
hud/server/low_level.py +132 -132
hud/server/server.py +170 -166
hud/server/tests/__init__.py +3 -3
hud/settings.py +73 -73
hud/shared/__init__.py +5 -5
hud/shared/exceptions.py +180 -180
hud/shared/requests.py +264 -264
hud/shared/tests/test_exceptions.py +157 -157
hud/shared/tests/test_requests.py +275 -275
hud/telemetry/__init__.py +25 -25
hud/telemetry/instrument.py +379 -379
hud/telemetry/job.py +309 -309
hud/telemetry/replay.py +74 -74
hud/telemetry/trace.py +83 -83
hud/tools/__init__.py +33 -33
hud/tools/base.py +365 -365
hud/tools/bash.py +161 -161
hud/tools/computer/__init__.py +15 -15
hud/tools/computer/anthropic.py +437 -437
hud/tools/computer/hud.py +376 -376
hud/tools/computer/openai.py +295 -295
hud/tools/computer/settings.py +82 -82
hud/tools/edit.py +314 -314
hud/tools/executors/__init__.py +30 -30
hud/tools/executors/base.py +539 -539
hud/tools/executors/pyautogui.py +621 -621
hud/tools/executors/tests/__init__.py +1 -1
hud/tools/executors/tests/test_base_executor.py +338 -338
hud/tools/executors/tests/test_pyautogui_executor.py +165 -165
hud/tools/executors/xdo.py +511 -511
hud/tools/playwright.py +412 -412
hud/tools/tests/__init__.py +3 -3
hud/tools/tests/test_base.py +282 -282
hud/tools/tests/test_bash.py +158 -158
hud/tools/tests/test_bash_extended.py +197 -197
hud/tools/tests/test_computer.py +425 -425
hud/tools/tests/test_computer_actions.py +34 -34
hud/tools/tests/test_edit.py +259 -259
hud/tools/tests/test_init.py +27 -27
hud/tools/tests/test_playwright_tool.py +183 -183
hud/tools/tests/test_tools.py +145 -145
hud/tools/tests/test_utils.py +156 -156
hud/tools/types.py +72 -72
hud/tools/utils.py +50 -50
hud/types.py +136 -136
hud/utils/__init__.py +10 -10
hud/utils/async_utils.py +65 -65
hud/utils/design.py +236 -168
hud/utils/mcp.py +55 -55
hud/utils/progress.py +149 -149
hud/utils/telemetry.py +66 -66
hud/utils/tests/test_async_utils.py +173 -173
hud/utils/tests/test_init.py +17 -17
hud/utils/tests/test_progress.py +261 -261
hud/utils/tests/test_telemetry.py +82 -82
hud/utils/tests/test_version.py +8 -8
hud/version.py +7 -7
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/METADATA +10 -8
hud_python-0.4.3.dist-info/RECORD +131 -0
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/licenses/LICENSE +21 -21
hud/agents/art.py +0 -101
hud_python-0.4.1.dist-info/RECORD +0 -132
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/WHEEL +0 -0
{hud_python-0.4.1.dist-info → hud_python-0.4.3.dist-info}/entry_points.txt +0 -0

hud/agents/langchain.py CHANGED Viewed

@@ -1,250 +1,261 @@
-"""LangChain MCP Agent implementation."""
-from __future__ import annotations
-import logging
-from typing import TYPE_CHECKING, Any, ClassVar
-import mcp.types as types
-from langchain.agents import AgentExecutor, create_tool_calling_agent
-from langchain.prompts import ChatPromptTemplate, MessagesPlaceholder
-from langchain.schema import AIMessage, BaseMessage, HumanMessage, SystemMessage
-from mcp_use.adapters.langchain_adapter import LangChainAdapter
-import hud
-if TYPE_CHECKING:
-    from langchain.schema.language_model import BaseLanguageModel
-    from langchain_core.tools import BaseTool
-from hud.types import AgentResponse, MCPToolCall, MCPToolResult
-from .base import MCPAgent
-logger = logging.getLogger(__name__)
-class LangChainAgent(MCPAgent):
-    """
-    LangChain agent that uses MCP servers for tool execution.
-    This agent wraps any LangChain-compatible LLM and provides
-    access to MCP tools through LangChain's tool-calling interface.
-    """
-    metadata: ClassVar[dict[str, Any]] = {
-        "display_width": 1920,
-        "display_height": 1080,
-    }
-    def __init__(
-        self,
-        llm: BaseLanguageModel,
-        **kwargs: Any,
-    ) -> None:
-        """
-        Initialize LangChain MCP agent.
-        Args:
-            llm: Any LangChain-compatible language model
-            **kwargs: Additional arguments passed to BaseMCPAgent
-        """
-        super().__init__(**kwargs)
-        self.llm = llm
-        self.adapter = LangChainAdapter(disallowed_tools=self.disallowed_tools)
-        self._langchain_tools: list[BaseTool] | None = None
-        self.model_name = (
-            "langchain-" + self.llm.model_name  # type: ignore
-            if hasattr(self.llm, "model_name")
-            else "unknown"
-        )
-    def _get_langchain_tools(self) -> list[BaseTool]:
-        """Get or create LangChain tools from MCP tools."""
-        if self._langchain_tools is not None:
-            return self._langchain_tools
-        # Create LangChain tools from MCP tools using the adapter
-        self._langchain_tools = []
-        # Convert available tools using the adapter; no server grouping
-        langchain_tools = self.adapter._convert_tools(self._available_tools, "default")  # type: ignore[reportAttributeAccessIssue]
-        self._langchain_tools.extend(langchain_tools)
-        logger.info("Created %s LangChain tools from MCP tools", len(self._langchain_tools))
-        return self._langchain_tools
-    async def get_system_messages(self) -> list[BaseMessage]:
-        """Get system messages for LangChain."""
-        return [SystemMessage(content=self.system_prompt)]
-    async def format_blocks(self, blocks: list[types.ContentBlock]) -> list[BaseMessage]:
-        """Create initial messages for LangChain."""
-        messages = []
-        for block in blocks:
-            if isinstance(block, types.TextContent):
-                messages.append(HumanMessage(content=block.text))
-            elif isinstance(block, types.ImageContent):
-                messages.append(HumanMessage(content=block.data))
-        return messages
-    @hud.instrument(
-        span_type="agent",
-        record_args=False,  # Messages can be large
-        record_result=True,
-    )
-    async def get_response(self, messages: list[BaseMessage]) -> AgentResponse:
-        """Get response from LangChain model including any tool calls."""
-        # Get LangChain tools (created lazily)
-        langchain_tools = self._get_langchain_tools()
-        # Create a prompt template from current messages
-        # Extract system message if present
-        system_content = "You are a helpful assistant"
-        non_system_messages = []
-        for msg in messages:
-            if isinstance(msg, SystemMessage):
-                system_content = str(msg.content)
-            else:
-                non_system_messages.append(msg)
-        # Create prompt with placeholders
-        prompt = ChatPromptTemplate.from_messages(
-            [
-                ("system", system_content),
-                MessagesPlaceholder(variable_name="chat_history"),
-                MessagesPlaceholder(variable_name="agent_scratchpad"),
-            ]
-        )
-        # Create agent with tools
-        agent = create_tool_calling_agent(
-            llm=self.llm,
-            tools=langchain_tools,
-            prompt=prompt,
-        )
-        # Create executor
-        executor = AgentExecutor(
-            agent=agent,
-            tools=langchain_tools,
-            verbose=False,
-        )
-        # Format the last user message as input
-        last_user_msg = None
-        for msg in reversed(non_system_messages):
-            if isinstance(msg, HumanMessage):
-                last_user_msg = msg
-                break
-        if not last_user_msg:
-            return AgentResponse(content="No user message found", tool_calls=[], done=True)
-        # Extract text from message content
-        input_text = ""
-        if isinstance(last_user_msg.content, str):
-            input_text = last_user_msg.content
-        elif isinstance(last_user_msg.content, list):
-            # Extract text from multimodal content
-            for item in last_user_msg.content:
-                if isinstance(item, dict) and item.get("type") == "text":
-                    input_text = item.get("text", "")
-                    break
-        # Build chat history (exclude last user message and system)
-        chat_history = []
-        for _, msg in enumerate(non_system_messages[:-1]):
-            if isinstance(msg, HumanMessage | AIMessage):
-                chat_history.append(msg)
-        # Execute the agent
-        try:
-            result = await executor.ainvoke(
-                {
-                    "input": input_text,
-                    "chat_history": chat_history,
-                }
-            )
-            # Process the result
-            output = result.get("output", "")
-            # Check if tools were called
-            if result.get("intermediate_steps"):
-                # Tools were called
-                tool_calls = []
-                for action, _ in result["intermediate_steps"]:
-                    if hasattr(action, "tool") and hasattr(action, "tool_input"):
-                        tool_calls.append(
-                            MCPToolCall(
-                                name=action.tool,
-                                arguments=action.tool_input,
-                            )
-                        )
-                return AgentResponse(content=output, tool_calls=tool_calls, done=False)
-            else:
-                # No tools called, just text response
-                return AgentResponse(content=output, tool_calls=[], done=True)
-        except Exception as e:
-            logger.error("Agent execution failed: %s", e)
-            return AgentResponse(content=f"Error: {e!s}", tool_calls=[], done=True)
-    async def format_tool_results(
-        self, tool_calls: list[MCPToolCall], tool_results: list[MCPToolResult]
-    ) -> list[BaseMessage]:
-        """Format tool results into LangChain messages."""
-        # Create an AI message with the tool calls and results
-        messages = []
-        # First add an AI message indicating tools were called
-        tool_names = [tc.name for tc in tool_calls]
-        ai_content = f"I'll use the following tools: {', '.join(tool_names)}"
-        messages.append(AIMessage(content=ai_content))
-        # Build result text from tool results
-        text_parts = []
-        latest_screenshot = None
-        for tool_call, result in zip(tool_calls, tool_results, strict=False):
-            if result.isError:
-                error_text = "Tool execution failed"
-                for content in result.content:
-                    if isinstance(content, types.TextContent):
-                        error_text = content.text
-                        break
-                text_parts.append(f"Error - {tool_call.name}: {error_text}")
-            else:
-                # Process success content
-                tool_output = []
-                for content in result.content:
-                    if isinstance(content, types.TextContent):
-                        tool_output.append(content.text)
-                    elif isinstance(content, types.ImageContent):
-                        latest_screenshot = content.data
-                if tool_output:
-                    text_parts.append(f"{tool_call.name}: " + " ".join(tool_output))
-        result_text = "\n".join(text_parts) if text_parts else "No output from tools"
-        # Then add a human message with the tool results
-        if latest_screenshot:
-            # Include screenshot in multimodal format
-            content = [
-                {"type": "text", "text": f"Tool results:\n{result_text}"},
-                {
-                    "type": "image_url",
-                    "image_url": {"url": f"data:image/png;base64,{latest_screenshot}"},
-                },
-            ]
-            messages.append(HumanMessage(content=content))
-        else:
-            messages.append(HumanMessage(content=f"Tool results:\n{result_text}"))
-        return messages
+"""LangChain MCP Agent implementation."""
+from __future__ import annotations
+import logging
+from typing import TYPE_CHECKING, Any, ClassVar
+import mcp.types as types
+from langchain.agents import AgentExecutor, create_tool_calling_agent
+from langchain.prompts import ChatPromptTemplate, MessagesPlaceholder
+from langchain.schema import AIMessage, BaseMessage, HumanMessage, SystemMessage
+import hud
+if TYPE_CHECKING:
+    from langchain.schema.language_model import BaseLanguageModel
+    from langchain_core.tools import BaseTool
+    from mcp_use.adapters.langchain_adapter import LangChainAdapter
+try:
+    from mcp_use.adapters.langchain_adapter import LangChainAdapter
+except ImportError:
+    LangChainAdapter = None  # type: ignore[misc, assignment]
+from hud.types import AgentResponse, MCPToolCall, MCPToolResult
+from .base import MCPAgent
+logger = logging.getLogger(__name__)
+class LangChainAgent(MCPAgent):
+    """
+    LangChain agent that uses MCP servers for tool execution.
+    This agent wraps any LangChain-compatible LLM and provides
+    access to MCP tools through LangChain's tool-calling interface.
+    """
+    metadata: ClassVar[dict[str, Any]] = {
+        "display_width": 1920,
+        "display_height": 1080,
+    }
+    def __init__(
+        self,
+        llm: BaseLanguageModel,
+        **kwargs: Any,
+    ) -> None:
+        """
+        Initialize LangChain MCP agent.
+        Args:
+            llm: Any LangChain-compatible language model
+            **kwargs: Additional arguments passed to BaseMCPAgent
+        """
+        super().__init__(**kwargs)
+        if LangChainAdapter is None:
+            raise ImportError(
+                "LangChainAdapter is not available. "
+                "Please install the optional agent dependencies: pip install 'hud-python[agent]'"
+            )
+        self.llm = llm
+        self.adapter = LangChainAdapter(disallowed_tools=self.disallowed_tools)
+        self._langchain_tools: list[BaseTool] | None = None
+        self.model_name = (
+            "langchain-" + self.llm.model_name  # type: ignore
+            if hasattr(self.llm, "model_name")
+            else "unknown"
+        )
+    def _get_langchain_tools(self) -> list[BaseTool]:
+        """Get or create LangChain tools from MCP tools."""
+        if self._langchain_tools is not None:
+            return self._langchain_tools
+        # Create LangChain tools from MCP tools using the adapter
+        self._langchain_tools = []
+        # Convert available tools using the adapter; no server grouping
+        langchain_tools = self.adapter._convert_tools(self._available_tools, "default")  # type: ignore[reportAttributeAccessIssue]
+        self._langchain_tools.extend(langchain_tools)
+        logger.info("Created %s LangChain tools from MCP tools", len(self._langchain_tools))
+        return self._langchain_tools
+    async def get_system_messages(self) -> list[BaseMessage]:
+        """Get system messages for LangChain."""
+        return [SystemMessage(content=self.system_prompt)]
+    async def format_blocks(self, blocks: list[types.ContentBlock]) -> list[BaseMessage]:
+        """Create initial messages for LangChain."""
+        messages = []
+        for block in blocks:
+            if isinstance(block, types.TextContent):
+                messages.append(HumanMessage(content=block.text))
+            elif isinstance(block, types.ImageContent):
+                messages.append(HumanMessage(content=block.data))
+        return messages
+    @hud.instrument(
+        span_type="agent",
+        record_args=False,  # Messages can be large
+        record_result=True,
+    )
+    async def get_response(self, messages: list[BaseMessage]) -> AgentResponse:
+        """Get response from LangChain model including any tool calls."""
+        # Get LangChain tools (created lazily)
+        langchain_tools = self._get_langchain_tools()
+        # Create a prompt template from current messages
+        # Extract system message if present
+        system_content = "You are a helpful assistant"
+        non_system_messages = []
+        for msg in messages:
+            if isinstance(msg, SystemMessage):
+                system_content = str(msg.content)
+            else:
+                non_system_messages.append(msg)
+        # Create prompt with placeholders
+        prompt = ChatPromptTemplate.from_messages(
+            [
+                ("system", system_content),
+                MessagesPlaceholder(variable_name="chat_history"),
+                MessagesPlaceholder(variable_name="agent_scratchpad"),
+            ]
+        )
+        # Create agent with tools
+        agent = create_tool_calling_agent(
+            llm=self.llm,
+            tools=langchain_tools,
+            prompt=prompt,
+        )
+        # Create executor
+        executor = AgentExecutor(
+            agent=agent,
+            tools=langchain_tools,
+            verbose=False,
+        )
+        # Format the last user message as input
+        last_user_msg = None
+        for msg in reversed(non_system_messages):
+            if isinstance(msg, HumanMessage):
+                last_user_msg = msg
+                break
+        if not last_user_msg:
+            return AgentResponse(content="No user message found", tool_calls=[], done=True)
+        # Extract text from message content
+        input_text = ""
+        if isinstance(last_user_msg.content, str):
+            input_text = last_user_msg.content
+        elif isinstance(last_user_msg.content, list):
+            # Extract text from multimodal content
+            for item in last_user_msg.content:
+                if isinstance(item, dict) and item.get("type") == "text":
+                    input_text = item.get("text", "")
+                    break
+        # Build chat history (exclude last user message and system)
+        chat_history = []
+        for _, msg in enumerate(non_system_messages[:-1]):
+            if isinstance(msg, HumanMessage | AIMessage):
+                chat_history.append(msg)
+        # Execute the agent
+        try:
+            result = await executor.ainvoke(
+                {
+                    "input": input_text,
+                    "chat_history": chat_history,
+                }
+            )
+            # Process the result
+            output = result.get("output", "")
+            # Check if tools were called
+            if result.get("intermediate_steps"):
+                # Tools were called
+                tool_calls = []
+                for action, _ in result["intermediate_steps"]:
+                    if hasattr(action, "tool") and hasattr(action, "tool_input"):
+                        tool_calls.append(
+                            MCPToolCall(
+                                name=action.tool,
+                                arguments=action.tool_input,
+                            )
+                        )
+                return AgentResponse(content=output, tool_calls=tool_calls, done=False)
+            else:
+                # No tools called, just text response
+                return AgentResponse(content=output, tool_calls=[], done=True)
+        except Exception as e:
+            logger.error("Agent execution failed: %s", e)
+            return AgentResponse(content=f"Error: {e!s}", tool_calls=[], done=True)
+    async def format_tool_results(
+        self, tool_calls: list[MCPToolCall], tool_results: list[MCPToolResult]
+    ) -> list[BaseMessage]:
+        """Format tool results into LangChain messages."""
+        # Create an AI message with the tool calls and results
+        messages = []
+        # First add an AI message indicating tools were called
+        tool_names = [tc.name for tc in tool_calls]
+        ai_content = f"I'll use the following tools: {', '.join(tool_names)}"
+        messages.append(AIMessage(content=ai_content))
+        # Build result text from tool results
+        text_parts = []
+        latest_screenshot = None
+        for tool_call, result in zip(tool_calls, tool_results, strict=False):
+            if result.isError:
+                error_text = "Tool execution failed"
+                for content in result.content:
+                    if isinstance(content, types.TextContent):
+                        error_text = content.text
+                        break
+                text_parts.append(f"Error - {tool_call.name}: {error_text}")
+            else:
+                # Process success content
+                tool_output = []
+                for content in result.content:
+                    if isinstance(content, types.TextContent):
+                        tool_output.append(content.text)
+                    elif isinstance(content, types.ImageContent):
+                        latest_screenshot = content.data
+                if tool_output:
+                    text_parts.append(f"{tool_call.name}: " + " ".join(tool_output))
+        result_text = "\n".join(text_parts) if text_parts else "No output from tools"
+        # Then add a human message with the tool results
+        if latest_screenshot:
+            # Include screenshot in multimodal format
+            content = [
+                {"type": "text", "text": f"Tool results:\n{result_text}"},
+                {
+                    "type": "image_url",
+                    "image_url": {"url": f"data:image/png;base64,{latest_screenshot}"},
+                },
+            ]
+            messages.append(HumanMessage(content=content))
+        else:
+            messages.append(HumanMessage(content=f"Tool results:\n{result_text}"))
+        return messages

hud/agents/misc/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
-"""Miscellaneous agents."""
-from __future__ import annotations
-from .response_agent import ResponseAgent
-__all__ = ["ResponseAgent"]
+"""Miscellaneous agents."""
+from __future__ import annotations
+from .response_agent import ResponseAgent
+__all__ = ["ResponseAgent"]

hud-python 0.4.1__py3-none-any.whl → 0.4.3__py3-none-any.whl

Potentially problematic release.

hud-python 0.4.1py3-none-any.whl → 0.4.3py3-none-any.whl