hud-python 0.3.4__py3-none-any.whl → 0.4.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of hud-python might be problematic. Click here for more details.

Files changed (192) hide show
  1. hud/__init__.py +22 -89
  2. hud/agents/__init__.py +17 -0
  3. hud/agents/art.py +101 -0
  4. hud/agents/base.py +599 -0
  5. hud/{mcp → agents}/claude.py +373 -321
  6. hud/{mcp → agents}/langchain.py +250 -250
  7. hud/agents/misc/__init__.py +7 -0
  8. hud/{agent → agents}/misc/response_agent.py +80 -80
  9. hud/{mcp → agents}/openai.py +352 -334
  10. hud/agents/openai_chat_generic.py +154 -0
  11. hud/{mcp → agents}/tests/__init__.py +1 -1
  12. hud/agents/tests/test_base.py +742 -0
  13. hud/agents/tests/test_claude.py +324 -0
  14. hud/{mcp → agents}/tests/test_client.py +363 -324
  15. hud/{mcp → agents}/tests/test_openai.py +237 -238
  16. hud/cli/__init__.py +617 -0
  17. hud/cli/__main__.py +8 -0
  18. hud/cli/analyze.py +371 -0
  19. hud/cli/analyze_metadata.py +230 -0
  20. hud/cli/build.py +427 -0
  21. hud/cli/clone.py +185 -0
  22. hud/cli/cursor.py +92 -0
  23. hud/cli/debug.py +392 -0
  24. hud/cli/docker_utils.py +83 -0
  25. hud/cli/init.py +281 -0
  26. hud/cli/interactive.py +353 -0
  27. hud/cli/mcp_server.py +756 -0
  28. hud/cli/pull.py +336 -0
  29. hud/cli/push.py +379 -0
  30. hud/cli/remote_runner.py +311 -0
  31. hud/cli/runner.py +160 -0
  32. hud/cli/tests/__init__.py +3 -0
  33. hud/cli/tests/test_analyze.py +284 -0
  34. hud/cli/tests/test_cli_init.py +265 -0
  35. hud/cli/tests/test_cli_main.py +27 -0
  36. hud/cli/tests/test_clone.py +142 -0
  37. hud/cli/tests/test_cursor.py +253 -0
  38. hud/cli/tests/test_debug.py +453 -0
  39. hud/cli/tests/test_mcp_server.py +139 -0
  40. hud/cli/tests/test_utils.py +388 -0
  41. hud/cli/utils.py +263 -0
  42. hud/clients/README.md +143 -0
  43. hud/clients/__init__.py +16 -0
  44. hud/clients/base.py +354 -0
  45. hud/clients/fastmcp.py +202 -0
  46. hud/clients/mcp_use.py +278 -0
  47. hud/clients/tests/__init__.py +1 -0
  48. hud/clients/tests/test_client_integration.py +111 -0
  49. hud/clients/tests/test_fastmcp.py +342 -0
  50. hud/clients/tests/test_protocol.py +188 -0
  51. hud/clients/utils/__init__.py +1 -0
  52. hud/clients/utils/retry_transport.py +160 -0
  53. hud/datasets.py +322 -192
  54. hud/misc/__init__.py +1 -0
  55. hud/{agent → misc}/claude_plays_pokemon.py +292 -283
  56. hud/otel/__init__.py +35 -0
  57. hud/otel/collector.py +142 -0
  58. hud/otel/config.py +164 -0
  59. hud/otel/context.py +536 -0
  60. hud/otel/exporters.py +366 -0
  61. hud/otel/instrumentation.py +97 -0
  62. hud/otel/processors.py +118 -0
  63. hud/otel/tests/__init__.py +1 -0
  64. hud/otel/tests/test_processors.py +197 -0
  65. hud/server/__init__.py +5 -5
  66. hud/server/context.py +114 -0
  67. hud/server/helper/__init__.py +5 -0
  68. hud/server/low_level.py +132 -0
  69. hud/server/server.py +166 -0
  70. hud/server/tests/__init__.py +3 -0
  71. hud/settings.py +73 -79
  72. hud/shared/__init__.py +5 -0
  73. hud/{exceptions.py → shared/exceptions.py} +180 -180
  74. hud/{server → shared}/requests.py +264 -264
  75. hud/shared/tests/test_exceptions.py +157 -0
  76. hud/{server → shared}/tests/test_requests.py +275 -275
  77. hud/telemetry/__init__.py +25 -30
  78. hud/telemetry/instrument.py +379 -0
  79. hud/telemetry/job.py +309 -141
  80. hud/telemetry/replay.py +74 -0
  81. hud/telemetry/trace.py +83 -0
  82. hud/tools/__init__.py +33 -34
  83. hud/tools/base.py +365 -65
  84. hud/tools/bash.py +161 -137
  85. hud/tools/computer/__init__.py +15 -13
  86. hud/tools/computer/anthropic.py +437 -414
  87. hud/tools/computer/hud.py +376 -328
  88. hud/tools/computer/openai.py +295 -286
  89. hud/tools/computer/settings.py +82 -0
  90. hud/tools/edit.py +314 -290
  91. hud/tools/executors/__init__.py +30 -30
  92. hud/tools/executors/base.py +539 -532
  93. hud/tools/executors/pyautogui.py +621 -619
  94. hud/tools/executors/tests/__init__.py +1 -1
  95. hud/tools/executors/tests/test_base_executor.py +338 -338
  96. hud/tools/executors/tests/test_pyautogui_executor.py +165 -165
  97. hud/tools/executors/xdo.py +511 -503
  98. hud/tools/{playwright_tool.py → playwright.py} +412 -379
  99. hud/tools/tests/__init__.py +3 -3
  100. hud/tools/tests/test_base.py +282 -0
  101. hud/tools/tests/test_bash.py +158 -152
  102. hud/tools/tests/test_bash_extended.py +197 -0
  103. hud/tools/tests/test_computer.py +425 -52
  104. hud/tools/tests/test_computer_actions.py +34 -34
  105. hud/tools/tests/test_edit.py +259 -240
  106. hud/tools/tests/test_init.py +27 -27
  107. hud/tools/tests/test_playwright_tool.py +183 -183
  108. hud/tools/tests/test_tools.py +145 -157
  109. hud/tools/tests/test_utils.py +156 -156
  110. hud/tools/types.py +72 -0
  111. hud/tools/utils.py +50 -50
  112. hud/types.py +136 -89
  113. hud/utils/__init__.py +10 -16
  114. hud/utils/async_utils.py +65 -0
  115. hud/utils/design.py +168 -0
  116. hud/utils/mcp.py +55 -0
  117. hud/utils/progress.py +149 -149
  118. hud/utils/telemetry.py +66 -66
  119. hud/utils/tests/test_async_utils.py +173 -0
  120. hud/utils/tests/test_init.py +17 -21
  121. hud/utils/tests/test_progress.py +261 -225
  122. hud/utils/tests/test_telemetry.py +82 -37
  123. hud/utils/tests/test_version.py +8 -8
  124. hud/version.py +7 -7
  125. hud_python-0.4.0.dist-info/METADATA +474 -0
  126. hud_python-0.4.0.dist-info/RECORD +132 -0
  127. hud_python-0.4.0.dist-info/entry_points.txt +3 -0
  128. {hud_python-0.3.4.dist-info → hud_python-0.4.0.dist-info}/licenses/LICENSE +21 -21
  129. hud/adapters/__init__.py +0 -8
  130. hud/adapters/claude/__init__.py +0 -5
  131. hud/adapters/claude/adapter.py +0 -180
  132. hud/adapters/claude/tests/__init__.py +0 -1
  133. hud/adapters/claude/tests/test_adapter.py +0 -519
  134. hud/adapters/common/__init__.py +0 -6
  135. hud/adapters/common/adapter.py +0 -178
  136. hud/adapters/common/tests/test_adapter.py +0 -289
  137. hud/adapters/common/types.py +0 -446
  138. hud/adapters/operator/__init__.py +0 -5
  139. hud/adapters/operator/adapter.py +0 -108
  140. hud/adapters/operator/tests/__init__.py +0 -1
  141. hud/adapters/operator/tests/test_adapter.py +0 -370
  142. hud/agent/__init__.py +0 -19
  143. hud/agent/base.py +0 -126
  144. hud/agent/claude.py +0 -271
  145. hud/agent/langchain.py +0 -215
  146. hud/agent/misc/__init__.py +0 -3
  147. hud/agent/operator.py +0 -268
  148. hud/agent/tests/__init__.py +0 -1
  149. hud/agent/tests/test_base.py +0 -202
  150. hud/env/__init__.py +0 -11
  151. hud/env/client.py +0 -35
  152. hud/env/docker_client.py +0 -349
  153. hud/env/environment.py +0 -446
  154. hud/env/local_docker_client.py +0 -358
  155. hud/env/remote_client.py +0 -212
  156. hud/env/remote_docker_client.py +0 -292
  157. hud/gym.py +0 -130
  158. hud/job.py +0 -773
  159. hud/mcp/__init__.py +0 -17
  160. hud/mcp/base.py +0 -631
  161. hud/mcp/client.py +0 -312
  162. hud/mcp/tests/test_base.py +0 -512
  163. hud/mcp/tests/test_claude.py +0 -294
  164. hud/task.py +0 -149
  165. hud/taskset.py +0 -237
  166. hud/telemetry/_trace.py +0 -347
  167. hud/telemetry/context.py +0 -230
  168. hud/telemetry/exporter.py +0 -575
  169. hud/telemetry/instrumentation/__init__.py +0 -3
  170. hud/telemetry/instrumentation/mcp.py +0 -259
  171. hud/telemetry/instrumentation/registry.py +0 -59
  172. hud/telemetry/mcp_models.py +0 -270
  173. hud/telemetry/tests/__init__.py +0 -1
  174. hud/telemetry/tests/test_context.py +0 -210
  175. hud/telemetry/tests/test_trace.py +0 -312
  176. hud/tools/helper/README.md +0 -56
  177. hud/tools/helper/__init__.py +0 -9
  178. hud/tools/helper/mcp_server.py +0 -78
  179. hud/tools/helper/server_initialization.py +0 -115
  180. hud/tools/helper/utils.py +0 -58
  181. hud/trajectory.py +0 -94
  182. hud/utils/agent.py +0 -37
  183. hud/utils/common.py +0 -256
  184. hud/utils/config.py +0 -120
  185. hud/utils/deprecation.py +0 -115
  186. hud/utils/misc.py +0 -53
  187. hud/utils/tests/test_common.py +0 -277
  188. hud/utils/tests/test_config.py +0 -129
  189. hud_python-0.3.4.dist-info/METADATA +0 -284
  190. hud_python-0.3.4.dist-info/RECORD +0 -120
  191. /hud/{adapters/common → shared}/tests/__init__.py +0 -0
  192. {hud_python-0.3.4.dist-info → hud_python-0.4.0.dist-info}/WHEEL +0 -0
@@ -0,0 +1,154 @@
1
+ """Generic OpenAI chat-completions agent.
2
+
3
+ This class provides the minimal glue required to connect any endpoint that
4
+ implements the OpenAI compatible *chat.completions* API with MCP tool calling
5
+ through the existing :class:`hud.agent.MCPAgent` scaffolding.
6
+
7
+ Key points:
8
+ - Stateless, no special server-side conversation state is assumed.
9
+ - Accepts an :class:`openai.AsyncOpenAI` client, caller can supply their own
10
+ base_url / api_key (e.g. ART, llama.cpp, together.ai, …)
11
+ - All HUD features (step_count, OTel spans, tool filtering, screenshots, …)
12
+ come from the ``MCPAgent`` base class, we only implement the three abstract
13
+ methods
14
+ """
15
+
16
+ from __future__ import annotations
17
+
18
+ import json
19
+ import logging
20
+ from typing import TYPE_CHECKING, Any, cast
21
+
22
+ import mcp.types as types
23
+
24
+ from hud.types import AgentResponse, MCPToolCall, MCPToolResult
25
+
26
+ from .base import MCPAgent
27
+
28
+ if TYPE_CHECKING:
29
+ from openai import AsyncOpenAI
30
+ from openai.types.chat import ChatCompletionToolParam
31
+
32
+ from hud.clients import AgentMCPClient
33
+
34
+ logger = logging.getLogger(__name__)
35
+
36
+
37
+ class GenericOpenAIChatAgent(MCPAgent):
38
+ """MCP-enabled agent that speaks the OpenAI *chat.completions* protocol."""
39
+
40
+ def __init__(
41
+ self,
42
+ mcp_client: AgentMCPClient,
43
+ *,
44
+ openai_client: AsyncOpenAI,
45
+ model_name: str = "gpt-4o-mini",
46
+ parallel_tool_calls: bool = False,
47
+ logprobs: bool = False,
48
+ **agent_kwargs: Any,
49
+ ) -> None:
50
+ super().__init__(mcp_client=mcp_client, **agent_kwargs)
51
+ self.oai = openai_client
52
+ self.model_name = model_name
53
+ self.parallel_tool_calls = parallel_tool_calls
54
+ self.logprobs = logprobs
55
+
56
+ @staticmethod
57
+ def _oai_to_mcp(tool_call: Any) -> MCPToolCall: # type: ignore[valid-type]
58
+ """Convert an OpenAI ``tool_call`` to :class:`MCPToolCall`."""
59
+ return MCPToolCall(
60
+ id=tool_call.id,
61
+ name=tool_call.function.name,
62
+ arguments=json.loads(tool_call.function.arguments or "{}"),
63
+ )
64
+
65
+ async def get_system_messages(self) -> list[Any]:
66
+ """Get system messages for OpenAI."""
67
+ return [
68
+ {"role": "system", "content": self.system_prompt},
69
+ ]
70
+
71
+ async def format_blocks(self, blocks: list[types.ContentBlock]) -> list[Any]:
72
+ """Format blocks for OpenAI."""
73
+ return [
74
+ {
75
+ "role": "user",
76
+ "content": [
77
+ {"type": "text", "text": block.text}
78
+ for block in blocks
79
+ if isinstance(block, types.TextContent)
80
+ ],
81
+ },
82
+ ]
83
+
84
+ def get_tool_schemas(self) -> list[dict]:
85
+ tool_schemas = super().get_tool_schemas()
86
+ openai_tools = []
87
+ for schema in tool_schemas:
88
+ openai_tool = {
89
+ "type": "function",
90
+ "function": {
91
+ "name": schema["name"],
92
+ "description": schema.get("description", ""),
93
+ "parameters": schema.get("parameters", {"type": "object", "properties": {}}),
94
+ },
95
+ }
96
+ openai_tools.append(openai_tool)
97
+ return openai_tools
98
+
99
+ async def get_response(self, messages: list[Any]) -> AgentResponse:
100
+ """Send chat request to OpenAI and convert the response."""
101
+ # Convert MCP tool schemas to OpenAI format
102
+ mcp_schemas = self.get_tool_schemas()
103
+
104
+ response = await self.oai.chat.completions.create(
105
+ model=self.model_name,
106
+ messages=messages,
107
+ tools=cast("list[ChatCompletionToolParam]", mcp_schemas),
108
+ parallel_tool_calls=self.parallel_tool_calls,
109
+ logprobs=self.logprobs,
110
+ )
111
+
112
+ choice = response.choices[0]
113
+ msg = choice.message
114
+
115
+ tool_calls = []
116
+ if msg.tool_calls:
117
+ for tc in msg.tool_calls:
118
+ if tc.function.name is not None: # type: ignore
119
+ tool_calls.append(self._oai_to_mcp(tc))
120
+ if not self.parallel_tool_calls:
121
+ break
122
+
123
+ return AgentResponse(
124
+ content=msg.content or "",
125
+ tool_calls=tool_calls,
126
+ done=choice.finish_reason == "stop",
127
+ raw=response, # Include raw response for access to Choice objects
128
+ )
129
+
130
+ async def format_tool_results(
131
+ self,
132
+ tool_calls: list[MCPToolCall],
133
+ tool_results: list[MCPToolResult],
134
+ ) -> list[Any]:
135
+ """Render MCP tool results as OpenAI ``role=tool`` messages."""
136
+ rendered: list[dict[str, Any]] = []
137
+ for call, res in zip(tool_calls, tool_results, strict=False):
138
+ if res.structuredContent:
139
+ content = json.dumps(res.structuredContent)
140
+ else:
141
+ # Concatenate any TextContent blocks
142
+ content = "".join(
143
+ c.text # type: ignore[attr-defined]
144
+ for c in res.content
145
+ if hasattr(c, "text")
146
+ )
147
+ rendered.append(
148
+ {
149
+ "role": "tool",
150
+ "tool_call_id": call.id,
151
+ "content": content or "", # Ensure content is never None
152
+ }
153
+ )
154
+ return rendered
@@ -1 +1 @@
1
- """Tests for MCP Agent module."""
1
+ """Tests for MCP Agent module."""