hud-python 0.3.4__tar.gz → 0.3.5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of hud-python might be problematic. Click here for more details.

Files changed (266) hide show
  1. {hud_python-0.3.4 → hud_python-0.3.5}/PKG-INFO +1 -1
  2. {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/simple_task_example.py +1 -1
  3. {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/gmail_local.py +18 -8
  4. {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/gmail_remote.py +1 -1
  5. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/computer/anthropic.py +6 -0
  6. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/computer/hud.py +18 -12
  7. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/computer/openai.py +6 -0
  8. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_version.py +1 -1
  9. {hud_python-0.3.4 → hud_python-0.3.5}/hud/version.py +1 -1
  10. {hud_python-0.3.4 → hud_python-0.3.5}/pyproject.toml +1 -1
  11. {hud_python-0.3.4 → hud_python-0.3.5}/.env.example +0 -0
  12. {hud_python-0.3.4 → hud_python-0.3.5}/.github/workflows/ci.yml +0 -0
  13. {hud_python-0.3.4 → hud_python-0.3.5}/.github/workflows/release.yml +0 -0
  14. {hud_python-0.3.4 → hud_python-0.3.5}/.gitignore +0 -0
  15. {hud_python-0.3.4 → hud_python-0.3.5}/LICENSE +0 -0
  16. {hud_python-0.3.4 → hud_python-0.3.5}/MANIFEST.in +0 -0
  17. {hud_python-0.3.4 → hud_python-0.3.5}/README.md +0 -0
  18. {hud_python-0.3.4 → hud_python-0.3.5}/docs/advanced/cla-details.mdx +0 -0
  19. {hud_python-0.3.4 → hud_python-0.3.5}/docs/advanced/environment-control.mdx +0 -0
  20. {hud_python-0.3.4 → hud_python-0.3.5}/docs/advanced/tracing.mdx +0 -0
  21. {hud_python-0.3.4 → hud_python-0.3.5}/docs/advanced/uploading.mdx +0 -0
  22. {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/adapters.mdx +0 -0
  23. {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/env.mdx +0 -0
  24. {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/gym.mdx +0 -0
  25. {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/job.mdx +0 -0
  26. {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/task.mdx +0 -0
  27. {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/taskset.mdx +0 -0
  28. {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/telemetry.mdx +0 -0
  29. {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/trajectory.mdx +0 -0
  30. {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/adapter.mdx +0 -0
  31. {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/agent.mdx +0 -0
  32. {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/environment.mdx +0 -0
  33. {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/job.mdx +0 -0
  34. {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/task.mdx +0 -0
  35. {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/trajectory.mdx +0 -0
  36. {hud_python-0.3.4 → hud_python-0.3.5}/docs/docs.json +0 -0
  37. {hud_python-0.3.4 → hud_python-0.3.5}/docs/environment-creation.mdx +0 -0
  38. {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/browser.mdx +0 -0
  39. {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/custom-environments.mdx +0 -0
  40. {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/custom.mdx +0 -0
  41. {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/osworld-ubuntu.mdx +0 -0
  42. {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/qa.mdx +0 -0
  43. {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/alignment-evaluation.mdx +0 -0
  44. {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/benchmarking-agents.mdx +0 -0
  45. {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/custom-os-env.mdx +0 -0
  46. {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/mcp-agent-tracing.mdx +0 -0
  47. {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/web-app-testing.mdx +0 -0
  48. {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/web-mocks.mdx +0 -0
  49. {hud_python-0.3.4 → hud_python-0.3.5}/docs/favicon.png +0 -0
  50. {hud_python-0.3.4 → hud_python-0.3.5}/docs/logo/hud_logo.svg +0 -0
  51. {hud_python-0.3.4 → hud_python-0.3.5}/docs/logo/hud_logo_dark.svg +0 -0
  52. {hud_python-0.3.4 → hud_python-0.3.5}/docs/quickstart.mdx +0 -0
  53. {hud_python-0.3.4 → hud_python-0.3.5}/docs/running-your-agent.mdx +0 -0
  54. {hud_python-0.3.4 → hud_python-0.3.5}/docs/task-creation.mdx +0 -0
  55. {hud_python-0.3.4 → hud_python-0.3.5}/environments/README.md +0 -0
  56. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/.dockerignore +0 -0
  57. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/.gitignore +0 -0
  58. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/Dockerfile +0 -0
  59. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/README.md +0 -0
  60. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/README.md +0 -0
  61. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/README.md +0 -0
  62. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/backend/main.py +0 -0
  63. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/backend/pyproject.toml +0 -0
  64. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/app/globals.css +0 -0
  65. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/app/layout.tsx +0 -0
  66. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/app/page.tsx +0 -0
  67. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/next.config.js +0 -0
  68. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/package-lock.json +0 -0
  69. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/package.json +0 -0
  70. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/postcss.config.js +0 -0
  71. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/tailwind.config.js +0 -0
  72. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/tsconfig.json +0 -0
  73. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/launch.py +0 -0
  74. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/pyproject.toml +0 -0
  75. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/README.md +0 -0
  76. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/__init__.py +0 -0
  77. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/__main__.py +0 -0
  78. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/__init__.py +0 -0
  79. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/context.py +0 -0
  80. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/registry.py +0 -0
  81. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/todo.py +0 -0
  82. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/__init__.py +0 -0
  83. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/registry.py +0 -0
  84. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/todo.py +0 -0
  85. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/runtime.py +0 -0
  86. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/server.py +0 -0
  87. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/services.py +0 -0
  88. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/setup/__init__.py +0 -0
  89. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/setup/registry.py +0 -0
  90. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/setup/todo.py +0 -0
  91. {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/start.sh +0 -0
  92. {hud_python-0.3.4 → hud_python-0.3.5}/environments/docker_debug.py +0 -0
  93. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/.gitignore +0 -0
  94. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/Dockerfile +0 -0
  95. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/README.md +0 -0
  96. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/pyproject.toml +0 -0
  97. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/__init__.py +0 -0
  98. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/__main__.py +0 -0
  99. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/browser_executor.py +0 -0
  100. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/__init__.py +0 -0
  101. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/context.py +0 -0
  102. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/cookie_exists.py +0 -0
  103. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/cookie_match.py +0 -0
  104. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/history_length.py +0 -0
  105. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/page_contains.py +0 -0
  106. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/raw_last_action_is.py +0 -0
  107. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/registry.py +0 -0
  108. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/selector_history.py +0 -0
  109. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/sheet_contains.py +0 -0
  110. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/sheets_cell_values.py +0 -0
  111. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/url_match.py +0 -0
  112. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/verify_type_action.py +0 -0
  113. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/playwright_with_memory.py +0 -0
  114. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/__init__.py +0 -0
  115. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/element_interaction.py +0 -0
  116. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/form_interaction.py +0 -0
  117. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/navigate_and_verify.py +0 -0
  118. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/registry.py +0 -0
  119. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/search_interaction.py +0 -0
  120. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/README.md +0 -0
  121. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/__init__.py +0 -0
  122. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/anchorbrowser.py +0 -0
  123. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/base.py +0 -0
  124. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/browserbase.py +0 -0
  125. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/hyperbrowser.py +0 -0
  126. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/kernel.py +0 -0
  127. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/steel.py +0 -0
  128. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/runtime.py +0 -0
  129. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/server.py +0 -0
  130. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/__init__.py +0 -0
  131. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/cookies.py +0 -0
  132. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/interact.py +0 -0
  133. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/load_html.py +0 -0
  134. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/navigate.py +0 -0
  135. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/registry.py +0 -0
  136. {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/sheets.py +0 -0
  137. {hud_python-0.3.4 → hud_python-0.3.5}/examples/README.md +0 -0
  138. {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/browser_use.ipynb +0 -0
  139. {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/mcp_claude_agent.py +0 -0
  140. {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/mcp_openai_agent.py +0 -0
  141. {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/mcp_test.ipynb +0 -0
  142. {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/mcp_use_agent.py +0 -0
  143. {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/sensitive_data.ipynb +0 -0
  144. {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/pokemon_local.ipynb +0 -0
  145. {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/pokemon_remote.ipynb +0 -0
  146. {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/remote.ipynb +0 -0
  147. {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/resources_example.py +0 -0
  148. {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/simple_browser_example.py +0 -0
  149. {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/eval.py +0 -0
  150. {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/osworld.ipynb +0 -0
  151. {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/sheetbench_direct_example.ipynb +0 -0
  152. {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/tasks.ipynb +0 -0
  153. {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/telemetry_and_datasets.ipynb +0 -0
  154. {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/wordle_example.ipynb +0 -0
  155. {hud_python-0.3.4 → hud_python-0.3.5}/examples/sheets_bench_cua_example.ipynb +0 -0
  156. {hud_python-0.3.4 → hud_python-0.3.5}/hud/__init__.py +0 -0
  157. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/__init__.py +0 -0
  158. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/claude/__init__.py +0 -0
  159. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/claude/adapter.py +0 -0
  160. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/claude/tests/__init__.py +0 -0
  161. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/claude/tests/test_adapter.py +0 -0
  162. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/__init__.py +0 -0
  163. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/adapter.py +0 -0
  164. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/tests/__init__.py +0 -0
  165. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/tests/test_adapter.py +0 -0
  166. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/types.py +0 -0
  167. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/operator/__init__.py +0 -0
  168. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/operator/adapter.py +0 -0
  169. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/operator/tests/__init__.py +0 -0
  170. {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/operator/tests/test_adapter.py +0 -0
  171. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/__init__.py +0 -0
  172. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/base.py +0 -0
  173. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/claude.py +0 -0
  174. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/claude_plays_pokemon.py +0 -0
  175. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/langchain.py +0 -0
  176. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/misc/__init__.py +0 -0
  177. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/misc/response_agent.py +0 -0
  178. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/operator.py +0 -0
  179. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/tests/__init__.py +0 -0
  180. {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/tests/test_base.py +0 -0
  181. {hud_python-0.3.4 → hud_python-0.3.5}/hud/datasets.py +0 -0
  182. {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/__init__.py +0 -0
  183. {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/client.py +0 -0
  184. {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/docker_client.py +0 -0
  185. {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/environment.py +0 -0
  186. {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/local_docker_client.py +0 -0
  187. {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/remote_client.py +0 -0
  188. {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/remote_docker_client.py +0 -0
  189. {hud_python-0.3.4 → hud_python-0.3.5}/hud/exceptions.py +0 -0
  190. {hud_python-0.3.4 → hud_python-0.3.5}/hud/gym.py +0 -0
  191. {hud_python-0.3.4 → hud_python-0.3.5}/hud/job.py +0 -0
  192. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/__init__.py +0 -0
  193. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/base.py +0 -0
  194. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/claude.py +0 -0
  195. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/client.py +0 -0
  196. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/langchain.py +0 -0
  197. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/openai.py +0 -0
  198. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/__init__.py +0 -0
  199. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/test_base.py +0 -0
  200. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/test_claude.py +0 -0
  201. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/test_client.py +0 -0
  202. {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/test_openai.py +0 -0
  203. {hud_python-0.3.4 → hud_python-0.3.5}/hud/py.typed +0 -0
  204. {hud_python-0.3.4 → hud_python-0.3.5}/hud/server/__init__.py +0 -0
  205. {hud_python-0.3.4 → hud_python-0.3.5}/hud/server/requests.py +0 -0
  206. {hud_python-0.3.4 → hud_python-0.3.5}/hud/server/tests/__init__.py +0 -0
  207. {hud_python-0.3.4 → hud_python-0.3.5}/hud/server/tests/test_requests.py +0 -0
  208. {hud_python-0.3.4 → hud_python-0.3.5}/hud/settings.py +0 -0
  209. {hud_python-0.3.4 → hud_python-0.3.5}/hud/task.py +0 -0
  210. {hud_python-0.3.4 → hud_python-0.3.5}/hud/taskset.py +0 -0
  211. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/__init__.py +0 -0
  212. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/_trace.py +0 -0
  213. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/context.py +0 -0
  214. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/exporter.py +0 -0
  215. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/instrumentation/__init__.py +0 -0
  216. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/instrumentation/mcp.py +0 -0
  217. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/instrumentation/registry.py +0 -0
  218. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/job.py +0 -0
  219. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/mcp_models.py +0 -0
  220. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/tests/__init__.py +0 -0
  221. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/tests/test_context.py +0 -0
  222. {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/tests/test_trace.py +0 -0
  223. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/__init__.py +0 -0
  224. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/base.py +0 -0
  225. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/bash.py +0 -0
  226. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/computer/__init__.py +0 -0
  227. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/edit.py +0 -0
  228. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/__init__.py +0 -0
  229. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/base.py +0 -0
  230. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/pyautogui.py +0 -0
  231. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/tests/__init__.py +0 -0
  232. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/tests/test_base_executor.py +0 -0
  233. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/tests/test_pyautogui_executor.py +0 -0
  234. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/xdo.py +0 -0
  235. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/README.md +0 -0
  236. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/__init__.py +0 -0
  237. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/mcp_server.py +0 -0
  238. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/server_initialization.py +0 -0
  239. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/utils.py +0 -0
  240. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/playwright_tool.py +0 -0
  241. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/__init__.py +0 -0
  242. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_bash.py +0 -0
  243. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_computer.py +0 -0
  244. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_computer_actions.py +0 -0
  245. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_edit.py +0 -0
  246. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_init.py +0 -0
  247. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_playwright_tool.py +0 -0
  248. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_tools.py +0 -0
  249. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_utils.py +0 -0
  250. {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/utils.py +0 -0
  251. {hud_python-0.3.4 → hud_python-0.3.5}/hud/trajectory.py +0 -0
  252. {hud_python-0.3.4 → hud_python-0.3.5}/hud/types.py +0 -0
  253. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/__init__.py +0 -0
  254. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/agent.py +0 -0
  255. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/common.py +0 -0
  256. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/config.py +0 -0
  257. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/deprecation.py +0 -0
  258. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/misc.py +0 -0
  259. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/progress.py +0 -0
  260. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/telemetry.py +0 -0
  261. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/__init__.py +0 -0
  262. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_common.py +0 -0
  263. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_config.py +0 -0
  264. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_init.py +0 -0
  265. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_progress.py +0 -0
  266. {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_telemetry.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: hud-python
3
- Version: 0.3.4
3
+ Version: 0.3.5
4
4
  Summary: SDK for the HUD platform.
5
5
  Project-URL: Homepage, https://github.com/hud-evals/hud-python
6
6
  Project-URL: Bug Tracker, https://github.com/hud-evals/hud-python/issues
@@ -18,7 +18,7 @@ Usage:
18
18
  import asyncio
19
19
  import logging
20
20
  from hud.mcp import ClaudeMCPAgent
21
- from hud.task import TaskConfig
21
+ from hud.datasets import TaskConfig
22
22
  from mcp.types import CallToolRequestParams as MCPToolCall
23
23
  from mcp_use import MCPClient
24
24
 
@@ -1,8 +1,12 @@
1
1
  import asyncio
2
2
  import hud
3
- from hud.mcp import ClaudeMCPAgent, OpenAIMCPAgent
4
- from hud.task import TaskConfig
5
- from mcp_use import MCPClient
3
+ from hud.datasets import TaskConfig
4
+ from hud.mcp import ClaudeMCPAgent, OpenAIMCPAgent, MCPClient
5
+ from hud.mcp.base import AgentResult
6
+
7
+ import logging
8
+
9
+ logging.basicConfig(level=logging.INFO)
6
10
 
7
11
 
8
12
  async def main():
@@ -36,18 +40,24 @@ async def main():
36
40
  },
37
41
  "metadata": {"id": "forward-series-b-deck-to-billgates"},
38
42
  }
43
+ # Update the prompt to give a disclaimer that this is a testing environment (anthropic doesn't like doing some actions)
44
+ task_dict["prompt"] = (
45
+ task_dict["prompt"]
46
+ + "\n\nThis is a mock sandbox environment for evaluations, so feel free to execute any actions you want and do not ask me for confirmation before executing actions."
47
+ )
39
48
 
40
49
  # Create TaskConfig from dict
41
50
  task = TaskConfig(**task_dict)
42
51
 
43
52
  print("📡 Defining the environment...")
44
53
  print("🔴 See the agent live at http://localhost:6080/vnc.html")
45
- client = MCPClient.from_dict({"mcp_config": task.mcp_config})
54
+ client = MCPClient(mcp_config=task.mcp_config)
46
55
 
47
56
  agent = ClaudeMCPAgent( # or OpenAIMCPAgent
48
57
  mcp_client=client,
49
58
  model="claude-3-7-sonnet-20250219",
50
- allowed_tools=["computer"],
59
+ # Allowing anthropic_computer tool to be used because we're using ClaudeMCPAgent
60
+ allowed_tools=["anthropic_computer"],
51
61
  initial_screenshot=True,
52
62
  )
53
63
 
@@ -57,16 +67,16 @@ async def main():
57
67
 
58
68
  # Run the task
59
69
  print("🚀 Running the task...")
60
- eval_result = await agent.run(task, max_steps=10)
70
+ eval_result: AgentResult = await agent.run(task, max_steps=30)
61
71
  print(f"🎉 Task Result: {eval_result}")
62
72
 
63
73
  # Show formatted results
64
- reward = eval_result.get("reward", 0.0)
74
+ reward = eval_result.reward
65
75
  print(f" 🏆 Reward: {reward}")
66
76
 
67
77
  # Clean up
68
78
  print("\n🧹 Cleaning up...")
69
- await client.close_all_sessions()
79
+ await client.close()
70
80
  print("✅ Done!")
71
81
 
72
82
 
@@ -1,7 +1,7 @@
1
1
  import asyncio
2
2
  import hud
3
3
  from hud.mcp import ClaudeMCPAgent, OpenAIMCPAgent
4
- from hud.task import TaskConfig
4
+ from hud.datasets import TaskConfig
5
5
  from mcp_use import MCPClient
6
6
 
7
7
 
@@ -68,6 +68,8 @@ class AnthropicComputerTool(HudComputerTool):
68
68
  self,
69
69
  width: int = 1400,
70
70
  height: int = 850,
71
+ environment_width: int = 1920,
72
+ environment_height: int = 1080,
71
73
  display_num: int | None = None,
72
74
  platform_type: Literal["auto", "xdo", "pyautogui"] = "auto",
73
75
  rescale_images: bool = False,
@@ -79,6 +81,8 @@ class AnthropicComputerTool(HudComputerTool):
79
81
  Args:
80
82
  width: Target width for rescaling (default: 1400 for Anthropic)
81
83
  height: Target height for rescaling (default: 850 for Anthropic)
84
+ environment_width: Environment screen width (default: 1920)
85
+ environment_height: Environment screen height (default: 1080)
82
86
  display_num: X display number
83
87
  platform_type: Which executor to use:
84
88
  - "auto": Automatically detect based on platform
@@ -91,6 +95,8 @@ class AnthropicComputerTool(HudComputerTool):
91
95
  width=width,
92
96
  height=height,
93
97
  display_num=display_num,
98
+ environment_width=environment_width,
99
+ environment_height=environment_height,
94
100
  platform_type=platform_type,
95
101
  rescale_images=rescale_images,
96
102
  **kwargs,
@@ -16,9 +16,6 @@ from hud.tools.executors.xdo import XDOExecutor
16
16
 
17
17
  logger = logging.getLogger(__name__)
18
18
 
19
- BASE_SCREEN_WIDTH = 1920
20
- BASE_SCREEN_HEIGHT = 1080
21
-
22
19
 
23
20
  class HudComputerTool:
24
21
  """
@@ -29,6 +26,8 @@ class HudComputerTool:
29
26
  self,
30
27
  width: int | None = None,
31
28
  height: int | None = None,
29
+ environment_width: int = 1920,
30
+ environment_height: int = 1080,
32
31
  display_num: int | None = None,
33
32
  platform_type: Literal["auto", "xdo", "pyautogui"] = "auto",
34
33
  custom_executor: BaseExecutor | None = None,
@@ -38,8 +37,10 @@ class HudComputerTool:
38
37
  Initialize the HUD computer tool.
39
38
 
40
39
  Args:
41
- width: Target width for rescaling (None = use actual screen width)
42
- height: Target height for rescaling (None = use actual screen height)
40
+ width: Target width for rescaling (None = use environment width)
41
+ height: Target height for rescaling (None = use environment height)
42
+ environment_width: Base screen width
43
+ environment_height: Base screen height
43
44
  display_num: X display number
44
45
  platform_type: Which executor to use:
45
46
  - "auto": Automatically detect based on platform
@@ -49,20 +50,25 @@ class HudComputerTool:
49
50
  rescale_images: If True, rescale screenshots. If False, only rescale action coordinates
50
51
  """
51
52
  # Use provided dimensions or defaults
52
- self.width = width or BASE_SCREEN_WIDTH
53
- self.height = height or BASE_SCREEN_HEIGHT
53
+ self.width = width or environment_width
54
+ self.environment_width = environment_width
55
+
56
+ self.height = height or environment_height
57
+ self.environment_height = environment_height
58
+
54
59
  self.rescale_images = rescale_images
55
60
 
56
61
  logger.info("Width: %s, Height: %s", self.width, self.height)
57
62
  logger.info(
58
- "Base Screen Width: %s, Base Screen Height: %s",
59
- BASE_SCREEN_WIDTH,
60
- BASE_SCREEN_HEIGHT,
63
+ "Environment Screen Width: %s, Environment Screen Height: %s",
64
+ self.environment_width,
65
+ self.environment_height,
61
66
  )
62
67
 
63
68
  # Calculate scaling factors from base screen size to target size
64
- self.scale_x = self.width / BASE_SCREEN_WIDTH
65
- self.scale_y = self.height / BASE_SCREEN_HEIGHT
69
+ self.scale_x = self.width / self.environment_width
70
+
71
+ self.scale_y = self.height / self.environment_height
66
72
 
67
73
  logger.info("Scale X: %s, Scale Y: %s", self.scale_x, self.scale_y)
68
74
  self.scale = min(self.scale_x, self.scale_y)
@@ -51,6 +51,8 @@ class OpenAIComputerTool(HudComputerTool):
51
51
  self,
52
52
  width: int = 1024,
53
53
  height: int = 768,
54
+ environment_width: int = 1920,
55
+ environment_height: int = 1080,
54
56
  display_num: int | None = None,
55
57
  platform_type: Literal["auto", "xdo", "pyautogui"] = "auto",
56
58
  rescale_images: bool = False,
@@ -62,6 +64,8 @@ class OpenAIComputerTool(HudComputerTool):
62
64
  Args:
63
65
  width: Target width for rescaling (default: 1024 for OpenAI)
64
66
  height: Target height for rescaling (default: 768 for OpenAI)
67
+ environment_width: Environment screen width (default: 1920)
68
+ environment_height: Environment screen height (default: 1080)
65
69
  display_num: X display number
66
70
  platform_type: Which executor to use:
67
71
  - "auto": Automatically detect based on platform
@@ -73,6 +77,8 @@ class OpenAIComputerTool(HudComputerTool):
73
77
  super().__init__(
74
78
  width=width,
75
79
  height=height,
80
+ environment_width=environment_width,
81
+ environment_height=environment_height,
76
82
  display_num=display_num,
77
83
  platform_type=platform_type,
78
84
  rescale_images=rescale_images,
@@ -5,4 +5,4 @@ def test_import():
5
5
  """Test that the package can be imported."""
6
6
  import hud
7
7
 
8
- assert hud.__version__ == "0.3.4"
8
+ assert hud.__version__ == "0.3.5"
@@ -4,4 +4,4 @@ Version information for the HUD SDK.
4
4
 
5
5
  from __future__ import annotations
6
6
 
7
- __version__ = "0.3.4"
7
+ __version__ = "0.3.5"
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "hud-python"
3
- version = "0.3.4"
3
+ version = "0.3.5"
4
4
  description = "SDK for the HUD platform."
5
5
  readme = "README.md"
6
6
  requires-python = ">=3.11, <3.14"
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes