hud-python 0.3.4__tar.gz → 0.3.5__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of hud-python might be problematic. Click here for more details.
- {hud_python-0.3.4 → hud_python-0.3.5}/PKG-INFO +1 -1
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/simple_task_example.py +1 -1
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/gmail_local.py +18 -8
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/gmail_remote.py +1 -1
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/computer/anthropic.py +6 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/computer/hud.py +18 -12
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/computer/openai.py +6 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_version.py +1 -1
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/version.py +1 -1
- {hud_python-0.3.4 → hud_python-0.3.5}/pyproject.toml +1 -1
- {hud_python-0.3.4 → hud_python-0.3.5}/.env.example +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/.github/workflows/ci.yml +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/.github/workflows/release.yml +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/.gitignore +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/LICENSE +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/MANIFEST.in +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/advanced/cla-details.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/advanced/environment-control.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/advanced/tracing.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/advanced/uploading.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/adapters.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/env.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/gym.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/job.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/task.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/taskset.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/telemetry.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/api-reference/trajectory.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/adapter.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/agent.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/environment.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/job.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/task.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/concepts/trajectory.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/docs.json +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/environment-creation.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/browser.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/custom-environments.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/custom.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/osworld-ubuntu.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/environments/qa.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/alignment-evaluation.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/benchmarking-agents.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/custom-os-env.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/mcp-agent-tracing.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/web-app-testing.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/examples/web-mocks.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/favicon.png +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/logo/hud_logo.svg +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/logo/hud_logo_dark.svg +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/quickstart.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/running-your-agent.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/docs/task-creation.mdx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/.dockerignore +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/.gitignore +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/Dockerfile +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/backend/main.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/backend/pyproject.toml +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/app/globals.css +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/app/layout.tsx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/app/page.tsx +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/next.config.js +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/package-lock.json +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/package.json +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/postcss.config.js +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/tailwind.config.js +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/tsconfig.json +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/launch.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/pyproject.toml +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/__main__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/context.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/registry.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/todo.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/registry.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/todo.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/runtime.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/server.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/services.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/setup/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/setup/registry.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/setup/todo.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/start.sh +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/docker_debug.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/.gitignore +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/Dockerfile +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/pyproject.toml +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/__main__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/browser_executor.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/context.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/cookie_exists.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/cookie_match.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/history_length.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/page_contains.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/raw_last_action_is.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/registry.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/selector_history.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/sheet_contains.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/sheets_cell_values.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/url_match.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/evaluators/verify_type_action.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/playwright_with_memory.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/element_interaction.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/form_interaction.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/navigate_and_verify.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/registry.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/problems/search_interaction.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/anchorbrowser.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/base.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/browserbase.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/hyperbrowser.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/kernel.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/providers/steel.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/runtime.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/server.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/cookies.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/interact.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/load_html.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/navigate.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/registry.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/sheets.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/browser_use.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/mcp_claude_agent.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/mcp_openai_agent.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/mcp_test.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/mcp_use_agent.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/agents_tools/sensitive_data.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/pokemon_local.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/pokemon_remote.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/remote.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/resources_example.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/environments/simple_browser_example.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/eval.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/osworld.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/sheetbench_direct_example.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/tasks.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/telemetry_and_datasets.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/evaluations/wordle_example.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/examples/sheets_bench_cua_example.ipynb +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/claude/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/claude/adapter.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/claude/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/claude/tests/test_adapter.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/adapter.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/tests/test_adapter.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/common/types.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/operator/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/operator/adapter.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/operator/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/adapters/operator/tests/test_adapter.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/base.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/claude.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/claude_plays_pokemon.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/langchain.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/misc/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/misc/response_agent.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/operator.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/agent/tests/test_base.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/datasets.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/client.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/docker_client.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/environment.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/local_docker_client.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/remote_client.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/env/remote_docker_client.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/exceptions.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/gym.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/job.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/base.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/claude.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/client.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/langchain.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/openai.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/test_base.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/test_claude.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/test_client.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/mcp/tests/test_openai.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/py.typed +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/server/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/server/requests.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/server/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/server/tests/test_requests.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/settings.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/task.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/taskset.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/_trace.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/context.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/exporter.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/instrumentation/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/instrumentation/mcp.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/instrumentation/registry.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/job.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/mcp_models.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/tests/test_context.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/telemetry/tests/test_trace.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/base.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/bash.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/computer/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/edit.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/base.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/pyautogui.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/tests/test_base_executor.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/tests/test_pyautogui_executor.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/executors/xdo.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/README.md +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/mcp_server.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/server_initialization.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/helper/utils.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/playwright_tool.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_bash.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_computer.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_computer_actions.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_edit.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_init.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_playwright_tool.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_tools.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/tests/test_utils.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/tools/utils.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/trajectory.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/types.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/agent.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/common.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/config.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/deprecation.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/misc.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/progress.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/telemetry.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/__init__.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_common.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_config.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_init.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_progress.py +0 -0
- {hud_python-0.3.4 → hud_python-0.3.5}/hud/utils/tests/test_telemetry.py +0 -0
|
@@ -1,8 +1,12 @@
|
|
|
1
1
|
import asyncio
|
|
2
2
|
import hud
|
|
3
|
-
from hud.
|
|
4
|
-
from hud.
|
|
5
|
-
from
|
|
3
|
+
from hud.datasets import TaskConfig
|
|
4
|
+
from hud.mcp import ClaudeMCPAgent, OpenAIMCPAgent, MCPClient
|
|
5
|
+
from hud.mcp.base import AgentResult
|
|
6
|
+
|
|
7
|
+
import logging
|
|
8
|
+
|
|
9
|
+
logging.basicConfig(level=logging.INFO)
|
|
6
10
|
|
|
7
11
|
|
|
8
12
|
async def main():
|
|
@@ -36,18 +40,24 @@ async def main():
|
|
|
36
40
|
},
|
|
37
41
|
"metadata": {"id": "forward-series-b-deck-to-billgates"},
|
|
38
42
|
}
|
|
43
|
+
# Update the prompt to give a disclaimer that this is a testing environment (anthropic doesn't like doing some actions)
|
|
44
|
+
task_dict["prompt"] = (
|
|
45
|
+
task_dict["prompt"]
|
|
46
|
+
+ "\n\nThis is a mock sandbox environment for evaluations, so feel free to execute any actions you want and do not ask me for confirmation before executing actions."
|
|
47
|
+
)
|
|
39
48
|
|
|
40
49
|
# Create TaskConfig from dict
|
|
41
50
|
task = TaskConfig(**task_dict)
|
|
42
51
|
|
|
43
52
|
print("📡 Defining the environment...")
|
|
44
53
|
print("🔴 See the agent live at http://localhost:6080/vnc.html")
|
|
45
|
-
client = MCPClient
|
|
54
|
+
client = MCPClient(mcp_config=task.mcp_config)
|
|
46
55
|
|
|
47
56
|
agent = ClaudeMCPAgent( # or OpenAIMCPAgent
|
|
48
57
|
mcp_client=client,
|
|
49
58
|
model="claude-3-7-sonnet-20250219",
|
|
50
|
-
|
|
59
|
+
# Allowing anthropic_computer tool to be used because we're using ClaudeMCPAgent
|
|
60
|
+
allowed_tools=["anthropic_computer"],
|
|
51
61
|
initial_screenshot=True,
|
|
52
62
|
)
|
|
53
63
|
|
|
@@ -57,16 +67,16 @@ async def main():
|
|
|
57
67
|
|
|
58
68
|
# Run the task
|
|
59
69
|
print("🚀 Running the task...")
|
|
60
|
-
eval_result = await agent.run(task, max_steps=
|
|
70
|
+
eval_result: AgentResult = await agent.run(task, max_steps=30)
|
|
61
71
|
print(f"🎉 Task Result: {eval_result}")
|
|
62
72
|
|
|
63
73
|
# Show formatted results
|
|
64
|
-
reward = eval_result.
|
|
74
|
+
reward = eval_result.reward
|
|
65
75
|
print(f" 🏆 Reward: {reward}")
|
|
66
76
|
|
|
67
77
|
# Clean up
|
|
68
78
|
print("\n🧹 Cleaning up...")
|
|
69
|
-
await client.
|
|
79
|
+
await client.close()
|
|
70
80
|
print("✅ Done!")
|
|
71
81
|
|
|
72
82
|
|
|
@@ -68,6 +68,8 @@ class AnthropicComputerTool(HudComputerTool):
|
|
|
68
68
|
self,
|
|
69
69
|
width: int = 1400,
|
|
70
70
|
height: int = 850,
|
|
71
|
+
environment_width: int = 1920,
|
|
72
|
+
environment_height: int = 1080,
|
|
71
73
|
display_num: int | None = None,
|
|
72
74
|
platform_type: Literal["auto", "xdo", "pyautogui"] = "auto",
|
|
73
75
|
rescale_images: bool = False,
|
|
@@ -79,6 +81,8 @@ class AnthropicComputerTool(HudComputerTool):
|
|
|
79
81
|
Args:
|
|
80
82
|
width: Target width for rescaling (default: 1400 for Anthropic)
|
|
81
83
|
height: Target height for rescaling (default: 850 for Anthropic)
|
|
84
|
+
environment_width: Environment screen width (default: 1920)
|
|
85
|
+
environment_height: Environment screen height (default: 1080)
|
|
82
86
|
display_num: X display number
|
|
83
87
|
platform_type: Which executor to use:
|
|
84
88
|
- "auto": Automatically detect based on platform
|
|
@@ -91,6 +95,8 @@ class AnthropicComputerTool(HudComputerTool):
|
|
|
91
95
|
width=width,
|
|
92
96
|
height=height,
|
|
93
97
|
display_num=display_num,
|
|
98
|
+
environment_width=environment_width,
|
|
99
|
+
environment_height=environment_height,
|
|
94
100
|
platform_type=platform_type,
|
|
95
101
|
rescale_images=rescale_images,
|
|
96
102
|
**kwargs,
|
|
@@ -16,9 +16,6 @@ from hud.tools.executors.xdo import XDOExecutor
|
|
|
16
16
|
|
|
17
17
|
logger = logging.getLogger(__name__)
|
|
18
18
|
|
|
19
|
-
BASE_SCREEN_WIDTH = 1920
|
|
20
|
-
BASE_SCREEN_HEIGHT = 1080
|
|
21
|
-
|
|
22
19
|
|
|
23
20
|
class HudComputerTool:
|
|
24
21
|
"""
|
|
@@ -29,6 +26,8 @@ class HudComputerTool:
|
|
|
29
26
|
self,
|
|
30
27
|
width: int | None = None,
|
|
31
28
|
height: int | None = None,
|
|
29
|
+
environment_width: int = 1920,
|
|
30
|
+
environment_height: int = 1080,
|
|
32
31
|
display_num: int | None = None,
|
|
33
32
|
platform_type: Literal["auto", "xdo", "pyautogui"] = "auto",
|
|
34
33
|
custom_executor: BaseExecutor | None = None,
|
|
@@ -38,8 +37,10 @@ class HudComputerTool:
|
|
|
38
37
|
Initialize the HUD computer tool.
|
|
39
38
|
|
|
40
39
|
Args:
|
|
41
|
-
width: Target width for rescaling (None = use
|
|
42
|
-
height: Target height for rescaling (None = use
|
|
40
|
+
width: Target width for rescaling (None = use environment width)
|
|
41
|
+
height: Target height for rescaling (None = use environment height)
|
|
42
|
+
environment_width: Base screen width
|
|
43
|
+
environment_height: Base screen height
|
|
43
44
|
display_num: X display number
|
|
44
45
|
platform_type: Which executor to use:
|
|
45
46
|
- "auto": Automatically detect based on platform
|
|
@@ -49,20 +50,25 @@ class HudComputerTool:
|
|
|
49
50
|
rescale_images: If True, rescale screenshots. If False, only rescale action coordinates
|
|
50
51
|
"""
|
|
51
52
|
# Use provided dimensions or defaults
|
|
52
|
-
self.width = width or
|
|
53
|
-
self.
|
|
53
|
+
self.width = width or environment_width
|
|
54
|
+
self.environment_width = environment_width
|
|
55
|
+
|
|
56
|
+
self.height = height or environment_height
|
|
57
|
+
self.environment_height = environment_height
|
|
58
|
+
|
|
54
59
|
self.rescale_images = rescale_images
|
|
55
60
|
|
|
56
61
|
logger.info("Width: %s, Height: %s", self.width, self.height)
|
|
57
62
|
logger.info(
|
|
58
|
-
"
|
|
59
|
-
|
|
60
|
-
|
|
63
|
+
"Environment Screen Width: %s, Environment Screen Height: %s",
|
|
64
|
+
self.environment_width,
|
|
65
|
+
self.environment_height,
|
|
61
66
|
)
|
|
62
67
|
|
|
63
68
|
# Calculate scaling factors from base screen size to target size
|
|
64
|
-
self.scale_x = self.width /
|
|
65
|
-
|
|
69
|
+
self.scale_x = self.width / self.environment_width
|
|
70
|
+
|
|
71
|
+
self.scale_y = self.height / self.environment_height
|
|
66
72
|
|
|
67
73
|
logger.info("Scale X: %s, Scale Y: %s", self.scale_x, self.scale_y)
|
|
68
74
|
self.scale = min(self.scale_x, self.scale_y)
|
|
@@ -51,6 +51,8 @@ class OpenAIComputerTool(HudComputerTool):
|
|
|
51
51
|
self,
|
|
52
52
|
width: int = 1024,
|
|
53
53
|
height: int = 768,
|
|
54
|
+
environment_width: int = 1920,
|
|
55
|
+
environment_height: int = 1080,
|
|
54
56
|
display_num: int | None = None,
|
|
55
57
|
platform_type: Literal["auto", "xdo", "pyautogui"] = "auto",
|
|
56
58
|
rescale_images: bool = False,
|
|
@@ -62,6 +64,8 @@ class OpenAIComputerTool(HudComputerTool):
|
|
|
62
64
|
Args:
|
|
63
65
|
width: Target width for rescaling (default: 1024 for OpenAI)
|
|
64
66
|
height: Target height for rescaling (default: 768 for OpenAI)
|
|
67
|
+
environment_width: Environment screen width (default: 1920)
|
|
68
|
+
environment_height: Environment screen height (default: 1080)
|
|
65
69
|
display_num: X display number
|
|
66
70
|
platform_type: Which executor to use:
|
|
67
71
|
- "auto": Automatically detect based on platform
|
|
@@ -73,6 +77,8 @@ class OpenAIComputerTool(HudComputerTool):
|
|
|
73
77
|
super().__init__(
|
|
74
78
|
width=width,
|
|
75
79
|
height=height,
|
|
80
|
+
environment_width=environment_width,
|
|
81
|
+
environment_height=environment_height,
|
|
76
82
|
display_num=display_num,
|
|
77
83
|
platform_type=platform_type,
|
|
78
84
|
rescale_images=rescale_images,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/app/globals.css
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/app/layout.tsx
RENAMED
|
File without changes
|
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/next.config.js
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/package-lock.json
RENAMED
|
File without changes
|
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/postcss.config.js
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/apps/todo/frontend/tailwind.config.js
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/__init__.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/context.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/registry.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/evaluators/todo.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/__init__.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/registry.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/problems/todo.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/setup/__init__.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/browser/src/hud_controller/setup/registry.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/__init__.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/__main__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/runtime.py
RENAMED
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/server.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hud_python-0.3.4 → hud_python-0.3.5}/environments/remote_browser/src/hud_controller/setup/sheets.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|