PyPI - hud-python - Versions diffs - 0.4.34__py3-none-any.whl → 0.4.36__py3-none-any.whl - Mend

hud-python 0.4.34py3-none-any.whl → 0.4.36py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hud-python might be problematic. Click here for more details.

Files changed (40) hide show

hud/agents/claude.py +9 -1
hud/agents/openai.py +9 -1
hud/agents/tests/test_claude.py +32 -7
hud/agents/tests/test_openai.py +29 -6
hud/cli/__init__.py +209 -75
hud/cli/build.py +10 -5
hud/cli/dev.py +20 -39
hud/cli/eval.py +4 -3
hud/cli/flows/tasks.py +1 -0
hud/cli/init.py +222 -629
hud/cli/pull.py +6 -0
hud/cli/push.py +2 -1
hud/cli/rl/remote_runner.py +3 -1
hud/cli/tests/test_build.py +3 -27
hud/cli/tests/test_mcp_server.py +1 -12
hud/cli/utils/config.py +85 -0
hud/cli/utils/docker.py +21 -39
hud/cli/utils/environment.py +4 -3
hud/cli/utils/interactive.py +2 -1
hud/cli/utils/local_runner.py +204 -0
hud/cli/utils/metadata.py +3 -1
hud/cli/utils/package_runner.py +292 -0
hud/cli/utils/remote_runner.py +4 -1
hud/clients/mcp_use.py +30 -7
hud/datasets/parallel.py +3 -1
hud/datasets/runner.py +5 -2
hud/otel/context.py +38 -4
hud/rl/buffer.py +3 -0
hud/rl/tests/test_learner.py +1 -1
hud/server/server.py +157 -1
hud/settings.py +38 -0
hud/shared/hints.py +1 -1
hud/utils/tests/test_version.py +1 -1
hud/utils/tool_shorthand.py +7 -4
hud/version.py +1 -1
{hud_python-0.4.34.dist-info → hud_python-0.4.36.dist-info}/METADATA +30 -12
{hud_python-0.4.34.dist-info → hud_python-0.4.36.dist-info}/RECORD +40 -37
{hud_python-0.4.34.dist-info → hud_python-0.4.36.dist-info}/WHEEL +0 -0
{hud_python-0.4.34.dist-info → hud_python-0.4.36.dist-info}/entry_points.txt +0 -0
{hud_python-0.4.34.dist-info → hud_python-0.4.36.dist-info}/licenses/LICENSE +0 -0

hud/agents/claude.py CHANGED Viewed

@@ -6,7 +6,7 @@ import copy
 import logging
 from typing import TYPE_CHECKING, Any, ClassVar, cast
-from anthropic import AsyncAnthropic, BadRequestError
+from anthropic import Anthropic, AsyncAnthropic, BadRequestError
 from anthropic.types.beta import BetaContentBlockParam, BetaImageBlockParam, BetaTextBlockParam
 import hud
@@ -54,6 +54,7 @@ class ClaudeAgent(MCPAgent):
         model: str = "claude-sonnet-4-20250514",
         max_tokens: int = 4096,
         use_computer_beta: bool = True,
+        validate_api_key: bool = True,
         **kwargs: Any,
     ) -> None:
         """
@@ -75,6 +76,13 @@ class ClaudeAgent(MCPAgent):
                 raise ValueError("Anthropic API key not found. Set ANTHROPIC_API_KEY.")
             model_client = AsyncAnthropic(api_key=api_key)
+        # validate api key if requested
+        if validate_api_key:
+            try:
+                Anthropic(api_key=model_client.api_key).models.list()
+            except Exception as e:
+                raise ValueError(f"Anthropic API key is invalid: {e}") from e
         self.anthropic_client = model_client
         self.model = model
         self.max_tokens = max_tokens

hud/agents/openai.py CHANGED Viewed

@@ -6,7 +6,7 @@ import logging
 from typing import Any, ClassVar, Literal
 import mcp.types as types
-from openai import AsyncOpenAI
+from openai import AsyncOpenAI, OpenAI
 from openai.types.responses import (
     ResponseComputerToolCall,
     ResponseInputMessageContentListParam,
@@ -45,6 +45,7 @@ class OperatorAgent(MCPAgent):
         model_client: AsyncOpenAI | None = None,
         model: str = "computer-use-preview",
         environment: Literal["windows", "mac", "linux", "browser"] = "linux",
+        validate_api_key: bool = True,
         **kwargs: Any,
     ) -> None:
         """
@@ -76,6 +77,13 @@ class OperatorAgent(MCPAgent):
         self.pending_call_id: str | None = None
         self.pending_safety_checks: list[Any] = []
+        # validate api key if requested
+        if validate_api_key:
+            try:
+                OpenAI(api_key=self.openai_client.api_key).models.list()
+            except Exception as e:
+                raise ValueError(f"OpenAI API key is invalid: {e}") from e
         self.model_name = "openai-" + self.model
         # Append OpenAI-specific instructions to the base system prompt

hud/agents/tests/test_claude.py CHANGED Viewed

@@ -86,6 +86,7 @@ class TestClaudeAgent:
             model_client=mock_model_client,
             model="claude-3-opus-20240229",
             max_tokens=1000,
+            validate_api_key=False,  # Skip validation in tests
         )
         assert agent.model_name == "claude-3-opus-20240229"
@@ -93,10 +94,14 @@ class TestClaudeAgent:
         assert agent.anthropic_client == mock_model_client
     @pytest.mark.asyncio
-    async def test_init_without_model_client(self, mock_mcp_client):
+    async def test_init_without_model_client(self, mock_mcp_client, mock_anthropic):
         """Test agent initialization without model client."""
         with patch("hud.settings.settings.anthropic_api_key", "test_key"):
-            agent = ClaudeAgent(mcp_client=mock_mcp_client, model="claude-3-opus-20240229")
+            agent = ClaudeAgent(
+                mcp_client=mock_mcp_client,
+                model="claude-3-opus-20240229",
+                validate_api_key=False,  # Skip validation in tests
+            )
             assert agent.model_name == "claude-3-opus-20240229"
             assert agent.anthropic_client is not None
@@ -105,7 +110,11 @@ class TestClaudeAgent:
     async def test_format_blocks(self, mock_mcp_client):
         """Test formatting content blocks into Claude messages."""
         mock_model_client = MagicMock()
-        agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_model_client)
+        agent = ClaudeAgent(
+            mcp_client=mock_mcp_client,
+            model_client=mock_model_client,
+            validate_api_key=False,  # Skip validation in tests
+        )
         # Test with text only
         text_blocks: list[types.ContentBlock] = [
@@ -141,7 +150,11 @@ class TestClaudeAgent:
     async def test_format_tool_results_method(self, mock_mcp_client):
         """Test the agent's format_tool_results method."""
         mock_model_client = MagicMock()
-        agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_model_client)
+        agent = ClaudeAgent(
+            mcp_client=mock_mcp_client,
+            model_client=mock_model_client,
+            validate_api_key=False,  # Skip validation in tests
+        )
         tool_calls = [
             MCPToolCall(name="test_tool", arguments={}, id="id1"),
@@ -171,7 +184,11 @@ class TestClaudeAgent:
         """Test getting model response from Claude API."""
         # Disable telemetry for this test to avoid backend configuration issues
         with patch("hud.settings.settings.telemetry_enabled", False):
-            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
+            agent = ClaudeAgent(
+                mcp_client=mock_mcp_client,
+                model_client=mock_anthropic,
+                validate_api_key=False,  # Skip validation in tests
+            )
             # Mock the API response
             mock_response = MagicMock()
@@ -215,7 +232,11 @@ class TestClaudeAgent:
         """Test getting text-only response."""
         # Disable telemetry for this test to avoid backend configuration issues
         with patch("hud.settings.settings.telemetry_enabled", False):
-            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
+            agent = ClaudeAgent(
+                mcp_client=mock_mcp_client,
+                model_client=mock_anthropic,
+                validate_api_key=False,  # Skip validation in tests
+            )
             mock_response = MagicMock()
             # Create text block
@@ -242,7 +263,11 @@ class TestClaudeAgent:
         """Test handling API errors."""
         # Disable telemetry for this test to avoid backend configuration issues
         with patch("hud.settings.settings.telemetry_enabled", False):
-            agent = ClaudeAgent(mcp_client=mock_mcp_client, model_client=mock_anthropic)
+            agent = ClaudeAgent(
+                mcp_client=mock_mcp_client,
+                model_client=mock_anthropic,
+                validate_api_key=False,  # Skip validation in tests
+            )
             # Mock API error
             mock_anthropic.beta.messages.create = AsyncMock(

hud/agents/tests/test_openai.py CHANGED Viewed

@@ -44,7 +44,10 @@ class TestOperatorAgent:
         """Test agent initialization."""
         mock_model_client = MagicMock()
         agent = OperatorAgent(
-            mcp_client=mock_mcp_client, model_client=mock_model_client, model="gpt-4"
+            mcp_client=mock_mcp_client,
+            model_client=mock_model_client,
+            model="gpt-4",
+            validate_api_key=False,  # Skip validation in tests
         )
         assert agent.model_name == "openai-gpt-4"
@@ -55,7 +58,11 @@ class TestOperatorAgent:
     async def test_format_blocks(self, mock_mcp_client):
         """Test formatting content blocks."""
         mock_model_client = MagicMock()
-        agent = OperatorAgent(mcp_client=mock_mcp_client, model_client=mock_model_client)
+        agent = OperatorAgent(
+            mcp_client=mock_mcp_client,
+            model_client=mock_model_client,
+            validate_api_key=False,  # Skip validation in tests
+        )
         # Test with text blocks
         blocks: list[types.ContentBlock] = [
@@ -85,7 +92,11 @@ class TestOperatorAgent:
     @pytest.mark.asyncio
     async def test_format_tool_results(self, mock_mcp_client, mock_openai):
         """Test formatting tool results."""
-        agent = OperatorAgent(mcp_client=mock_mcp_client, model_client=mock_openai)
+        agent = OperatorAgent(
+            mcp_client=mock_mcp_client,
+            model_client=mock_openai,
+            validate_api_key=False,  # Skip validation in tests
+        )
         tool_calls = [
             MCPToolCall(name="test_tool", arguments={}, id="call_123"),  # type: ignore
@@ -111,7 +122,11 @@ class TestOperatorAgent:
     @pytest.mark.asyncio
     async def test_format_tool_results_with_error(self, mock_mcp_client, mock_openai):
         """Test formatting tool results with errors."""
-        agent = OperatorAgent(mcp_client=mock_mcp_client, model_client=mock_openai)
+        agent = OperatorAgent(
+            mcp_client=mock_mcp_client,
+            model_client=mock_openai,
+            validate_api_key=False,  # Skip validation in tests
+        )
         tool_calls = [
             MCPToolCall(name="failing_tool", arguments={}, id="call_error"),  # type: ignore
@@ -131,7 +146,11 @@ class TestOperatorAgent:
     @pytest.mark.asyncio
     async def test_get_model_response(self, mock_mcp_client, mock_openai):
         """Test getting model response from OpenAI API."""
-        agent = OperatorAgent(mcp_client=mock_mcp_client, model_client=mock_openai)
+        agent = OperatorAgent(
+            mcp_client=mock_mcp_client,
+            model_client=mock_openai,
+            validate_api_key=False,  # Skip validation in tests
+        )
         # Set up available tools so agent doesn't return "No computer use tools available"
         agent._available_tools = [
@@ -162,7 +181,11 @@ class TestOperatorAgent:
     @pytest.mark.asyncio
     async def test_handle_empty_response(self, mock_mcp_client, mock_openai):
         """Test handling empty response from API."""
-        agent = OperatorAgent(mcp_client=mock_mcp_client, model_client=mock_openai)
+        agent = OperatorAgent(
+            mcp_client=mock_mcp_client,
+            model_client=mock_openai,
+            validate_api_key=False,  # Skip validation in tests
+        )
         # Set up available tools
         agent._available_tools = [

hud/cli/__init__.py CHANGED Viewed

@@ -3,6 +3,7 @@
 from __future__ import annotations
 import asyncio
+import contextlib
 import json
 import sys
 from pathlib import Path
@@ -28,6 +29,7 @@ from .init import create_environment
 from .pull import pull_command
 from .push import push_command
 from .remove import remove_command
+from .utils.config import set_env_values
 from .utils.cursor import get_cursor_config_path, list_cursor_servers, parse_cursor_config
 from .utils.logging import CaptureLogger
@@ -116,7 +118,9 @@ def analyze(
         image, *docker_args = params
         if live or docker_args:  # If docker args provided, assume live mode
             # Build Docker command from image and args
-            docker_cmd = ["docker", "run", "--rm", "-i", *docker_args, image]
+            from .utils.docker import build_run_command
+            docker_cmd = build_run_command(image, docker_args)
             asyncio.run(analyze_environment(docker_cmd, output_format, verbose))
         else:
             # Fast mode - analyze from metadata
@@ -239,11 +243,15 @@ def debug(
                     raise typer.Exit(1)
             # Build Docker command
-            command = ["docker", "run", "--rm", "-i", *docker_args, image_name]
+            from .utils.docker import build_run_command
+            command = build_run_command(image_name, docker_args)
         else:
             # Assume it's an image name
             image = first_param
-            command = ["docker", "run", "--rm", "-i", *docker_args, image]
+            from .utils.docker import build_run_command
+            command = build_run_command(image, docker_args)
     else:
         console.print(
             "[red]Error: Must specify a directory, Docker image, --config, or --cursor[/red]"
@@ -370,12 +378,10 @@ def dev(
         False, "--interactive", help="Launch interactive testing mode (HTTP mode only)"
     ),
 ) -> None:
-    """🔥 Development mode with hot-reload.
-    Runs your MCP environment in Docker with automatic restart on file changes.
+    """🔥 Development mode - interactive MCP environment.
-    The container's last command (typically the MCP server) will be wrapped
-    with watchfiles for hot-reload functionality.
+    Runs your MCP environment in Docker with mounted source for development.
+    The container's CMD determines reload behavior.
     Examples:
         hud dev                      # Auto-detect in current directory
@@ -388,13 +394,12 @@ def dev(
         hud dev . --inspector        # Launch MCP Inspector (HTTP mode only)
         hud dev . --interactive      # Launch interactive testing mode (HTTP mode only)
         hud dev . --no-logs          # Disable Docker log streaming
-        hud dev . --full-reload      # Restart entire container on file changes (instead of just server)
         # With Docker arguments (after all options):
         hud dev . -e BROWSER_PROVIDER=anchorbrowser -e ANCHOR_API_KEY=xxx
         hud dev . -e API_KEY=secret -v /tmp/data:/data --network host
         hud dev . --build -e DEBUG=true --memory 2g
-    """  # noqa: E501
+    """
     # Parse directory and Docker arguments
     if params:
         directory = params[0]
@@ -424,7 +429,7 @@ def dev(
 def run(
     params: list[str] = typer.Argument(  # type: ignore[arg-type]  # noqa: B008
         None,
-        help="Docker image followed by optional arguments (e.g., 'hud-image:latest -e KEY=value')",
+        help="Python file/module/package or Docker image followed by optional arguments",
     ),
     local: bool = typer.Option(
         False,
@@ -474,32 +479,152 @@ def run(
         "--interactive",
         help="Launch interactive testing mode (HTTP transport only)",
     ),
+    reload: bool = typer.Option(
+        False,
+        "--reload",
+        help="Enable auto-reload on file changes (local Python files only)",
+    ),
+    watch: list[str] = typer.Option(  # noqa: B008
+        None,
+        "--watch",
+        help="Directories to watch for changes (can be used multiple times). Defaults to current directory.",  # noqa: E501
+    ),
+    cmd: str | None = typer.Option(
+        None,
+        "--cmd",
+        help="Command to run as MCP server (e.g., 'python -m controller')",
+    ),
 ) -> None:
-    """🚀 Run MCP server locally or remotely.
+    """🚀 Run MCP server.
-    By default, runs remotely via mcp.hud.so. Use --local for Docker.
+    Modes:
+    - Python (decorator-based): pass a dotted module path. Example: hud run controller
+      The module is imported, decorators register implicitly, and the server runs.
+      Use --reload to watch the module/package directory.
-    Remote Examples:
-        hud run hud-text-2048:latest
-        hud run my-server:v1 -e API_KEY=xxx -h Run-Id:abc123
-        hud run my-server:v1 --transport http --port 9000
+    - Command: use --cmd to run any command as an MCP server. Example: hud run --cmd "python -m controller"
+      Works with Docker, binaries, or any executable. Supports --reload.
-    Local Examples:
-        hud run --local hud-text-2048:latest
-        hud run --local my-server:v1 -e API_KEY=xxx
-        hud run --local my-server:v1 --transport http
-    Interactive Testing (local only):
-        hud run --local --interactive --transport http hud-text-2048:latest
-        hud run --local --interactive --transport http --port 9000 my-server:v1
-    """
-    if not params:
-        typer.echo("❌ Docker image is required")
+    - Docker image: pass a Docker image name (optionally with --local to run locally).
+    """  # noqa: E501
+    if not params and not cmd:
+        typer.echo("❌ Dotted module path, Docker image, or --cmd is required")
         raise typer.Exit(1)
-    # Parse image and args
-    image = params[0]
-    docker_args = params[1:] if len(params) > 1 else []
+    # Handle --cmd mode
+    if cmd:
+        import asyncio
+        from .utils.package_runner import run_package_as_mcp
+        asyncio.run(
+            run_package_as_mcp(
+                cmd,  # Pass command string
+                transport=transport,
+                port=port,
+                verbose=verbose,
+                reload=reload,
+                watch_paths=watch if watch else None,
+            )
+        )
+        return
+    first_param = params[0]
+    extra_args = params[1:] if len(params) > 1 else []
+    # Guard: strip accidental nested 'run' token from positional args,
+    # which can happen with nested invocations or reload wrappers.
+    if first_param == "run" and extra_args:
+        first_param, extra_args = extra_args[0], extra_args[1:]
+    # Try to interpret first_param as module[:attr] or file[:attr]
+    target = first_param
+    server_attr = "mcp"
+    if ":" in target:
+        target, server_attr = target.split(":", 1)
+    # Only allow dotted import paths or python files for Python mode
+    import importlib.util as _importlib_util
+    # Ensure current working directory is importable for local packages like 'controller'
+    try:
+        import sys as _sys
+        from pathlib import Path as _Path
+        cwd_str = str(_Path.cwd())
+        if cwd_str not in _sys.path:
+            _sys.path.insert(0, cwd_str)
+    except Exception:  # noqa: S110
+        pass
+    try:
+        # If given a file path, detect and import via file spec
+        from pathlib import Path as _Path
+        if target.endswith(".py") and _Path(target).exists():
+            spec = _importlib_util.spec_from_file_location("_hud_module", target)
+        else:
+            spec = _importlib_util.find_spec(target)
+    except Exception:
+        spec = None
+    # Fallback: treat a local package directory (e.g. 'controller') as a module target
+    from pathlib import Path as _Path
+    pkg_dir = _Path(target)
+    is_pkg_dir = pkg_dir.is_dir() and (pkg_dir / "__init__.py").exists()
+    is_python_target = (spec is not None) or is_pkg_dir
+    if is_python_target and not (local or remote):
+        # Python file/package mode - use implicit MCP server
+        import asyncio
+        from .utils.package_runner import run_package_as_mcp, run_with_reload
+        if reload:
+            # Run with watchfiles reload
+            # Use user-provided watch paths or compute from module
+            if watch:
+                watch_paths = watch
+            else:
+                # Compute a watch path that works for dotted modules as well
+                watch_paths = [target]
+                if spec is not None:
+                    origin = getattr(spec, "origin", None)
+                    sublocs = getattr(spec, "submodule_search_locations", None)
+                    if origin:
+                        p = _Path(origin)
+                        # If package __init__.py, watch the package directory
+                        watch_paths = [str(p.parent if p.name == "__init__.py" else p)]
+                    elif sublocs:
+                        with contextlib.suppress(Exception):
+                            watch_paths = [next(iter(sublocs))]
+            # Always run as subprocess when using reload to enable proper file watching
+            # This ensures the parent process can watch files while the child runs the server
+            run_with_reload(
+                None,  # This forces subprocess mode for both stdio and http
+                watch_paths,
+                verbose=verbose,
+            )
+        else:
+            # Run normally (but still pass reload=False for consistency)
+            asyncio.run(
+                run_package_as_mcp(
+                    target,
+                    transport=transport,
+                    port=port,
+                    verbose=verbose,
+                    server_attr=server_attr,
+                    reload=False,  # Explicitly pass reload state
+                    watch_paths=None,
+                )
+            )
+        return
+    # Docker image mode
+    image = first_param
+    docker_args = extra_args
     # Handle conflicting flags
     if local and remote:
@@ -741,6 +866,12 @@ def remove(
 @app.command()
 def init(
     name: str = typer.Argument(None, help="Environment name (default: current directory name)"),
+    preset: str | None = typer.Option(
+        None,
+        "--preset",
+        "-p",
+        help="Preset to use: blank, deep-research, browser. If omitted, you'll choose interactively.",  # noqa: E501
+    ),
     directory: str = typer.Option(".", "--dir", "-d", help="Target directory"),
     force: bool = typer.Option(False, "--force", "-f", help="Overwrite existing files"),
 ) -> None:
@@ -757,7 +888,7 @@ def init(
         hud init my-env             # Create in ./my-env/
         hud init my-env --dir /tmp  # Create in /tmp/my-env/
     """
-    create_environment(name, directory, force)
+    create_environment(name, directory, force, preset)
 @app.command()
@@ -774,7 +905,7 @@ def eval(
     source: str | None = typer.Argument(
         None,
         help=(
-            "HuggingFace dataset identifier (e.g. 'hud-evals/SheetBench-50') or task JSON file. "
+            "HuggingFace dataset (e.g. 'hud-evals/SheetBench-50') or task JSON file. "
             "If not provided, looks for task.json in current directory."
         ),
     ),
@@ -846,54 +977,21 @@ def eval(
     hud_console = HUDConsole()
-    # If no source provided, look for task/eval JSON files in current directory
+    # If no source provided, reuse RL helper to find a tasks file interactively
     if source is None:
-        # Search for JSON files with "task" or "eval" in the name (case-insensitive)
-        json_files = []
-        patterns = [
-            "*task*.json",
-            "*eval*.json",
-            "*Task*.json",
-            "*Eval*.json",
-            "*TASK*.json",
-            "*EVAL*.json",
-        ]
-        # First check current directory
-        for pattern in patterns:
-            json_files.extend(Path(".").glob(pattern))
-        # If no files found, search recursively (but limit depth to avoid deep searches)
-        if not json_files:
-            for pattern in patterns:
-                # Search up to 2 levels deep
-                json_files.extend(Path(".").glob(f"*/{pattern}"))
-                json_files.extend(Path(".").glob(f"*/*/{pattern}"))
-        # Remove duplicates and sort
-        json_files = sorted(set(json_files))
-        if not json_files:
+        try:
+            from hud.cli.utils.tasks import find_tasks_file
+            source = find_tasks_file(None, msg="Select a tasks file to run")
+            hud_console.success(f"Selected: {source}")
+        except Exception as e:
             hud_console.error(
                 "No source provided and no task/eval JSON files found in current directory"
             )
             hud_console.info(
-                "Usage: hud eval <source> or create a task JSON file "
-                "(e.g., task.json, eval_config.json)"
-            )
-            raise typer.Exit(1)
-        elif len(json_files) == 1:
-            source = str(json_files[0])
-            hud_console.info(f"Found task file: {source}")
-        else:
-            # Multiple files found, let user choose
-            hud_console.info("Multiple task files found:")
-            file_choice = hud_console.select(
-                "Select a task file to run:",
-                choices=[str(f) for f in json_files],
+                "Usage: hud eval <source> or create a task JSON file (e.g., task.json, tasks.jsonl)"
             )
-            source = file_choice
-            hud_console.success(f"Selected: {source}")
+            raise typer.Exit(1) from e
     # Import eval_command lazily to avoid importing agent dependencies
     try:
@@ -1085,6 +1183,42 @@ def rl(
     )
+@app.command()
+def set(
+    assignments: list[str] = typer.Argument(  # type: ignore[arg-type]  # noqa: B008
+        ..., help="One or more KEY=VALUE pairs to persist in ~/.hud/.env"
+    ),
+) -> None:
+    """Persist API keys or other variables for HUD to use by default.
+    Examples:
+        hud set ANTHROPIC_API_KEY=sk-... OPENAI_API_KEY=sk-...
+    Values are stored in ~/.hud/.env and are loaded by hud.settings with
+    the lowest precedence (overridden by process env and project .env).
+    """
+    from hud.utils.hud_console import HUDConsole
+    hud_console = HUDConsole()
+    updates: dict[str, str] = {}
+    for item in assignments:
+        if "=" not in item:
+            hud_console.error(f"Invalid assignment (expected KEY=VALUE): {item}")
+            raise typer.Exit(1)
+        key, value = item.split("=", 1)
+        key = key.strip()
+        value = value.strip()
+        if not key:
+            hud_console.error(f"Invalid key in assignment: {item}")
+            raise typer.Exit(1)
+        updates[key] = value
+    path = set_env_values(updates)
+    hud_console.success("Saved credentials to user config")
+    hud_console.info(f"Location: {path}")
 def main() -> None:
     """Main entry point for the CLI."""
     # Handle --version flag before Typer parses args

hud/cli/build.py CHANGED Viewed

@@ -236,10 +236,13 @@ def build_docker_image(
         hud_console.error(f"No Dockerfile found in {directory}")
         return False
+    # Default platform to match RL pipeline unless explicitly overridden
+    effective_platform = platform if platform is not None else "linux/amd64"
     # Build command
     cmd = ["docker", "build"]
-    if platform:
-        cmd.extend(["--platform", platform])
+    if effective_platform:
+        cmd.extend(["--platform", effective_platform])
     cmd.extend(["-t", tag])
     if no_cache:
         cmd.append("--no-cache")
@@ -437,8 +440,10 @@ def build_environment(
     version_tag = f"{base_name}:{new_version}"
     label_cmd = ["docker", "build"]
-    if platform is not None:
-        label_cmd.extend(["--platform", platform])
+    # Use same defaulting for the second build step
+    label_platform = platform if platform is not None else "linux/amd64"
+    if label_platform:
+        label_cmd.extend(["--platform", label_platform])
     label_cmd.extend(
         [
             "--label",
@@ -489,7 +494,7 @@ def build_environment(
         hud_console.warning("Could not retrieve image ID for lock file")
     # Remove temp image after we're done
-    subprocess.run(["docker", "rmi", temp_tag], capture_output=True)  # noqa: S603, S607
+    subprocess.run(["docker", "rmi", "-f", temp_tag], capture_output=True)  # noqa: S603, S607
     # Add to local registry
     if image_id:

hud-python 0.4.34__py3-none-any.whl → 0.4.36__py3-none-any.whl

Potentially problematic release.

hud-python 0.4.34py3-none-any.whl → 0.4.36py3-none-any.whl