PyPI - hud-python - Versions diffs - 0.4.45__py3-none-any.whl → 0.5.13__py3-none-any.whl - Mend

hud-python 0.4.45py3-none-any.whl → 0.5.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (282) hide show

hud/__init__.py +27 -7
hud/agents/__init__.py +70 -5
hud/agents/base.py +238 -500
hud/agents/claude.py +236 -247
hud/agents/gateway.py +42 -0
hud/agents/gemini.py +264 -0
hud/agents/gemini_cua.py +324 -0
hud/agents/grounded_openai.py +98 -100
hud/agents/misc/integration_test_agent.py +51 -20
hud/agents/misc/response_agent.py +48 -36
hud/agents/openai.py +282 -296
hud/agents/{openai_chat_generic.py → openai_chat.py} +63 -33
hud/agents/operator.py +199 -0
hud/agents/resolver.py +70 -0
hud/agents/tests/conftest.py +133 -0
hud/agents/tests/test_base.py +300 -622
hud/agents/tests/test_base_runtime.py +233 -0
hud/agents/tests/test_claude.py +381 -214
hud/agents/tests/test_client.py +9 -10
hud/agents/tests/test_gemini.py +369 -0
hud/agents/tests/test_grounded_openai_agent.py +65 -50
hud/agents/tests/test_openai.py +377 -140
hud/agents/tests/test_operator.py +362 -0
hud/agents/tests/test_resolver.py +192 -0
hud/agents/tests/test_run_eval.py +179 -0
hud/agents/types.py +148 -0
hud/cli/__init__.py +493 -546
hud/cli/analyze.py +43 -5
hud/cli/build.py +699 -113
hud/cli/debug.py +8 -5
hud/cli/dev.py +889 -732
hud/cli/eval.py +793 -667
hud/cli/flows/dev.py +167 -0
hud/cli/flows/init.py +191 -0
hud/cli/flows/tasks.py +153 -56
hud/cli/flows/templates.py +151 -0
hud/cli/flows/tests/__init__.py +1 -0
hud/cli/flows/tests/test_dev.py +126 -0
hud/cli/init.py +60 -58
hud/cli/pull.py +1 -1
hud/cli/push.py +38 -13
hud/cli/rft.py +311 -0
hud/cli/rft_status.py +145 -0
hud/cli/tests/test_analyze.py +5 -5
hud/cli/tests/test_analyze_metadata.py +3 -2
hud/cli/tests/test_analyze_module.py +120 -0
hud/cli/tests/test_build.py +110 -8
hud/cli/tests/test_build_failure.py +41 -0
hud/cli/tests/test_build_module.py +50 -0
hud/cli/tests/test_cli_init.py +6 -1
hud/cli/tests/test_cli_more_wrappers.py +30 -0
hud/cli/tests/test_cli_root.py +140 -0
hud/cli/tests/test_convert.py +361 -0
hud/cli/tests/test_debug.py +12 -10
hud/cli/tests/test_dev.py +197 -0
hud/cli/tests/test_eval.py +251 -0
hud/cli/tests/test_eval_bedrock.py +51 -0
hud/cli/tests/test_init.py +124 -0
hud/cli/tests/test_main_module.py +11 -5
hud/cli/tests/test_mcp_server.py +12 -100
hud/cli/tests/test_push.py +1 -1
hud/cli/tests/test_push_happy.py +74 -0
hud/cli/tests/test_push_wrapper.py +23 -0
hud/cli/tests/test_registry.py +1 -1
hud/cli/tests/test_utils.py +1 -1
hud/cli/{rl → utils}/celebrate.py +14 -12
hud/cli/utils/config.py +18 -1
hud/cli/utils/docker.py +130 -4
hud/cli/utils/env_check.py +9 -9
hud/cli/utils/git.py +136 -0
hud/cli/utils/interactive.py +39 -5
hud/cli/utils/metadata.py +70 -1
hud/cli/utils/runner.py +1 -1
hud/cli/utils/server.py +2 -2
hud/cli/utils/source_hash.py +3 -3
hud/cli/utils/tasks.py +4 -1
hud/cli/utils/tests/__init__.py +0 -0
hud/cli/utils/tests/test_config.py +58 -0
hud/cli/utils/tests/test_docker.py +93 -0
hud/cli/utils/tests/test_docker_hints.py +71 -0
hud/cli/utils/tests/test_env_check.py +74 -0
hud/cli/utils/tests/test_environment.py +42 -0
hud/cli/utils/tests/test_git.py +142 -0
hud/cli/utils/tests/test_interactive_module.py +60 -0
hud/cli/utils/tests/test_local_runner.py +50 -0
hud/cli/utils/tests/test_logging_utils.py +23 -0
hud/cli/utils/tests/test_metadata.py +49 -0
hud/cli/utils/tests/test_package_runner.py +35 -0
hud/cli/utils/tests/test_registry_utils.py +49 -0
hud/cli/utils/tests/test_remote_runner.py +25 -0
hud/cli/utils/tests/test_runner_modules.py +52 -0
hud/cli/utils/tests/test_source_hash.py +36 -0
hud/cli/utils/tests/test_tasks.py +80 -0
hud/cli/utils/version_check.py +258 -0
hud/cli/{rl → utils}/viewer.py +2 -2
hud/clients/README.md +12 -11
hud/clients/__init__.py +4 -3
hud/clients/base.py +166 -26
hud/clients/environment.py +51 -0
hud/clients/fastmcp.py +13 -6
hud/clients/mcp_use.py +45 -15
hud/clients/tests/test_analyze_scenarios.py +206 -0
hud/clients/tests/test_protocol.py +9 -3
hud/datasets/__init__.py +23 -20
hud/datasets/loader.py +326 -0
hud/datasets/runner.py +198 -105
hud/datasets/tests/__init__.py +0 -0
hud/datasets/tests/test_loader.py +221 -0
hud/datasets/tests/test_utils.py +315 -0
hud/datasets/utils.py +270 -90
hud/environment/__init__.py +52 -0
hud/environment/connection.py +258 -0
hud/environment/connectors/__init__.py +33 -0
hud/environment/connectors/base.py +68 -0
hud/environment/connectors/local.py +177 -0
hud/environment/connectors/mcp_config.py +137 -0
hud/environment/connectors/openai.py +101 -0
hud/environment/connectors/remote.py +172 -0
hud/environment/environment.py +835 -0
hud/environment/integrations/__init__.py +45 -0
hud/environment/integrations/adk.py +67 -0
hud/environment/integrations/anthropic.py +196 -0
hud/environment/integrations/gemini.py +92 -0
hud/environment/integrations/langchain.py +82 -0
hud/environment/integrations/llamaindex.py +68 -0
hud/environment/integrations/openai.py +238 -0
hud/environment/mock.py +306 -0
hud/environment/router.py +263 -0
hud/environment/scenarios.py +620 -0
hud/environment/tests/__init__.py +1 -0
hud/environment/tests/test_connection.py +317 -0
hud/environment/tests/test_connectors.py +205 -0
hud/environment/tests/test_environment.py +593 -0
hud/environment/tests/test_integrations.py +257 -0
hud/environment/tests/test_local_connectors.py +242 -0
hud/environment/tests/test_scenarios.py +1086 -0
hud/environment/tests/test_tools.py +208 -0
hud/environment/types.py +23 -0
hud/environment/utils/__init__.py +35 -0
hud/environment/utils/formats.py +215 -0
hud/environment/utils/schema.py +171 -0
hud/environment/utils/tool_wrappers.py +113 -0
hud/eval/__init__.py +67 -0
hud/eval/context.py +727 -0
hud/eval/display.py +299 -0
hud/eval/instrument.py +187 -0
hud/eval/manager.py +533 -0
hud/eval/parallel.py +268 -0
hud/eval/task.py +372 -0
hud/eval/tests/__init__.py +1 -0
hud/eval/tests/test_context.py +178 -0
hud/eval/tests/test_eval.py +210 -0
hud/eval/tests/test_manager.py +152 -0
hud/eval/tests/test_parallel.py +168 -0
hud/eval/tests/test_task.py +291 -0
hud/eval/types.py +65 -0
hud/eval/utils.py +194 -0
hud/patches/__init__.py +19 -0
hud/patches/mcp_patches.py +308 -0
hud/patches/warnings.py +54 -0
hud/samples/browser.py +4 -4
hud/server/__init__.py +2 -1
hud/server/low_level.py +2 -1
hud/server/router.py +164 -0
hud/server/server.py +567 -80
hud/server/tests/test_mcp_server_integration.py +11 -11
hud/server/tests/test_mcp_server_more.py +1 -1
hud/server/tests/test_server_extra.py +2 -0
hud/settings.py +45 -3
hud/shared/exceptions.py +36 -10
hud/shared/hints.py +26 -1
hud/shared/requests.py +15 -3
hud/shared/tests/test_exceptions.py +40 -31
hud/shared/tests/test_hints.py +167 -0
hud/telemetry/__init__.py +20 -19
hud/telemetry/exporter.py +201 -0
hud/telemetry/instrument.py +165 -253
hud/telemetry/tests/test_eval_telemetry.py +356 -0
hud/telemetry/tests/test_exporter.py +258 -0
hud/telemetry/tests/test_instrument.py +401 -0
hud/tools/__init__.py +18 -2
hud/tools/agent.py +223 -0
hud/tools/apply_patch.py +639 -0
hud/tools/base.py +54 -4
hud/tools/bash.py +2 -2
hud/tools/computer/__init__.py +36 -3
hud/tools/computer/anthropic.py +2 -2
hud/tools/computer/gemini.py +385 -0
hud/tools/computer/hud.py +23 -6
hud/tools/computer/openai.py +20 -21
hud/tools/computer/qwen.py +434 -0
hud/tools/computer/settings.py +37 -0
hud/tools/edit.py +3 -7
hud/tools/executors/base.py +4 -2
hud/tools/executors/pyautogui.py +1 -1
hud/tools/grounding/grounded_tool.py +13 -18
hud/tools/grounding/grounder.py +10 -31
hud/tools/grounding/tests/test_grounded_tool.py +26 -44
hud/tools/jupyter.py +330 -0
hud/tools/playwright.py +18 -3
hud/tools/shell.py +308 -0
hud/tools/tests/test_agent_tool.py +355 -0
hud/tools/tests/test_apply_patch.py +718 -0
hud/tools/tests/test_computer.py +4 -9
hud/tools/tests/test_computer_actions.py +24 -2
hud/tools/tests/test_jupyter_tool.py +181 -0
hud/tools/tests/test_shell.py +596 -0
hud/tools/tests/test_submit.py +85 -0
hud/tools/tests/test_types.py +193 -0
hud/tools/types.py +21 -1
hud/types.py +194 -56
hud/utils/__init__.py +2 -0
hud/utils/env.py +67 -0
hud/utils/hud_console.py +89 -18
hud/utils/mcp.py +15 -58
hud/utils/strict_schema.py +162 -0
hud/utils/tests/test_init.py +1 -2
hud/utils/tests/test_mcp.py +1 -28
hud/utils/tests/test_pretty_errors.py +186 -0
hud/utils/tests/test_tool_shorthand.py +154 -0
hud/utils/tests/test_version.py +1 -1
hud/utils/types.py +20 -0
hud/version.py +1 -1
hud_python-0.5.13.dist-info/METADATA +264 -0
hud_python-0.5.13.dist-info/RECORD +305 -0
{hud_python-0.4.45.dist-info → hud_python-0.5.13.dist-info}/WHEEL +1 -1
hud/agents/langchain.py +0 -261
hud/agents/lite_llm.py +0 -72
hud/cli/rl/__init__.py +0 -180
hud/cli/rl/config.py +0 -101
hud/cli/rl/display.py +0 -133
hud/cli/rl/gpu.py +0 -63
hud/cli/rl/gpu_utils.py +0 -321
hud/cli/rl/local_runner.py +0 -595
hud/cli/rl/presets.py +0 -96
hud/cli/rl/remote_runner.py +0 -463
hud/cli/rl/rl_api.py +0 -150
hud/cli/rl/vllm.py +0 -177
hud/cli/rl/wait_utils.py +0 -89
hud/datasets/parallel.py +0 -687
hud/misc/__init__.py +0 -1
hud/misc/claude_plays_pokemon.py +0 -292
hud/otel/__init__.py +0 -35
hud/otel/collector.py +0 -142
hud/otel/config.py +0 -181
hud/otel/context.py +0 -570
hud/otel/exporters.py +0 -369
hud/otel/instrumentation.py +0 -135
hud/otel/processors.py +0 -121
hud/otel/tests/__init__.py +0 -1
hud/otel/tests/test_processors.py +0 -197
hud/rl/README.md +0 -30
hud/rl/__init__.py +0 -1
hud/rl/actor.py +0 -176
hud/rl/buffer.py +0 -405
hud/rl/chat_template.jinja +0 -101
hud/rl/config.py +0 -192
hud/rl/distributed.py +0 -132
hud/rl/learner.py +0 -637
hud/rl/tests/__init__.py +0 -1
hud/rl/tests/test_learner.py +0 -186
hud/rl/train.py +0 -382
hud/rl/types.py +0 -101
hud/rl/utils/start_vllm_server.sh +0 -30
hud/rl/utils.py +0 -524
hud/rl/vllm_adapter.py +0 -143
hud/telemetry/job.py +0 -352
hud/telemetry/replay.py +0 -74
hud/telemetry/tests/test_replay.py +0 -40
hud/telemetry/tests/test_trace.py +0 -63
hud/telemetry/trace.py +0 -158
hud/utils/agent_factories.py +0 -86
hud/utils/async_utils.py +0 -65
hud/utils/group_eval.py +0 -223
hud/utils/progress.py +0 -149
hud/utils/tasks.py +0 -127
hud/utils/tests/test_async_utils.py +0 -173
hud/utils/tests/test_progress.py +0 -261
hud_python-0.4.45.dist-info/METADATA +0 -552
hud_python-0.4.45.dist-info/RECORD +0 -228
{hud_python-0.4.45.dist-info → hud_python-0.5.13.dist-info}/entry_points.txt +0 -0
{hud_python-0.4.45.dist-info → hud_python-0.5.13.dist-info}/licenses/LICENSE +0 -0

hud/tools/playwright.py CHANGED Viewed

@@ -84,6 +84,9 @@ class PlaywrightTool(BaseTool):
                             code=INVALID_PARAMS, message="url parameter is required for navigate"
                         )
                     )
+                # Guard against pydantic FieldInfo default leaking through
+                if not isinstance(wait_for_load_state, str):
+                    wait_for_load_state = None
                 result = await self.navigate(url, wait_for_load_state or "networkidle")
             elif action == "screenshot":
@@ -179,11 +182,16 @@ class PlaywrightTool(BaseTool):
                 if self._browser is None:
                     raise RuntimeError("Failed to connect to remote browser")
-                # Use existing context or create new one
+                # Reuse existing context and page where possible to avoid spawning new windows
                 contexts = self._browser.contexts
                 if contexts:
                     self._browser_context = contexts[0]
+                    # Prefer the first existing page to keep using the already visible window/tab
+                    existing_pages = self._browser_context.pages
+                    if existing_pages:
+                        self.page = existing_pages[0]
                 else:
+                    # As a fallback, create a new context
                     self._browser_context = await self._browser.new_context(
                         viewport={"width": 1920, "height": 1080},
                         ignore_https_errors=True,
@@ -225,7 +233,14 @@ class PlaywrightTool(BaseTool):
             if self._browser_context is None:
                 raise RuntimeError("Browser context failed to initialize")
-            self.page = await self._browser_context.new_page()
+            # Reuse existing page if available (for CDP connections), otherwise create new one
+            pages = self._browser_context.pages
+            if pages:
+                self.page = pages[0]
+                logger.info("Reusing existing browser page")
+            else:
+                self.page = await self._browser_context.new_page()
+                logger.info("Created new browser page")
             logger.info("Playwright browser launched successfully")
     async def navigate(
@@ -280,7 +295,7 @@ class PlaywrightTool(BaseTool):
         try:
             # Always return base64 encoded screenshot as ToolResult
-            screenshot_bytes = await self.page.screenshot(full_page=True)
+            screenshot_bytes = await self.page.screenshot(full_page=False)
             import base64
             screenshot_b64 = base64.b64encode(screenshot_bytes).decode()

hud/tools/shell.py ADDED Viewed

@@ -0,0 +1,308 @@
+"""
+Shell tool implementation conforming to OpenAI's shell tool specification.
+https://platform.openai.com/docs/guides/tools-shell
+Key features:
+- Auto-restart on error (no manual restart command)
+- Dynamic timeout via timeout_ms from agent
+- Dynamic max_output_length from agent (passed back, not truncated locally)
+- Output conforms to shell_call_output format
+"""
+import asyncio
+import os
+import sys
+from dataclasses import dataclass
+from typing import Any, Literal
+from .types import ToolError
+@dataclass
+class ShellCallOutcome:
+    """Outcome of a shell command execution."""
+    type: Literal["exit", "timeout"]
+    exit_code: int | None = None
+    def to_dict(self) -> dict:
+        if self.type == "timeout":
+            return {"type": "timeout"}
+        return {"type": "exit", "exit_code": self.exit_code}
+@dataclass
+class ShellCommandOutput:
+    """Output of a single shell command execution."""
+    stdout: str
+    stderr: str
+    outcome: ShellCallOutcome
+    def to_dict(self) -> dict:
+        return {
+            "stdout": self.stdout,
+            "stderr": self.stderr,
+            "outcome": self.outcome.to_dict(),
+        }
+@dataclass
+class ShellResult:
+    """Result of shell tool execution, conforming to shell_call_output format."""
+    output: list[ShellCommandOutput]
+    max_output_length: int | None = None
+    def to_dict(self) -> dict:
+        result: dict[str, Any] = {
+            "output": [o.to_dict() for o in self.output],
+        }
+        if self.max_output_length is not None:
+            result["max_output_length"] = self.max_output_length
+        return result
+class _BashSession:
+    """A session of a bash shell."""
+    _started: bool
+    _process: asyncio.subprocess.Process
+    command: str = "/bin/bash"
+    _output_delay: float = 0.2  # seconds
+    _sentinel: str = "<<exit>>"
+    def __init__(self) -> None:
+        self._started = False
+        self._timed_out = False
+    async def start(self) -> None:
+        if self._started:
+            await asyncio.sleep(0)
+            return
+        # preexec_fn and user demotion only available on Unix when running as root
+        preexec_fn = None
+        if sys.platform != "win32" and os.getuid() == 0:
+            # Only demote when running as root (e.g., inside Docker containers)
+            def demote() -> None:
+                # This only runs in the child process (Unix only)
+                os.setsid()  # type: ignore[attr-defined]
+                os.setgid(1000)  # type: ignore[attr-defined]
+                os.setuid(1000)  # type: ignore[attr-defined]
+            preexec_fn = demote
+        self._process = await asyncio.create_subprocess_shell(  # noqa: S604
+            self.command,
+            preexec_fn=preexec_fn,
+            shell=True,
+            bufsize=0,
+            stdin=asyncio.subprocess.PIPE,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+        )
+        self._started = True
+        self._timed_out = False
+    def stop(self) -> None:
+        """Terminate the bash shell."""
+        if not self._started:
+            return
+        if self._process.returncode is not None:
+            return
+        self._process.terminate()
+    def is_alive(self) -> bool:
+        """Check if the session is alive and usable."""
+        return self._started and self._process.returncode is None and not self._timed_out
+    async def run(self, command: str, timeout_ms: int | None = None) -> ShellCommandOutput:
+        """Execute a command in the bash shell."""
+        if not self._started:
+            raise ToolError("Session has not started.")
+        # Convert timeout from ms to seconds, default to 120 seconds
+        timeout_sec = (timeout_ms / 1000.0) if timeout_ms else 120.0
+        # we know these are not None because we created the process with PIPEs
+        assert self._process.stdin
+        assert self._process.stdout
+        assert self._process.stderr
+        # send command to the process
+        self._process.stdin.write(command.encode() + f"; echo '{self._sentinel}'$?\n".encode())
+        await self._process.stdin.drain()
+        output = ""
+        error = ""
+        exit_code = None
+        # read output from the process, until the sentinel is found
+        try:
+            async with asyncio.timeout(timeout_sec):
+                while True:
+                    await asyncio.sleep(self._output_delay)
+                    # if we read directly from stdout/stderr, it will wait forever for
+                    # EOF. use the StreamReader buffer directly instead.
+                    output = self._process.stdout._buffer.decode()  # pyright: ignore[reportAttributeAccessIssue]
+                    error = self._process.stderr._buffer.decode()  # pyright: ignore[reportAttributeAccessIssue]
+                    if self._sentinel in output:
+                        # Extract exit code from sentinel line
+                        sentinel_idx = output.index(self._sentinel)
+                        # Find the exit code after the sentinel
+                        after_sentinel = output[sentinel_idx + len(self._sentinel) :]
+                        newline_idx = after_sentinel.find("\n")
+                        if newline_idx != -1:
+                            exit_code_str = after_sentinel[:newline_idx].strip()
+                        else:
+                            exit_code_str = after_sentinel.strip()
+                        try:
+                            exit_code = int(exit_code_str)
+                        except ValueError:
+                            exit_code = 0
+                        # strip the sentinel and exit code from output
+                        output = output[:sentinel_idx]
+                        break
+        except TimeoutError:
+            self._timed_out = True
+            # clear the buffers
+            self._process.stdout._buffer.clear()  # pyright: ignore[reportAttributeAccessIssue]
+            self._process.stderr._buffer.clear()  # pyright: ignore[reportAttributeAccessIssue]
+            return ShellCommandOutput(
+                stdout=output,
+                stderr=error,
+                outcome=ShellCallOutcome(type="timeout"),
+            )
+        if output.endswith("\n"):
+            output = output[:-1]
+        if error.endswith("\n"):
+            error = error[:-1]
+        # clear the buffers so that the next output can be read correctly
+        self._process.stdout._buffer.clear()  # pyright: ignore[reportAttributeAccessIssue]
+        self._process.stderr._buffer.clear()  # pyright: ignore[reportAttributeAccessIssue]
+        return ShellCommandOutput(
+            stdout=output,
+            stderr=error,
+            outcome=ShellCallOutcome(type="exit", exit_code=exit_code),
+        )
+class ShellTool:
+    """
+    A tool that allows the agent to run shell commands.
+    Conforms to OpenAI's shell tool specification.
+    Features:
+    - Auto-restart on error (session automatically restarts if needed)
+    - Dynamic timeout via timeout_ms parameter
+    - Dynamic max_output_length (passed back to API, no local truncation)
+    - Supports concurrent command execution
+    """
+    _session: _BashSession | None
+    def __init__(self) -> None:
+        self._session = None
+    async def _ensure_session(self) -> tuple[_BashSession, str | None]:
+        """Ensure a working session exists, auto-restarting if needed.
+        Returns:
+            Tuple of (session, restart_message) where restart_message is set
+            if the session was restarted due to an error.
+        """
+        restart_message = None
+        if self._session is not None and not self._session.is_alive():
+            # Session exists but is dead - auto-restart
+            old_session = self._session
+            if old_session._timed_out:
+                restart_message = "Previous session timed out. Session auto-restarted."
+            elif old_session._process.returncode is not None:
+                restart_message = (
+                    f"Previous session exited with code {old_session._process.returncode}. "
+                    "Session auto-restarted."
+                )
+            else:
+                restart_message = "Previous session was not usable. Session auto-restarted."
+            old_session.stop()
+            self._session = None
+        if self._session is None:
+            self._session = _BashSession()
+            await self._session.start()
+            if restart_message is None:
+                # First start, no message needed
+                pass
+        return self._session, restart_message
+    async def __call__(
+        self,
+        commands: list[str] | None = None,
+        timeout_ms: int | None = None,
+        max_output_length: int | None = None,
+        **kwargs: object,
+    ) -> ShellResult:
+        """
+        Execute shell commands.
+        Args:
+            commands: List of shell commands to execute (can run concurrently).
+            timeout_ms: Optional timeout in milliseconds for each command.
+            max_output_length: Optional max output length (passed back to API).
+        Returns:
+            ShellResult conforming to shell_call_output format.
+        """
+        if not commands:
+            raise ToolError("No commands provided.")
+        session, restart_message = await self._ensure_session()
+        outputs: list[ShellCommandOutput] = []
+        # Execute commands - can be done concurrently
+        # Note: OpenAI docs say commands can be executed concurrently,
+        # but for a single bash session, we run them sequentially.
+        # For true concurrency, you'd need multiple sessions or subprocess per command.
+        for command in commands:
+            # Check if session is still alive before each command
+            if not session.is_alive():
+                session, new_restart_msg = await self._ensure_session()
+                if new_restart_msg:
+                    restart_message = new_restart_msg
+            try:
+                result = await session.run(command, timeout_ms)
+                # If we had a restart message, prepend it to the first output's stderr
+                if restart_message:
+                    if result.stderr:
+                        result.stderr = f"[SYSTEM: {restart_message}]\n{result.stderr}"
+                    else:
+                        result.stderr = f"[SYSTEM: {restart_message}]"
+                    restart_message = None  # Only add once
+                outputs.append(result)
+            except Exception as e:
+                # Command execution failed, add error output
+                outputs.append(
+                    ShellCommandOutput(
+                        stdout="",
+                        stderr=str(e),
+                        outcome=ShellCallOutcome(type="exit", exit_code=1),
+                    )
+                )
+        return ShellResult(
+            output=outputs,
+            max_output_length=max_output_length,
+        )

hud-python 0.4.45__py3-none-any.whl → 0.5.13__py3-none-any.whl

hud-python 0.4.45py3-none-any.whl → 0.5.13py3-none-any.whl