PyPI - hud-python - Versions diffs - 0.3.5__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

hud-python 0.3.5py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of hud-python might be problematic. Click here for more details.

Files changed (192) hide show

hud/__init__.py +22 -89
hud/agents/__init__.py +17 -0
hud/agents/art.py +101 -0
hud/agents/base.py +599 -0
hud/{mcp → agents}/claude.py +373 -321
hud/{mcp → agents}/langchain.py +250 -250
hud/agents/misc/__init__.py +7 -0
hud/{agent → agents}/misc/response_agent.py +80 -80
hud/{mcp → agents}/openai.py +352 -334
hud/agents/openai_chat_generic.py +154 -0
hud/{mcp → agents}/tests/__init__.py +1 -1
hud/agents/tests/test_base.py +742 -0
hud/agents/tests/test_claude.py +324 -0
hud/{mcp → agents}/tests/test_client.py +363 -324
hud/{mcp → agents}/tests/test_openai.py +237 -238
hud/cli/__init__.py +617 -0
hud/cli/__main__.py +8 -0
hud/cli/analyze.py +371 -0
hud/cli/analyze_metadata.py +230 -0
hud/cli/build.py +427 -0
hud/cli/clone.py +185 -0
hud/cli/cursor.py +92 -0
hud/cli/debug.py +392 -0
hud/cli/docker_utils.py +83 -0
hud/cli/init.py +281 -0
hud/cli/interactive.py +353 -0
hud/cli/mcp_server.py +756 -0
hud/cli/pull.py +336 -0
hud/cli/push.py +379 -0
hud/cli/remote_runner.py +311 -0
hud/cli/runner.py +160 -0
hud/cli/tests/__init__.py +3 -0
hud/cli/tests/test_analyze.py +284 -0
hud/cli/tests/test_cli_init.py +265 -0
hud/cli/tests/test_cli_main.py +27 -0
hud/cli/tests/test_clone.py +142 -0
hud/cli/tests/test_cursor.py +253 -0
hud/cli/tests/test_debug.py +453 -0
hud/cli/tests/test_mcp_server.py +139 -0
hud/cli/tests/test_utils.py +388 -0
hud/cli/utils.py +263 -0
hud/clients/README.md +143 -0
hud/clients/__init__.py +16 -0
hud/clients/base.py +354 -0
hud/clients/fastmcp.py +202 -0
hud/clients/mcp_use.py +278 -0
hud/clients/tests/__init__.py +1 -0
hud/clients/tests/test_client_integration.py +111 -0
hud/clients/tests/test_fastmcp.py +342 -0
hud/clients/tests/test_protocol.py +188 -0
hud/clients/utils/__init__.py +1 -0
hud/clients/utils/retry_transport.py +160 -0
hud/datasets.py +322 -192
hud/misc/__init__.py +1 -0
hud/{agent → misc}/claude_plays_pokemon.py +292 -283
hud/otel/__init__.py +35 -0
hud/otel/collector.py +142 -0
hud/otel/config.py +164 -0
hud/otel/context.py +536 -0
hud/otel/exporters.py +366 -0
hud/otel/instrumentation.py +97 -0
hud/otel/processors.py +118 -0
hud/otel/tests/__init__.py +1 -0
hud/otel/tests/test_processors.py +197 -0
hud/server/__init__.py +5 -5
hud/server/context.py +114 -0
hud/server/helper/__init__.py +5 -0
hud/server/low_level.py +132 -0
hud/server/server.py +166 -0
hud/server/tests/__init__.py +3 -0
hud/settings.py +73 -79
hud/shared/__init__.py +5 -0
hud/{exceptions.py → shared/exceptions.py} +180 -180
hud/{server → shared}/requests.py +264 -264
hud/shared/tests/test_exceptions.py +157 -0
hud/{server → shared}/tests/test_requests.py +275 -275
hud/telemetry/__init__.py +25 -30
hud/telemetry/instrument.py +379 -0
hud/telemetry/job.py +309 -141
hud/telemetry/replay.py +74 -0
hud/telemetry/trace.py +83 -0
hud/tools/__init__.py +33 -34
hud/tools/base.py +365 -65
hud/tools/bash.py +161 -137
hud/tools/computer/__init__.py +15 -13
hud/tools/computer/anthropic.py +437 -420
hud/tools/computer/hud.py +376 -334
hud/tools/computer/openai.py +295 -292
hud/tools/computer/settings.py +82 -0
hud/tools/edit.py +314 -290
hud/tools/executors/__init__.py +30 -30
hud/tools/executors/base.py +539 -532
hud/tools/executors/pyautogui.py +621 -619
hud/tools/executors/tests/__init__.py +1 -1
hud/tools/executors/tests/test_base_executor.py +338 -338
hud/tools/executors/tests/test_pyautogui_executor.py +165 -165
hud/tools/executors/xdo.py +511 -503
hud/tools/{playwright_tool.py → playwright.py} +412 -379
hud/tools/tests/__init__.py +3 -3
hud/tools/tests/test_base.py +282 -0
hud/tools/tests/test_bash.py +158 -152
hud/tools/tests/test_bash_extended.py +197 -0
hud/tools/tests/test_computer.py +425 -52
hud/tools/tests/test_computer_actions.py +34 -34
hud/tools/tests/test_edit.py +259 -240
hud/tools/tests/test_init.py +27 -27
hud/tools/tests/test_playwright_tool.py +183 -183
hud/tools/tests/test_tools.py +145 -157
hud/tools/tests/test_utils.py +156 -156
hud/tools/types.py +72 -0
hud/tools/utils.py +50 -50
hud/types.py +136 -89
hud/utils/__init__.py +10 -16
hud/utils/async_utils.py +65 -0
hud/utils/design.py +168 -0
hud/utils/mcp.py +55 -0
hud/utils/progress.py +149 -149
hud/utils/telemetry.py +66 -66
hud/utils/tests/test_async_utils.py +173 -0
hud/utils/tests/test_init.py +17 -21
hud/utils/tests/test_progress.py +261 -225
hud/utils/tests/test_telemetry.py +82 -37
hud/utils/tests/test_version.py +8 -8
hud/version.py +7 -7
hud_python-0.4.0.dist-info/METADATA +474 -0
hud_python-0.4.0.dist-info/RECORD +132 -0
hud_python-0.4.0.dist-info/entry_points.txt +3 -0
{hud_python-0.3.5.dist-info → hud_python-0.4.0.dist-info}/licenses/LICENSE +21 -21
hud/adapters/__init__.py +0 -8
hud/adapters/claude/__init__.py +0 -5
hud/adapters/claude/adapter.py +0 -180
hud/adapters/claude/tests/__init__.py +0 -1
hud/adapters/claude/tests/test_adapter.py +0 -519
hud/adapters/common/__init__.py +0 -6
hud/adapters/common/adapter.py +0 -178
hud/adapters/common/tests/test_adapter.py +0 -289
hud/adapters/common/types.py +0 -446
hud/adapters/operator/__init__.py +0 -5
hud/adapters/operator/adapter.py +0 -108
hud/adapters/operator/tests/__init__.py +0 -1
hud/adapters/operator/tests/test_adapter.py +0 -370
hud/agent/__init__.py +0 -19
hud/agent/base.py +0 -126
hud/agent/claude.py +0 -271
hud/agent/langchain.py +0 -215
hud/agent/misc/__init__.py +0 -3
hud/agent/operator.py +0 -268
hud/agent/tests/__init__.py +0 -1
hud/agent/tests/test_base.py +0 -202
hud/env/__init__.py +0 -11
hud/env/client.py +0 -35
hud/env/docker_client.py +0 -349
hud/env/environment.py +0 -446
hud/env/local_docker_client.py +0 -358
hud/env/remote_client.py +0 -212
hud/env/remote_docker_client.py +0 -292
hud/gym.py +0 -130
hud/job.py +0 -773
hud/mcp/__init__.py +0 -17
hud/mcp/base.py +0 -631
hud/mcp/client.py +0 -312
hud/mcp/tests/test_base.py +0 -512
hud/mcp/tests/test_claude.py +0 -294
hud/task.py +0 -149
hud/taskset.py +0 -237
hud/telemetry/_trace.py +0 -347
hud/telemetry/context.py +0 -230
hud/telemetry/exporter.py +0 -575
hud/telemetry/instrumentation/__init__.py +0 -3
hud/telemetry/instrumentation/mcp.py +0 -259
hud/telemetry/instrumentation/registry.py +0 -59
hud/telemetry/mcp_models.py +0 -270
hud/telemetry/tests/__init__.py +0 -1
hud/telemetry/tests/test_context.py +0 -210
hud/telemetry/tests/test_trace.py +0 -312
hud/tools/helper/README.md +0 -56
hud/tools/helper/__init__.py +0 -9
hud/tools/helper/mcp_server.py +0 -78
hud/tools/helper/server_initialization.py +0 -115
hud/tools/helper/utils.py +0 -58
hud/trajectory.py +0 -94
hud/utils/agent.py +0 -37
hud/utils/common.py +0 -256
hud/utils/config.py +0 -120
hud/utils/deprecation.py +0 -115
hud/utils/misc.py +0 -53
hud/utils/tests/test_common.py +0 -277
hud/utils/tests/test_config.py +0 -129
hud_python-0.3.5.dist-info/METADATA +0 -284
hud_python-0.3.5.dist-info/RECORD +0 -120
/hud/{adapters/common → shared}/tests/__init__.py +0 -0
{hud_python-0.3.5.dist-info → hud_python-0.4.0.dist-info}/WHEEL +0 -0

hud/telemetry/job.py CHANGED Viewed

@@ -1,141 +1,309 @@
-"""Job context manager for grouping related traces."""
-from __future__ import annotations
-import logging
-import sys
-import uuid
-from contextlib import contextmanager
-from contextvars import ContextVar
-from typing import TYPE_CHECKING, Any
-from hud.telemetry.exporter import JobStatus, submit_to_worker_loop, update_job_status
-if TYPE_CHECKING:
-    from collections.abc import Generator
-    from typing import Self
-logger = logging.getLogger("hud.telemetry")
-# Context variables for current job
-current_job_id: ContextVar[str | None] = ContextVar("current_job_id", default=None)
-current_job_name: ContextVar[str | None] = ContextVar("current_job_name", default=None)
-class JobContext:
-    """Context manager for grouping traces under a job."""
-    def __init__(
-        self, name: str, taskset_name: str | None = None, metadata: dict[str, Any] | None = None
-    ) -> None:
-        self.id = str(uuid.uuid4())
-        self.name = name
-        self.metadata = metadata or {}
-        self.taskset_name: str | None = taskset_name
-    def __enter__(self) -> Self:
-        # Auto-detect dataset
-        if self.taskset_name is None:
-            self._detect_dataset()
-        # Set context variables
-        current_job_id.set(self.id)
-        current_job_name.set(self.name)
-        # Send initial status
-        job_metadata = {**self.metadata}
-        coro = update_job_status(
-            self.id, JobStatus.RUNNING, metadata=job_metadata, taskset_name=self.taskset_name
-        )
-        submit_to_worker_loop(coro)
-        logger.info("Started job %s (ID: %s)", self.name, self.id)
-        return self
-    def __exit__(
-        self, exc_type: type[BaseException] | None, exc_val: BaseException | None, exc_tb: object
-    ) -> None:
-        # Determine final status
-        if exc_type is not None:
-            # Job failed with exception
-            error_msg = f"{exc_type.__name__}: {exc_val}"
-            coro = update_job_status(
-                self.id, JobStatus.ERROR, error_message=error_msg, taskset_name=self.taskset_name
-            )
-        else:
-            # Job completed successfully
-            coro = update_job_status(self.id, JobStatus.COMPLETED, taskset_name=self.taskset_name)
-        submit_to_worker_loop(coro)
-        # Clear context
-        current_job_id.set(None)
-        current_job_name.set(None)
-        status = "failed" if exc_type else "completed"
-        logger.info("Job %s %s", self.name, status)
-    def _detect_dataset(self) -> None:
-        """Auto-detect HuggingFace dataset in parent scope."""
-        try:
-            # Check frames 2 and 3 (with statement and parent scope)
-            for frame_depth in [2, 3]:
-                try:
-                    frame = sys._getframe(frame_depth)
-                    # Search for Dataset objects
-                    for var_value in frame.f_locals.values():
-                        if hasattr(var_value, "info") and hasattr(var_value.info, "builder_name"):
-                            self.taskset_name = var_value.info.builder_name
-                            logger.debug(
-                                "Auto-detected dataset at frame %d: %s",
-                                frame_depth,
-                                self.taskset_name,
-                            )
-                            return
-                        elif hasattr(var_value, "builder_name"):
-                            # Older dataset format
-                            self.taskset_name = var_value.builder_name
-                            logger.debug(
-                                "Auto-detected dataset at frame %d: %s",
-                                frame_depth,
-                                self.taskset_name,
-                            )
-                            return
-                except ValueError:
-                    # Frame doesn't exist
-                    continue
-        except Exception as e:
-            logger.debug("Dataset auto-detection failed: %s", e)
-@contextmanager
-def job(
-    name: str, taskset_name: str | None = None, metadata: dict[str, Any] | None = None
-) -> Generator[JobContext, None, None]:
-    """
-    Create a job context for grouping related traces.
-    Args:
-        name: Name for the job
-        metadata: Optional metadata to include with the job
-    Example:
-        with hud.job("evaluation_run") as job:
-            for task in tasks:
-                with hud.trace(f"task_{task.id}"):
-                    # Trace automatically includes job_id
-                    result = await agent.run(task)
-    """
-    with JobContext(name, taskset_name, metadata) as ctx:
-        yield ctx
-def get_current_job_id() -> str | None:
-    """Get the current job ID if inside a job context."""
-    return current_job_id.get()
-def get_current_job_name() -> str | None:
-    """Get the current job name if inside a job context."""
-    return current_job_name.get()
+"""Job management for HUD SDK.
+This module provides APIs for managing jobs - logical groupings of related tasks.
+Jobs can be used to track experiments, batch processing, training runs, etc.
+"""
+from __future__ import annotations
+import asyncio
+import logging
+import uuid
+from contextlib import contextmanager
+from datetime import UTC, datetime
+from functools import wraps
+from typing import TYPE_CHECKING, Any
+from hud.settings import settings
+from hud.shared import make_request, make_request_sync
+if TYPE_CHECKING:
+    from collections.abc import Callable, Generator
+logger = logging.getLogger(__name__)
+class Job:
+    """A job represents a collection of related tasks."""
+    def __init__(
+        self,
+        job_id: str,
+        name: str,
+        metadata: dict[str, Any] | None = None,
+        dataset_link: str | None = None,
+    ) -> None:
+        self.id = job_id
+        self.name = name
+        self.metadata = metadata or {}
+        self.dataset_link = dataset_link
+        self.status = "created"
+        self.created_at = datetime.now(UTC)
+        self.tasks: list[str] = []
+    def add_task(self, task_id: str) -> None:
+        """Associate a task with this job."""
+        self.tasks.append(task_id)
+    async def update_status(self, status: str) -> None:
+        """Update job status on the server."""
+        self.status = status
+        if settings.telemetry_enabled:
+            try:
+                payload = {
+                    "name": self.name,
+                    "status": status,
+                    "metadata": self.metadata,
+                }
+                if self.dataset_link:
+                    payload["dataset_link"] = self.dataset_link
+                await make_request(
+                    method="POST",
+                    url=f"{settings.hud_telemetry_url}/jobs/{self.id}/status",
+                    json=payload,
+                    api_key=settings.api_key,
+                )
+            except Exception as e:
+                logger.warning("Failed to update job status: %s", e)
+    def update_status_sync(self, status: str) -> None:
+        """Synchronously update job status on the server."""
+        self.status = status
+        if settings.telemetry_enabled:
+            try:
+                payload = {
+                    "name": self.name,
+                    "status": status,
+                    "metadata": self.metadata,
+                }
+                if self.dataset_link:
+                    payload["dataset_link"] = self.dataset_link
+                make_request_sync(
+                    method="POST",
+                    url=f"{settings.hud_telemetry_url}/jobs/{self.id}/status",
+                    json=payload,
+                    api_key=settings.api_key,
+                )
+            except Exception as e:
+                logger.warning("Failed to update job status: %s", e)
+    def __repr__(self) -> str:
+        return f"Job(id={self.id!r}, name={self.name!r}, status={self.status!r})"
+# Global job registry for the decorator pattern
+_current_job: Job | None = None
+def _print_job_url(job_id: str, job_name: str) -> None:
+    """Print the job URL in a colorful box."""
+    # Only print HUD URL if HUD telemetry is enabled and has API key
+    if not (settings.telemetry_enabled and settings.api_key):
+        return
+    url = f"https://app.hud.so/jobs/{job_id}"
+    header = f"🚀 Job '{job_name}' started:"
+    # ANSI color codes
+    DIM = "\033[90m"  # Dim/Gray for border
+    GOLD = "\033[33m"  # Gold/Yellow for URL
+    RESET = "\033[0m"
+    BOLD = "\033[1m"
+    # Calculate box width based on the longest line
+    box_width = max(len(url), len(header)) + 6
+    # Box drawing characters
+    top_border = "╔" + "═" * (box_width - 2) + "╗"
+    bottom_border = "╚" + "═" * (box_width - 2) + "╝"
+    divider = "╟" + "─" * (box_width - 2) + "╢"
+    # Center the content
+    header_padding = (box_width - len(header) - 2) // 2
+    url_padding = (box_width - len(url) - 2) // 2
+    # Print the box
+    print(f"\n{DIM}{top_border}{RESET}")  # noqa: T201
+    print(  # noqa: T201
+        f"{DIM}║{RESET}{' ' * header_padding}{header}{' ' * (box_width - len(header) - header_padding - 3)}{DIM}║{RESET}"  # noqa: E501
+    )
+    print(f"{DIM}{divider}{RESET}")  # noqa: T201
+    print(  # noqa: T201
+        f"{DIM}║{RESET}{' ' * url_padding}{BOLD}{GOLD}{url}{RESET}{' ' * (box_width - len(url) - url_padding - 2)}{DIM}║{RESET}"  # noqa: E501
+    )
+    print(f"{DIM}{bottom_border}{RESET}\n")  # noqa: T201
+def _print_job_complete_url(job_id: str, job_name: str, error_occurred: bool = False) -> None:
+    """Print the job completion URL with appropriate messaging."""
+    # Only print HUD URL if HUD telemetry is enabled and has API key
+    if not (settings.telemetry_enabled and settings.api_key):
+        return
+    url = f"https://app.hud.so/jobs/{job_id}"
+    # ANSI color codes
+    GREEN = "\033[92m"
+    RED = "\033[91m"
+    GOLD = "\033[33m"
+    RESET = "\033[0m"
+    DIM = "\033[2m"
+    BOLD = "\033[1m"
+    if error_occurred:
+        print(  # noqa: T201
+            f"\n{RED}✗ Job '{job_name}' failed!{RESET} {DIM}View details at:{RESET} {BOLD}{GOLD}{url}{RESET}\n"  # noqa: E501
+        )
+    else:
+        print(  # noqa: T201
+            f"\n{GREEN}✓ Job '{job_name}' complete!{RESET} {DIM}View all results at:{RESET} {BOLD}{GOLD}{url}{RESET}\n"  # noqa: E501
+        )
+def get_current_job() -> Job | None:
+    """Get the currently active job, if any."""
+    return _current_job
+@contextmanager
+def job(
+    name: str,
+    metadata: dict[str, Any] | None = None,
+    job_id: str | None = None,
+    dataset_link: str | None = None,
+) -> Generator[Job, None, None]:
+    """Context manager for job tracking.
+    Groups related tasks together under a single job for tracking and organization.
+    Args:
+        name: Human-readable job name
+        metadata: Optional metadata dictionary
+        job_id: Optional job ID (auto-generated if not provided)
+        dataset_link: Optional HuggingFace dataset identifier (e.g. "hud-evals/SheetBench-50")
+    Yields:
+        Job: The job object
+    Example:
+        with hud.job("training_run", {"model": "gpt-4"}) as job:
+            for epoch in range(10):
+                with hud.trace(f"epoch_{epoch}", job_id=job.id):
+                    train_epoch()
+    """
+    global _current_job
+    if not job_id:
+        job_id = str(uuid.uuid4())
+    job_obj = Job(job_id, name, metadata, dataset_link)
+    # Set as current job
+    old_job = _current_job
+    _current_job = job_obj
+    try:
+        # Update status to running synchronously to ensure job is registered before tasks start
+        job_obj.update_status_sync("running")
+        # Print the nice job URL box
+        _print_job_url(job_obj.id, job_obj.name)
+        yield job_obj
+        # Update status to completed synchronously to ensure it completes before process exit
+        job_obj.update_status_sync("completed")
+        # Print job completion message
+        _print_job_complete_url(job_obj.id, job_obj.name, error_occurred=False)
+    except Exception:
+        # Update status to failed synchronously to ensure it completes before process exit
+        job_obj.update_status_sync("failed")
+        # Print job failure message
+        _print_job_complete_url(job_obj.id, job_obj.name, error_occurred=True)
+        raise
+    finally:
+        _current_job = old_job
+def create_job(
+    name: str, metadata: dict[str, Any] | None = None, dataset_link: str | None = None
+) -> Job:
+    """Create a job without using context manager.
+    Useful when you need explicit control over job lifecycle.
+    Args:
+        name: Human-readable job name
+        metadata: Optional metadata dictionary
+        dataset_link: Optional HuggingFace dataset identifier (e.g. "hud-evals/SheetBench-50")
+    Returns:
+        Job: The created job object
+    Example:
+        job = hud.create_job("data_processing")
+        try:
+            for item in items:
+                with hud.trace(f"process_{item.id}", job_id=job.id):
+                    process(item)
+        finally:
+            await job.update_status("completed")
+    """
+    job_id = str(uuid.uuid4())
+    return Job(job_id, name, metadata, dataset_link)
+def job_decorator(name: str | None = None, **metadata: Any) -> Callable:
+    """Decorator for functions that should be tracked as jobs.
+    Args:
+        name: Job name (defaults to function name)
+        **metadata: Additional metadata for the job
+    Example:
+        @hud.job_decorator("model_training", model="gpt-4", dataset="v2")
+        async def train_model(config):
+            # This entire function execution is tracked as a job
+            await model.train(config)
+            return model.evaluate()
+    """
+    def decorator(func: Callable) -> Callable:
+        job_name = name or func.__name__
+        @wraps(func)
+        async def async_wrapper(*args: Any, **kwargs: Any) -> Any:
+            with job(job_name, metadata) as job_obj:
+                # Store job ID in function for access
+                func._current_job_id = job_obj.id
+                try:
+                    return await func(*args, **kwargs)
+                finally:
+                    delattr(func, "_current_job_id")
+        @wraps(func)
+        def sync_wrapper(*args: Any, **kwargs: Any) -> Any:
+            with job(job_name, metadata) as job_obj:
+                # Store job ID in function for access
+                func._current_job_id = job_obj.id
+                try:
+                    return func(*args, **kwargs)
+                finally:
+                    delattr(func, "_current_job_id")
+        # Return appropriate wrapper based on function type
+        if asyncio.iscoroutinefunction(func):
+            return async_wrapper
+        else:
+            return sync_wrapper
+    return decorator
+# Convenience exports
+__all__ = [
+    "Job",
+    "create_job",
+    "get_current_job",
+    "job",
+    "job_decorator",
+]

hud/telemetry/replay.py ADDED Viewed

@@ -0,0 +1,74 @@
+"""Trace retrieval and replay functionality.
+This module provides APIs to retrieve collected traces for analysis,
+debugging, and replay purposes.
+"""
+from __future__ import annotations
+from typing import TYPE_CHECKING
+from hud.otel.collector import clear_trace as _clear_trace
+from hud.otel.collector import get_trace as _get_trace
+if TYPE_CHECKING:
+    from hud.types import Trace
+__all__ = ["clear_trace", "get_trace"]
+def get_trace(task_run_id: str) -> Trace | None:
+    """Retrieve the collected trace for a task run.
+    Returns None if trace collection was disabled or the trace doesn't exist.
+    Args:
+        task_run_id: The task run ID to retrieve the trace for
+    Returns:
+        Trace object containing all collected steps, or None if not found
+    Usage:
+        import hud
+        # Run agent with tracing
+        with hud.trace() as task_run_id:
+            agent = MyAgent()
+            result = await agent.run("solve task")
+        # Get the trace for analysis
+        trace = hud.get_trace(task_run_id)
+        if trace:
+            print(f"Collected {len(trace.trace)} steps")
+            # Analyze agent vs MCP steps
+            agent_steps = [s for s in trace.trace if s.category == "agent"]
+            mcp_steps = [s for s in trace.trace if s.category == "mcp"]
+            print(f"Agent steps: {len(agent_steps)}")
+            print(f"MCP steps: {len(mcp_steps)}")
+            # Replay or analyze individual steps
+            for step in trace.trace:
+                if step.category == "agent" and step.result:
+                    print(f"Agent: {step.result.get('content') if isinstance(step.result, dict) else step.result}")
+                if step.category == "mcp" and step.request:
+                    print(f"MCP: {step.request.method if hasattr(step.request, 'method') else step.request}")
+    """  # noqa: E501
+    return _get_trace(task_run_id)
+def clear_trace(task_run_id: str) -> None:
+    """Clear the collected trace for a task run ID.
+    Useful for cleaning up memory after processing large traces.
+    Args:
+        task_run_id: The task run ID to clear the trace for
+    Usage:
+        trace = hud.get_trace(task_run_id)
+        # Process trace...
+        hud.clear_trace(task_run_id)  # Free memory
+    """
+    _clear_trace(task_run_id)

hud/telemetry/trace.py ADDED Viewed

@@ -0,0 +1,83 @@
+"""User-facing trace context manager for HUD telemetry.
+This module provides the simple trace() API that users interact with.
+The actual OpenTelemetry implementation is in hud.otel.
+"""
+from __future__ import annotations
+import uuid
+from contextlib import contextmanager
+from typing import TYPE_CHECKING, Any
+from hud.otel import configure_telemetry
+from hud.otel import trace as OtelTrace
+if TYPE_CHECKING:
+    from collections.abc import Generator
+__all__ = ["trace"]
+@contextmanager
+def trace(
+    name: str = "Test task from hud",
+    *,
+    root: bool = True,
+    attrs: dict[str, Any] | None = None,
+    job_id: str | None = None,
+    task_id: str | None = None,
+) -> Generator[str, None, None]:
+    """Start a HUD trace context.
+    A unique task_run_id is automatically generated for each trace.
+    Args:
+        name: Descriptive name for this trace/task
+        root: Whether this is a root trace (updates task status)
+        attrs: Additional attributes to attach to the trace
+        job_id: Optional job ID to associate with this trace
+    Yields:
+        str: The auto-generated task run ID
+    Usage:
+        import hud
+        with hud.trace("My Task") as task_run_id:
+            # Your code here
+            print(f"Running task: {task_run_id}")
+        # Or with default name:
+        with hud.trace() as task_run_id:
+            pass
+        # Or with job_id:
+        with hud.trace("My Task", job_id="550e8400-e29b-41d4-a716-446655440000") as task_run_id:
+            pass
+    """
+    # Ensure telemetry is configured
+    configure_telemetry()
+    # Only generate task_run_id if using HUD backend
+    # For custom OTLP backends, we don't need it
+    from hud.settings import get_settings
+    settings = get_settings()
+    if settings.telemetry_enabled and settings.api_key:
+        task_run_id = str(uuid.uuid4())
+    else:
+        # Use a placeholder for custom backends
+        task_run_id = "custom-otlp-trace"
+    # Delegate to OpenTelemetry implementation
+    with OtelTrace(
+        task_run_id,
+        is_root=root,
+        span_name=name,
+        attributes=attrs or {},
+        job_id=job_id,
+        task_id=task_id,
+    ) as run_id:
+        yield run_id

hud-python 0.3.5__py3-none-any.whl → 0.4.0__py3-none-any.whl

Potentially problematic release.

hud-python 0.3.5py3-none-any.whl → 0.4.0py3-none-any.whl