PyPI - hud-python - Versions diffs - 0.4.45__py3-none-any.whl → 0.5.13__py3-none-any.whl - Mend

hud-python 0.4.45py3-none-any.whl → 0.5.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (282) hide show

hud/__init__.py +27 -7
hud/agents/__init__.py +70 -5
hud/agents/base.py +238 -500
hud/agents/claude.py +236 -247
hud/agents/gateway.py +42 -0
hud/agents/gemini.py +264 -0
hud/agents/gemini_cua.py +324 -0
hud/agents/grounded_openai.py +98 -100
hud/agents/misc/integration_test_agent.py +51 -20
hud/agents/misc/response_agent.py +48 -36
hud/agents/openai.py +282 -296
hud/agents/{openai_chat_generic.py → openai_chat.py} +63 -33
hud/agents/operator.py +199 -0
hud/agents/resolver.py +70 -0
hud/agents/tests/conftest.py +133 -0
hud/agents/tests/test_base.py +300 -622
hud/agents/tests/test_base_runtime.py +233 -0
hud/agents/tests/test_claude.py +381 -214
hud/agents/tests/test_client.py +9 -10
hud/agents/tests/test_gemini.py +369 -0
hud/agents/tests/test_grounded_openai_agent.py +65 -50
hud/agents/tests/test_openai.py +377 -140
hud/agents/tests/test_operator.py +362 -0
hud/agents/tests/test_resolver.py +192 -0
hud/agents/tests/test_run_eval.py +179 -0
hud/agents/types.py +148 -0
hud/cli/__init__.py +493 -546
hud/cli/analyze.py +43 -5
hud/cli/build.py +699 -113
hud/cli/debug.py +8 -5
hud/cli/dev.py +889 -732
hud/cli/eval.py +793 -667
hud/cli/flows/dev.py +167 -0
hud/cli/flows/init.py +191 -0
hud/cli/flows/tasks.py +153 -56
hud/cli/flows/templates.py +151 -0
hud/cli/flows/tests/__init__.py +1 -0
hud/cli/flows/tests/test_dev.py +126 -0
hud/cli/init.py +60 -58
hud/cli/pull.py +1 -1
hud/cli/push.py +38 -13
hud/cli/rft.py +311 -0
hud/cli/rft_status.py +145 -0
hud/cli/tests/test_analyze.py +5 -5
hud/cli/tests/test_analyze_metadata.py +3 -2
hud/cli/tests/test_analyze_module.py +120 -0
hud/cli/tests/test_build.py +110 -8
hud/cli/tests/test_build_failure.py +41 -0
hud/cli/tests/test_build_module.py +50 -0
hud/cli/tests/test_cli_init.py +6 -1
hud/cli/tests/test_cli_more_wrappers.py +30 -0
hud/cli/tests/test_cli_root.py +140 -0
hud/cli/tests/test_convert.py +361 -0
hud/cli/tests/test_debug.py +12 -10
hud/cli/tests/test_dev.py +197 -0
hud/cli/tests/test_eval.py +251 -0
hud/cli/tests/test_eval_bedrock.py +51 -0
hud/cli/tests/test_init.py +124 -0
hud/cli/tests/test_main_module.py +11 -5
hud/cli/tests/test_mcp_server.py +12 -100
hud/cli/tests/test_push.py +1 -1
hud/cli/tests/test_push_happy.py +74 -0
hud/cli/tests/test_push_wrapper.py +23 -0
hud/cli/tests/test_registry.py +1 -1
hud/cli/tests/test_utils.py +1 -1
hud/cli/{rl → utils}/celebrate.py +14 -12
hud/cli/utils/config.py +18 -1
hud/cli/utils/docker.py +130 -4
hud/cli/utils/env_check.py +9 -9
hud/cli/utils/git.py +136 -0
hud/cli/utils/interactive.py +39 -5
hud/cli/utils/metadata.py +70 -1
hud/cli/utils/runner.py +1 -1
hud/cli/utils/server.py +2 -2
hud/cli/utils/source_hash.py +3 -3
hud/cli/utils/tasks.py +4 -1
hud/cli/utils/tests/__init__.py +0 -0
hud/cli/utils/tests/test_config.py +58 -0
hud/cli/utils/tests/test_docker.py +93 -0
hud/cli/utils/tests/test_docker_hints.py +71 -0
hud/cli/utils/tests/test_env_check.py +74 -0
hud/cli/utils/tests/test_environment.py +42 -0
hud/cli/utils/tests/test_git.py +142 -0
hud/cli/utils/tests/test_interactive_module.py +60 -0
hud/cli/utils/tests/test_local_runner.py +50 -0
hud/cli/utils/tests/test_logging_utils.py +23 -0
hud/cli/utils/tests/test_metadata.py +49 -0
hud/cli/utils/tests/test_package_runner.py +35 -0
hud/cli/utils/tests/test_registry_utils.py +49 -0
hud/cli/utils/tests/test_remote_runner.py +25 -0
hud/cli/utils/tests/test_runner_modules.py +52 -0
hud/cli/utils/tests/test_source_hash.py +36 -0
hud/cli/utils/tests/test_tasks.py +80 -0
hud/cli/utils/version_check.py +258 -0
hud/cli/{rl → utils}/viewer.py +2 -2
hud/clients/README.md +12 -11
hud/clients/__init__.py +4 -3
hud/clients/base.py +166 -26
hud/clients/environment.py +51 -0
hud/clients/fastmcp.py +13 -6
hud/clients/mcp_use.py +45 -15
hud/clients/tests/test_analyze_scenarios.py +206 -0
hud/clients/tests/test_protocol.py +9 -3
hud/datasets/__init__.py +23 -20
hud/datasets/loader.py +326 -0
hud/datasets/runner.py +198 -105
hud/datasets/tests/__init__.py +0 -0
hud/datasets/tests/test_loader.py +221 -0
hud/datasets/tests/test_utils.py +315 -0
hud/datasets/utils.py +270 -90
hud/environment/__init__.py +52 -0
hud/environment/connection.py +258 -0
hud/environment/connectors/__init__.py +33 -0
hud/environment/connectors/base.py +68 -0
hud/environment/connectors/local.py +177 -0
hud/environment/connectors/mcp_config.py +137 -0
hud/environment/connectors/openai.py +101 -0
hud/environment/connectors/remote.py +172 -0
hud/environment/environment.py +835 -0
hud/environment/integrations/__init__.py +45 -0
hud/environment/integrations/adk.py +67 -0
hud/environment/integrations/anthropic.py +196 -0
hud/environment/integrations/gemini.py +92 -0
hud/environment/integrations/langchain.py +82 -0
hud/environment/integrations/llamaindex.py +68 -0
hud/environment/integrations/openai.py +238 -0
hud/environment/mock.py +306 -0
hud/environment/router.py +263 -0
hud/environment/scenarios.py +620 -0
hud/environment/tests/__init__.py +1 -0
hud/environment/tests/test_connection.py +317 -0
hud/environment/tests/test_connectors.py +205 -0
hud/environment/tests/test_environment.py +593 -0
hud/environment/tests/test_integrations.py +257 -0
hud/environment/tests/test_local_connectors.py +242 -0
hud/environment/tests/test_scenarios.py +1086 -0
hud/environment/tests/test_tools.py +208 -0
hud/environment/types.py +23 -0
hud/environment/utils/__init__.py +35 -0
hud/environment/utils/formats.py +215 -0
hud/environment/utils/schema.py +171 -0
hud/environment/utils/tool_wrappers.py +113 -0
hud/eval/__init__.py +67 -0
hud/eval/context.py +727 -0
hud/eval/display.py +299 -0
hud/eval/instrument.py +187 -0
hud/eval/manager.py +533 -0
hud/eval/parallel.py +268 -0
hud/eval/task.py +372 -0
hud/eval/tests/__init__.py +1 -0
hud/eval/tests/test_context.py +178 -0
hud/eval/tests/test_eval.py +210 -0
hud/eval/tests/test_manager.py +152 -0
hud/eval/tests/test_parallel.py +168 -0
hud/eval/tests/test_task.py +291 -0
hud/eval/types.py +65 -0
hud/eval/utils.py +194 -0
hud/patches/__init__.py +19 -0
hud/patches/mcp_patches.py +308 -0
hud/patches/warnings.py +54 -0
hud/samples/browser.py +4 -4
hud/server/__init__.py +2 -1
hud/server/low_level.py +2 -1
hud/server/router.py +164 -0
hud/server/server.py +567 -80
hud/server/tests/test_mcp_server_integration.py +11 -11
hud/server/tests/test_mcp_server_more.py +1 -1
hud/server/tests/test_server_extra.py +2 -0
hud/settings.py +45 -3
hud/shared/exceptions.py +36 -10
hud/shared/hints.py +26 -1
hud/shared/requests.py +15 -3
hud/shared/tests/test_exceptions.py +40 -31
hud/shared/tests/test_hints.py +167 -0
hud/telemetry/__init__.py +20 -19
hud/telemetry/exporter.py +201 -0
hud/telemetry/instrument.py +165 -253
hud/telemetry/tests/test_eval_telemetry.py +356 -0
hud/telemetry/tests/test_exporter.py +258 -0
hud/telemetry/tests/test_instrument.py +401 -0
hud/tools/__init__.py +18 -2
hud/tools/agent.py +223 -0
hud/tools/apply_patch.py +639 -0
hud/tools/base.py +54 -4
hud/tools/bash.py +2 -2
hud/tools/computer/__init__.py +36 -3
hud/tools/computer/anthropic.py +2 -2
hud/tools/computer/gemini.py +385 -0
hud/tools/computer/hud.py +23 -6
hud/tools/computer/openai.py +20 -21
hud/tools/computer/qwen.py +434 -0
hud/tools/computer/settings.py +37 -0
hud/tools/edit.py +3 -7
hud/tools/executors/base.py +4 -2
hud/tools/executors/pyautogui.py +1 -1
hud/tools/grounding/grounded_tool.py +13 -18
hud/tools/grounding/grounder.py +10 -31
hud/tools/grounding/tests/test_grounded_tool.py +26 -44
hud/tools/jupyter.py +330 -0
hud/tools/playwright.py +18 -3
hud/tools/shell.py +308 -0
hud/tools/tests/test_agent_tool.py +355 -0
hud/tools/tests/test_apply_patch.py +718 -0
hud/tools/tests/test_computer.py +4 -9
hud/tools/tests/test_computer_actions.py +24 -2
hud/tools/tests/test_jupyter_tool.py +181 -0
hud/tools/tests/test_shell.py +596 -0
hud/tools/tests/test_submit.py +85 -0
hud/tools/tests/test_types.py +193 -0
hud/tools/types.py +21 -1
hud/types.py +194 -56
hud/utils/__init__.py +2 -0
hud/utils/env.py +67 -0
hud/utils/hud_console.py +89 -18
hud/utils/mcp.py +15 -58
hud/utils/strict_schema.py +162 -0
hud/utils/tests/test_init.py +1 -2
hud/utils/tests/test_mcp.py +1 -28
hud/utils/tests/test_pretty_errors.py +186 -0
hud/utils/tests/test_tool_shorthand.py +154 -0
hud/utils/tests/test_version.py +1 -1
hud/utils/types.py +20 -0
hud/version.py +1 -1
hud_python-0.5.13.dist-info/METADATA +264 -0
hud_python-0.5.13.dist-info/RECORD +305 -0
{hud_python-0.4.45.dist-info → hud_python-0.5.13.dist-info}/WHEEL +1 -1
hud/agents/langchain.py +0 -261
hud/agents/lite_llm.py +0 -72
hud/cli/rl/__init__.py +0 -180
hud/cli/rl/config.py +0 -101
hud/cli/rl/display.py +0 -133
hud/cli/rl/gpu.py +0 -63
hud/cli/rl/gpu_utils.py +0 -321
hud/cli/rl/local_runner.py +0 -595
hud/cli/rl/presets.py +0 -96
hud/cli/rl/remote_runner.py +0 -463
hud/cli/rl/rl_api.py +0 -150
hud/cli/rl/vllm.py +0 -177
hud/cli/rl/wait_utils.py +0 -89
hud/datasets/parallel.py +0 -687
hud/misc/__init__.py +0 -1
hud/misc/claude_plays_pokemon.py +0 -292
hud/otel/__init__.py +0 -35
hud/otel/collector.py +0 -142
hud/otel/config.py +0 -181
hud/otel/context.py +0 -570
hud/otel/exporters.py +0 -369
hud/otel/instrumentation.py +0 -135
hud/otel/processors.py +0 -121
hud/otel/tests/__init__.py +0 -1
hud/otel/tests/test_processors.py +0 -197
hud/rl/README.md +0 -30
hud/rl/__init__.py +0 -1
hud/rl/actor.py +0 -176
hud/rl/buffer.py +0 -405
hud/rl/chat_template.jinja +0 -101
hud/rl/config.py +0 -192
hud/rl/distributed.py +0 -132
hud/rl/learner.py +0 -637
hud/rl/tests/__init__.py +0 -1
hud/rl/tests/test_learner.py +0 -186
hud/rl/train.py +0 -382
hud/rl/types.py +0 -101
hud/rl/utils/start_vllm_server.sh +0 -30
hud/rl/utils.py +0 -524
hud/rl/vllm_adapter.py +0 -143
hud/telemetry/job.py +0 -352
hud/telemetry/replay.py +0 -74
hud/telemetry/tests/test_replay.py +0 -40
hud/telemetry/tests/test_trace.py +0 -63
hud/telemetry/trace.py +0 -158
hud/utils/agent_factories.py +0 -86
hud/utils/async_utils.py +0 -65
hud/utils/group_eval.py +0 -223
hud/utils/progress.py +0 -149
hud/utils/tasks.py +0 -127
hud/utils/tests/test_async_utils.py +0 -173
hud/utils/tests/test_progress.py +0 -261
hud_python-0.4.45.dist-info/METADATA +0 -552
hud_python-0.4.45.dist-info/RECORD +0 -228
{hud_python-0.4.45.dist-info → hud_python-0.5.13.dist-info}/entry_points.txt +0 -0
{hud_python-0.4.45.dist-info → hud_python-0.5.13.dist-info}/licenses/LICENSE +0 -0

hud/telemetry/job.py DELETED Viewed

@@ -1,352 +0,0 @@
-"""Job management for HUD SDK.
-This module provides APIs for managing jobs - logical groupings of related tasks.
-Jobs can be used to track experiments, batch processing, training runs, etc.
-"""
-from __future__ import annotations
-import asyncio
-import logging
-import uuid
-from contextlib import contextmanager
-from datetime import UTC, datetime
-from functools import wraps
-from typing import TYPE_CHECKING, Any
-from hud.settings import settings
-from hud.shared import make_request, make_request_sync
-if TYPE_CHECKING:
-    from collections.abc import Callable, Generator
-logger = logging.getLogger(__name__)
-class Job:
-    """A job represents a collection of related tasks."""
-    def __init__(
-        self,
-        job_id: str,
-        name: str,
-        metadata: dict[str, Any] | None = None,
-        dataset_link: str | None = None,
-    ) -> None:
-        self.id = job_id
-        self.name = name
-        self.metadata = metadata or {}
-        self.dataset_link = dataset_link
-        self.status = "created"
-        self.created_at = datetime.now(UTC)
-        self.tasks: list[str] = []
-    def add_task(self, task_id: str) -> None:
-        """Associate a task with this job."""
-        self.tasks.append(task_id)
-    async def update_status(self, status: str) -> None:
-        """Update job status on the server."""
-        self.status = status
-        if settings.telemetry_enabled:
-            try:
-                payload = {
-                    "name": self.name,
-                    "status": status,
-                    "metadata": self.metadata,
-                }
-                if self.dataset_link:
-                    payload["dataset_link"] = self.dataset_link
-                await make_request(
-                    method="POST",
-                    url=f"{settings.hud_telemetry_url}/jobs/{self.id}/status",
-                    json=payload,
-                    api_key=settings.api_key,
-                )
-            except Exception as e:
-                logger.warning("Failed to update job status: %s", e)
-    def update_status_sync(self, status: str) -> None:
-        """Synchronously update job status on the server."""
-        self.status = status
-        if settings.telemetry_enabled:
-            try:
-                payload = {
-                    "name": self.name,
-                    "status": status,
-                    "metadata": self.metadata,
-                }
-                if self.dataset_link:
-                    payload["dataset_link"] = self.dataset_link
-                make_request_sync(
-                    method="POST",
-                    url=f"{settings.hud_telemetry_url}/jobs/{self.id}/status",
-                    json=payload,
-                    api_key=settings.api_key,
-                )
-            except Exception as e:
-                logger.warning("Failed to update job status: %s", e)
-    async def log(self, metrics: dict[str, Any]) -> None:
-        """Log metrics to the job.
-        Args:
-            metrics: Dictionary of metric name to value pairs
-        Example:
-            await job.log({"loss": 0.5, "accuracy": 0.95, "epoch": 1})
-        """
-        if settings.telemetry_enabled:
-            try:
-                await make_request(
-                    method="POST",
-                    url=f"{settings.hud_telemetry_url}/jobs/{self.id}/log",
-                    json={"metrics": metrics, "timestamp": datetime.now(UTC).isoformat()},
-                    api_key=settings.api_key,
-                )
-            except Exception as e:
-                logger.warning("Failed to log metrics to job: %s", e)
-    def log_sync(self, metrics: dict[str, Any]) -> None:
-        """Synchronously log metrics to the job.
-        Args:
-            metrics: Dictionary of metric name to value pairs
-        Example:
-            job.log_sync({"loss": 0.5, "accuracy": 0.95, "epoch": 1})
-        """
-        if settings.telemetry_enabled:
-            try:
-                make_request_sync(
-                    method="POST",
-                    url=f"{settings.hud_telemetry_url}/jobs/{self.id}/log",
-                    json={"metrics": metrics, "timestamp": datetime.now(UTC).isoformat()},
-                    api_key=settings.api_key,
-                )
-            except Exception as e:
-                logger.warning("Failed to log metrics to job: %s", e)
-    def __repr__(self) -> str:
-        return f"Job(id={self.id!r}, name={self.name!r}, status={self.status!r})"
-# Global job registry for the decorator pattern
-_current_job: Job | None = None
-def _print_job_url(job_id: str, job_name: str) -> None:
-    """Print the job URL in a colorful box."""
-    # Only print HUD URL if HUD telemetry is enabled and has API key
-    if not (settings.telemetry_enabled and settings.api_key):
-        return
-    url = f"https://hud.so/jobs/{job_id}"
-    header = f"🚀 Job '{job_name}' started:"
-    # ANSI color codes
-    DIM = "\033[90m"  # Dim/Gray for border
-    GOLD = "\033[33m"  # Gold/Yellow for URL
-    RESET = "\033[0m"
-    BOLD = "\033[1m"
-    # Calculate box width based on the longest line
-    box_width = max(len(url), len(header)) + 6
-    # Box drawing characters
-    top_border = "╔" + "═" * (box_width - 2) + "╗"
-    bottom_border = "╚" + "═" * (box_width - 2) + "╝"
-    divider = "╟" + "─" * (box_width - 2) + "╢"
-    # Center the content
-    header_padding = (box_width - len(header) - 2) // 2
-    url_padding = (box_width - len(url) - 2) // 2
-    # Print the box
-    print(f"\n{DIM}{top_border}{RESET}")  # noqa: T201
-    print(  # noqa: T201
-        f"{DIM}║{RESET}{' ' * header_padding}{header}{' ' * (box_width - len(header) - header_padding - 3)}{DIM}║{RESET}"  # noqa: E501
-    )
-    print(f"{DIM}{divider}{RESET}")  # noqa: T201
-    print(  # noqa: T201
-        f"{DIM}║{RESET}{' ' * url_padding}{BOLD}{GOLD}{url}{RESET}{' ' * (box_width - len(url) - url_padding - 2)}{DIM}║{RESET}"  # noqa: E501
-    )
-    print(f"{DIM}{bottom_border}{RESET}\n")  # noqa: T201
-def _print_job_complete_url(job_id: str, job_name: str, error_occurred: bool = False) -> None:
-    """Print the job completion URL with appropriate messaging."""
-    # Only print HUD URL if HUD telemetry is enabled and has API key
-    if not (settings.telemetry_enabled and settings.api_key):
-        return
-    url = f"https://hud.so/jobs/{job_id}"
-    # ANSI color codes
-    GREEN = "\033[92m"
-    RED = "\033[91m"
-    GOLD = "\033[33m"
-    RESET = "\033[0m"
-    DIM = "\033[2m"
-    BOLD = "\033[1m"
-    if error_occurred:
-        print(  # noqa: T201
-            f"\n{RED}✗ Job '{job_name}' failed!{RESET} {DIM}View details at:{RESET} {BOLD}{GOLD}{url}{RESET}\n"  # noqa: E501
-        )
-    else:
-        print(  # noqa: T201
-            f"\n{GREEN}✓ Job '{job_name}' complete!{RESET} {DIM}View all results at:{RESET} {BOLD}{GOLD}{url}{RESET}\n"  # noqa: E501
-        )
-def get_current_job() -> Job | None:
-    """Get the currently active job, if any."""
-    return _current_job
-@contextmanager
-def job(
-    name: str,
-    metadata: dict[str, Any] | None = None,
-    job_id: str | None = None,
-    dataset_link: str | None = None,
-) -> Generator[Job, None, None]:
-    """Context manager for job tracking.
-    Groups related tasks together under a single job for tracking and organization.
-    Args:
-        name: Human-readable job name
-        metadata: Optional metadata dictionary
-        job_id: Optional job ID (auto-generated if not provided)
-        dataset_link: Optional HuggingFace dataset identifier (e.g. "hud-evals/SheetBench-50")
-    Yields:
-        Job: The job object
-    Example:
-        with hud.job("training_run", {"model": "gpt-4"}) as job:
-            for epoch in range(10):
-                with hud.trace(f"epoch_{epoch}", job_id=job.id):
-                    train_epoch()
-    """
-    global _current_job
-    if not job_id:
-        job_id = str(uuid.uuid4())
-    job_obj = Job(job_id, name, metadata, dataset_link)
-    # Set as current job
-    old_job = _current_job
-    _current_job = job_obj
-    try:
-        # Update status to running synchronously to ensure job is registered before tasks start
-        job_obj.update_status_sync("running")
-        # Print the nice job URL box
-        _print_job_url(job_obj.id, job_obj.name)
-        yield job_obj
-        # Update status to completed synchronously to ensure it completes before process exit
-        job_obj.update_status_sync("completed")
-        # Print job completion message
-        _print_job_complete_url(job_obj.id, job_obj.name, error_occurred=False)
-    except Exception:
-        # Update status to failed synchronously to ensure it completes before process exit
-        job_obj.update_status_sync("failed")
-        # Print job failure message
-        _print_job_complete_url(job_obj.id, job_obj.name, error_occurred=True)
-        raise
-    finally:
-        _current_job = old_job
-def create_job(
-    name: str,
-    metadata: dict[str, Any] | None = None,
-    dataset_link: str | None = None,
-    job_id: str | None = None,
-) -> Job:
-    """Create a job without using context manager.
-    Useful when you need explicit control over job lifecycle.
-    Args:
-        name: Human-readable job name
-        metadata: Optional metadata dictionary
-        dataset_link: Optional HuggingFace dataset identifier (e.g. "hud-evals/SheetBench-50")
-        job_id: Optional job ID (auto-generated if not provided)
-    Returns:
-        Job: The created job object
-    Example:
-        job = hud.create_job("data_processing")
-        try:
-            for item in items:
-                with hud.trace(f"process_{item.id}", job_id=job.id):
-                    process(item)
-        finally:
-            await job.update_status("completed")
-    """
-    job_id = job_id or str(uuid.uuid4())
-    return Job(job_id, name, metadata, dataset_link)
-def job_decorator(name: str | None = None, **metadata: Any) -> Callable:
-    """Decorator for functions that should be tracked as jobs.
-    Args:
-        name: Job name (defaults to function name)
-        **metadata: Additional metadata for the job
-    Example:
-        @hud.job_decorator("model_training", model="gpt-4", dataset="v2")
-        async def train_model(config):
-            # This entire function execution is tracked as a job
-            await model.train(config)
-            return model.evaluate()
-    """
-    def decorator(func: Callable) -> Callable:
-        job_name = name or func.__name__
-        @wraps(func)
-        async def async_wrapper(*args: Any, **kwargs: Any) -> Any:
-            with job(job_name, metadata) as job_obj:
-                # Store job ID in function for access
-                func._current_job_id = job_obj.id
-                try:
-                    return await func(*args, **kwargs)
-                finally:
-                    delattr(func, "_current_job_id")
-        @wraps(func)
-        def sync_wrapper(*args: Any, **kwargs: Any) -> Any:
-            with job(job_name, metadata) as job_obj:
-                # Store job ID in function for access
-                func._current_job_id = job_obj.id
-                try:
-                    return func(*args, **kwargs)
-                finally:
-                    delattr(func, "_current_job_id")
-        # Return appropriate wrapper based on function type
-        if asyncio.iscoroutinefunction(func):
-            return async_wrapper
-        else:
-            return sync_wrapper
-    return decorator
-# Convenience exports
-__all__ = [
-    "Job",
-    "create_job",
-    "get_current_job",
-    "job",
-    "job_decorator",
-]

hud/telemetry/replay.py DELETED Viewed

@@ -1,74 +0,0 @@
-"""Trace retrieval and replay functionality.
-This module provides APIs to retrieve collected traces for analysis,
-debugging, and replay purposes.
-"""
-from __future__ import annotations
-from typing import TYPE_CHECKING
-from hud.otel.collector import clear_trace as _clear_trace
-from hud.otel.collector import get_trace as _get_trace
-if TYPE_CHECKING:
-    from hud.types import Trace
-__all__ = ["clear_trace", "get_trace"]
-def get_trace(task_run_id: str) -> Trace | None:
-    """Retrieve the collected trace for a task run.
-    Returns None if trace collection was disabled or the trace doesn't exist.
-    Args:
-        task_run_id: The task run ID to retrieve the trace for
-    Returns:
-        Trace object containing all collected steps, or None if not found
-    Usage:
-        import hud
-        # Run agent with tracing
-        with hud.trace() as task_run_id:
-            agent = MyAgent()
-            result = await agent.run("solve task")
-        # Get the trace for analysis
-        trace = hud.get_trace(task_run_id)
-        if trace:
-            print(f"Collected {len(trace.trace)} steps")
-            # Analyze agent vs MCP steps
-            agent_steps = [s for s in trace.trace if s.category == "agent"]
-            mcp_steps = [s for s in trace.trace if s.category == "mcp"]
-            print(f"Agent steps: {len(agent_steps)}")
-            print(f"MCP steps: {len(mcp_steps)}")
-            # Replay or analyze individual steps
-            for step in trace.trace:
-                if step.category == "agent" and step.result:
-                    print(f"Agent: {step.result.get('content') if isinstance(step.result, dict) else step.result}")
-                if step.category == "mcp" and step.request:
-                    print(f"MCP: {step.request.method if hasattr(step.request, 'method') else step.request}")
-    """  # noqa: E501
-    return _get_trace(task_run_id)
-def clear_trace(task_run_id: str) -> None:
-    """Clear the collected trace for a task run ID.
-    Useful for cleaning up memory after processing large traces.
-    Args:
-        task_run_id: The task run ID to clear the trace for
-    Usage:
-        trace = hud.get_trace(task_run_id)
-        # Process trace...
-        hud.clear_trace(task_run_id)  # Free memory
-    """
-    _clear_trace(task_run_id)

hud/telemetry/tests/test_replay.py DELETED Viewed

@@ -1,40 +0,0 @@
-"""Tests for telemetry replay functionality."""
-from __future__ import annotations
-from unittest.mock import patch
-from hud.telemetry.replay import clear_trace, get_trace
-class TestReplayAPI:
-    """Tests for replay API functions."""
-    def test_get_trace_calls_internal(self):
-        """Test that get_trace calls the internal _get_trace function."""
-        with patch("hud.telemetry.replay._get_trace") as mock_get:
-            mock_get.return_value = None
-            result = get_trace("test-task-id")
-            mock_get.assert_called_once_with("test-task-id")
-            assert result is None
-    def test_clear_trace_calls_internal(self):
-        """Test that clear_trace calls the internal _clear_trace function."""
-        with patch("hud.telemetry.replay._clear_trace") as mock_clear:
-            clear_trace("test-task-id")
-            mock_clear.assert_called_once_with("test-task-id")
-    def test_get_trace_with_data(self):
-        """Test get_trace with mock data."""
-        mock_trace = {"trace": [{"step": 1}], "task_run_id": "test-123"}
-        with patch("hud.telemetry.replay._get_trace") as mock_get:
-            mock_get.return_value = mock_trace
-            result = get_trace("test-123")
-            assert result == mock_trace
-            mock_get.assert_called_once_with("test-123")

hud/telemetry/tests/test_trace.py DELETED Viewed

@@ -1,63 +0,0 @@
-"""Tests for telemetry trace functionality."""
-from __future__ import annotations
-from unittest.mock import patch
-from hud.telemetry.trace import trace
-class TestTraceAPI:
-    """Tests for trace API function."""
-    def test_trace_with_disabled_telemetry_and_no_api_key(self):
-        """Test trace behavior when telemetry is disabled and no API key."""
-        # Mock settings to disable telemetry and remove API key
-        mock_settings = type("Settings", (), {"telemetry_enabled": False, "api_key": None})()
-        with (
-            patch("hud.settings.get_settings", return_value=mock_settings),
-            patch("hud.telemetry.trace.OtelTrace") as mock_otel_trace,
-        ):
-            mock_otel_trace.return_value.__enter__.return_value = "custom-otlp-trace"
-            with trace("test-trace") as task_run_id:
-                # Should use placeholder ID for custom backends
-                assert task_run_id.id == "custom-otlp-trace"
-    def test_trace_with_enabled_telemetry_and_api_key(self):
-        """Test trace behavior when telemetry is enabled with API key."""
-        mock_settings = type("Settings", (), {"telemetry_enabled": True, "api_key": "test-key"})()
-        with (
-            patch("hud.settings.get_settings", return_value=mock_settings),
-            patch("hud.telemetry.trace.OtelTrace") as mock_otel_trace,
-            patch("hud.telemetry.trace.uuid.uuid4") as mock_uuid,
-        ):
-            mock_uuid.return_value = "mock-uuid-123"
-            mock_otel_trace.return_value.__enter__.return_value = "mock-uuid-123"
-            with trace("test-trace") as task_run_id:
-                # Should use generated UUID
-                assert task_run_id.id == "mock-uuid-123"
-    def test_trace_with_no_api_key(self):
-        """Test trace behavior with no API key (custom backend scenario)."""
-        mock_settings = type(
-            "Settings",
-            (),
-            {
-                "telemetry_enabled": True,  # Enabled but no API key
-                "api_key": None,
-            },
-        )()
-        with (
-            patch("hud.settings.get_settings", return_value=mock_settings),
-            patch("hud.telemetry.trace.OtelTrace") as mock_otel_trace,
-        ):
-            mock_otel_trace.return_value.__enter__.return_value = "custom-otlp-trace"
-            with trace("test-trace") as task_run_id:
-                # Should use custom backend placeholder
-                assert task_run_id.id == "custom-otlp-trace"

hud/telemetry/trace.py DELETED Viewed

@@ -1,158 +0,0 @@
-"""User-facing trace context manager for HUD telemetry.
-This module provides the simple trace() API that users interact with.
-The actual OpenTelemetry implementation is in hud.otel.
-"""
-from __future__ import annotations
-import logging
-import uuid
-from contextlib import contextmanager
-from datetime import UTC, datetime
-from typing import TYPE_CHECKING, Any
-from hud.otel import configure_telemetry
-from hud.otel import trace as OtelTrace
-from hud.settings import settings
-from hud.shared import make_request, make_request_sync
-if TYPE_CHECKING:
-    from collections.abc import Generator
-logger = logging.getLogger(__name__)
-__all__ = ["Trace", "trace"]
-class Trace:
-    """A trace represents a single task execution with telemetry."""
-    def __init__(
-        self,
-        trace_id: str,
-        name: str,
-        job_id: str | None = None,
-        task_id: str | None = None,
-    ) -> None:
-        self.id = trace_id
-        self.name = name
-        self.job_id = job_id
-        self.task_id = task_id
-        self.created_at = datetime.now(UTC)
-    async def log(self, metrics: dict[str, Any]) -> None:
-        """Log metrics to this trace.
-        Args:
-            metrics: Dictionary of metric name to value pairs
-        Example:
-            await trace.log({"step": 1, "loss": 0.5, "accuracy": 0.92})
-        """
-        if settings.telemetry_enabled:
-            try:
-                await make_request(
-                    method="POST",
-                    url=f"{settings.hud_telemetry_url}/traces/{self.id}/log",
-                    json={"metrics": metrics, "timestamp": datetime.now(UTC).isoformat()},
-                    api_key=settings.api_key,
-                )
-            except Exception as e:
-                logger.warning("Failed to log metrics to trace: %s", e)
-    def log_sync(self, metrics: dict[str, Any]) -> None:
-        """Synchronously log metrics to this trace.
-        Args:
-            metrics: Dictionary of metric name to value pairs
-        Example:
-            trace.log_sync({"step": 1, "loss": 0.5, "accuracy": 0.92})
-        """
-        if settings.telemetry_enabled:
-            try:
-                make_request_sync(
-                    method="POST",
-                    url=f"{settings.hud_telemetry_url}/traces/{self.id}/log",
-                    json={"metrics": metrics, "timestamp": datetime.now(UTC).isoformat()},
-                    api_key=settings.api_key,
-                )
-            except Exception as e:
-                logger.warning("Failed to log metrics to trace: %s", e)
-    def __repr__(self) -> str:
-        return f"Trace(id={self.id!r}, name={self.name!r})"
-@contextmanager
-def trace(
-    name: str = "Test task from hud",
-    *,
-    root: bool = True,
-    attrs: dict[str, Any] | None = None,
-    job_id: str | None = None,
-    task_id: str | None = None,
-) -> Generator[Trace, None, None]:
-    """Start a HUD trace context.
-    A unique task_run_id is automatically generated for each trace.
-    Args:
-        name: Descriptive name for this trace/task
-        root: Whether this is a root trace (updates task status)
-        attrs: Additional attributes to attach to the trace
-        job_id: Optional job ID to associate with this trace
-        task_id: Optional task ID (for custom task identifiers)
-    Yields:
-        Trace: The trace object with logging capabilities
-    Usage:
-        import hud
-        # Basic usage
-        with hud.trace("My Task") as trace:
-            # Your code here
-            trace.log_sync({"step": 1, "progress": 0.5})
-        # Async logging
-        async with hud.trace("Async Task") as trace:
-            await trace.log({"loss": 0.23, "accuracy": 0.95})
-        # With job association
-        with hud.job("Training Run") as job:
-            with hud.trace("Epoch 1", job_id=job.id) as trace:
-                trace.log_sync({"epoch": 1, "loss": 0.5})
-    """
-    # Ensure telemetry is configured
-    configure_telemetry()
-    # Only generate task_run_id if using HUD backend
-    # For custom OTLP backends, we don't need it
-    from hud.settings import get_settings
-    settings = get_settings()
-    if settings.telemetry_enabled and settings.api_key:
-        task_run_id = str(uuid.uuid4())
-    else:
-        # Use a placeholder for custom backends
-        logger.warning(
-            "HUD API key is not set, using a placeholder for the task run ID. If this looks wrong, check your API key." # noqa: E501
-        )
-        task_run_id = str(uuid.uuid4())
-    # Create trace object
-    trace_obj = Trace(task_run_id, name, job_id, task_id)
-    # Delegate to OpenTelemetry implementation
-    with OtelTrace(
-        task_run_id,
-        is_root=root,
-        span_name=name,
-        attributes=attrs or {},
-        job_id=job_id,
-        task_id=task_id,
-    ):
-        yield trace_obj

hud-python 0.4.45__py3-none-any.whl → 0.5.13__py3-none-any.whl

hud-python 0.4.45py3-none-any.whl → 0.5.13py3-none-any.whl