PyPI - humalab - Versions diffs - 0.0.5__py3-none-any.whl → 0.0.7__py3-none-any.whl - Mend

humalab 0.0.5py3-none-any.whl → 0.0.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of humalab might be problematic. Click here for more details.

Files changed (42) hide show

humalab/__init__.py +25 -0
humalab/assets/__init__.py +8 -2
humalab/assets/files/resource_file.py +96 -6
humalab/assets/files/urdf_file.py +49 -11
humalab/assets/resource_operator.py +139 -0
humalab/constants.py +48 -5
humalab/dists/__init__.py +7 -0
humalab/dists/bernoulli.py +26 -1
humalab/dists/categorical.py +25 -0
humalab/dists/discrete.py +27 -2
humalab/dists/distribution.py +11 -0
humalab/dists/gaussian.py +27 -2
humalab/dists/log_uniform.py +29 -3
humalab/dists/truncated_gaussian.py +33 -4
humalab/dists/uniform.py +24 -0
humalab/episode.py +291 -11
humalab/humalab.py +93 -38
humalab/humalab_api_client.py +297 -95
humalab/humalab_config.py +49 -0
humalab/humalab_test.py +46 -17
humalab/metrics/__init__.py +11 -5
humalab/metrics/code.py +59 -0
humalab/metrics/metric.py +69 -102
humalab/metrics/scenario_stats.py +163 -0
humalab/metrics/summary.py +45 -24
humalab/run.py +224 -101
humalab/scenarios/__init__.py +11 -0
humalab/{scenario.py → scenarios/scenario.py} +130 -136
humalab/scenarios/scenario_operator.py +114 -0
humalab/{scenario_test.py → scenarios/scenario_test.py} +150 -269
humalab/utils.py +37 -0
{humalab-0.0.5.dist-info → humalab-0.0.7.dist-info}/METADATA +1 -1
humalab-0.0.7.dist-info/RECORD +39 -0
humalab/assets/resource_manager.py +0 -58
humalab/evaluators/__init__.py +0 -16
humalab/humalab_main.py +0 -119
humalab/metrics/dist_metric.py +0 -22
humalab-0.0.5.dist-info/RECORD +0 -37
{humalab-0.0.5.dist-info → humalab-0.0.7.dist-info}/WHEEL +0 -0
{humalab-0.0.5.dist-info → humalab-0.0.7.dist-info}/entry_points.txt +0 -0
{humalab-0.0.5.dist-info → humalab-0.0.7.dist-info}/licenses/LICENSE +0 -0
{humalab-0.0.5.dist-info → humalab-0.0.7.dist-info}/top_level.txt +0 -0

humalab/metrics/scenario_stats.py ADDED Viewed

@@ -0,0 +1,163 @@
+from humalab.metrics.metric import Metrics
+from humalab.constants import ArtifactType, GraphType, MetricDimType
+from humalab.humalab_api_client import EpisodeStatus
+from typing import Any
+SCENARIO_STATS_NEED_FLATTEN = {
+    "uniform_1d",
+    "bernoulli_1d",
+    "categorical_1d",
+    "discrete_1d",
+    "log_uniform_1d",
+    "gaussian_1d",
+    "truncated_gaussian_1d"
+}
+DISTRIBUTION_GRAPH_TYPE = {
+    # 0D distributions
+    "uniform": GraphType.HISTOGRAM,
+    "bernoulli": GraphType.BAR,
+    "categorical": GraphType.BAR,
+    "discrete": GraphType.BAR,
+    "log_uniform": GraphType.HISTOGRAM,
+    "gaussian": GraphType.GAUSSIAN,
+    "truncated_gaussian": GraphType.GAUSSIAN,
+    # 1D distributions
+    "uniform_1d": GraphType.HISTOGRAM,
+    "bernoulli_1d": GraphType.BAR,
+    "categorical_1d": GraphType.BAR,
+    "discrete_1d": GraphType.BAR,
+    "log_uniform_1d": GraphType.HISTOGRAM,
+    "gaussian_1d": GraphType.GAUSSIAN,
+    "truncated_gaussian_1d": GraphType.GAUSSIAN,
+    # 2D distributions
+    "uniform_2d": GraphType.SCATTER,
+    "gaussian_2d": GraphType.HEATMAP,
+    "truncated_gaussian_2d": GraphType.HEATMAP,
+    # 3D distributions
+    "uniform_3d": GraphType.THREE_D_MAP,
+    "gaussian_3d": GraphType.THREE_D_MAP,
+    "truncated_gaussian_3d": GraphType.THREE_D_MAP,
+}
+class ScenarioStats(Metrics):
+    """Metric to track scenario statistics across episodes.
+    This class logs sampled values from scenario distributions and tracks episode
+    statuses. It supports various distribution types and automatically handles
+    flattening for 1D distributions.
+    Attributes:
+        name (str): The name of the scenario statistic.
+        distribution_type (str): The type of distribution (e.g., 'uniform', 'gaussian').
+        artifact_type (ArtifactType): The artifact type, always SCENARIO_STATS.
+    """
+    def __init__(self,
+                 name: str,
+                 distribution_type: str,
+                 ) -> None:
+        super().__init__(
+            graph_type=DISTRIBUTION_GRAPH_TYPE[distribution_type]
+        )
+        self._name = name
+        self._distribution_type = distribution_type
+        self._artifact_type = ArtifactType.SCENARIO_STATS
+        self._values = {}
+        self._results = {}
+    @property
+    def name(self) -> str:
+        """The name of the scenario statistic.
+        Returns:
+            str: The statistic name.
+        """
+        return self._name
+    @property
+    def distribution_type(self) -> str:
+        """The type of distribution used for this statistic.
+        Returns:
+            str: The distribution type (e.g., 'uniform', 'gaussian').
+        """
+        return self._distribution_type
+    @property
+    def artifact_type(self) -> ArtifactType:
+        """The artifact type, always SCENARIO_STATS.
+        Returns:
+            ArtifactType: The artifact type.
+        """
+        return self._artifact_type
+    def log(self, data: Any, x: Any = None, replace: bool = False) -> None:
+        """Log a sampled value from the scenario distribution.
+        Args:
+            data (Any): The sampled value to log.
+            x (Any | None): The key/identifier for this sample (typically episode_id).
+                If None, auto-incrementing step is used.
+            replace (bool): Whether to replace an existing value. Defaults to False.
+        Raises:
+            ValueError: If data for the given x already exists and replace is False.
+        """
+        if x in self._values:
+            if replace:
+                if self._distribution_type in SCENARIO_STATS_NEED_FLATTEN:
+                    data = data[0]
+                self._values[x] = data
+            else:
+                raise ValueError(f"Data for episode_id {x} already exists. Use replace=True to overwrite.")
+        else:
+            if self._distribution_type in SCENARIO_STATS_NEED_FLATTEN:
+                data = data[0]
+            self._values[x] = data
+    def log_status(self,
+                   episode_id: str,
+                   episode_status: EpisodeStatus,
+                   replace: bool = False) -> None:
+        """Log the status of an episode.
+        Args:
+            episode_id (str): The unique identifier of the episode.
+            episode_status (EpisodeStatus): The status of the episode.
+            replace (bool): Whether to replace an existing status for this episode.
+                Defaults to False.
+        Raises:
+            ValueError: If status for the episode_id already exists and replace is False.
+        """
+        if episode_id in self._results:
+            if replace:
+                self._results[episode_id] = episode_status.value
+            else:
+                raise ValueError(f"Data for episode_id {episode_id} already exists. Use replace=True to overwrite.")
+        else:
+            self._results[episode_id] = episode_status.value
+    def _finalize(self) -> dict:
+        """Finalize and return all collected scenario statistics.
+        Returns:
+            dict: Dictionary containing values, results, and distribution type.
+        """
+        ret_val = {
+            "values": self._values,
+            "results": self._results,
+            "distribution_type": self._distribution_type,
+        }
+        self._values = {}
+        self._results = {}
+        return ret_val

humalab/metrics/summary.py CHANGED Viewed

@@ -1,47 +1,65 @@
-from humalab.metrics.metric import MetricGranularity, Metrics, MetricType
-from humalab.constants import EpisodeStatus
+from humalab.metrics.metric import Metrics
+from humalab.constants import MetricDimType, GraphType
 class Summary(Metrics):
-    def __init__(self,
-                 name: str,
+    """A metric that aggregates logged values into a single summary statistic.
+    Summary metrics collect values throughout a run or episode and compute a single
+    aggregated result. Supported aggregation methods include min, max, mean, first,
+    last, and none (no aggregation).
+    Attributes:
+        summary (str): The aggregation method used.
+    """
+    def __init__(self,
                  summary: str,
-                 episode_id: str,
-                 run_id: str,
-                 granularity: MetricGranularity = MetricGranularity.RUN,
                  ) -> None:
         """
         A summary metric that captures a single value per episode or run.
         Args:
-            name (str): The name of the metric.
-            summary (str | None): Specify aggregate metrics added to summary.
+            summary (str): Specify the aggregation method for the summary.
                 Supported aggregations include "min", "max", "mean", "last",
-                "first", and "none". "none" prevents a summary
-                from being generated.
-            granularity (MetricGranularity): The granularity of the metric.
+                "first", and "none". "none" prevents a summary from being generated.
         """
-        if granularity == MetricGranularity.RUN:
-            raise ValueError("Summary metrics cannot have RUN granularity.")
         if summary not in {"min", "max", "mean", "last", "first", "none"}:
             raise ValueError(f"Unsupported summary type: {summary}. Supported types are 'min', 'max', 'mean', 'last', 'first', and 'none'.")
-        super().__init__(name, MetricType.SUMMARY, episode_id=episode_id, run_id=run_id, granularity=granularity)
-        self.summary = summary
+        super().__init__(graph_type=GraphType.NUMERIC)
+        self._summary = summary
+    @property
+    def summary(self) -> str:
+        """The aggregation method for this summary metric.
+        Returns:
+            str: The summary type (e.g., 'min', 'max', 'mean').
+        """
+        return self._summary
+    def _finalize(self) -> dict:
+        """Compute the final aggregated value.
-    def _submit(self) -> None:
+        Returns:
+            dict: Dictionary containing the aggregated value and summary type.
+        """
         if not self._values:
-            return
+            return {
+                "value": None,
+                "summary": self.summary
+            }
+        final_val = None
         # For summary metrics, we only keep the latest value
         if self.summary == "last":
-            self._values = [self._values[-1]]
+            final_val = self._values[-1]
         elif self.summary == "first":
-            self._values = [self._values[0]]
+            final_val = self._values[0]
         elif self.summary == "none":
-            self._values = []
+            final_val = None
         elif self.summary in {"min", "max", "mean"}:
             if not self._values:
-                self._values = []
+                final_val = None
             else:
                 if self.summary == "min":
                     agg_value = min(self._values)
@@ -49,6 +67,9 @@ class Summary(Metrics):
                     agg_value = max(self._values)
                 elif self.summary == "mean":
                     agg_value = sum(self._values) / len(self._values)
-                self._values = [agg_value]
+                final_val = agg_value
-        super()._submit()
+        return {
+            "value": final_val,
+            "summary": self.summary
+        }

humalab/run.py CHANGED Viewed

@@ -1,19 +1,51 @@
 import uuid
-from humalab.metrics.dist_metric import DistributionMetric
-from humalab.metrics.metric import MetricGranularity, MetricType, Metrics
-from humalab.constants import EpisodeStatus
+import traceback
+import pickle
+import base64
+from humalab.metrics.code import Code
 from humalab.metrics.summary import Summary
-from humalab.scenario import Scenario
+from humalab.constants import DEFAULT_PROJECT, RESERVED_NAMES, ArtifactType
+from humalab.metrics.scenario_stats import ScenarioStats
+from humalab.humalab_api_client import EpisodeStatus, HumaLabApiClient, RunStatus
+from humalab.metrics.metric import Metrics
+from humalab.episode import Episode
+from humalab.utils import is_standard_type
+from humalab.scenarios.scenario import Scenario
 class Run:
+    """Represents a run containing multiple episodes for a scenario.
+    A Run is a context manager that tracks experiments or evaluations using a specific
+    scenario. It manages episode creation, metric logging, and code artifacts. The run
+    can contain multiple episodes, each representing a single execution instance.
+    Use as a context manager to automatically handle run lifecycle:
+        with Run(scenario=my_scenario) as run:
+            # Your code here
+            pass
+    Attributes:
+        project (str): The project name under which the run is created.
+        id (str): The unique identifier for the run.
+        name (str): The name of the run.
+        description (str): A description of the run.
+        tags (list[str]): A list of tags associated with the run.
+        scenario (Scenario): The scenario associated with the run.
+    """
     def __init__(self,
-                 project: str,
                  scenario: Scenario,
+                 project: str = DEFAULT_PROJECT,
                  name: str | None = None,
                  description: str | None = None,
                  id: str | None = None,
                  tags: list[str] | None = None,
+                 base_url: str | None = None,
+                 api_key: str | None = None,
+                 timeout: float | None = None,
                  ) -> None:
         """
         Initialize a new Run instance.
@@ -31,13 +63,16 @@ class Run:
         self._name = name or ""
         self._description = description or ""
         self._tags = tags or []
-        self._finished = False
-        self._episode = str(uuid.uuid4())
         self._scenario = scenario
+        self._logs = {}
+        self._episodes = {}
+        self._is_finished = False
+        self._api_client = HumaLabApiClient(base_url=base_url,
+                                            api_key=api_key,
+                                            timeout=timeout)
-        self._metrics = {}
     @property
     def project(self) -> str:
@@ -84,15 +119,6 @@ class Run:
         """
         return self._tags
-    @property
-    def episode(self) -> str:
-        """The episode ID for the run.
-        Returns:
-            str: The episode ID.
-        """
-        return self._episode
     @property
     def scenario(self) -> Scenario:
         """The scenario associated with the run.
@@ -101,102 +127,199 @@ class Run:
             Scenario: The scenario instance.
         """
         return self._scenario
+    def __enter__(self):
+        """Enter the run context."""
+        return self
-    def finish(self,
-               status: EpisodeStatus = EpisodeStatus.PASS,
-               quiet: bool | None = None) -> None:
-        """Finish the run and submit final metrics.
+    def __exit__(self, exception_type, exception_value, exception_traceback):
+        """Exit the run context and finalize the run."""
+        if self._is_finished:
+            return
+        if exception_type is not None:
+            err_msg = "".join(traceback.format_exception(exception_type, exception_value, exception_traceback))
+            self.finish(status=RunStatus.ERRORED, err_msg=err_msg)
+        else:
+            self.finish()
+    def create_episode(self, episode_id: str | None = None) -> Episode:
+        """Create a new episode for this run.
         Args:
-            status (EpisodeStatus): The final status of the episode.
-            quiet (bool | None): Whether to suppress output.
+            episode_id (str | None): Optional unique identifier for the episode.
+                If None, a UUID is generated automatically.
+        Returns:
+            Episode: The newly created episode instance.
         """
-        self._finished = True
-        self._scenario.finish()
-        for metric in self._metrics.values():
-            metric.finish(status=status)
+        episode = None
+        episode_id = episode_id or str(uuid.uuid4())
+        cur_scenario, episode_vals = self._scenario.resolve()
+        episode = Episode(run_id=self._id,
+                          episode_id=episode_id,
+                          scenario_conf=cur_scenario,
+                          episode_vals=episode_vals)
+        self._handle_scenario_stats(episode, episode_vals)
+        return episode
+    def _handle_scenario_stats(self, episode: Episode, episode_vals: dict) -> None:
+        for metric_name, value in episode_vals.items():
+            if metric_name not in self._logs:
+                stat = ScenarioStats(name=metric_name,
+                                    distribution_type=value["distribution"])
+                self._logs[metric_name] = stat
+            self._logs[metric_name].log(data=value["value"],
+                                        x=episode.episode_id)
+        self._episodes[episode.episode_id] = episode
-    def log(self,
-            data: dict,
-            step: int | None = None,
-            commit: bool = True,
-            ) -> None:
-        """Log metrics for the run.
+    def add_metric(self, name: str, metric: Metrics) -> None:
+        """Add a metric to track for this run.
         Args:
-            data (dict): A dictionary of metric names and their values.
-            step (int | None): The step number for the metrics.
-            commit (bool): Whether to commit the metrics immediately.
+            name (str): The name of the metric.
+            metric (Metrics): The metric instance to add.
+        Raises:
+            ValueError: If the name is already used.
         """
-        for key, value in data.items():
-            if key in self._metrics:
-                metric = self._metrics[key]
-                metric.log(value, step=step, commit=commit)
-            else:
-                self._metrics[key] = Metrics(key,
-                                             metric_type=MetricType.DEFAULT,
-                                             run_id=self._id,
-                                             granularity=MetricGranularity.EPISODE,
-                                             episode_id=self._episode)
-                self._metrics[key].log(value, step=step, commit=commit)
+        if name in self._logs:
+            raise ValueError(f"{name} is a reserved name and is not allowed.")
+        self._logs[name] = metric
-    def reset(self, status: EpisodeStatus = EpisodeStatus.PASS) -> None:
-        """Reset the run for a new episode.
+    def log_code(self, key: str, code_content: str) -> None:
+        """Log code content as an artifact.
         Args:
-            status (EpisodeStatus): The status of the current episode before reset.
+            key (str): The key for the code artifact.
+            code_content (str): The code content to log.
         """
-        self._submit_episode_status(status=status, episode=self._episode)
-        self._episode = str(uuid.uuid4())
-        self._finished = False
-        self._scenario.reset(episode_id=self._episode)
-        for metric in self._metrics.values():
-            metric.reset(episode=self._episode)
-    def _submit_episode_status(self, status: EpisodeStatus, episode: str) -> None:
-        # TODO: Implement submission of episode status
-        pass
-    def define_metric(self,
-                      name: str,
-                      metric_type: MetricType = MetricType.DEFAULT,
-                      granularity: MetricGranularity = MetricGranularity.RUN,
-                      distribution_type: str | None = None,
-                      summary: str | None = None,
-                      replace: bool = False) -> None:
-        """Define a new metric for the run.
+        if key in RESERVED_NAMES:
+            raise ValueError(f"{key} is a reserved name and is not allowed.")
+        self._logs[key] = Code(
+            run_id=self._id,
+            key=key,
+            code_content=code_content,
+        )
+    def log(self, data: dict, x: dict | None = None, replace: bool = False) -> None:
+        """Log data points or values for the run.
         Args:
-            name (str): The name of the metric.
-            metric_type (MetricType): The type of the metric.
-            granularity (MetricGranularity): The granularity of the metric.
-            distribution_type (str | None): The type of distribution if metric_type is DISTRIBUTION.
-            summary (str | None): Specify aggregate metrics added to summary.
-                Supported aggregations include "min", "max", "mean", "last",
-                "first", and "none". "none" prevents a summary
-                from being generated.
-            replace (bool): Whether to replace the metric if it already exists.
+            data (dict): Dictionary of key-value pairs to log.
+            x (dict | None): Optional dictionary of x-axis values for each key.
+            replace (bool): Whether to replace existing values. Defaults to False.
+        Raises:
+            ValueError: If a key is reserved or logging fails.
         """
-        if name not in self._metrics or replace:
-            if metric_type == MetricType.DISTRIBUTION:
-                if distribution_type is None:
-                    raise ValueError("distribution_type must be specified for distribution metrics.")
-                self._metrics[name] = DistributionMetric(name=name,
-                                                         distribution_type=distribution_type,
-                                                         run_id=self._id,
-                                                         episode_id=self._episode,
-                                                         granularity=granularity)
-            elif summary is not None:
-                self._metrics[name] = Summary(name=name,
-                                              summary=summary,
-                                              run_id=self._id,
-                                              episode_id=self._episode,
-                                              granularity=granularity)
+        for key, value in data.items():
+            if key in RESERVED_NAMES:
+                raise ValueError(f"{key} is a reserved name and is not allowed.")
+            if key not in self._logs:
+                self._logs[key] = value
             else:
-                self._metrics[name] = Metrics(name=name,
-                                              metric_type=metric_type,
-                                              run_id=self._id,
-                                              episode_id=self._episode,
-                                              granularity=granularity)
-        else:
-            raise ValueError(f"Metric {name} already exists.")
+                cur_val = self._logs[key]
+                if isinstance(cur_val, Metrics):
+                    cur_x = x.get(key) if x is not None else None
+                    cur_val.log(value, x=cur_x, replace=replace)
+                else:
+                    if replace:
+                        self._logs[key] = value
+                    else:
+                        raise ValueError(f"Cannot log value for key '{key}' as there is already a value logged.")
+    def _finish_episodes(self,
+                         status: RunStatus,
+                         err_msg: str | None = None) -> None:
+        for episode in self._episodes.values():
+            if not episode.is_finished:
+                if status == RunStatus.FINISHED:
+                    episode.finish(status=EpisodeStatus.CANCELED, err_msg=err_msg)
+                elif status == RunStatus.ERRORED:
+                    episode.finish(status=EpisodeStatus.ERRORED, err_msg=err_msg)
+                elif status == RunStatus.CANCELED:
+                    episode.finish(status=EpisodeStatus.CANCELED, err_msg=err_msg)
+    def finish(self,
+               status: RunStatus = RunStatus.FINISHED,
+               err_msg: str | None = None) -> None:
+        """Finish the run and submit final metrics.
+        Args:
+            status (RunStatus): The final status of the run.
+            err_msg (str | None): An optional error message.
+        """
+        if self._is_finished:
+            return
+        self._is_finished = True
+        self._finish_episodes(status=status, err_msg=err_msg)
+        self._api_client.upload_code(
+            artifact_key="scenario",
+            run_id=self._id,
+            code_content=self.scenario.yaml
+        )
+        self._api_client.upload_python(
+            artifact_key="seed",
+            run_id=self._id,
+            pickled_bytes=pickle.dumps(self.scenario.seed)
+        )
+        # TODO: submit final metrics
+        for key, value in self._logs.items():
+            if isinstance(value, ScenarioStats):
+                for episode_id, episode in self._episodes.items():
+                    episode_status = episode.status
+                    value.log_status(
+                        episode_id=episode_id,
+                        episode_status=episode_status
+                    )
+                metric_val = value.finalize()
+                pickled = pickle.dumps(metric_val)
+                self._api_client.upload_scenario_stats_artifact(
+                    artifact_key=key,
+                    run_id=self._id,
+                    pickled_bytes=pickled,
+                    graph_type=value.graph_type.value,
+                )
+            elif isinstance(value, Summary):
+                metric_val = value.finalize()
+                pickled = pickle.dumps(metric_val["value"])
+                self._api_client.upload_python(
+                    artifact_key=key,
+                    run_id=self._id,
+                    pickled_bytes=pickled
+                )
+            elif isinstance(value, Metrics):
+                metric_val = value.finalize()
+                pickled = pickle.dumps(metric_val)
+                self._api_client.upload_metrics(
+                    artifact_key=key,
+                    run_id=self._id,
+                    pickled_bytes=pickled,
+                    graph_type=value.graph_type.value,
+                )
+            elif isinstance(value, Code):
+                self._api_client.upload_code(
+                    artifact_key=value.key,
+                    run_id=value.run_id,
+                    episode_id=value.episode_id,
+                    code_content=value.code_content
+                )
+            else:
+                if not is_standard_type(value):
+                    raise ValueError(f"Value for key '{key}' is not a standard type.")
+                pickled = pickle.dumps(value)
+                self._api_client.upload_python(
+                    artifact_key=key,
+                    run_id=self._id,
+                    pickled_bytes=pickled
+                )
+        self._api_client.update_run(
+            run_id=self._id,
+            status=status,
+            err_msg=err_msg
+        )

humalab/scenarios/__init__.py ADDED Viewed

@@ -0,0 +1,11 @@
+"""Scenario management and configuration.
+This module provides the Scenario class and related utilities for managing scenario
+configurations with probabilistic distributions, supporting randomized scenario generation
+for robotics experiments.
+"""
+from .scenario import Scenario
+from .scenario_operator import list_scenarios, get_scenario
+__all__ = ["Scenario", "list_scenarios", "get_scenario"]

humalab 0.0.5__py3-none-any.whl → 0.0.7__py3-none-any.whl

Potentially problematic release.

humalab 0.0.5py3-none-any.whl → 0.0.7py3-none-any.whl