PyPI - opentau - Versions diffs - 0.1.0__py3-none-any.whl - Mend

opentau 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

opentau/__init__.py +179 -0
opentau/__version__.py +24 -0
opentau/configs/__init__.py +19 -0
opentau/configs/default.py +297 -0
opentau/configs/libero.py +113 -0
opentau/configs/parser.py +393 -0
opentau/configs/policies.py +297 -0
opentau/configs/reward.py +42 -0
opentau/configs/train.py +370 -0
opentau/configs/types.py +76 -0
opentau/constants.py +52 -0
opentau/datasets/__init__.py +84 -0
opentau/datasets/backward_compatibility.py +78 -0
opentau/datasets/compute_stats.py +333 -0
opentau/datasets/dataset_mixture.py +460 -0
opentau/datasets/factory.py +232 -0
opentau/datasets/grounding/__init__.py +67 -0
opentau/datasets/grounding/base.py +154 -0
opentau/datasets/grounding/clevr.py +110 -0
opentau/datasets/grounding/cocoqa.py +130 -0
opentau/datasets/grounding/dummy.py +101 -0
opentau/datasets/grounding/pixmo.py +177 -0
opentau/datasets/grounding/vsr.py +141 -0
opentau/datasets/image_writer.py +304 -0
opentau/datasets/lerobot_dataset.py +1910 -0
opentau/datasets/online_buffer.py +442 -0
opentau/datasets/push_dataset_to_hub/utils.py +132 -0
opentau/datasets/sampler.py +99 -0
opentau/datasets/standard_data_format_mapping.py +278 -0
opentau/datasets/transforms.py +330 -0
opentau/datasets/utils.py +1243 -0
opentau/datasets/v2/batch_convert_dataset_v1_to_v2.py +887 -0
opentau/datasets/v2/convert_dataset_v1_to_v2.py +829 -0
opentau/datasets/v21/_remove_language_instruction.py +109 -0
opentau/datasets/v21/batch_convert_dataset_v20_to_v21.py +60 -0
opentau/datasets/v21/convert_dataset_v20_to_v21.py +183 -0
opentau/datasets/v21/convert_stats.py +150 -0
opentau/datasets/video_utils.py +597 -0
opentau/envs/__init__.py +18 -0
opentau/envs/configs.py +178 -0
opentau/envs/factory.py +99 -0
opentau/envs/libero.py +439 -0
opentau/envs/utils.py +204 -0
opentau/optim/__init__.py +16 -0
opentau/optim/factory.py +43 -0
opentau/optim/optimizers.py +121 -0
opentau/optim/schedulers.py +140 -0
opentau/planner/__init__.py +82 -0
opentau/planner/high_level_planner.py +366 -0
opentau/planner/utils/memory.py +64 -0
opentau/planner/utils/utils.py +65 -0
opentau/policies/__init__.py +24 -0
opentau/policies/factory.py +172 -0
opentau/policies/normalize.py +315 -0
opentau/policies/pi0/__init__.py +19 -0
opentau/policies/pi0/configuration_pi0.py +250 -0
opentau/policies/pi0/modeling_pi0.py +994 -0
opentau/policies/pi0/paligemma_with_expert.py +516 -0
opentau/policies/pi05/__init__.py +20 -0
opentau/policies/pi05/configuration_pi05.py +231 -0
opentau/policies/pi05/modeling_pi05.py +1257 -0
opentau/policies/pi05/paligemma_with_expert.py +572 -0
opentau/policies/pretrained.py +315 -0
opentau/policies/utils.py +123 -0
opentau/policies/value/__init__.py +18 -0
opentau/policies/value/configuration_value.py +170 -0
opentau/policies/value/modeling_value.py +512 -0
opentau/policies/value/reward.py +87 -0
opentau/policies/value/siglip_gemma.py +221 -0
opentau/scripts/actions_mse_loss.py +89 -0
opentau/scripts/bin_to_safetensors.py +116 -0
opentau/scripts/compute_max_token_length.py +111 -0
opentau/scripts/display_sys_info.py +90 -0
opentau/scripts/download_libero_benchmarks.py +54 -0
opentau/scripts/eval.py +877 -0
opentau/scripts/export_to_onnx.py +180 -0
opentau/scripts/fake_tensor_training.py +87 -0
opentau/scripts/get_advantage_and_percentiles.py +220 -0
opentau/scripts/high_level_planner_inference.py +114 -0
opentau/scripts/inference.py +70 -0
opentau/scripts/launch_train.py +63 -0
opentau/scripts/libero_simulation_parallel.py +356 -0
opentau/scripts/libero_simulation_sequential.py +122 -0
opentau/scripts/nav_high_level_planner_inference.py +61 -0
opentau/scripts/train.py +379 -0
opentau/scripts/visualize_dataset.py +294 -0
opentau/scripts/visualize_dataset_html.py +507 -0
opentau/scripts/zero_to_fp32.py +760 -0
opentau/utils/__init__.py +20 -0
opentau/utils/accelerate_utils.py +79 -0
opentau/utils/benchmark.py +98 -0
opentau/utils/fake_tensor.py +81 -0
opentau/utils/hub.py +209 -0
opentau/utils/import_utils.py +79 -0
opentau/utils/io_utils.py +137 -0
opentau/utils/libero.py +214 -0
opentau/utils/libero_dataset_recorder.py +460 -0
opentau/utils/logging_utils.py +180 -0
opentau/utils/monkey_patch.py +278 -0
opentau/utils/random_utils.py +244 -0
opentau/utils/train_utils.py +198 -0
opentau/utils/utils.py +471 -0
opentau-0.1.0.dist-info/METADATA +161 -0
opentau-0.1.0.dist-info/RECORD +108 -0
opentau-0.1.0.dist-info/WHEEL +5 -0
opentau-0.1.0.dist-info/entry_points.txt +2 -0
opentau-0.1.0.dist-info/licenses/LICENSE +508 -0
opentau-0.1.0.dist-info/top_level.txt +1 -0

opentau/__init__.py ADDED Viewed

@@ -0,0 +1,179 @@
+#!/usr/bin/env python
+# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
+# Copyright 2026 Tensor Auto Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""OpenTau package initialization and registry.
+This module provides lightweight access to available environments, datasets, and policies
+without importing heavy dependencies. It serves as the main entry point for discovering
+what components are available in the OpenTau library.
+The module maintains several key registries:
+- `available_envs`: List of supported environment types (e.g., "aloha", "pusht")
+- `available_tasks_per_env`: Mapping of environments to their available tasks
+- `available_datasets_per_env`: Mapping of environments to their compatible datasets
+- `available_real_world_datasets`: List of real-world robot datasets
+- `available_grounding_datasets`: Registry for grounding datasets (populated via decorator)
+- `available_policies`: List of available policy types (e.g., "pi0", "pi05", "value")
+- `available_policies_per_env`: Mapping of environments to their compatible policies
+Example:
+    ```python
+        import opentau
+        print(opentau.available_envs)
+        print(opentau.available_tasks_per_env)
+        print(opentau.available_datasets)
+        print(opentau.available_datasets_per_env)
+        print(opentau.available_real_world_datasets)
+        print(opentau.available_policies)
+        print(opentau.available_policies_per_env)
+    ```
+When implementing a new dataset, follow these steps:
+- Update `available_datasets_per_env` in `src/opentau/__init__.py`
+When implementing a new environment (e.g., `gym_aloha`), follow these steps:
+- Update `available_tasks_per_env` and `available_datasets_per_env` in `src/opentau/__init__.py`
+When implementing a new policy class (e.g., `DiffusionPolicy`), follow these steps:
+- Update `available_policies` and `available_policies_per_env` in `src/opentau/__init__.py`
+- Set the required `name` class attribute
+- Update variables in `tests/test_available.py` by importing your new Policy class
+"""
+import itertools
+from opentau.__version__ import __version__  # noqa: F401
+# TODO(rcadene): Improve policies and envs. As of now, an item in `available_policies`
+# refers to a yaml file AND a modeling name. Same for `available_envs` which refers to
+# a yaml file AND a environment name. The difference should be more obvious.
+available_tasks_per_env = {}
+available_envs = list(available_tasks_per_env.keys())
+available_datasets_per_env = {}
+available_real_world_datasets = [
+    "lerobot/aloha_mobile_cabinet",
+    "lerobot/aloha_mobile_chair",
+    "lerobot/aloha_mobile_elevator",
+    "lerobot/aloha_mobile_shrimp",
+    "lerobot/aloha_mobile_wash_pan",
+    "lerobot/aloha_mobile_wipe_wine",
+    "lerobot/aloha_static_battery",
+    "lerobot/aloha_static_candy",
+    "lerobot/aloha_static_coffee",
+    "lerobot/aloha_static_coffee_new",
+    "lerobot/aloha_static_cups_open",
+    "lerobot/aloha_static_fork_pick_up",
+    "lerobot/aloha_static_pingpong_test",
+    "lerobot/aloha_static_pro_pencil",
+    "lerobot/aloha_static_screw_driver",
+    "lerobot/aloha_static_tape",
+    "lerobot/aloha_static_thread_velcro",
+    "lerobot/aloha_static_towel",
+    "lerobot/aloha_static_vinh_cup",
+    "lerobot/aloha_static_vinh_cup_left",
+    "lerobot/aloha_static_ziploc_slide",
+    "lerobot/umi_cup_in_the_wild",
+    "lerobot/unitreeh1_fold_clothes",
+    "lerobot/unitreeh1_rearrange_objects",
+    "lerobot/unitreeh1_two_robot_greeting",
+    "lerobot/unitreeh1_warehouse",
+    "lerobot/nyu_rot_dataset",
+    "lerobot/utokyo_saytap",
+    "lerobot/imperialcollege_sawyer_wrist_cam",
+    "lerobot/utokyo_xarm_bimanual",
+    "lerobot/tokyo_u_lsmo",
+    "lerobot/utokyo_pr2_opening_fridge",
+    "lerobot/cmu_franka_exploration_dataset",
+    "lerobot/cmu_stretch",
+    "lerobot/asu_table_top",
+    "lerobot/utokyo_pr2_tabletop_manipulation",
+    "lerobot/utokyo_xarm_pick_and_place",
+    "lerobot/ucsd_kitchen_dataset",
+    "lerobot/austin_buds_dataset",
+    "lerobot/dlr_sara_grid_clamp",
+    "lerobot/conq_hose_manipulation",
+    "lerobot/columbia_cairlab_pusht_real",
+    "lerobot/dlr_sara_pour",
+    "lerobot/dlr_edan_shared_control",
+    "lerobot/ucsd_pick_and_place_dataset",
+    "lerobot/berkeley_cable_routing",
+    "lerobot/nyu_franka_play_dataset",
+    "lerobot/austin_sirius_dataset",
+    "lerobot/cmu_play_fusion",
+    "lerobot/berkeley_gnm_sac_son",
+    "lerobot/nyu_door_opening_surprising_effectiveness",
+    "lerobot/berkeley_fanuc_manipulation",
+    "lerobot/jaco_play",
+    "lerobot/viola",
+    "lerobot/kaist_nonprehensile",
+    "lerobot/berkeley_mvp",
+    "lerobot/uiuc_d3field",
+    "lerobot/berkeley_gnm_recon",
+    "lerobot/austin_sailor_dataset",
+    "lerobot/utaustin_mutex",
+    "lerobot/roboturk",
+    "lerobot/stanford_hydra_dataset",
+    "lerobot/berkeley_autolab_ur5",
+    "lerobot/stanford_robocook",
+    "lerobot/toto",
+    "lerobot/fmb",
+    "lerobot/droid_100",
+    "lerobot/berkeley_rpt",
+    "lerobot/stanford_kuka_multimodal_dataset",
+    "lerobot/iamlab_cmu_pickup_insert",
+    "lerobot/taco_play",
+    "lerobot/berkeley_gnm_cory_hall",
+    "lerobot/usc_cloth_sim",
+]
+available_grounding_datasets = {}
+available_datasets = sorted(
+    set(itertools.chain(*available_datasets_per_env.values(), available_real_world_datasets))
+)
+# lists all available policies from `src/opentau/policies`
+available_policies = ["pi0", "pi05", "value"]
+# keys and values refer to yaml files
+available_policies_per_env = {}
+env_task_pairs = [(env, task) for env, tasks in available_tasks_per_env.items() for task in tasks]
+env_dataset_pairs = [
+    (env, dataset) for env, datasets in available_datasets_per_env.items() for dataset in datasets
+]
+env_dataset_policy_triplets = [
+    (env, dataset, policy)
+    for env, datasets in available_datasets_per_env.items()
+    for dataset in datasets
+    for policy in available_policies_per_env[env]
+]
+def registry_factory(global_dict):
+    def register(name):
+        def decorator(cls):
+            global_dict[name] = cls
+            return cls
+        return decorator
+    return register
+register_grounding_dataset = registry_factory(available_grounding_datasets)

opentau/__version__.py ADDED Viewed

@@ -0,0 +1,24 @@
+#!/usr/bin/env python
+# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
+# Copyright 2026 Tensor Auto Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""To enable `opentau.__version__`"""
+from importlib.metadata import PackageNotFoundError, version
+try:
+    __version__ = version("opentau")
+except PackageNotFoundError:
+    __version__ = "unknown"

opentau/configs/__init__.py ADDED Viewed

@@ -0,0 +1,19 @@
+# Copyright 2026 Tensor Auto Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Configuration module for OpenTau.
+This module provides configuration classes and utilities for training pipelines,
+datasets, policies, environments, and evaluation settings.
+"""

opentau/configs/default.py ADDED Viewed

@@ -0,0 +1,297 @@
+#!/usr/bin/env python
+# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
+# Copyright 2026 Tensor Auto Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Default configuration classes for datasets, evaluation, and logging.
+This module provides default configuration classes for:
+- Dataset configuration and dataset mixtures
+- Weights & Biases (wandb) logging configuration
+- Evaluation settings and parameters
+"""
+from dataclasses import dataclass, field
+import draccus
+import numpy as np
+from draccus.parsers.encoding import encode_dataclass
+from opentau import (
+    policies,  # noqa: F401
+)
+from opentau.datasets.standard_data_format_mapping import DATA_FEATURES_NAME_MAPPING, LOSS_TYPE_MAPPING
+from opentau.datasets.transforms import ImageTransformsConfig
+from opentau.datasets.video_utils import get_safe_default_codec
+# --- Custom NumPy encoder registration ---
+# For decoding from cmd/yaml
+draccus.decode.register(np.ndarray, np.asarray)
+# For encoding to yaml
+draccus.encode.register(np.ndarray, lambda x: x.tolist())
+@dataclass
+class DatasetConfig:
+    """Configuration for a dataset.
+    You may provide a list of datasets here. `train.py` creates them all and
+    concatenates them. Note: only data keys common between the datasets are kept.
+    Each dataset gets an additional transform that inserts the "dataset_index"
+    into the returned item. The index mapping is made according to the order in
+    which the datasets are provided.
+    Args:
+        repo_id: HuggingFace repository ID for the dataset. Exactly one of
+            `repo_id` or `grounding` must be set.
+        grounding: Grounding dataset identifier. Exactly one of `repo_id` or
+            `grounding` must be set.
+        root: Root directory where the dataset will be stored (e.g. 'dataset/path').
+            Defaults to None.
+        episodes: List of episode indices to use from the dataset. If None, all
+            episodes are used. Defaults to None.
+        image_transforms: Configuration for image transformations. Defaults to
+            ImageTransformsConfig().
+        revision: Git revision of the dataset repository to use. Defaults to None.
+        use_imagenet_stats: Whether to use ImageNet statistics for normalization.
+            Defaults to True.
+        video_backend: Video codec backend to use. Defaults to a safe default codec.
+        stats: Dictionary of statistics for normalization, keyed by feature name.
+            Each value is a dictionary with 'mean' and 'std' arrays. Defaults to None.
+        data_features_name_mapping: Optional mapping from dataset feature names to
+            standard feature names. Must be provided together with `loss_type_mapping`.
+            Defaults to None.
+        loss_type_mapping: Optional loss type mapping for the dataset. Must be
+            provided together with `data_features_name_mapping`. Defaults to None.
+    Raises:
+        ValueError: If both or neither of `repo_id` and `grounding` are set, or
+            if only one of `data_features_name_mapping` and `loss_type_mapping`
+            is provided.
+    """
+    repo_id: str | None = None
+    grounding: str | None = None
+    # Root directory where the dataset will be stored (e.g. 'dataset/path').
+    root: str | None = None
+    episodes: list[int] | None = None
+    image_transforms: ImageTransformsConfig = field(default_factory=ImageTransformsConfig)
+    revision: str | None = None
+    use_imagenet_stats: bool = True
+    video_backend: str = field(default_factory=get_safe_default_codec)
+    stats: dict[str, dict[str, np.ndarray]] | None = None
+    # optional standard data format mapping for the dataset if mapping is not already in standard_data_format_mapping.py
+    data_features_name_mapping: dict[str, str] | None = None
+    loss_type_mapping: str | None = None
+    def __post_init__(self):
+        """Validate dataset configuration and register custom mappings if provided."""
+        if (self.repo_id is None) == (self.grounding is None):
+            raise ValueError("Exactly one of `repo_id` or `grounding` for Dataset config should be set.")
+        # data_features_name_mapping and loss_type_mapping have to be provided together
+        if (self.data_features_name_mapping is None) != (self.loss_type_mapping is None):
+            raise ValueError(
+                "`data_features_name_mapping` and `loss_type_mapping` have to be provided together."
+            )
+        # add data_features_name_mapping and loss_type_mapping to standard_data_format_mapping.py if they are provided
+        if self.data_features_name_mapping is not None and self.loss_type_mapping is not None:
+            DATA_FEATURES_NAME_MAPPING[self.repo_id] = self.data_features_name_mapping
+            LOSS_TYPE_MAPPING[self.repo_id] = self.loss_type_mapping
+@dataclass
+class DatasetMixtureConfig:
+    """Configuration for a mixture of multiple datasets.
+    This configuration allows combining multiple datasets with specified weights
+    for training. The datasets are sampled according to their weights during
+    training, and features are resampled to a common action frequency.
+    Args:
+        datasets: List of dataset configs to be used in the mixture.
+        weights: List of weights for each dataset in the mixture. Must be the
+            same length as `datasets`. Defaults to empty list.
+        action_freq: Frequency at which actions from the dataset mixture are
+            resampled, in Hz. Defaults to 30.0.
+        image_resample_strategy: Resample strategy for image features. Must be
+            one of 'linear' or 'nearest'. Defaults to 'nearest'.
+        vector_resample_strategy: Resample strategy for non-image features, such
+            as action or state. Must be one of 'linear' or 'nearest'.
+            Defaults to 'nearest'.
+    Raises:
+        ValueError: If the length of `weights` doesn't match `datasets`, if
+            `action_freq` is not positive, or if resample strategies are invalid.
+    """
+    # List of dataset configs to be used in the mixture.
+    datasets: list[DatasetConfig] = field(default_factory=list)
+    # List of weights for each dataset in the mixture. Must be the same length as `datasets`.
+    weights: list[float] = field(default_factory=list)
+    # Frequency at which the actions from dataset mixture are resampled, in Hz.
+    action_freq: float = 30.0
+    # Resample strategy for image features
+    image_resample_strategy: str = "nearest"
+    # Resample strategy for non-image features, such as action or state
+    vector_resample_strategy: str = "nearest"
+    def __post_init__(self):
+        """Validate dataset mixture configuration."""
+        if len(self.datasets) != len(self.weights):
+            raise ValueError("The length of `weights` must match the length of `datasets`.")
+        if self.action_freq <= 0:
+            raise ValueError(f"`action_freq` must be a positive number, got {self.action_freq}.")
+        if self.image_resample_strategy not in ["linear", "nearest"]:
+            raise ValueError(
+                f"`image_resample_strategy` must be one of ['linear', 'nearest'], got {self.image_resample_strategy}."
+            )
+        if self.vector_resample_strategy not in ["linear", "nearest"]:
+            raise ValueError(
+                f"`vector_resample_strategy` must be one of ['linear', 'nearest'], got {self.vector_resample_strategy}."
+            )
+@dataclass
+class WandBConfig:
+    """Configuration for Weights & Biases (wandb) logging.
+    Args:
+        enable: Enable Weights & Biases logging. Defaults to False.
+        entity: The entity name in Weights & Biases, e.g. your username or your
+            team name. Defaults to None.
+        project: The project name in Weights & Biases, e.g. "pi0". Defaults to "opentau".
+        run_id: If provided, the run will be forked from this run ID. Defaults to None.
+        name: Name of the run, shown in the UI. Defaults to None.
+        notes: Description of the run, shown in the UI. If None and `enable` is True,
+            will prompt the user for input. Defaults to None.
+        tags: Tags to be added to the run in the UI, e.g. ["robot", "v1.0"].
+            Defaults to empty list.
+        group: Used to group runs in the UI, e.g. "experiment_1", "experiment_2".
+            Defaults to None.
+        job_type: Used to group runs in the UI, e.g. "train", "eval", "test".
+            Defaults to None.
+        mode: Allowed values: 'online', 'offline', 'disabled'. Defaults to None
+            (which uses 'online').
+        allow_resume: If True, resume the run from the last checkpoint when
+            `run_id` is provided. Defaults to True.
+        disable_artifact: Set to True to disable saving an artifact despite
+            `training.save_checkpoint=True`. Defaults to False.
+    """
+    enable: bool = False  # Enable Weights & Biases logging.
+    entity: str | None = None  # The entity name in Weights & Biases, e.g. your username or your team name
+    project: str = "opentau"  # The project name in Weights & Biases, e.g. "pi0"
+    run_id: str | None = None  # If provided, the run will be forked from this run ID.
+    name: str | None = None  # Name of the run, shown in the UI
+    notes: str | None = None  # Description of the run, shown in the UI
+    tags: list[str] = field(
+        default_factory=list
+    )  # Tags to be added to the run in the UI, e.g. ["robot", "v1.0"]
+    group: str | None = None  # Used to group runs in the UI, e.g. "experiment_1", "experiment_2"
+    job_type: str | None = None  # Used to group runs in the UI, e.g. "train", "eval", "test"
+    mode: str | None = None  # Allowed values: 'online', 'offline' 'disabled'. Defaults to 'online'
+    allow_resume: bool | None = True  # If True, resume the run from the last checkpoint.
+    # Set to true to disable saving an artifact despite training.save_checkpoint=True
+    disable_artifact: bool = False
+    def __post_init__(self):
+        """Prompt user for wandb notes if enabled and notes are not provided."""
+        if not self.enable or self.notes is not None:
+            return
+        confirm = False
+        while not confirm:
+            self.notes = input("Please enter a description for wandb logging:\n")
+            confirm = input("Confirm (y/N): ").strip().lower() == "y"
+    def to_wandb_kwargs(self, step=None):
+        """Convert configuration to keyword arguments for wandb.init().
+        Args:
+            step: Optional training step number. If provided along with `run_id`,
+                used for resuming or forking runs. Defaults to None.
+        Returns:
+            Dictionary of keyword arguments suitable for passing to wandb.init().
+        """
+        kwargs = encode_dataclass(self)
+        excluded_keys = ["enable", "disable_artifact", "project"]
+        for ek in excluded_keys:
+            kwargs.pop(ek)
+        allow_resume = kwargs.pop("allow_resume")
+        run_id = kwargs.pop("run_id", None)
+        # If both `run_id` and `step` are provided, we handle the resuming or forking logic.
+        if run_id is not None and step is not None:
+            if allow_resume:
+                # if `allow_resume`, we resume from the `run_id` if provided.
+                kwargs["id"] = run_id
+                kwargs["resume"] = "allow"
+            else:
+                # Without `allow_resume`, we create a new run,
+                # and add information about the forked run in the notes.
+                # TODO request `kwargs[fork_from]=f"{run_id}?_step={step}"` feature from wandb
+                kwargs["notes"] += f"\nForked from run {run_id} at step {step}."
+        return kwargs
+@dataclass
+class EvalConfig:
+    """Configuration for evaluation settings.
+    Args:
+        n_episodes: Number of episodes to run during evaluation. Defaults to 16.
+        batch_size: Number of environments to use in a gym.vector.VectorEnv.
+            Only used for environments that are not already vectorized.
+            Defaults to 16.
+        use_async_envs: Whether to use asynchronous environments (multiprocessing).
+            Defaults to True.
+        max_episodes_rendered: Maximum number of episodes to render as videos.
+            Defaults to 16.
+        grid_size: Grid dimensions for video summary (rows, cols). If None, will
+            be auto-calculated as a square grid. Defaults to None.
+        recording_root: Root directory for saving evaluation recordings.
+            Defaults to None.
+    Raises:
+        ValueError: If `batch_size` is greater than `n_episodes`.
+    """
+    n_episodes: int = 16
+    # `batch_size` specifies the number of environments to use in a gym.vector.VectorEnv. (Only used for environments that are not already vectorized.)
+    batch_size: int = 16
+    # `use_async_envs` specifies whether to use asynchronous environments (multiprocessing).
+    use_async_envs: bool = True
+    max_episodes_rendered: int = 16
+    # Grid dimensions for video summary (rows, cols). If None, will be auto-calculated as square grid.
+    grid_size: tuple[int, int] | None = None
+    recording_root: str | None = None
+    def __post_init__(self):
+        """Validate evaluation configuration."""
+        if self.batch_size > self.n_episodes:
+            raise ValueError(
+                "The eval batch size is greater than the number of eval episodes "
+                f"({self.batch_size} > {self.n_episodes}). As a result, {self.batch_size} "
+                f"eval environments will be instantiated, but only {self.n_episodes} will be used. "
+                "This might significantly slow down evaluation. To fix this, you should update your command "
+                f"to increase the number of episodes to match the batch size (e.g. `eval.n_episodes={self.batch_size}`), "
+                f"or lower the batch size (e.g. `eval.batch_size={self.n_episodes}`)."
+            )

opentau/configs/libero.py ADDED Viewed

@@ -0,0 +1,113 @@
+# Copyright 2026 Tensor Auto Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""LIBERO environment configuration module.
+This module provides configuration classes for LIBERO benchmark evaluation,
+which is a benchmark suite for learning manipulation tasks. It extends the
+base training pipeline configuration with LIBERO-specific evaluation parameters.
+"""
+import os
+from dataclasses import dataclass
+from libero.libero import benchmark, get_libero_path
+from opentau.configs.train import TrainPipelineConfig
+from opentau.utils.monkey_patch import torch_load_patch
+LIBERO_BENCHMARK_DICT = benchmark.get_benchmark_dict()
+@dataclass
+class LiberoEnvConfig:
+    """Configuration for LIBERO environment evaluation.
+    LIBERO is a benchmark suite for learning manipulation tasks. This configuration
+    specifies which task suite and task to run, along with evaluation parameters.
+    Args:
+        suite: Task suite to run. Must be 'spatial', 'object', 'goal', or '100'.
+        id: Index of the task in the suite to run.
+        max_steps: Maximum number of steps to run for each task. Defaults to 1000.
+        chunk_usage: Number of actions to perform in each chunk before getting a
+            new observation. If None, will be set from the training config's
+            `action_chunk`. Defaults to None.
+        n_simulations: Number of simulations to run for each task. Defaults to 100.
+        video_dir: Directory to save videos of the task execution. Defaults to None.
+    Raises:
+        ValueError: If the suite name is invalid or if the task id is out of range
+            for the specified suite.
+    """
+    suite: str  # Task suite to run. Must be 'spatial', 'object', 'goal', or '100'.
+    id: int  # index of the task in the suite to run.
+    max_steps: int = 1000  # maximum number of steps to run for each task.
+    chunk_usage: int | None = (
+        None  # number of actions to perform in each chunk before getting a new observation.
+    )
+    n_simulations: int = 100  # number of simulations to run for each task.
+    video_dir: str = None  # directory to save videos of the task execution.
+    def __post_init__(self):
+        """Validate LIBERO configuration and initialize task-specific attributes."""
+        torch_load_patch()
+        suite = f"libero_{self.suite}".lower()
+        if suite not in LIBERO_BENCHMARK_DICT:
+            raise ValueError(
+                f"Invalid suites: '{self.suite}'. "
+                f"Available suites are: {[k.replace('libero_', '') for k in LIBERO_BENCHMARK_DICT]}"
+            )
+        suite = LIBERO_BENCHMARK_DICT[suite]()
+        try:
+            task = suite.get_task(self.id)
+        except IndexError as e:
+            raise ValueError(
+                f"Invalid task id: {self.id} for suite: {self.suite}. "
+                f"Available ids must be from 0 to {len(suite.tasks) - 1}."
+            ) from e
+        self.bddl_file = os.path.join(get_libero_path("bddl_files"), task.problem_folder, task.bddl_file)
+        self.init_states = suite.get_task_init_states(self.id)
+        self.task = task
+@dataclass
+class TrainConfigWithLiberoEval(TrainPipelineConfig):
+    """Training configuration extended with LIBERO evaluation settings.
+    This configuration extends the base training pipeline configuration with
+    LIBERO-specific evaluation parameters.
+    Args:
+        libero: Configuration for LIBERO environment evaluation. Must be provided.
+            Defaults to None.
+    Raises:
+        ValueError: If `libero` is None or if `chunk_usage` is not within valid
+            range (1 to action_chunk).
+    """
+    libero: LiberoEnvConfig = None
+    def __post_init__(self):
+        """Validate LIBERO configuration and set default chunk_usage if needed."""
+        super().__post_init__()
+        if self.libero is None:
+            raise ValueError("Libero config must be provided.")
+        if self.libero.chunk_usage is None:
+            self.libero.chunk_usage = self.action_chunk
+        assert 1 <= self.libero.chunk_usage <= self.action_chunk, (
+            f"Chunk usage must be between 1 and {self.action_chunk=}, got {self.libero.chunk_usage=}."
+        )