PyPI - opentau - Versions diffs - 0.1.0__py3-none-any.whl - Mend

opentau 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

opentau/__init__.py +179 -0
opentau/__version__.py +24 -0
opentau/configs/__init__.py +19 -0
opentau/configs/default.py +297 -0
opentau/configs/libero.py +113 -0
opentau/configs/parser.py +393 -0
opentau/configs/policies.py +297 -0
opentau/configs/reward.py +42 -0
opentau/configs/train.py +370 -0
opentau/configs/types.py +76 -0
opentau/constants.py +52 -0
opentau/datasets/__init__.py +84 -0
opentau/datasets/backward_compatibility.py +78 -0
opentau/datasets/compute_stats.py +333 -0
opentau/datasets/dataset_mixture.py +460 -0
opentau/datasets/factory.py +232 -0
opentau/datasets/grounding/__init__.py +67 -0
opentau/datasets/grounding/base.py +154 -0
opentau/datasets/grounding/clevr.py +110 -0
opentau/datasets/grounding/cocoqa.py +130 -0
opentau/datasets/grounding/dummy.py +101 -0
opentau/datasets/grounding/pixmo.py +177 -0
opentau/datasets/grounding/vsr.py +141 -0
opentau/datasets/image_writer.py +304 -0
opentau/datasets/lerobot_dataset.py +1910 -0
opentau/datasets/online_buffer.py +442 -0
opentau/datasets/push_dataset_to_hub/utils.py +132 -0
opentau/datasets/sampler.py +99 -0
opentau/datasets/standard_data_format_mapping.py +278 -0
opentau/datasets/transforms.py +330 -0
opentau/datasets/utils.py +1243 -0
opentau/datasets/v2/batch_convert_dataset_v1_to_v2.py +887 -0
opentau/datasets/v2/convert_dataset_v1_to_v2.py +829 -0
opentau/datasets/v21/_remove_language_instruction.py +109 -0
opentau/datasets/v21/batch_convert_dataset_v20_to_v21.py +60 -0
opentau/datasets/v21/convert_dataset_v20_to_v21.py +183 -0
opentau/datasets/v21/convert_stats.py +150 -0
opentau/datasets/video_utils.py +597 -0
opentau/envs/__init__.py +18 -0
opentau/envs/configs.py +178 -0
opentau/envs/factory.py +99 -0
opentau/envs/libero.py +439 -0
opentau/envs/utils.py +204 -0
opentau/optim/__init__.py +16 -0
opentau/optim/factory.py +43 -0
opentau/optim/optimizers.py +121 -0
opentau/optim/schedulers.py +140 -0
opentau/planner/__init__.py +82 -0
opentau/planner/high_level_planner.py +366 -0
opentau/planner/utils/memory.py +64 -0
opentau/planner/utils/utils.py +65 -0
opentau/policies/__init__.py +24 -0
opentau/policies/factory.py +172 -0
opentau/policies/normalize.py +315 -0
opentau/policies/pi0/__init__.py +19 -0
opentau/policies/pi0/configuration_pi0.py +250 -0
opentau/policies/pi0/modeling_pi0.py +994 -0
opentau/policies/pi0/paligemma_with_expert.py +516 -0
opentau/policies/pi05/__init__.py +20 -0
opentau/policies/pi05/configuration_pi05.py +231 -0
opentau/policies/pi05/modeling_pi05.py +1257 -0
opentau/policies/pi05/paligemma_with_expert.py +572 -0
opentau/policies/pretrained.py +315 -0
opentau/policies/utils.py +123 -0
opentau/policies/value/__init__.py +18 -0
opentau/policies/value/configuration_value.py +170 -0
opentau/policies/value/modeling_value.py +512 -0
opentau/policies/value/reward.py +87 -0
opentau/policies/value/siglip_gemma.py +221 -0
opentau/scripts/actions_mse_loss.py +89 -0
opentau/scripts/bin_to_safetensors.py +116 -0
opentau/scripts/compute_max_token_length.py +111 -0
opentau/scripts/display_sys_info.py +90 -0
opentau/scripts/download_libero_benchmarks.py +54 -0
opentau/scripts/eval.py +877 -0
opentau/scripts/export_to_onnx.py +180 -0
opentau/scripts/fake_tensor_training.py +87 -0
opentau/scripts/get_advantage_and_percentiles.py +220 -0
opentau/scripts/high_level_planner_inference.py +114 -0
opentau/scripts/inference.py +70 -0
opentau/scripts/launch_train.py +63 -0
opentau/scripts/libero_simulation_parallel.py +356 -0
opentau/scripts/libero_simulation_sequential.py +122 -0
opentau/scripts/nav_high_level_planner_inference.py +61 -0
opentau/scripts/train.py +379 -0
opentau/scripts/visualize_dataset.py +294 -0
opentau/scripts/visualize_dataset_html.py +507 -0
opentau/scripts/zero_to_fp32.py +760 -0
opentau/utils/__init__.py +20 -0
opentau/utils/accelerate_utils.py +79 -0
opentau/utils/benchmark.py +98 -0
opentau/utils/fake_tensor.py +81 -0
opentau/utils/hub.py +209 -0
opentau/utils/import_utils.py +79 -0
opentau/utils/io_utils.py +137 -0
opentau/utils/libero.py +214 -0
opentau/utils/libero_dataset_recorder.py +460 -0
opentau/utils/logging_utils.py +180 -0
opentau/utils/monkey_patch.py +278 -0
opentau/utils/random_utils.py +244 -0
opentau/utils/train_utils.py +198 -0
opentau/utils/utils.py +471 -0
opentau-0.1.0.dist-info/METADATA +161 -0
opentau-0.1.0.dist-info/RECORD +108 -0
opentau-0.1.0.dist-info/WHEEL +5 -0
opentau-0.1.0.dist-info/entry_points.txt +2 -0
opentau-0.1.0.dist-info/licenses/LICENSE +508 -0
opentau-0.1.0.dist-info/top_level.txt +1 -0

opentau/utils/io_utils.py ADDED Viewed

@@ -0,0 +1,137 @@
+#!/usr/bin/env python
+# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
+# Copyright 2026 Tensor Auto Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Utilities for file I/O operations.
+This module provides functions for reading and writing JSON files, saving videos,
+and deserializing JSON data into structured objects with type checking.
+"""
+import json
+import warnings
+from pathlib import Path
+from typing import TypeVar
+import imageio
+JsonLike = str | int | float | bool | None | list["JsonLike"] | dict[str, "JsonLike"] | tuple["JsonLike", ...]
+T = TypeVar("T", bound=JsonLike)
+def write_video(video_path: str | Path, stacked_frames: list, fps: float) -> None:
+    """Write a list of frames to a video file.
+    Args:
+        video_path: Path where the video file will be saved.
+        stacked_frames: List of image frames to write.
+        fps: Frames per second for the output video.
+    """
+    # Filter out DeprecationWarnings raised from pkg_resources
+    with warnings.catch_warnings():
+        warnings.filterwarnings(
+            "ignore", "pkg_resources is deprecated as an API", category=DeprecationWarning
+        )
+        imageio.mimsave(video_path, stacked_frames, fps=fps)
+def deserialize_json_into_object(fpath: Path, obj: T) -> T:
+    """Load JSON data and recursively fill an object with matching structure.
+    Loads the JSON data from fpath and recursively fills obj with the
+    corresponding values (strictly matching structure and types).
+    Tuples in obj are expected to be lists in the JSON data, which will be
+    converted back into tuples.
+    Args:
+        fpath: Path to the JSON file to load.
+        obj: Template object with the desired structure and types.
+    Returns:
+        Object with the same structure as obj, filled with values from the JSON file.
+    Raises:
+        TypeError: If structure or types don't match between JSON and obj.
+        ValueError: If dictionary keys or list/tuple lengths don't match.
+    """
+    with open(fpath, encoding="utf-8") as f:
+        data = json.load(f)
+    def _deserialize(target, source):
+        """
+        Recursively overwrite the structure in `target` with data from `source`,
+        performing strict checks on structure and type.
+        Returns the updated version of `target` (especially important for tuples).
+        """
+        # If the target is a dictionary, source must be a dictionary as well.
+        if isinstance(target, dict):
+            if not isinstance(source, dict):
+                raise TypeError(f"Type mismatch: expected dict, got {type(source)}")
+            # Check that they have exactly the same set of keys.
+            if target.keys() != source.keys():
+                raise ValueError(
+                    f"Dictionary keys do not match.\nExpected: {target.keys()}, got: {source.keys()}"
+                )
+            # Recursively update each key.
+            for k in target:
+                target[k] = _deserialize(target[k], source[k])
+            return target
+        # If the target is a list, source must be a list as well.
+        elif isinstance(target, list):
+            if not isinstance(source, list):
+                raise TypeError(f"Type mismatch: expected list, got {type(source)}")
+            # Check length
+            if len(target) != len(source):
+                raise ValueError(f"List length mismatch: expected {len(target)}, got {len(source)}")
+            # Recursively update each element.
+            for i in range(len(target)):
+                target[i] = _deserialize(target[i], source[i])
+            return target
+        # If the target is a tuple, the source must be a list in JSON,
+        # which we'll convert back to a tuple.
+        elif isinstance(target, tuple):
+            if not isinstance(source, list):
+                raise TypeError(f"Type mismatch: expected list (for tuple), got {type(source)}")
+            if len(target) != len(source):
+                raise ValueError(f"Tuple length mismatch: expected {len(target)}, got {len(source)}")
+            # Convert each element, forming a new tuple.
+            converted_items = []
+            for t_item, s_item in zip(target, source, strict=False):
+                converted_items.append(_deserialize(t_item, s_item))
+            # Return a brand new tuple (tuples are immutable in Python).
+            return tuple(converted_items)
+        # Otherwise, we're dealing with a "primitive" (int, float, str, bool, None).
+        else:
+            # Check the exact type.  If these must match 1:1, do:
+            if type(target) is not type(source):
+                raise TypeError(f"Type mismatch: expected {type(target)}, got {type(source)}")
+            return source
+    # Perform the in-place/recursive deserialization
+    updated_obj = _deserialize(obj, data)
+    return updated_obj

opentau/utils/libero.py ADDED Viewed

@@ -0,0 +1,214 @@
+# Copyright 2026 Tensor Auto Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Utilities for working with the LIBERO robotics environment.
+This module provides functions for converting LIBERO observations to PyTorch tensors,
+summarizing LIBERO evaluation results, and recording observations from LIBERO environments.
+"""
+import logging
+from pathlib import Path
+import imageio
+import numpy as np
+import torch
+from einops import rearrange
+from robosuite.utils.transform_utils import quat2axisangle
+def rotate_numpy_image(image: np.ndarray) -> np.ndarray:
+    """Rotate and normalize a numpy image array.
+    Args:
+        image: Input image array in HWC format with values in [0, 255].
+    Returns:
+        Rotated and normalized image array in CHW format with values in [0, 1].
+    """
+    image = image.astype(float) / 255.0
+    image = np.rot90(image, 2)
+    return rearrange(image, "H W C -> C H W")
+def _libero2np(obs: dict[str, np.ndarray], cfg) -> dict[str, str | np.ndarray]:
+    """Convert LIBERO observation dictionary to numpy format.
+    Args:
+        obs: LIBERO observation dictionary containing robot state and images.
+        cfg: Configuration object with task language, state dimensions, etc.
+    Returns:
+        Dictionary with converted observations in numpy format, including camera
+        images, state, prompt, and padding flags.
+    """
+    eef_pos = obs["robot0_eef_pos"]
+    eef_angle = quat2axisangle(obs["robot0_eef_quat"])
+    gripper_pos = obs["robot0_gripper_qpos"]
+    state = np.hstack((eef_pos, eef_angle, gripper_pos))
+    agent_view = rotate_numpy_image(obs["agentview_image"])
+    wrist_view = rotate_numpy_image(obs["robot0_eye_in_hand_image"])
+    return {
+        "camera0": agent_view,
+        "camera1": wrist_view,
+        "prompt": cfg.libero.task.language,
+        "state": np.pad(state, (0, cfg.max_state_dim - len(state))),
+        "img_is_pad": np.zeros(cfg.num_cams, dtype=bool),
+        "action_is_pad": np.zeros(cfg.action_chunk, dtype=bool),
+    }
+def _np2torch(
+    np_input: dict[str, str | np.ndarray], device: str, dtype: torch.dtype
+) -> dict[str, str | torch.Tensor]:
+    """Convert numpy arrays in dictionary to PyTorch tensors.
+    Args:
+        np_input: Dictionary containing numpy arrays and strings.
+        device: Target device for tensors (e.g., 'cuda', 'cpu').
+        dtype: Target dtype for floating point tensors.
+    Returns:
+        Dictionary with numpy arrays converted to PyTorch tensors on the
+        specified device. String values are preserved as-is.
+    Raises:
+        TypeError: If a value type is not supported (not str or np.ndarray).
+    """
+    torch_input = {}
+    for k, v in np_input.items():
+        if isinstance(v, str):
+            torch_input[k] = v
+        elif isinstance(v, np.ndarray):
+            # .copy() ensures the array is contiguous for PyTorch to use it
+            tensor = torch.tensor(v.copy())
+            if tensor.dtype.is_floating_point:
+                tensor = tensor.to(dtype=dtype)
+            torch_input[k] = tensor.to(device)
+        else:
+            raise TypeError(f"Unsupported type {type(v)} for key {k}.")
+    return torch_input
+def libero2torch(
+    obs: dict[str, np.ndarray], cfg, device: str, dtype: torch.dtype
+) -> dict[str, str | torch.Tensor]:
+    """Convert LIBERO observation to PyTorch tensors.
+    Args:
+        obs: LIBERO observation dictionary containing robot state and images.
+        cfg: Configuration object with task language, state dimensions, etc.
+        device: Target device for tensors (e.g., 'cuda', 'cpu').
+        dtype: Target dtype for floating point tensors.
+    Returns:
+        Dictionary with observations converted to PyTorch tensors on the
+        specified device, including camera images, state, prompt, and padding flags.
+    """
+    np_input = _libero2np(obs, cfg)
+    torch_input = _np2torch(np_input, device, dtype)
+    return torch_input
+def summarize_libero_results(results: list[int]) -> dict:
+    """Summarize LIBERO evaluation results.
+    Args:
+        results: List of integer results where:
+            - Positive values indicate success (number of steps taken).
+            - -1 indicates failure.
+            - -2 indicates crash.
+    Returns:
+        Dictionary containing summary statistics including success/failure/crash
+        rates, counts, indices, and average steps taken for successful episodes.
+    """
+    if not results:
+        return {"message": "No results to summarize."}
+    success_indices = [i for i, r in enumerate(results) if r >= 0]
+    failure_indices = [i for i, r in enumerate(results) if r == -1]
+    crashed_indices = [i for i, r in enumerate(results) if r == -2]
+    success_rate = len(success_indices) / len(results)
+    failure_rate = len(failure_indices) / len(results)
+    crashed_rate = len(crashed_indices) / len(results)
+    avg_steps_taken = float(np.mean([r for r in results if r >= 0])) if success_indices else None
+    return {
+        "total_simulations": len(results),
+        "success_indices": success_indices,
+        "failure_indices": failure_indices,
+        "crashed_indices": crashed_indices,
+        "success_count": len(success_indices),
+        "failure_count": len(failure_indices),
+        "crashed_count": len(crashed_indices),
+        "success_rate": success_rate,
+        "failure_rate": failure_rate,
+        "crashed_rate": crashed_rate,
+        "steps_taken": results,
+        "avg_steps_taken_until_success": avg_steps_taken,
+    }
+class LiberoObservationRecorder:
+    """Context manager for recording LIBERO observations to video files.
+    This class is not multi-processing safe. Each process should use a different
+    (folder, camera_name) pair.
+    Args:
+        folder: Directory path where video files will be saved. If None, recording
+            is disabled.
+        camera_names: List of camera names to record. If None, no cameras are recorded.
+        fps: Frames per second for the output videos. Defaults to 10.
+        extension: Video file extension. Defaults to "mp4".
+    """
+    def __init__(self, folder, camera_names=None, fps=10, extension="mp4"):
+        if folder is None:
+            logging.debug("No folder specified for video recording. Skipping.")
+            self.writers = []
+            self.camera_names = []
+            return
+        self.camera_names = camera_names or []
+        folder = Path(folder)
+        Path(folder).mkdir(parents=True, exist_ok=True)
+        video_files = [folder / f"{cam}.{extension}" for cam in self.camera_names]
+        logging.debug("Creating video files: %s", video_files)
+        self.writers = [imageio.get_writer(vf, fps=fps) for vf in video_files]
+    def __enter__(self):
+        return self
+    def record(self, obs):
+        """Record a single observation frame.
+        Args:
+            obs: Observation dictionary containing camera images keyed by camera name.
+        """
+        for writer, camera in zip(self.writers, self.camera_names, strict=True):
+            writer.append_data(np.rot90(obs[camera], k=2))
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        logging.debug("Closing video writers.")
+        for writer in self.writers:
+            writer.close()
+        logging.debug("Video writers closed.")
+        return False