PyPI - opentau - Versions diffs - 0.1.0__py3-none-any.whl - Mend

opentau 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

opentau/__init__.py +179 -0
opentau/__version__.py +24 -0
opentau/configs/__init__.py +19 -0
opentau/configs/default.py +297 -0
opentau/configs/libero.py +113 -0
opentau/configs/parser.py +393 -0
opentau/configs/policies.py +297 -0
opentau/configs/reward.py +42 -0
opentau/configs/train.py +370 -0
opentau/configs/types.py +76 -0
opentau/constants.py +52 -0
opentau/datasets/__init__.py +84 -0
opentau/datasets/backward_compatibility.py +78 -0
opentau/datasets/compute_stats.py +333 -0
opentau/datasets/dataset_mixture.py +460 -0
opentau/datasets/factory.py +232 -0
opentau/datasets/grounding/__init__.py +67 -0
opentau/datasets/grounding/base.py +154 -0
opentau/datasets/grounding/clevr.py +110 -0
opentau/datasets/grounding/cocoqa.py +130 -0
opentau/datasets/grounding/dummy.py +101 -0
opentau/datasets/grounding/pixmo.py +177 -0
opentau/datasets/grounding/vsr.py +141 -0
opentau/datasets/image_writer.py +304 -0
opentau/datasets/lerobot_dataset.py +1910 -0
opentau/datasets/online_buffer.py +442 -0
opentau/datasets/push_dataset_to_hub/utils.py +132 -0
opentau/datasets/sampler.py +99 -0
opentau/datasets/standard_data_format_mapping.py +278 -0
opentau/datasets/transforms.py +330 -0
opentau/datasets/utils.py +1243 -0
opentau/datasets/v2/batch_convert_dataset_v1_to_v2.py +887 -0
opentau/datasets/v2/convert_dataset_v1_to_v2.py +829 -0
opentau/datasets/v21/_remove_language_instruction.py +109 -0
opentau/datasets/v21/batch_convert_dataset_v20_to_v21.py +60 -0
opentau/datasets/v21/convert_dataset_v20_to_v21.py +183 -0
opentau/datasets/v21/convert_stats.py +150 -0
opentau/datasets/video_utils.py +597 -0
opentau/envs/__init__.py +18 -0
opentau/envs/configs.py +178 -0
opentau/envs/factory.py +99 -0
opentau/envs/libero.py +439 -0
opentau/envs/utils.py +204 -0
opentau/optim/__init__.py +16 -0
opentau/optim/factory.py +43 -0
opentau/optim/optimizers.py +121 -0
opentau/optim/schedulers.py +140 -0
opentau/planner/__init__.py +82 -0
opentau/planner/high_level_planner.py +366 -0
opentau/planner/utils/memory.py +64 -0
opentau/planner/utils/utils.py +65 -0
opentau/policies/__init__.py +24 -0
opentau/policies/factory.py +172 -0
opentau/policies/normalize.py +315 -0
opentau/policies/pi0/__init__.py +19 -0
opentau/policies/pi0/configuration_pi0.py +250 -0
opentau/policies/pi0/modeling_pi0.py +994 -0
opentau/policies/pi0/paligemma_with_expert.py +516 -0
opentau/policies/pi05/__init__.py +20 -0
opentau/policies/pi05/configuration_pi05.py +231 -0
opentau/policies/pi05/modeling_pi05.py +1257 -0
opentau/policies/pi05/paligemma_with_expert.py +572 -0
opentau/policies/pretrained.py +315 -0
opentau/policies/utils.py +123 -0
opentau/policies/value/__init__.py +18 -0
opentau/policies/value/configuration_value.py +170 -0
opentau/policies/value/modeling_value.py +512 -0
opentau/policies/value/reward.py +87 -0
opentau/policies/value/siglip_gemma.py +221 -0
opentau/scripts/actions_mse_loss.py +89 -0
opentau/scripts/bin_to_safetensors.py +116 -0
opentau/scripts/compute_max_token_length.py +111 -0
opentau/scripts/display_sys_info.py +90 -0
opentau/scripts/download_libero_benchmarks.py +54 -0
opentau/scripts/eval.py +877 -0
opentau/scripts/export_to_onnx.py +180 -0
opentau/scripts/fake_tensor_training.py +87 -0
opentau/scripts/get_advantage_and_percentiles.py +220 -0
opentau/scripts/high_level_planner_inference.py +114 -0
opentau/scripts/inference.py +70 -0
opentau/scripts/launch_train.py +63 -0
opentau/scripts/libero_simulation_parallel.py +356 -0
opentau/scripts/libero_simulation_sequential.py +122 -0
opentau/scripts/nav_high_level_planner_inference.py +61 -0
opentau/scripts/train.py +379 -0
opentau/scripts/visualize_dataset.py +294 -0
opentau/scripts/visualize_dataset_html.py +507 -0
opentau/scripts/zero_to_fp32.py +760 -0
opentau/utils/__init__.py +20 -0
opentau/utils/accelerate_utils.py +79 -0
opentau/utils/benchmark.py +98 -0
opentau/utils/fake_tensor.py +81 -0
opentau/utils/hub.py +209 -0
opentau/utils/import_utils.py +79 -0
opentau/utils/io_utils.py +137 -0
opentau/utils/libero.py +214 -0
opentau/utils/libero_dataset_recorder.py +460 -0
opentau/utils/logging_utils.py +180 -0
opentau/utils/monkey_patch.py +278 -0
opentau/utils/random_utils.py +244 -0
opentau/utils/train_utils.py +198 -0
opentau/utils/utils.py +471 -0
opentau-0.1.0.dist-info/METADATA +161 -0
opentau-0.1.0.dist-info/RECORD +108 -0
opentau-0.1.0.dist-info/WHEEL +5 -0
opentau-0.1.0.dist-info/entry_points.txt +2 -0
opentau-0.1.0.dist-info/licenses/LICENSE +508 -0
opentau-0.1.0.dist-info/top_level.txt +1 -0

opentau/policies/pi05/configuration_pi05.py ADDED Viewed

@@ -0,0 +1,231 @@
+# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
+# Copyright 2026 Tensor Auto Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Configuration module for the PI05 Policy.
+This module defines the `PI05Config` class, which handles the configuration parameters
+for the PI05 Vision-Language-Action Flow Model. It includes settings for the model architecture,
+optimization, scheduling, and data processing.
+"""
+import logging
+from dataclasses import dataclass, field
+from typing import Literal
+from opentau.configs.policies import PreTrainedConfig
+from opentau.configs.types import FeatureType, NormalizationMode, PolicyFeature
+from opentau.optim.optimizers import AdamWConfig
+from opentau.optim.schedulers import (
+    CosineDecayWithWarmupSchedulerConfig,
+    LRSchedulerConfig,
+)
+@PreTrainedConfig.register_subclass("pi05")
+@dataclass
+class PI05Config(PreTrainedConfig):
+    """Configuration class for the PI05 Policy.
+    This class defines the configuration parameters for the PI05 model, including
+    input/output structure, model architecture, training settings, and preprocessing.
+    Args:
+        n_obs_steps: Number of observation steps to use. Defaults to 1.
+        chunk_size: Size of the action chunk. The upper bound for n_action_steps. Defaults to 50.
+        n_action_steps: Number of action steps to predict. Defaults to 50.
+        normalization_mapping: Mapping of feature names to normalization modes.
+            Defaults to identity for visual features and mean-std for state and action.
+        max_state_dim: Maximum dimension for state vectors. Shorter vectors are padded. Defaults to 32.
+        max_action_dim: Maximum dimension for action vectors. Shorter vectors are padded. Defaults to 32.
+        resize_imgs_with_padding: Target size (height, width) for image resizing with padding.
+            Defaults to (224, 224).
+        empty_cameras: Number of empty camera inputs to add. Used for specific adaptations like
+            Aloha simulation. Defaults to 0.
+        tokenizer_max_length: Maximum length for tokenizer. Defaults to 256.
+        discrete_action_max_length: Maximum length for discrete action tokens. Defaults to 32.
+        proj_width: Width of the projection layer. Defaults to 1024.
+        dropout: Dropout rate. Defaults to 0.1.
+        num_steps: Number of flow matching steps for decoding. Defaults to 10.
+        init_strategy: Initialization strategy. One of "no_init", "full_he_init", "expert_only_he_init".
+            Defaults to "full_he_init".
+        use_cache: Whether to use KV cache during inference. Defaults to True.
+        attention_implementation: Attention implementation to use ("eager" or "fa2"). Defaults to "eager".
+        freeze_vision_encoder: Whether to freeze the vision encoder during fine-tuning. Defaults to True.
+        train_expert_only: Whether to train only the expert module. Defaults to False.
+        optimizer_lr: Learning rate for the optimizer. Defaults to 2.5e-5.
+        optimizer_betas: Beta parameters for AdamW optimizer. Defaults to (0.9, 0.95).
+        optimizer_eps: Epsilon parameter for AdamW optimizer. Defaults to 1e-8.
+        optimizer_weight_decay: Weight decay for AdamW optimizer. Defaults to 1e-10.
+        scheduler_warmup_steps: Number of warmup steps for the scheduler. Defaults to 1_000.
+        scheduler_decay_steps: Number of decay steps for the scheduler. Defaults to 30_000.
+        scheduler_decay_lr: Target learning rate after decay. Defaults to 2.5e-6.
+    """
+    # Input / output structure.
+    n_obs_steps: int = 1
+    chunk_size: int = 50
+    n_action_steps: int = 50
+    normalization_mapping: dict[str, NormalizationMode] = field(
+        default_factory=lambda: {
+            "VISUAL": NormalizationMode.IDENTITY,
+            "STATE": NormalizationMode.MEAN_STD,
+            "ACTION": NormalizationMode.MEAN_STD,
+        }
+    )
+    # Shorter state and action vectors will be padded
+    max_state_dim: int = 32
+    max_action_dim: int = 32
+    # Image preprocessing
+    resize_imgs_with_padding: tuple[int, int] = (224, 224)
+    # Add empty images. Used by pi05_aloha_sim which adds the empty
+    # left and right wrist cameras in addition to the top camera.
+    empty_cameras: int = 0
+    # Tokenizer
+    tokenizer_max_length: int = 256
+    # Maximum length of the action tokens
+    discrete_action_max_length: int = 32
+    # Projector
+    proj_width: int = 1024
+    # Dropout
+    dropout: float = 0.1
+    # Decoding
+    num_steps: int = 10
+    # Initialization strategy
+    init_strategy: Literal["no_init", "full_he_init", "expert_only_he_init"] = "full_he_init"
+    # Attention utils
+    use_cache: bool = True
+    attention_implementation: str = "eager"  # or fa2
+    # Finetuning settings
+    freeze_vision_encoder: bool = True
+    train_expert_only: bool = False
+    # Training presets
+    optimizer_lr: float = 2.5e-5
+    optimizer_betas: tuple[float, float] = (0.9, 0.95)
+    optimizer_eps: float = 1e-8
+    optimizer_weight_decay: float = 1e-10
+    scheduler_warmup_steps: int = 1_000
+    scheduler_decay_steps: int = 30_000
+    scheduler_decay_lr: float = 2.5e-6
+    def __post_init__(self):
+        """Post-initialization validation."""
+        super().__post_init__()
+        # TODO(Steven): Validate device and amp? in all policy configs?
+        """Input validation (not exhaustive)."""
+        if self.n_action_steps > self.chunk_size:
+            raise ValueError(
+                f"The chunk size is the upper bound for the number of action steps per model invocation. Got "
+                f"{self.n_action_steps} for `n_action_steps` and {self.chunk_size} for `chunk_size`."
+            )
+        if self.n_obs_steps != 1:
+            raise ValueError(
+                f"Multiple observation steps not handled yet. Got `nobs_steps={self.n_obs_steps}`"
+            )
+        assert self.init_strategy in ["no_init", "full_he_init", "expert_only_he_init"], (
+            f"Invalid init strategy: {self.init_strategy} must be one of ['no_init', 'full_he_init', 'expert_only_he_init']"
+        )
+        if self.init_strategy == "expert_only_he_init" and self.pretrained_path == "lerobot/pi05":
+            raise ValueError(
+                "You cannot load pretrained PI0 model when init_strategy is 'expert_only_he_init' due to differences in PaliGemma tokenizer vocab sizes."
+            )
+        if self.pretrained_path is not None and self.pretrained_path != "lerobot/pi05":
+            logging.info("Setting init_strategy to 'no_init' because we are resuming from a checkpoint.")
+            self.init_strategy = "no_init"
+    def validate_features(self) -> None:
+        """Validates the features and adds empty cameras if configured.
+        This method checks feature configurations and dynamically adds empty camera inputs
+        to `self.input_features` based on the `empty_cameras` parameter.
+        """
+        for i in range(self.empty_cameras):
+            key = f"observation.images.empty_camera_{i}"
+            empty_camera = PolicyFeature(
+                type=FeatureType.VISUAL,
+                shape=(3, 480, 640),
+            )
+            self.input_features[key] = empty_camera
+    def get_optimizer_preset(self) -> AdamWConfig:
+        """Returns the default optimizer configuration.
+        Returns:
+            AdamWConfig: The optimizer configuration with default parameters.
+        """
+        return AdamWConfig(
+            lr=self.optimizer_lr,
+            betas=self.optimizer_betas,
+            eps=self.optimizer_eps,
+            weight_decay=self.optimizer_weight_decay,
+        )
+    def get_scheduler_preset(self) -> LRSchedulerConfig:
+        """Returns the default scheduler configuration.
+        Returns:
+            CosineDecayWithWarmupSchedulerConfig: The scheduler configuration with default parameters.
+        """
+        return CosineDecayWithWarmupSchedulerConfig(
+            peak_lr=self.optimizer_lr,
+            decay_lr=self.scheduler_decay_lr,
+            num_warmup_steps=self.scheduler_warmup_steps,
+            num_decay_steps=self.scheduler_decay_steps,
+        )
+    @property
+    def observation_delta_indices(self) -> None:
+        """Indices for observation deltas.
+        Returns:
+            None: As observation deltas are not used.
+        """
+        return None
+    @property
+    def action_delta_indices(self) -> list[int]:
+        """Indices for action deltas.
+        Returns:
+            list[int]: A list of indices corresponding to the chunk size.
+        """
+        return list(range(self.chunk_size))
+    @property
+    def reward_delta_indices(self) -> None:
+        """Indices for reward deltas.
+        Returns:
+            None: As reward deltas are not used.
+        """
+        return None