PyPI - roboreason - Versions diffs - 0.1.0__tar.gz - Mend

roboreason 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (135) hide show

roboreason-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,305 @@
+Metadata-Version: 2.4
+Name: roboreason
+Version: 0.1.0
+Summary: Roboreason package
+Author: Philip
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+Requires-Dist: transformers==4.57.3
+Requires-Dist: vllm==0.12.0
+Requires-Dist: wandb>=0.19.1
+Requires-Dist: pillow
+Requires-Dist: accelerate>=1.2.1
+Requires-Dist: qwen_vl_utils
+Requires-Dist: datasets>=3.2.0
+Requires-Dist: trl
+Requires-Dist: imageio
+Requires-Dist: matplotlib
+Requires-Dist: av>=16.0.0
+Requires-Dist: openai
+Requires-Dist: google-genai
+Provides-Extra: robometer
+Requires-Dist: omegaconf>=2.3.0; extra == "robometer"
+Requires-Dist: hydra-core; extra == "robometer"
+Requires-Dist: tensorboard; extra == "robometer"
+Requires-Dist: peft; extra == "robometer"
+Requires-Dist: codetiming>=1.4.0; extra == "robometer"
+Requires-Dist: unsloth>=2025.10; extra == "robometer"
+Requires-Dist: sentence-transformers>=2.0.0; extra == "robometer"
+Requires-Dist: decord>=0.6.0; extra == "robometer"
+Provides-Extra: lerobot
+Requires-Dist: lerobot; extra == "lerobot"
+Provides-Extra: all
+Requires-Dist: omegaconf>=2.3.0; extra == "all"
+Requires-Dist: hydra-core; extra == "all"
+Requires-Dist: tensorboard; extra == "all"
+Requires-Dist: peft; extra == "all"
+Requires-Dist: codetiming>=1.4.0; extra == "all"
+Requires-Dist: unsloth>=2025.10; extra == "all"
+Requires-Dist: sentence-transformers>=2.0.0; extra == "all"
+Requires-Dist: decord>=0.6.0; extra == "all"
+Requires-Dist: lerobot; extra == "all"
+<div align="center">
+# RoboReason
+**RoboReason** is a python package that makes it easy to apply any ***reward model*** or ***video-language reasoning model*** to your robot videos.
+</div>
+## Supported Models
+- Robometer (https://robometer.github.io)
+- TOPReward (https://topreward.github.io/webpage/)
+- RoboReward (https://arxiv.org/abs/2601.00675)
+- SOLE-R1 (https://philipmit.github.io/sole-r1/)
+- OpenAI models (e.g., `"gpt-5"`)
+- Google models (e.g., `"gemini-3-pro-preview"`)
+## ToDos
+- [ ] Enable fine-tuning of reward models on custom datasets
+## 📦 File Structure
+```
+roboreason/
+├── roboreason/         # Main package
+│   ├── robometer/         # Robometer code
+│   ├── sole.py            # SOLE-R1 code
+│   ├── roboreward.py      # RoboReward code
+│   ├── topreward.py       # TOPReward code
+│   └── api_models.py      # OpenAI and Gemini APIs
+├── test_videos/        # Example videos to test
+├── model_outputs/      # Videos showing model outputs
+└── pyproject.toml      # Dependencies (uv)
+```
+## Install
+### Option 1: quick pip install
+```bash
+pip install -U roboreason
+```
+### Option 2: use [uv](https://github.com/astral-sh/uv) for dependency management
+#### 1. Clone the repository:
+```bash
+git clone https://github.com/philipmit/roboreason
+```
+#### 2. Install `uv`
+```bash
+pip install uv
+```
+#### 3. Sync environment
+```bash
+uv sync
+```
+#### 4. Activate environment
+```bash
+source .venv/bin/activate
+```
+---
+## Download model checkpoints
+```bash
+# SOLE-R1 (8B)
+python -c "from roboreason.utils.model_utils import get_model_dir; get_model_dir('sole')"
+# Robometer (4B)
+python -c "from roboreason.utils.model_utils import get_model_dir; get_model_dir('robometer')"
+# TOPReward (based on Qwen3-VL-8B)
+python -c "from roboreason.utils.model_utils import get_model_dir; get_model_dir('topreward')"
+# RoboReward (8B)
+python -c "from roboreason.utils.model_utils import get_model_dir; get_model_dir('roboreward')"
+```
+---
+## Quick start: Example reward generation and plotting
+```python
+# pip install -U roboreason
+import roboreason as rr
+video_paths = ['../test_videos/robosuite/robosuite_lift_example_00.mp4']
+task_description="Pick up the cube from the table."
+# Robometer
+rewards, success_probs = rr.generate(model="robometer",  task_description=task_description, video_paths=video_paths, view_type_per_video=['external'])
+output_robometer = {"model": "robometer", "rewards": rewards[0]}
+# SOLE-R1
+rewards, reasoning_traces = rr.generate(model="sole-r1",  task_description=task_description, video_paths=video_paths, view_type_per_video=['external and wrist'])
+output_sole = {"model": "sole-r1", "rewards": rewards[0], "reasoning_traces": reasoning_traces[0]}
+rr.video_plot(outputs=[output_sole, output_robometer], plot_save_path='../model_outputs/combined/robosuite_lift_example_00.mp4', video_path = video_paths[0])
+```
+---
+## Examples for generating across all models
+### Robometer
+```python
+import roboreason as rr
+rewards, success_probs = rr.generate(
+    model="robometer",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external']
+)
+```
+### SOLE-R1
+```python
+import roboreason as rr
+rewards, reasoning_traces = rr.generate(
+    model="sole-r1",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external and wrist']
+)
+```
+### TOPReward
+```python
+import roboreason as rr
+rewards = rr.generate(
+    model="topreward",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external']
+)
+```
+### RoboReward
+```python
+import roboreason as rr
+rewards = rr.generate(
+    model="roboreward",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external']
+)
+```
+### GPT-5 (and other OpenAI models)
+```python
+import roboreason as rr
+# requires OpenAI API key: https://developers.openai.com/api/docs/quickstart
+API_KEY = "..."
+rewards, reasoning_traces = rr.generate(
+    model="gpt-5",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external'],
+    key=API_KEY
+)
+```
+### Gemini-3-Pro (and other Google models)
+```python
+import roboreason as rr
+# requires Gemini API key: https://ai.google.dev/gemini-api/docs/api-key
+API_KEY = "..."
+rewards, reasoning_traces = rr.generate(
+    model="gemini-3-pro-preview",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external'],
+    key=API_KEY
+)
+```
+## Video plotting
+```python
+import roboreason as rr
+# Robometer
+rewards, success_probs = rr.generate(model="robometer",  task_description=task_description, video_paths=video_paths, view_type_per_video=['external'])
+output_robometer = {"model": "robometer", "rewards": rewards[0]}
+# SOLE-R1
+rewards, reasoning_traces = rr.generate(model="sole-r1",  task_description=task_description, video_paths=video_paths, view_type_per_video=['external and wrist'])
+output_sole = {"model": "sole-r1", "rewards": rewards[0], "reasoning_traces": reasoning_traces[0]}
+rr.video_plot(
+    outputs=[output_sole, output_robometer],
+    plot_save_path='../model_outputs/combined/robosuite_lift_example_00.mp4',
+    video_path = '../test_videos/robosuite/robosuite_lift_example_00.mp4'
+)
+```
+---
+## rr.generate
+| Argument              | Type        | Required | Description                                                                                                                                    |
+| --------------------- | ----------- | -------- | ---------------------------------------------------------------------------------------------------------------------------------------------- |
+| `model`               | `str`       | ✅        | Name of the model to use. Options include: `"robometer"`, `"sole-r1"`, `"topreward"`, `"roboreward"`, OpenAI models (e.g.`"gpt-5"`), Google models (e.g., `"gemini-3-pro-preview"`) |
+| `task_description`    | `str`       | ✅        | Natural language description of the task the robot is performing.                                                                              |
+| `video_paths`         | `List[str]` | ✅        | List of paths to input video files.                                                                                                            |
+| `view_type_per_video` | `List[str]` | ✅        | List specifying the camera view(s) used for reward reasoning for each video (e.g., `"external"`, `"wrist"`, or `"external and wrist"`).                                  |
+| `key`                 | `str`       | ❌        | API key required for external models (e.g., OpenAI or Gemini). Not needed for local models.                                                    |
+| Model Type             | Return Values               |
+| ---------------------- | --------------------------- |
+| SOLE-R1 / GPT / Gemini | `rewards, reasoning_traces` |
+| Robometer              | `rewards, success_probs`    |
+| TOPReward / RoboReward | `rewards`                   |
+## rr.video_plot
+| Argument                | Type         | Required | Description                                                                               |
+| ----------------------- | ------------ | -------- | ----------------------------------------------------------------------------------------- |
+| `outputs`               | `List[dict]` | ❌*       | List of model outputs (e.g., from `rr.generate`) to visualize together.                   |
+| `plot_save_path`        | `str`        | ❌        | Path where the output video with overlays will be saved.                                  |
+| `video_path`            | `str`        | ❌        | Path to the original video file being visualized.                                         |
+| `view_type`             | `str`        | ❌        | View type used for visualization (e.g., `"external"`, `"wrist"`, `"external and wrist"`). |
+| `show_reasoning_traces` | `bool`       | ❌        | Whether to overlay reasoning traces on the video. Default: `False`.                       |
+| `show_all_frames`       | `bool`       | ❌        | Whether to render all frames instead of sampled frames. Default: `False`.                 |
+| `model`                 | `str`        | ❌**      | Model name (used when calling `video_plot` directly instead of passing `outputs`).        |
+| `task_description`      | `str`        | ❌**      | Task description (used in direct-call mode).                                              |
+| `video_paths`           | `List[str]`  | ❌**      | Input videos (used in direct-call mode).                                                  |
+| `view_type_per_video`   | `List[str]`  | ❌**      | View types per video (used in direct-call mode).                                          |
+| `key`                   | `str`        | ❌**      | API key (if required for model).                                                          |

roboreason-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,263 @@
+<div align="center">
+# RoboReason
+**RoboReason** is a python package that makes it easy to apply any ***reward model*** or ***video-language reasoning model*** to your robot videos.
+</div>
+## Supported Models
+- Robometer (https://robometer.github.io)
+- TOPReward (https://topreward.github.io/webpage/)
+- RoboReward (https://arxiv.org/abs/2601.00675)
+- SOLE-R1 (https://philipmit.github.io/sole-r1/)
+- OpenAI models (e.g., `"gpt-5"`)
+- Google models (e.g., `"gemini-3-pro-preview"`)
+## ToDos
+- [ ] Enable fine-tuning of reward models on custom datasets
+## 📦 File Structure
+```
+roboreason/
+├── roboreason/         # Main package
+│   ├── robometer/         # Robometer code
+│   ├── sole.py            # SOLE-R1 code
+│   ├── roboreward.py      # RoboReward code
+│   ├── topreward.py       # TOPReward code
+│   └── api_models.py      # OpenAI and Gemini APIs
+├── test_videos/        # Example videos to test
+├── model_outputs/      # Videos showing model outputs
+└── pyproject.toml      # Dependencies (uv)
+```
+## Install
+### Option 1: quick pip install
+```bash
+pip install -U roboreason
+```
+### Option 2: use [uv](https://github.com/astral-sh/uv) for dependency management
+#### 1. Clone the repository:
+```bash
+git clone https://github.com/philipmit/roboreason
+```
+#### 2. Install `uv`
+```bash
+pip install uv
+```
+#### 3. Sync environment
+```bash
+uv sync
+```
+#### 4. Activate environment
+```bash
+source .venv/bin/activate
+```
+---
+## Download model checkpoints
+```bash
+# SOLE-R1 (8B)
+python -c "from roboreason.utils.model_utils import get_model_dir; get_model_dir('sole')"
+# Robometer (4B)
+python -c "from roboreason.utils.model_utils import get_model_dir; get_model_dir('robometer')"
+# TOPReward (based on Qwen3-VL-8B)
+python -c "from roboreason.utils.model_utils import get_model_dir; get_model_dir('topreward')"
+# RoboReward (8B)
+python -c "from roboreason.utils.model_utils import get_model_dir; get_model_dir('roboreward')"
+```
+---
+## Quick start: Example reward generation and plotting
+```python
+# pip install -U roboreason
+import roboreason as rr
+video_paths = ['../test_videos/robosuite/robosuite_lift_example_00.mp4']
+task_description="Pick up the cube from the table."
+# Robometer
+rewards, success_probs = rr.generate(model="robometer",  task_description=task_description, video_paths=video_paths, view_type_per_video=['external'])
+output_robometer = {"model": "robometer", "rewards": rewards[0]}
+# SOLE-R1
+rewards, reasoning_traces = rr.generate(model="sole-r1",  task_description=task_description, video_paths=video_paths, view_type_per_video=['external and wrist'])
+output_sole = {"model": "sole-r1", "rewards": rewards[0], "reasoning_traces": reasoning_traces[0]}
+rr.video_plot(outputs=[output_sole, output_robometer], plot_save_path='../model_outputs/combined/robosuite_lift_example_00.mp4', video_path = video_paths[0])
+```
+---
+## Examples for generating across all models
+### Robometer
+```python
+import roboreason as rr
+rewards, success_probs = rr.generate(
+    model="robometer",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external']
+)
+```
+### SOLE-R1
+```python
+import roboreason as rr
+rewards, reasoning_traces = rr.generate(
+    model="sole-r1",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external and wrist']
+)
+```
+### TOPReward
+```python
+import roboreason as rr
+rewards = rr.generate(
+    model="topreward",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external']
+)
+```
+### RoboReward
+```python
+import roboreason as rr
+rewards = rr.generate(
+    model="roboreward",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external']
+)
+```
+### GPT-5 (and other OpenAI models)
+```python
+import roboreason as rr
+# requires OpenAI API key: https://developers.openai.com/api/docs/quickstart
+API_KEY = "..."
+rewards, reasoning_traces = rr.generate(
+    model="gpt-5",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external'],
+    key=API_KEY
+)
+```
+### Gemini-3-Pro (and other Google models)
+```python
+import roboreason as rr
+# requires Gemini API key: https://ai.google.dev/gemini-api/docs/api-key
+API_KEY = "..."
+rewards, reasoning_traces = rr.generate(
+    model="gemini-3-pro-preview",
+    task_description="Pick up the cube from the table.",
+    video_paths=['../test_videos/robosuite/robosuite_lift_example_00.mp4'],
+    view_type_per_video=['external'],
+    key=API_KEY
+)
+```
+## Video plotting
+```python
+import roboreason as rr
+# Robometer
+rewards, success_probs = rr.generate(model="robometer",  task_description=task_description, video_paths=video_paths, view_type_per_video=['external'])
+output_robometer = {"model": "robometer", "rewards": rewards[0]}
+# SOLE-R1
+rewards, reasoning_traces = rr.generate(model="sole-r1",  task_description=task_description, video_paths=video_paths, view_type_per_video=['external and wrist'])
+output_sole = {"model": "sole-r1", "rewards": rewards[0], "reasoning_traces": reasoning_traces[0]}
+rr.video_plot(
+    outputs=[output_sole, output_robometer],
+    plot_save_path='../model_outputs/combined/robosuite_lift_example_00.mp4',
+    video_path = '../test_videos/robosuite/robosuite_lift_example_00.mp4'
+)
+```
+---
+## rr.generate
+| Argument              | Type        | Required | Description                                                                                                                                    |
+| --------------------- | ----------- | -------- | ---------------------------------------------------------------------------------------------------------------------------------------------- |
+| `model`               | `str`       | ✅        | Name of the model to use. Options include: `"robometer"`, `"sole-r1"`, `"topreward"`, `"roboreward"`, OpenAI models (e.g.`"gpt-5"`), Google models (e.g., `"gemini-3-pro-preview"`) |
+| `task_description`    | `str`       | ✅        | Natural language description of the task the robot is performing.                                                                              |
+| `video_paths`         | `List[str]` | ✅        | List of paths to input video files.                                                                                                            |
+| `view_type_per_video` | `List[str]` | ✅        | List specifying the camera view(s) used for reward reasoning for each video (e.g., `"external"`, `"wrist"`, or `"external and wrist"`).                                  |
+| `key`                 | `str`       | ❌        | API key required for external models (e.g., OpenAI or Gemini). Not needed for local models.                                                    |
+| Model Type             | Return Values               |
+| ---------------------- | --------------------------- |
+| SOLE-R1 / GPT / Gemini | `rewards, reasoning_traces` |
+| Robometer              | `rewards, success_probs`    |
+| TOPReward / RoboReward | `rewards`                   |
+## rr.video_plot
+| Argument                | Type         | Required | Description                                                                               |
+| ----------------------- | ------------ | -------- | ----------------------------------------------------------------------------------------- |
+| `outputs`               | `List[dict]` | ❌*       | List of model outputs (e.g., from `rr.generate`) to visualize together.                   |
+| `plot_save_path`        | `str`        | ❌        | Path where the output video with overlays will be saved.                                  |
+| `video_path`            | `str`        | ❌        | Path to the original video file being visualized.                                         |
+| `view_type`             | `str`        | ❌        | View type used for visualization (e.g., `"external"`, `"wrist"`, `"external and wrist"`). |
+| `show_reasoning_traces` | `bool`       | ❌        | Whether to overlay reasoning traces on the video. Default: `False`.                       |
+| `show_all_frames`       | `bool`       | ❌        | Whether to render all frames instead of sampled frames. Default: `False`.                 |
+| `model`                 | `str`        | ❌**      | Model name (used when calling `video_plot` directly instead of passing `outputs`).        |
+| `task_description`      | `str`        | ❌**      | Task description (used in direct-call mode).                                              |
+| `video_paths`           | `List[str]`  | ❌**      | Input videos (used in direct-call mode).                                                  |
+| `view_type_per_video`   | `List[str]`  | ❌**      | View types per video (used in direct-call mode).                                          |
+| `key`                   | `str`        | ❌**      | API key (if required for model).                                                          |

roboreason-0.1.0/pyproject.toml ADDED Viewed

@@ -0,0 +1,81 @@
+[build-system]
+requires = ["setuptools>=61"]
+build-backend = "setuptools.build_meta"
+[project]
+name = "roboreason"
+version = "0.1.0"
+description = "Roboreason package"
+readme = "README.md"
+requires-python = ">=3.8"
+authors = [
+    { name = "Philip" }
+]
+dependencies = [
+    # Core ML stack
+    "transformers==4.57.3",
+    "vllm==0.12.0",
+    "wandb>=0.19.1",
+    "pillow",
+    "accelerate>=1.2.1",
+    "qwen_vl_utils",
+    "datasets>=3.2.0",
+    "trl",
+    "imageio",
+    "matplotlib",
+    "av>=16.0.0",
+    # General utilities
+    "openai",
+    "google-genai",
+]
+# Optional dependency groups
+[project.optional-dependencies]
+robometer = [
+    "omegaconf>=2.3.0",
+    "hydra-core",
+    "tensorboard",
+    "peft",
+    "codetiming>=1.4.0",
+    "unsloth>=2025.10",
+    "sentence-transformers>=2.0.0",
+    "decord>=0.6.0",
+]
+lerobot = [
+    "lerobot",
+]
+all = [
+    "omegaconf>=2.3.0",
+    "hydra-core",
+    "tensorboard",
+    "peft",
+    "codetiming>=1.4.0",
+    "unsloth>=2025.10",
+    "sentence-transformers>=2.0.0",
+    "decord>=0.6.0",
+    "lerobot",
+]
+# -------------------------
+# setuptools config
+# -------------------------
+[tool.setuptools.packages.find]
+where = ["."]
+include = ["roboreason*"]
+# -------------------------
+# UV-specific config
+# -------------------------
+[tool.uv]
+# This allows PyTorch CUDA wheels
+extra-index-url = [
+    "https://download.pytorch.org/whl/cu116"
+]

roboreason-0.1.0/roboreason/__init__.py ADDED Viewed

@@ -0,0 +1,8 @@
+from .core import *
+from .api_models import *
+from .roboreward import *
+from .sole import *
+from .topreward import *
+__all__ = []