rlinf 0.2.0.dev1__tar.gz → 0.2.0.dev2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {rlinf-0.2.0.dev1/rlinf.egg-info → rlinf-0.2.0.dev2}/PKG-INFO +23 -26
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/README.md +3 -3
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/pyproject.toml +26 -23
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/__init__.py +7 -2
- rlinf-0.2.0.dev2/rlinf/envs/maniskill/maniskill_offload_env.py +449 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/utils.py +30 -5
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/utils.py +24 -1
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/world_model/world_model_opensora_env.py +116 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/base_policy.py +25 -2
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/cnn_policy/cnn_policy.py +185 -22
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/mlp_policy/mlp_policy.py +132 -17
- rlinf-0.2.0.dev2/rlinf/utils/cuda_graph.py +274 -0
- rlinf-0.2.0.dev2/rlinf/utils/pytree.py +60 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/fsdp_actor_worker.py +1 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/env/env_worker.py +9 -5
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/hf/huggingface_worker.py +24 -3
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/sft/fsdp_sft_worker.py +7 -3
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2/rlinf.egg-info}/PKG-INFO +23 -26
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf.egg-info/SOURCES.txt +3 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf.egg-info/requires.txt +13 -24
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/LICENSE +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/fake_tool_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/mcp_agent_loop.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/mcp_filesystem_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/tool_agent_loop.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/searchr1/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/searchr1/search_tool_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/searchr1/searchr1_agent_loop.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/advantages.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/losses.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/registry.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/code/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/code/code_verifier/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/code/code_verifier/verify.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/math/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/math/math_verifier/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/math/math_verifier/parser.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/math/math_verifier/verify.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/searchr1/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/vqa/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/vqa/format_rewards.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/vqa/qa_rewards.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/config.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/item.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/math.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/vlm.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/world_model.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/embodied_io_struct.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/io_struct.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/replay_buffer.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/tokenizers.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/tool_call/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/tool_call/tool_io_struct.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/action_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/behavior/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/behavior/behavior_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/calvin/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/calvin/calvin_gym_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/calvin/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/calvin/venv.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/frankasim/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/frankasim/frankasim_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/extensions/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/extensions/config/vlnce_r2r.yaml +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/extensions/maps.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/extensions/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/habitat_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/venv.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/isaaclab_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/tasks/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/tasks/stack_cube.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/venv.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/libero/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/libero/libero_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/libero/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/libero/venv.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/maniskill_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/put_carrot_on_plate.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/put_on_in_scene_multi.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_carrot.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_ee_pose.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_image.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_instruct.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_multi_carrot.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_multi_plate.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_plate.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_position.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_position_change.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_single.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_vision_image.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_vision_texture.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_vision_whole.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/metaworld/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/metaworld/metaworld_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/metaworld/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/metaworld/venv.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/camera/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/camera/camera.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/keyboard/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/keyboard/keyboard_listener.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/ros/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/ros/ros_controller.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/spacemouse/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/spacemouse/spacemouse_expert.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/video_player/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/video_player/video_player.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/euler_obs.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/gripper_close.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/relative_frame.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/reward_done_wrapper.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/spacemouse_intervention.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/franka_controller.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/franka_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/franka_robot_state.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/tasks/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/tasks/bottle.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/tasks/franka_bin_relocation.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/tasks/peg_insertion_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/realworld_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/venv.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robocasa/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robocasa/robocasa_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robocasa/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robocasa/venv.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robotwin/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robotwin/robotwin_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/venv/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/venv/venv.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/world_model/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/world_model/base_world_env.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/wrappers/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/wrappers/record_video.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/fsdp_model_manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/base.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/checkpoint.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/fsdp.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/fsdp2.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/megatron/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/megatron/megatron_model_manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/megatron/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/detokenizer_manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/io_struct.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/sgl_engine.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/sgl_scheduler.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/tokenizer_manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/vllm/vllm_0_8_5/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/vllm/vllm_0_8_5/executor.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/vllm/vllm_0_8_5/weight_loader.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/vllm/vllm_0_8_5/worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/cnn_policy/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/dexbotic_pi/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/dexbotic_pi/dexbotic_pi_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/flow_policy/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/flow_policy/flow_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/embodiment_tags.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/gr00t_action_model.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/modality_config.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/simulation_io.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/mlp_policy/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/batch_renorm.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/entropy_tunning.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/explore_noise_net.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/flow_actor.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/mlp.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/q_head.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/resnet_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/value_head.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/behavior_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/calvin_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/franka_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/gsenv_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/libero_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/maniskill_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/metaworld_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/robocasa_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/robotwin_aloha_dataconfig.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/openpi_action_model.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/aloha_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/behavior_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/calvin_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/franka_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/gsenv_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/libero_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/maniskill_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/metaworld_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/robocasa_policy.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla/openvla_action_model.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/official/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/official/openvla_oft_action_model.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/openvla_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/rlinf/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/rlinf/openvla_oft_action_model.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/prismatic/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/prismatic/processing_prismatic.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/agent_eval_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/agent_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/async_embodied_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/coding_online_rl_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/embodied_eval_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/embodied_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/reasoning_eval_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/reasoning_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/sft_runner.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/channel/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/channel/channel.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/channel/channel_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/cluster.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/config.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/node.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/async_work.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/collective.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/collective_group.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/multi_channel_pg.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/dynamic_scheduler/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/dynamic_scheduler/manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/dynamic_scheduler/scheduler_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/dynamic_scheduler/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/accelerator.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/amd_gpu.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/ascend_npu.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/intel_gpu.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/musa_gpu.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/nvidia_gpu.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/hardware.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/robots/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/robots/franka.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/coll_manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/lock_manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/node_manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/worker_manager.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/flexible.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/node.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/packed.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/placement.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/worker/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/worker/lock.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/worker/worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/worker/worker_group.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/convert_openpi_jax_to_python.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/config/fsdp_model_convertor.yaml +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/convert_dcp_to_pt.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/convert_pt_to_hf.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/config.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_hf_to_mg.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_hf_to_middle_file.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_mg_to_middle_file.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_middle_file_to_hf.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_middle_file_to_mg.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/default_args.yaml +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/fp8_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/mg_loader.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/mg_moe_groupgemm.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/mp_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/safetensors_loader.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/tensor_operations.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/convertor/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/convertor/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/data_iter_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/data_process.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/distributed.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/drq.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/flops.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/initialize.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/logging.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/metric_logger.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/metric_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/nested_dict_process.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/omega_resolver.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/patcher.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/placement.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/profiler.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/resharding/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/resharding/mcore_weight_reshard.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/resharding/reshard_config.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/resharding/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/runner_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/timers.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/torch_functionals.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/train_utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/async_fsdp_sac_policy_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/fsdp_sac_policy_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/megatron_actor_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/agent/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/agent/agent_loop.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/agent/tool_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/env/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/env/async_env_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/inference/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/inference/fsdp_inference_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/inference/megatron_inference_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/inference/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/reward/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/reward/reward_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/hf/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/hf/async_huggingface_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/hf/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/server/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/server/online_router_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/server/server_rollout_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/sglang/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/sglang/sglang_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/utils.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/vllm/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/vllm/vllm_worker.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/sft/__init__.py +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf.egg-info/dependency_links.txt +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf.egg-info/top_level.txt +0 -0
- {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/setup.cfg +0 -0
|
@@ -1,6 +1,8 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: rlinf
|
|
3
|
-
Version: 0.2.0.
|
|
3
|
+
Version: 0.2.0.dev2
|
|
4
|
+
Summary: Reinforcement Learning Infrastructure for Embodied and Agentic AI
|
|
5
|
+
Author: RLinf Contributors
|
|
4
6
|
License: Apache License
|
|
5
7
|
Version 2.0, January 2004
|
|
6
8
|
https://www.apache.org/licenses/
|
|
@@ -202,6 +204,10 @@ License: Apache License
|
|
|
202
204
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
203
205
|
See the License for the specific language governing permissions and
|
|
204
206
|
limitations under the License.
|
|
207
|
+
Project-URL: Homepage, https://github.com/RLinf/RLinf
|
|
208
|
+
Project-URL: Repository, https://github.com/RLinf/RLinf
|
|
209
|
+
Project-URL: Documentation, https://rlinf.readthedocs.io/
|
|
210
|
+
Project-URL: Bug Report, https://github.com/RLinf/RLinf/issues
|
|
205
211
|
Keywords: reinforcement-learning,embodied-intelligence,large-language-models
|
|
206
212
|
Classifier: Development Status :: 2 - Pre-Alpha
|
|
207
213
|
Classifier: Environment :: GPU :: NVIDIA CUDA :: 12 :: 12.4
|
|
@@ -212,10 +218,10 @@ Requires-Python: <=3.11.14,>=3.10
|
|
|
212
218
|
Description-Content-Type: text/markdown
|
|
213
219
|
License-File: LICENSE
|
|
214
220
|
Requires-Dist: ray[default]>=2.47.0
|
|
215
|
-
Requires-Dist: torch
|
|
221
|
+
Requires-Dist: torch<=2.9.0,>=2.5.0
|
|
216
222
|
Requires-Dist: hydra-core
|
|
217
223
|
Requires-Dist: numpy
|
|
218
|
-
Requires-Dist: datasets
|
|
224
|
+
Requires-Dist: datasets
|
|
219
225
|
Requires-Dist: torchdata
|
|
220
226
|
Requires-Dist: scipy
|
|
221
227
|
Requires-Dist: accelerate
|
|
@@ -223,7 +229,7 @@ Requires-Dist: debugpy
|
|
|
223
229
|
Requires-Dist: einops
|
|
224
230
|
Requires-Dist: nvitop
|
|
225
231
|
Requires-Dist: pybind11
|
|
226
|
-
Requires-Dist: setuptools
|
|
232
|
+
Requires-Dist: setuptools
|
|
227
233
|
Requires-Dist: ninja
|
|
228
234
|
Requires-Dist: pytest
|
|
229
235
|
Requires-Dist: gsutil
|
|
@@ -241,44 +247,35 @@ Requires-Dist: tensorboard
|
|
|
241
247
|
Provides-Extra: agentic-sglang
|
|
242
248
|
Requires-Dist: sglang[all]==0.4.6.post5; extra == "agentic-sglang"
|
|
243
249
|
Requires-Dist: torch-memory-saver; extra == "agentic-sglang"
|
|
250
|
+
Requires-Dist: numpy==2.2; extra == "agentic-sglang"
|
|
244
251
|
Requires-Dist: transformers==4.51.1; extra == "agentic-sglang"
|
|
245
252
|
Requires-Dist: uvloop==0.21.0; extra == "agentic-sglang"
|
|
246
253
|
Requires-Dist: hydra-core==1.4.0.dev1; extra == "agentic-sglang"
|
|
254
|
+
Requires-Dist: omegaconf==2.4.0.dev4; extra == "agentic-sglang"
|
|
247
255
|
Requires-Dist: word2number; extra == "agentic-sglang"
|
|
248
256
|
Requires-Dist: regex; extra == "agentic-sglang"
|
|
249
257
|
Requires-Dist: peft==0.11.1; extra == "agentic-sglang"
|
|
250
258
|
Requires-Dist: rlinf_latex2sympy2; extra == "agentic-sglang"
|
|
259
|
+
Requires-Dist: mcp; extra == "agentic-sglang"
|
|
251
260
|
Provides-Extra: agentic-vllm
|
|
252
261
|
Requires-Dist: vllm==0.8.5; extra == "agentic-vllm"
|
|
262
|
+
Requires-Dist: numpy==2.2; extra == "agentic-vllm"
|
|
253
263
|
Requires-Dist: transformers==4.51.1; extra == "agentic-vllm"
|
|
254
264
|
Requires-Dist: uvloop==0.21.0; extra == "agentic-vllm"
|
|
255
265
|
Requires-Dist: hydra-core==1.4.0.dev1; extra == "agentic-vllm"
|
|
266
|
+
Requires-Dist: omegaconf==2.4.0.dev4; extra == "agentic-vllm"
|
|
256
267
|
Requires-Dist: word2number; extra == "agentic-vllm"
|
|
257
268
|
Requires-Dist: regex; extra == "agentic-vllm"
|
|
258
269
|
Requires-Dist: peft==0.11.1; extra == "agentic-vllm"
|
|
259
270
|
Requires-Dist: rlinf_latex2sympy2; extra == "agentic-vllm"
|
|
271
|
+
Requires-Dist: mcp; extra == "agentic-vllm"
|
|
260
272
|
Provides-Extra: embodied
|
|
261
|
-
Requires-Dist: transformers
|
|
262
|
-
Requires-Dist:
|
|
263
|
-
Requires-Dist:
|
|
264
|
-
Requires-Dist: tensorflow; extra == "embodied"
|
|
265
|
-
Requires-Dist: tensorflow_graphics; extra == "embodied"
|
|
266
|
-
Requires-Dist: peft==0.11.1; extra == "embodied"
|
|
267
|
-
Requires-Dist: timm==0.9.10; extra == "embodied"
|
|
268
|
-
Requires-Dist: sapien==3.0.1; platform_system == "Linux" and extra == "embodied"
|
|
269
|
-
Requires-Dist: tensordict; extra == "embodied"
|
|
273
|
+
Requires-Dist: transformers<=4.57.6; extra == "embodied"
|
|
274
|
+
Requires-Dist: peft; extra == "embodied"
|
|
275
|
+
Requires-Dist: timm; extra == "embodied"
|
|
270
276
|
Requires-Dist: imageio[ffmpeg]; extra == "embodied"
|
|
271
|
-
Requires-Dist: robosuite==1.4.1; extra == "embodied"
|
|
272
|
-
Requires-Dist: bddl; extra == "embodied"
|
|
273
|
-
Requires-Dist: easydict; extra == "embodied"
|
|
274
|
-
Requires-Dist: cloudpickle; extra == "embodied"
|
|
275
|
-
Requires-Dist: gym; extra == "embodied"
|
|
276
277
|
Requires-Dist: gymnasium; extra == "embodied"
|
|
277
|
-
Requires-Dist:
|
|
278
|
-
Requires-Dist: open3d; extra == "embodied"
|
|
279
|
-
Requires-Dist: zarr; extra == "embodied"
|
|
280
|
-
Requires-Dist: openai; extra == "embodied"
|
|
281
|
-
Requires-Dist: jax; extra == "embodied"
|
|
278
|
+
Requires-Dist: gym; extra == "embodied"
|
|
282
279
|
Provides-Extra: franka
|
|
283
280
|
Requires-Dist: pyyaml; extra == "franka"
|
|
284
281
|
Requires-Dist: rospkg; extra == "franka"
|
|
@@ -294,7 +291,7 @@ Requires-Dist: pynput; extra == "franka"
|
|
|
294
291
|
Dynamic: license-file
|
|
295
292
|
|
|
296
293
|
<div align="center">
|
|
297
|
-
<img src="
|
|
294
|
+
<img src="https://github.com/RLinf/misc/raw/main/pic/logo_white.svg" alt="RLinf-logo" width="600"/>
|
|
298
295
|
</div>
|
|
299
296
|
|
|
300
297
|
<div align="center">
|
|
@@ -320,7 +317,7 @@ Dynamic: license-file
|
|
|
320
317
|
RLinf is a flexible and scalable open-source RL infrastructure designed for Embodied and Agentic AI. The 'inf' in RLinf stands for `Infrastructure`, highlighting its role as a robust backbone for next-generation training. It also stands for `Infinite`, symbolizing the system’s support for open-ended learning, continuous generalization, and limitless possibilities in intelligence development.
|
|
321
318
|
|
|
322
319
|
<div align="center">
|
|
323
|
-
<img src="
|
|
320
|
+
<img src="https://github.com/RLinf/misc/raw/main/pic/overview.svg" alt="RLinf-overview"/>
|
|
324
321
|
</div>
|
|
325
322
|
|
|
326
323
|
|
|
@@ -417,7 +414,7 @@ Multiple Backend Integrations
|
|
|
417
414
|
</ul>
|
|
418
415
|
<li><b>Custom Models</b></li>
|
|
419
416
|
<ul>
|
|
420
|
-
<li><a href="https://
|
|
417
|
+
<li><a href="https://rlinf.readthedocs.io/en/latest/rst_source/examples/embodied/mlp.html">MLP-Policy</a> ✅</li>
|
|
421
418
|
<li>CNN-Policy ✅</li>
|
|
422
419
|
</ul>
|
|
423
420
|
</ul>
|
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
<div align="center">
|
|
2
|
-
<img src="
|
|
2
|
+
<img src="https://github.com/RLinf/misc/raw/main/pic/logo_white.svg" alt="RLinf-logo" width="600"/>
|
|
3
3
|
</div>
|
|
4
4
|
|
|
5
5
|
<div align="center">
|
|
@@ -25,7 +25,7 @@
|
|
|
25
25
|
RLinf is a flexible and scalable open-source RL infrastructure designed for Embodied and Agentic AI. The 'inf' in RLinf stands for `Infrastructure`, highlighting its role as a robust backbone for next-generation training. It also stands for `Infinite`, symbolizing the system’s support for open-ended learning, continuous generalization, and limitless possibilities in intelligence development.
|
|
26
26
|
|
|
27
27
|
<div align="center">
|
|
28
|
-
<img src="
|
|
28
|
+
<img src="https://github.com/RLinf/misc/raw/main/pic/overview.svg" alt="RLinf-overview"/>
|
|
29
29
|
</div>
|
|
30
30
|
|
|
31
31
|
|
|
@@ -122,7 +122,7 @@ Multiple Backend Integrations
|
|
|
122
122
|
</ul>
|
|
123
123
|
<li><b>Custom Models</b></li>
|
|
124
124
|
<ul>
|
|
125
|
-
<li><a href="https://
|
|
125
|
+
<li><a href="https://rlinf.readthedocs.io/en/latest/rst_source/examples/embodied/mlp.html">MLP-Policy</a> ✅</li>
|
|
126
126
|
<li>CNN-Policy ✅</li>
|
|
127
127
|
</ul>
|
|
128
128
|
</ul>
|
|
@@ -4,7 +4,9 @@ build-backend = "setuptools.build_meta"
|
|
|
4
4
|
|
|
5
5
|
[project]
|
|
6
6
|
name = "rlinf"
|
|
7
|
-
version = "0.2.0.
|
|
7
|
+
version = "0.2.0.dev2"
|
|
8
|
+
authors = [{ name = "RLinf Contributors" }]
|
|
9
|
+
description = "Reinforcement Learning Infrastructure for Embodied and Agentic AI"
|
|
8
10
|
readme = {file = "README.md", content-type = "text/markdown"}
|
|
9
11
|
requires-python = ">=3.10,<=3.11.14"
|
|
10
12
|
license = {file = "LICENSE"}
|
|
@@ -25,16 +27,17 @@ classifiers = [
|
|
|
25
27
|
"Programming Language :: Python :: 3.11",
|
|
26
28
|
]
|
|
27
29
|
|
|
30
|
+
|
|
28
31
|
dependencies = [
|
|
29
32
|
# Core System
|
|
30
33
|
# These are the dependencies of the core scheduler
|
|
31
34
|
"ray[default]>=2.47.0",
|
|
32
|
-
"torch
|
|
35
|
+
"torch>=2.5.0,<=2.9.0",
|
|
33
36
|
"hydra-core",
|
|
34
37
|
"numpy",
|
|
35
38
|
|
|
36
39
|
# Data processing
|
|
37
|
-
"datasets
|
|
40
|
+
"datasets",
|
|
38
41
|
"torchdata",
|
|
39
42
|
"scipy",
|
|
40
43
|
|
|
@@ -44,7 +47,7 @@ dependencies = [
|
|
|
44
47
|
"einops",
|
|
45
48
|
"nvitop",
|
|
46
49
|
"pybind11",
|
|
47
|
-
"setuptools
|
|
50
|
+
"setuptools",
|
|
48
51
|
"ninja",
|
|
49
52
|
"pytest",
|
|
50
53
|
"gsutil",
|
|
@@ -63,52 +66,49 @@ dependencies = [
|
|
|
63
66
|
"tensorboard",
|
|
64
67
|
]
|
|
65
68
|
|
|
69
|
+
[project.urls]
|
|
70
|
+
Homepage = "https://github.com/RLinf/RLinf"
|
|
71
|
+
Repository = "https://github.com/RLinf/RLinf"
|
|
72
|
+
Documentation = "https://rlinf.readthedocs.io/"
|
|
73
|
+
"Bug Report" = "https://github.com/RLinf/RLinf/issues"
|
|
74
|
+
|
|
66
75
|
[project.optional-dependencies]
|
|
67
76
|
agentic-sglang = [
|
|
68
77
|
"sglang[all]==0.4.6.post5",
|
|
69
78
|
"torch-memory-saver",
|
|
79
|
+
"numpy==2.2",
|
|
70
80
|
"transformers==4.51.1",
|
|
71
81
|
# uvloop is not compatible with simulators, put it here
|
|
72
82
|
"uvloop==0.21.0",
|
|
73
83
|
"hydra-core==1.4.0.dev1",
|
|
84
|
+
"omegaconf==2.4.0.dev4",
|
|
74
85
|
"word2number",
|
|
75
86
|
"regex",
|
|
76
87
|
"peft==0.11.1",
|
|
77
88
|
"rlinf_latex2sympy2",
|
|
89
|
+
"mcp",
|
|
78
90
|
]
|
|
79
91
|
agentic-vllm = [
|
|
80
92
|
"vllm==0.8.5",
|
|
93
|
+
"numpy==2.2",
|
|
81
94
|
"transformers==4.51.1",
|
|
82
95
|
# uvloop is not compatible with simulators, put it here
|
|
83
96
|
"uvloop==0.21.0",
|
|
84
97
|
"hydra-core==1.4.0.dev1",
|
|
98
|
+
"omegaconf==2.4.0.dev4",
|
|
85
99
|
"word2number",
|
|
86
100
|
"regex",
|
|
87
101
|
"peft==0.11.1",
|
|
88
102
|
"rlinf_latex2sympy2",
|
|
103
|
+
"mcp",
|
|
89
104
|
]
|
|
90
105
|
embodied = [
|
|
91
|
-
"transformers
|
|
92
|
-
"
|
|
93
|
-
"
|
|
94
|
-
"tensorflow",
|
|
95
|
-
"tensorflow_graphics",
|
|
96
|
-
"peft==0.11.1",
|
|
97
|
-
"timm==0.9.10",
|
|
98
|
-
"sapien==3.0.1;platform_system=='Linux'",
|
|
99
|
-
"tensordict",
|
|
106
|
+
"transformers<=4.57.6",
|
|
107
|
+
"peft",
|
|
108
|
+
"timm",
|
|
100
109
|
"imageio[ffmpeg]",
|
|
101
|
-
"robosuite==1.4.1",
|
|
102
|
-
"bddl",
|
|
103
|
-
"easydict",
|
|
104
|
-
"cloudpickle",
|
|
105
|
-
"gym",
|
|
106
110
|
"gymnasium",
|
|
107
|
-
"
|
|
108
|
-
"open3d",
|
|
109
|
-
"zarr",
|
|
110
|
-
"openai",
|
|
111
|
-
"jax",
|
|
111
|
+
"gym",
|
|
112
112
|
]
|
|
113
113
|
franka = [
|
|
114
114
|
"pyyaml",
|
|
@@ -142,6 +142,9 @@ override-dependencies = [
|
|
|
142
142
|
"xgrammar==0.1.19",
|
|
143
143
|
"uvloop==0.21.0",
|
|
144
144
|
"tensorflow-addons==0.23.0",
|
|
145
|
+
"setuptools>=69.5.1,<75.9",
|
|
146
|
+
"datasets==3.6.0",
|
|
147
|
+
"peft==0.11.1",
|
|
145
148
|
]
|
|
146
149
|
|
|
147
150
|
[tool.setuptools]
|
|
@@ -45,9 +45,14 @@ def get_env_cls(env_type: str, env_cfg=None):
|
|
|
45
45
|
env_type = SupportedEnvType(env_type)
|
|
46
46
|
|
|
47
47
|
if env_type == SupportedEnvType.MANISKILL:
|
|
48
|
-
|
|
48
|
+
if env_cfg.get("enable_offload", False):
|
|
49
|
+
from rlinf.envs.maniskill.maniskill_offload_env import ManiskillOffloadEnv
|
|
49
50
|
|
|
50
|
-
|
|
51
|
+
return ManiskillOffloadEnv
|
|
52
|
+
else:
|
|
53
|
+
from rlinf.envs.maniskill.maniskill_env import ManiskillEnv
|
|
54
|
+
|
|
55
|
+
return ManiskillEnv
|
|
51
56
|
elif env_type == SupportedEnvType.LIBERO:
|
|
52
57
|
from rlinf.envs.libero.libero_env import LiberoEnv
|
|
53
58
|
|