rlinf 0.2.0.dev1__tar.gz → 0.2.0.dev2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (364) hide show
  1. {rlinf-0.2.0.dev1/rlinf.egg-info → rlinf-0.2.0.dev2}/PKG-INFO +23 -26
  2. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/README.md +3 -3
  3. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/pyproject.toml +26 -23
  4. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/__init__.py +7 -2
  5. rlinf-0.2.0.dev2/rlinf/envs/maniskill/maniskill_offload_env.py +449 -0
  6. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/utils.py +30 -5
  7. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/utils.py +24 -1
  8. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/world_model/world_model_opensora_env.py +116 -0
  9. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/base_policy.py +25 -2
  10. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/cnn_policy/cnn_policy.py +185 -22
  11. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/mlp_policy/mlp_policy.py +132 -17
  12. rlinf-0.2.0.dev2/rlinf/utils/cuda_graph.py +274 -0
  13. rlinf-0.2.0.dev2/rlinf/utils/pytree.py +60 -0
  14. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/fsdp_actor_worker.py +1 -0
  15. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/env/env_worker.py +9 -5
  16. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/hf/huggingface_worker.py +24 -3
  17. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/sft/fsdp_sft_worker.py +7 -3
  18. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2/rlinf.egg-info}/PKG-INFO +23 -26
  19. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf.egg-info/SOURCES.txt +3 -0
  20. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf.egg-info/requires.txt +13 -24
  21. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/LICENSE +0 -0
  22. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/__init__.py +0 -0
  23. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/__init__.py +0 -0
  24. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/__init__.py +0 -0
  25. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/fake_tool_worker.py +0 -0
  26. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/mcp_agent_loop.py +0 -0
  27. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/mcp_filesystem_worker.py +0 -0
  28. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/multiturn_demo/tool_agent_loop.py +0 -0
  29. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/searchr1/__init__.py +0 -0
  30. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/searchr1/search_tool_worker.py +0 -0
  31. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/agents/searchr1/searchr1_agent_loop.py +0 -0
  32. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/__init__.py +0 -0
  33. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/advantages.py +0 -0
  34. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/losses.py +0 -0
  35. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/registry.py +0 -0
  36. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/__init__.py +0 -0
  37. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/code/__init__.py +0 -0
  38. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/code/code_verifier/__init__.py +0 -0
  39. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/code/code_verifier/verify.py +0 -0
  40. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/math/__init__.py +0 -0
  41. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/math/math_verifier/__init__.py +0 -0
  42. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/math/math_verifier/parser.py +0 -0
  43. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/math/math_verifier/verify.py +0 -0
  44. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/searchr1/__init__.py +0 -0
  45. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/vqa/__init__.py +0 -0
  46. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/vqa/format_rewards.py +0 -0
  47. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/rewards/vqa/qa_rewards.py +0 -0
  48. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/algorithms/utils.py +0 -0
  49. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/config.py +0 -0
  50. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/__init__.py +0 -0
  51. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/__init__.py +0 -0
  52. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/item.py +0 -0
  53. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/math.py +0 -0
  54. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/vlm.py +0 -0
  55. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/datasets/world_model.py +0 -0
  56. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/embodied_io_struct.py +0 -0
  57. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/io_struct.py +0 -0
  58. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/replay_buffer.py +0 -0
  59. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/tokenizers.py +0 -0
  60. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/tool_call/__init__.py +0 -0
  61. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/tool_call/tool_io_struct.py +0 -0
  62. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/data/utils.py +0 -0
  63. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/action_utils.py +0 -0
  64. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/behavior/__init__.py +0 -0
  65. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/behavior/behavior_env.py +0 -0
  66. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/calvin/__init__.py +0 -0
  67. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/calvin/calvin_gym_env.py +0 -0
  68. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/calvin/utils.py +0 -0
  69. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/calvin/venv.py +0 -0
  70. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/frankasim/__init__.py +0 -0
  71. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/frankasim/frankasim_env.py +0 -0
  72. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/__init__.py +0 -0
  73. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/extensions/__init__.py +0 -0
  74. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/extensions/config/vlnce_r2r.yaml +0 -0
  75. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/extensions/maps.py +0 -0
  76. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/extensions/utils.py +0 -0
  77. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/habitat_env.py +0 -0
  78. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/habitat/venv.py +0 -0
  79. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/__init__.py +0 -0
  80. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/isaaclab_env.py +0 -0
  81. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/tasks/__init__.py +0 -0
  82. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/tasks/stack_cube.py +0 -0
  83. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/utils.py +0 -0
  84. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/isaaclab/venv.py +0 -0
  85. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/libero/__init__.py +0 -0
  86. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/libero/libero_env.py +0 -0
  87. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/libero/utils.py +0 -0
  88. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/libero/venv.py +0 -0
  89. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/__init__.py +0 -0
  90. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/maniskill_env.py +0 -0
  91. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/__init__.py +0 -0
  92. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/put_carrot_on_plate.py +0 -0
  93. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/put_on_in_scene_multi.py +0 -0
  94. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/__init__.py +0 -0
  95. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_carrot.py +0 -0
  96. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_ee_pose.py +0 -0
  97. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_image.py +0 -0
  98. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_instruct.py +0 -0
  99. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_multi_carrot.py +0 -0
  100. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_multi_plate.py +0 -0
  101. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_plate.py +0 -0
  102. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_position.py +0 -0
  103. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_position_change.py +0 -0
  104. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_single.py +0 -0
  105. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_vision_image.py +0 -0
  106. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_vision_texture.py +0 -0
  107. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/put_on_plate_25_vision_whole.py +0 -0
  108. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/maniskill/tasks/variants/utils.py +0 -0
  109. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/metaworld/__init__.py +0 -0
  110. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/metaworld/metaworld_env.py +0 -0
  111. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/metaworld/utils.py +0 -0
  112. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/metaworld/venv.py +0 -0
  113. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/__init__.py +0 -0
  114. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/camera/__init__.py +0 -0
  115. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/camera/camera.py +0 -0
  116. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/keyboard/__init__.py +0 -0
  117. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/keyboard/keyboard_listener.py +0 -0
  118. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/ros/__init__.py +0 -0
  119. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/ros/ros_controller.py +0 -0
  120. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/spacemouse/__init__.py +0 -0
  121. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/spacemouse/spacemouse_expert.py +0 -0
  122. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/video_player/__init__.py +0 -0
  123. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/video_player/video_player.py +0 -0
  124. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/__init__.py +0 -0
  125. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/euler_obs.py +0 -0
  126. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/gripper_close.py +0 -0
  127. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/relative_frame.py +0 -0
  128. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/reward_done_wrapper.py +0 -0
  129. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/common/wrappers/spacemouse_intervention.py +0 -0
  130. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/__init__.py +0 -0
  131. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/franka_controller.py +0 -0
  132. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/franka_env.py +0 -0
  133. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/franka_robot_state.py +0 -0
  134. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/tasks/__init__.py +0 -0
  135. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/tasks/bottle.py +0 -0
  136. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/tasks/franka_bin_relocation.py +0 -0
  137. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/tasks/peg_insertion_env.py +0 -0
  138. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/franka/utils.py +0 -0
  139. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/realworld_env.py +0 -0
  140. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/realworld/venv.py +0 -0
  141. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robocasa/__init__.py +0 -0
  142. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robocasa/robocasa_env.py +0 -0
  143. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robocasa/utils.py +0 -0
  144. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robocasa/venv.py +0 -0
  145. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robotwin/__init__.py +0 -0
  146. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/robotwin/robotwin_env.py +0 -0
  147. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/venv/__init__.py +0 -0
  148. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/venv/venv.py +0 -0
  149. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/world_model/__init__.py +0 -0
  150. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/world_model/base_world_env.py +0 -0
  151. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/wrappers/__init__.py +0 -0
  152. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/envs/wrappers/record_video.py +0 -0
  153. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/__init__.py +0 -0
  154. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/__init__.py +0 -0
  155. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/fsdp_model_manager.py +0 -0
  156. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/__init__.py +0 -0
  157. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/base.py +0 -0
  158. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/checkpoint.py +0 -0
  159. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/fsdp.py +0 -0
  160. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/strategy/fsdp2.py +0 -0
  161. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/fsdp/utils.py +0 -0
  162. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/megatron/__init__.py +0 -0
  163. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/megatron/megatron_model_manager.py +0 -0
  164. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/megatron/utils.py +0 -0
  165. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/__init__.py +0 -0
  166. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/detokenizer_manager.py +0 -0
  167. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/io_struct.py +0 -0
  168. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/sgl_engine.py +0 -0
  169. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/sgl_scheduler.py +0 -0
  170. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/sglang/common/tokenizer_manager.py +0 -0
  171. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/vllm/vllm_0_8_5/__init__.py +0 -0
  172. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/vllm/vllm_0_8_5/executor.py +0 -0
  173. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/vllm/vllm_0_8_5/weight_loader.py +0 -0
  174. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/hybrid_engines/vllm/vllm_0_8_5/worker.py +0 -0
  175. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/__init__.py +0 -0
  176. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/__init__.py +0 -0
  177. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/cnn_policy/__init__.py +0 -0
  178. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/dexbotic_pi/__init__.py +0 -0
  179. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/dexbotic_pi/dexbotic_pi_policy.py +0 -0
  180. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/flow_policy/__init__.py +0 -0
  181. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/flow_policy/flow_policy.py +0 -0
  182. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/__init__.py +0 -0
  183. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/embodiment_tags.py +0 -0
  184. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/gr00t_action_model.py +0 -0
  185. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/modality_config.py +0 -0
  186. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/simulation_io.py +0 -0
  187. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/gr00t/utils.py +0 -0
  188. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/mlp_policy/__init__.py +0 -0
  189. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/__init__.py +0 -0
  190. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/batch_renorm.py +0 -0
  191. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/entropy_tunning.py +0 -0
  192. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/explore_noise_net.py +0 -0
  193. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/flow_actor.py +0 -0
  194. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/mlp.py +0 -0
  195. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/q_head.py +0 -0
  196. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/resnet_utils.py +0 -0
  197. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/utils.py +0 -0
  198. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/modules/value_head.py +0 -0
  199. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/__init__.py +0 -0
  200. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/__init__.py +0 -0
  201. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/behavior_dataconfig.py +0 -0
  202. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/calvin_dataconfig.py +0 -0
  203. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/franka_dataconfig.py +0 -0
  204. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/gsenv_dataconfig.py +0 -0
  205. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/libero_dataconfig.py +0 -0
  206. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/maniskill_dataconfig.py +0 -0
  207. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/metaworld_dataconfig.py +0 -0
  208. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/robocasa_dataconfig.py +0 -0
  209. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/dataconfig/robotwin_aloha_dataconfig.py +0 -0
  210. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/openpi_action_model.py +0 -0
  211. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/__init__.py +0 -0
  212. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/aloha_policy.py +0 -0
  213. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/behavior_policy.py +0 -0
  214. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/calvin_policy.py +0 -0
  215. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/franka_policy.py +0 -0
  216. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/gsenv_policy.py +0 -0
  217. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/libero_policy.py +0 -0
  218. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/maniskill_policy.py +0 -0
  219. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/metaworld_policy.py +0 -0
  220. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openpi/policies/robocasa_policy.py +0 -0
  221. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla/__init__.py +0 -0
  222. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla/openvla_action_model.py +0 -0
  223. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/__init__.py +0 -0
  224. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/official/__init__.py +0 -0
  225. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/official/openvla_oft_action_model.py +0 -0
  226. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/openvla_utils.py +0 -0
  227. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/rlinf/__init__.py +0 -0
  228. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/openvla_oft/rlinf/openvla_oft_action_model.py +0 -0
  229. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/prismatic/__init__.py +0 -0
  230. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/models/embodiment/prismatic/processing_prismatic.py +0 -0
  231. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/__init__.py +0 -0
  232. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/agent_eval_runner.py +0 -0
  233. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/agent_runner.py +0 -0
  234. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/async_embodied_runner.py +0 -0
  235. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/coding_online_rl_runner.py +0 -0
  236. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/embodied_eval_runner.py +0 -0
  237. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/embodied_runner.py +0 -0
  238. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/reasoning_eval_runner.py +0 -0
  239. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/reasoning_runner.py +0 -0
  240. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/runners/sft_runner.py +0 -0
  241. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/__init__.py +0 -0
  242. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/channel/__init__.py +0 -0
  243. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/channel/channel.py +0 -0
  244. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/channel/channel_worker.py +0 -0
  245. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/__init__.py +0 -0
  246. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/cluster.py +0 -0
  247. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/config.py +0 -0
  248. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/node.py +0 -0
  249. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/cluster/utils.py +0 -0
  250. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/__init__.py +0 -0
  251. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/async_work.py +0 -0
  252. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/collective.py +0 -0
  253. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/collective_group.py +0 -0
  254. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/collective/multi_channel_pg.py +0 -0
  255. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/dynamic_scheduler/__init__.py +0 -0
  256. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/dynamic_scheduler/manager.py +0 -0
  257. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/dynamic_scheduler/scheduler_worker.py +0 -0
  258. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/dynamic_scheduler/utils.py +0 -0
  259. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/__init__.py +0 -0
  260. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/__init__.py +0 -0
  261. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/accelerator.py +0 -0
  262. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/amd_gpu.py +0 -0
  263. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/ascend_npu.py +0 -0
  264. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/intel_gpu.py +0 -0
  265. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/musa_gpu.py +0 -0
  266. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/accelerators/nvidia_gpu.py +0 -0
  267. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/hardware.py +0 -0
  268. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/robots/__init__.py +0 -0
  269. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/hardware/robots/franka.py +0 -0
  270. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/__init__.py +0 -0
  271. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/coll_manager.py +0 -0
  272. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/lock_manager.py +0 -0
  273. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/manager.py +0 -0
  274. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/node_manager.py +0 -0
  275. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/manager/worker_manager.py +0 -0
  276. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/__init__.py +0 -0
  277. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/flexible.py +0 -0
  278. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/node.py +0 -0
  279. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/packed.py +0 -0
  280. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/placement/placement.py +0 -0
  281. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/worker/__init__.py +0 -0
  282. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/worker/lock.py +0 -0
  283. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/worker/worker.py +0 -0
  284. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/scheduler/worker/worker_group.py +0 -0
  285. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/__init__.py +0 -0
  286. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/__init__.py +0 -0
  287. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/convert_openpi_jax_to_python.py +0 -0
  288. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/__init__.py +0 -0
  289. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/config/fsdp_model_convertor.yaml +0 -0
  290. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/convert_dcp_to_pt.py +0 -0
  291. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/convert_pt_to_hf.py +0 -0
  292. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/fsdp_convertor/utils.py +0 -0
  293. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/__init__.py +0 -0
  294. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/config.py +0 -0
  295. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_hf_to_mg.py +0 -0
  296. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_hf_to_middle_file.py +0 -0
  297. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_mg_to_middle_file.py +0 -0
  298. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_middle_file_to_hf.py +0 -0
  299. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/convert_middle_file_to_mg.py +0 -0
  300. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/default_args.yaml +0 -0
  301. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/__init__.py +0 -0
  302. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/fp8_utils.py +0 -0
  303. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/mg_loader.py +0 -0
  304. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/mg_moe_groupgemm.py +0 -0
  305. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/mp_utils.py +0 -0
  306. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/safetensors_loader.py +0 -0
  307. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/ckpt_convertor/megatron_convertor/utils/tensor_operations.py +0 -0
  308. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/convertor/__init__.py +0 -0
  309. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/convertor/utils.py +0 -0
  310. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/data_iter_utils.py +0 -0
  311. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/data_process.py +0 -0
  312. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/distributed.py +0 -0
  313. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/drq.py +0 -0
  314. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/flops.py +0 -0
  315. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/initialize.py +0 -0
  316. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/logging.py +0 -0
  317. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/metric_logger.py +0 -0
  318. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/metric_utils.py +0 -0
  319. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/nested_dict_process.py +0 -0
  320. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/omega_resolver.py +0 -0
  321. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/patcher.py +0 -0
  322. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/placement.py +0 -0
  323. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/profiler.py +0 -0
  324. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/resharding/__init__.py +0 -0
  325. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/resharding/mcore_weight_reshard.py +0 -0
  326. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/resharding/reshard_config.py +0 -0
  327. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/resharding/utils.py +0 -0
  328. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/runner_utils.py +0 -0
  329. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/timers.py +0 -0
  330. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/torch_functionals.py +0 -0
  331. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/train_utils.py +0 -0
  332. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/utils/utils.py +0 -0
  333. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/__init__.py +0 -0
  334. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/__init__.py +0 -0
  335. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/async_fsdp_sac_policy_worker.py +0 -0
  336. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/fsdp_sac_policy_worker.py +0 -0
  337. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/actor/megatron_actor_worker.py +0 -0
  338. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/agent/__init__.py +0 -0
  339. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/agent/agent_loop.py +0 -0
  340. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/agent/tool_worker.py +0 -0
  341. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/env/__init__.py +0 -0
  342. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/env/async_env_worker.py +0 -0
  343. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/inference/__init__.py +0 -0
  344. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/inference/fsdp_inference_worker.py +0 -0
  345. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/inference/megatron_inference_worker.py +0 -0
  346. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/inference/utils.py +0 -0
  347. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/reward/__init__.py +0 -0
  348. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/reward/reward_worker.py +0 -0
  349. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/__init__.py +0 -0
  350. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/hf/__init__.py +0 -0
  351. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/hf/async_huggingface_worker.py +0 -0
  352. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/hf/utils.py +0 -0
  353. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/server/__init__.py +0 -0
  354. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/server/online_router_worker.py +0 -0
  355. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/server/server_rollout_worker.py +0 -0
  356. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/sglang/__init__.py +0 -0
  357. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/sglang/sglang_worker.py +0 -0
  358. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/utils.py +0 -0
  359. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/vllm/__init__.py +0 -0
  360. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/rollout/vllm/vllm_worker.py +0 -0
  361. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf/workers/sft/__init__.py +0 -0
  362. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf.egg-info/dependency_links.txt +0 -0
  363. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/rlinf.egg-info/top_level.txt +0 -0
  364. {rlinf-0.2.0.dev1 → rlinf-0.2.0.dev2}/setup.cfg +0 -0
@@ -1,6 +1,8 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: rlinf
3
- Version: 0.2.0.dev1
3
+ Version: 0.2.0.dev2
4
+ Summary: Reinforcement Learning Infrastructure for Embodied and Agentic AI
5
+ Author: RLinf Contributors
4
6
  License: Apache License
5
7
  Version 2.0, January 2004
6
8
  https://www.apache.org/licenses/
@@ -202,6 +204,10 @@ License: Apache License
202
204
  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
203
205
  See the License for the specific language governing permissions and
204
206
  limitations under the License.
207
+ Project-URL: Homepage, https://github.com/RLinf/RLinf
208
+ Project-URL: Repository, https://github.com/RLinf/RLinf
209
+ Project-URL: Documentation, https://rlinf.readthedocs.io/
210
+ Project-URL: Bug Report, https://github.com/RLinf/RLinf/issues
205
211
  Keywords: reinforcement-learning,embodied-intelligence,large-language-models
206
212
  Classifier: Development Status :: 2 - Pre-Alpha
207
213
  Classifier: Environment :: GPU :: NVIDIA CUDA :: 12 :: 12.4
@@ -212,10 +218,10 @@ Requires-Python: <=3.11.14,>=3.10
212
218
  Description-Content-Type: text/markdown
213
219
  License-File: LICENSE
214
220
  Requires-Dist: ray[default]>=2.47.0
215
- Requires-Dist: torch==2.6.0
221
+ Requires-Dist: torch<=2.9.0,>=2.5.0
216
222
  Requires-Dist: hydra-core
217
223
  Requires-Dist: numpy
218
- Requires-Dist: datasets==3.6.0
224
+ Requires-Dist: datasets
219
225
  Requires-Dist: torchdata
220
226
  Requires-Dist: scipy
221
227
  Requires-Dist: accelerate
@@ -223,7 +229,7 @@ Requires-Dist: debugpy
223
229
  Requires-Dist: einops
224
230
  Requires-Dist: nvitop
225
231
  Requires-Dist: pybind11
226
- Requires-Dist: setuptools<75.9,>=69.5.1
232
+ Requires-Dist: setuptools
227
233
  Requires-Dist: ninja
228
234
  Requires-Dist: pytest
229
235
  Requires-Dist: gsutil
@@ -241,44 +247,35 @@ Requires-Dist: tensorboard
241
247
  Provides-Extra: agentic-sglang
242
248
  Requires-Dist: sglang[all]==0.4.6.post5; extra == "agentic-sglang"
243
249
  Requires-Dist: torch-memory-saver; extra == "agentic-sglang"
250
+ Requires-Dist: numpy==2.2; extra == "agentic-sglang"
244
251
  Requires-Dist: transformers==4.51.1; extra == "agentic-sglang"
245
252
  Requires-Dist: uvloop==0.21.0; extra == "agentic-sglang"
246
253
  Requires-Dist: hydra-core==1.4.0.dev1; extra == "agentic-sglang"
254
+ Requires-Dist: omegaconf==2.4.0.dev4; extra == "agentic-sglang"
247
255
  Requires-Dist: word2number; extra == "agentic-sglang"
248
256
  Requires-Dist: regex; extra == "agentic-sglang"
249
257
  Requires-Dist: peft==0.11.1; extra == "agentic-sglang"
250
258
  Requires-Dist: rlinf_latex2sympy2; extra == "agentic-sglang"
259
+ Requires-Dist: mcp; extra == "agentic-sglang"
251
260
  Provides-Extra: agentic-vllm
252
261
  Requires-Dist: vllm==0.8.5; extra == "agentic-vllm"
262
+ Requires-Dist: numpy==2.2; extra == "agentic-vllm"
253
263
  Requires-Dist: transformers==4.51.1; extra == "agentic-vllm"
254
264
  Requires-Dist: uvloop==0.21.0; extra == "agentic-vllm"
255
265
  Requires-Dist: hydra-core==1.4.0.dev1; extra == "agentic-vllm"
266
+ Requires-Dist: omegaconf==2.4.0.dev4; extra == "agentic-vllm"
256
267
  Requires-Dist: word2number; extra == "agentic-vllm"
257
268
  Requires-Dist: regex; extra == "agentic-vllm"
258
269
  Requires-Dist: peft==0.11.1; extra == "agentic-vllm"
259
270
  Requires-Dist: rlinf_latex2sympy2; extra == "agentic-vllm"
271
+ Requires-Dist: mcp; extra == "agentic-vllm"
260
272
  Provides-Extra: embodied
261
- Requires-Dist: transformers==4.40.1; extra == "embodied"
262
- Requires-Dist: draccus; extra == "embodied"
263
- Requires-Dist: rich; extra == "embodied"
264
- Requires-Dist: tensorflow; extra == "embodied"
265
- Requires-Dist: tensorflow_graphics; extra == "embodied"
266
- Requires-Dist: peft==0.11.1; extra == "embodied"
267
- Requires-Dist: timm==0.9.10; extra == "embodied"
268
- Requires-Dist: sapien==3.0.1; platform_system == "Linux" and extra == "embodied"
269
- Requires-Dist: tensordict; extra == "embodied"
273
+ Requires-Dist: transformers<=4.57.6; extra == "embodied"
274
+ Requires-Dist: peft; extra == "embodied"
275
+ Requires-Dist: timm; extra == "embodied"
270
276
  Requires-Dist: imageio[ffmpeg]; extra == "embodied"
271
- Requires-Dist: robosuite==1.4.1; extra == "embodied"
272
- Requires-Dist: bddl; extra == "embodied"
273
- Requires-Dist: easydict; extra == "embodied"
274
- Requires-Dist: cloudpickle; extra == "embodied"
275
- Requires-Dist: gym; extra == "embodied"
276
277
  Requires-Dist: gymnasium; extra == "embodied"
277
- Requires-Dist: av; extra == "embodied"
278
- Requires-Dist: open3d; extra == "embodied"
279
- Requires-Dist: zarr; extra == "embodied"
280
- Requires-Dist: openai; extra == "embodied"
281
- Requires-Dist: jax; extra == "embodied"
278
+ Requires-Dist: gym; extra == "embodied"
282
279
  Provides-Extra: franka
283
280
  Requires-Dist: pyyaml; extra == "franka"
284
281
  Requires-Dist: rospkg; extra == "franka"
@@ -294,7 +291,7 @@ Requires-Dist: pynput; extra == "franka"
294
291
  Dynamic: license-file
295
292
 
296
293
  <div align="center">
297
- <img src="docs/source-en/_static/svg/logo_white.svg" alt="RLinf-logo" width="600"/>
294
+ <img src="https://github.com/RLinf/misc/raw/main/pic/logo_white.svg" alt="RLinf-logo" width="600"/>
298
295
  </div>
299
296
 
300
297
  <div align="center">
@@ -320,7 +317,7 @@ Dynamic: license-file
320
317
  RLinf is a flexible and scalable open-source RL infrastructure designed for Embodied and Agentic AI. The 'inf' in RLinf stands for `Infrastructure`, highlighting its role as a robust backbone for next-generation training. It also stands for `Infinite`, symbolizing the system’s support for open-ended learning, continuous generalization, and limitless possibilities in intelligence development.
321
318
 
322
319
  <div align="center">
323
- <img src="docs/source-en/_static/svg/overview.svg" alt="RLinf-overview"/>
320
+ <img src="https://github.com/RLinf/misc/raw/main/pic/overview.svg" alt="RLinf-overview"/>
324
321
  </div>
325
322
 
326
323
 
@@ -417,7 +414,7 @@ Multiple Backend Integrations
417
414
  </ul>
418
415
  <li><b>Custom Models</b></li>
419
416
  <ul>
420
- <li><a href="https://github.com/RLinf/RLinf/blob/main/docs/source-en/rst_source/examples/embodied/mlp.rst">MLP-Policy</a> ✅</li>
417
+ <li><a href="https://rlinf.readthedocs.io/en/latest/rst_source/examples/embodied/mlp.html">MLP-Policy</a> ✅</li>
421
418
  <li>CNN-Policy ✅</li>
422
419
  </ul>
423
420
  </ul>
@@ -1,5 +1,5 @@
1
1
  <div align="center">
2
- <img src="docs/source-en/_static/svg/logo_white.svg" alt="RLinf-logo" width="600"/>
2
+ <img src="https://github.com/RLinf/misc/raw/main/pic/logo_white.svg" alt="RLinf-logo" width="600"/>
3
3
  </div>
4
4
 
5
5
  <div align="center">
@@ -25,7 +25,7 @@
25
25
  RLinf is a flexible and scalable open-source RL infrastructure designed for Embodied and Agentic AI. The 'inf' in RLinf stands for `Infrastructure`, highlighting its role as a robust backbone for next-generation training. It also stands for `Infinite`, symbolizing the system’s support for open-ended learning, continuous generalization, and limitless possibilities in intelligence development.
26
26
 
27
27
  <div align="center">
28
- <img src="docs/source-en/_static/svg/overview.svg" alt="RLinf-overview"/>
28
+ <img src="https://github.com/RLinf/misc/raw/main/pic/overview.svg" alt="RLinf-overview"/>
29
29
  </div>
30
30
 
31
31
 
@@ -122,7 +122,7 @@ Multiple Backend Integrations
122
122
  </ul>
123
123
  <li><b>Custom Models</b></li>
124
124
  <ul>
125
- <li><a href="https://github.com/RLinf/RLinf/blob/main/docs/source-en/rst_source/examples/embodied/mlp.rst">MLP-Policy</a> ✅</li>
125
+ <li><a href="https://rlinf.readthedocs.io/en/latest/rst_source/examples/embodied/mlp.html">MLP-Policy</a> ✅</li>
126
126
  <li>CNN-Policy ✅</li>
127
127
  </ul>
128
128
  </ul>
@@ -4,7 +4,9 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "rlinf"
7
- version = "0.2.0.dev1"
7
+ version = "0.2.0.dev2"
8
+ authors = [{ name = "RLinf Contributors" }]
9
+ description = "Reinforcement Learning Infrastructure for Embodied and Agentic AI"
8
10
  readme = {file = "README.md", content-type = "text/markdown"}
9
11
  requires-python = ">=3.10,<=3.11.14"
10
12
  license = {file = "LICENSE"}
@@ -25,16 +27,17 @@ classifiers = [
25
27
  "Programming Language :: Python :: 3.11",
26
28
  ]
27
29
 
30
+
28
31
  dependencies = [
29
32
  # Core System
30
33
  # These are the dependencies of the core scheduler
31
34
  "ray[default]>=2.47.0",
32
- "torch==2.6.0",
35
+ "torch>=2.5.0,<=2.9.0",
33
36
  "hydra-core",
34
37
  "numpy",
35
38
 
36
39
  # Data processing
37
- "datasets==3.6.0",
40
+ "datasets",
38
41
  "torchdata",
39
42
  "scipy",
40
43
 
@@ -44,7 +47,7 @@ dependencies = [
44
47
  "einops",
45
48
  "nvitop",
46
49
  "pybind11",
47
- "setuptools>=69.5.1,<75.9",
50
+ "setuptools",
48
51
  "ninja",
49
52
  "pytest",
50
53
  "gsutil",
@@ -63,52 +66,49 @@ dependencies = [
63
66
  "tensorboard",
64
67
  ]
65
68
 
69
+ [project.urls]
70
+ Homepage = "https://github.com/RLinf/RLinf"
71
+ Repository = "https://github.com/RLinf/RLinf"
72
+ Documentation = "https://rlinf.readthedocs.io/"
73
+ "Bug Report" = "https://github.com/RLinf/RLinf/issues"
74
+
66
75
  [project.optional-dependencies]
67
76
  agentic-sglang = [
68
77
  "sglang[all]==0.4.6.post5",
69
78
  "torch-memory-saver",
79
+ "numpy==2.2",
70
80
  "transformers==4.51.1",
71
81
  # uvloop is not compatible with simulators, put it here
72
82
  "uvloop==0.21.0",
73
83
  "hydra-core==1.4.0.dev1",
84
+ "omegaconf==2.4.0.dev4",
74
85
  "word2number",
75
86
  "regex",
76
87
  "peft==0.11.1",
77
88
  "rlinf_latex2sympy2",
89
+ "mcp",
78
90
  ]
79
91
  agentic-vllm = [
80
92
  "vllm==0.8.5",
93
+ "numpy==2.2",
81
94
  "transformers==4.51.1",
82
95
  # uvloop is not compatible with simulators, put it here
83
96
  "uvloop==0.21.0",
84
97
  "hydra-core==1.4.0.dev1",
98
+ "omegaconf==2.4.0.dev4",
85
99
  "word2number",
86
100
  "regex",
87
101
  "peft==0.11.1",
88
102
  "rlinf_latex2sympy2",
103
+ "mcp",
89
104
  ]
90
105
  embodied = [
91
- "transformers==4.40.1",
92
- "draccus",
93
- "rich",
94
- "tensorflow",
95
- "tensorflow_graphics",
96
- "peft==0.11.1",
97
- "timm==0.9.10",
98
- "sapien==3.0.1;platform_system=='Linux'",
99
- "tensordict",
106
+ "transformers<=4.57.6",
107
+ "peft",
108
+ "timm",
100
109
  "imageio[ffmpeg]",
101
- "robosuite==1.4.1",
102
- "bddl",
103
- "easydict",
104
- "cloudpickle",
105
- "gym",
106
110
  "gymnasium",
107
- "av",
108
- "open3d",
109
- "zarr",
110
- "openai",
111
- "jax",
111
+ "gym",
112
112
  ]
113
113
  franka = [
114
114
  "pyyaml",
@@ -142,6 +142,9 @@ override-dependencies = [
142
142
  "xgrammar==0.1.19",
143
143
  "uvloop==0.21.0",
144
144
  "tensorflow-addons==0.23.0",
145
+ "setuptools>=69.5.1,<75.9",
146
+ "datasets==3.6.0",
147
+ "peft==0.11.1",
145
148
  ]
146
149
 
147
150
  [tool.setuptools]
@@ -45,9 +45,14 @@ def get_env_cls(env_type: str, env_cfg=None):
45
45
  env_type = SupportedEnvType(env_type)
46
46
 
47
47
  if env_type == SupportedEnvType.MANISKILL:
48
- from rlinf.envs.maniskill.maniskill_env import ManiskillEnv
48
+ if env_cfg.get("enable_offload", False):
49
+ from rlinf.envs.maniskill.maniskill_offload_env import ManiskillOffloadEnv
49
50
 
50
- return ManiskillEnv
51
+ return ManiskillOffloadEnv
52
+ else:
53
+ from rlinf.envs.maniskill.maniskill_env import ManiskillEnv
54
+
55
+ return ManiskillEnv
51
56
  elif env_type == SupportedEnvType.LIBERO:
52
57
  from rlinf.envs.libero.libero_env import LiberoEnv
53
58