mani-skill-nightly 2025.4.28.835__py3-none-any.whl → 2025.4.29.2144__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -45,7 +45,7 @@ class PushCubeEnv(BaseEnv):
45
45
  - the target goal region is marked by a red/white circular target. The position of the target is fixed to be the cube xy position + [0.1 + goal_radius, 0]
46
46
 
47
47
  **Success Conditions:**
48
- - the cube's xy position is within goal_radius (default 0.1) of the target's xy position by euclidean distance.
48
+ - the cube's xy position is within goal_radius (default 0.1) of the target's xy position by euclidean distance and the cube is still on the table.
49
49
  """
50
50
 
51
51
  _sample_video_link = "https://github.com/haosulab/ManiSkill/raw/main/figures/environment_demos/PushCube-v1_rt.mp4"
@@ -226,12 +226,22 @@ class PushCubeEnv(BaseEnv):
226
226
  )
227
227
  place_reward = 1 - torch.tanh(5 * obj_to_goal_dist)
228
228
  reward += place_reward * reached
229
+
230
+ # Compute a z reward to encourage the robot to keep the cube on the table
231
+ desired_obj_z = self.cube_half_size
232
+ current_obj_z = self.obj.pose.p[..., 2]
233
+ z_deviation = torch.abs(current_obj_z - desired_obj_z)
234
+ z_reward = 1 - torch.tanh(5 * z_deviation)
235
+ # We multiply the z reward by the place_reward and reached mask so that
236
+ # we only add the z reward if the robot has reached the desired push pose
237
+ # and the z reward becomes more important as the robot gets closer to the goal.
238
+ reward += place_reward * z_reward * reached
229
239
 
230
240
  # assign rewards to parallel environments that achieved success to the maximum of 3.
231
- reward[info["success"]] = 3
241
+ reward[info["success"]] = 4
232
242
  return reward
233
243
 
234
244
  def compute_normalized_dense_reward(self, obs: Any, action: Array, info: Dict):
235
245
  # this should be equal to compute_dense_reward / max possible reward
236
- max_reward = 3.0
246
+ max_reward = 4.0
237
247
  return self.compute_dense_reward(obs=obs, action=action, info=info) / max_reward
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: mani-skill-nightly
3
- Version: 2025.4.28.835
3
+ Version: 2025.4.29.2144
4
4
  Summary: ManiSkill3: A Unified Benchmark for Generalizable Manipulation Skills
5
5
  Home-page: https://github.com/haosulab/ManiSkill
6
6
  Author: ManiSkill contributors
@@ -606,7 +606,7 @@ mani_skill/envs/tasks/tabletop/plug_charger.py,sha256=0g-rkNf-oo2ovttlcQ58jqUq6S
606
606
  mani_skill/envs/tasks/tabletop/poke_cube.py,sha256=KV6mp-Xgm9h4GYUcAUop2AZ4IECTdQKEMRRd9NThyBo,9343
607
607
  mani_skill/envs/tasks/tabletop/pull_cube.py,sha256=txtWuIRFzTKxJtWbrygxVEgOPDvm73WlERXldjlUB-I,5546
608
608
  mani_skill/envs/tasks/tabletop/pull_cube_tool.py,sha256=NaZpdbYYL4zC41GVY__eq4uRIQpVXthzAqe5oSq8YWU,9951
609
- mani_skill/envs/tasks/tabletop/push_cube.py,sha256=fPy0BHpdsDhuKWI1eaMLkWnC1rTyXFmvorvm7LN2q8U,12062
609
+ mani_skill/envs/tasks/tabletop/push_cube.py,sha256=WZ4k89f8inbwbomYtJAxodQDcGUYhDMrn9UHoaqYODQ,12701
610
610
  mani_skill/envs/tasks/tabletop/push_t.py,sha256=MpANhMe6ay5Qhsipe2G1Wy-LSJqrgeOyH3M8fZW_L2c,23522
611
611
  mani_skill/envs/tasks/tabletop/roll_ball.py,sha256=OujblvDphjdQBzQiCUnm_gXFwGLubpr40VT7daCWlDo,6760
612
612
  mani_skill/envs/tasks/tabletop/stack_cube.py,sha256=_3auYI95uj6hMzTmHMty8pFmD5RhiVxw48MPg5BpREA,7459
@@ -802,8 +802,8 @@ mani_skill/vector/wrappers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJ
802
802
  mani_skill/vector/wrappers/gymnasium.py,sha256=v1MDPIrVACBKCulrpdXBK2jDZQI7LKYFZgGgaCC5avY,7408
803
803
  mani_skill/vector/wrappers/sb3.py,sha256=SlXdiEPqcNHYMhJCzA29kBU6zK7DKTe1nc0L6Z3QQtY,4722
804
804
  mani_skill/viewer/__init__.py,sha256=srvDBsk4LQU75K2VIttrhiQ68p_ro7PSDqQRls2PY5c,1722
805
- mani_skill_nightly-2025.4.28.835.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
806
- mani_skill_nightly-2025.4.28.835.dist-info/METADATA,sha256=awOwJzRk__I4FqOIt-W49Ib9BMygtR4CqOQO9Rr8up4,9291
807
- mani_skill_nightly-2025.4.28.835.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
808
- mani_skill_nightly-2025.4.28.835.dist-info/top_level.txt,sha256=bkBgOVl_MZMoQx2aRFsSFEYlZLxjWlip5vtJ39FB3jA,11
809
- mani_skill_nightly-2025.4.28.835.dist-info/RECORD,,
805
+ mani_skill_nightly-2025.4.29.2144.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
806
+ mani_skill_nightly-2025.4.29.2144.dist-info/METADATA,sha256=CGkhsy7GS5mSxmW1Ct1yTcDEVdO0043WxrUfAcJvdIQ,9292
807
+ mani_skill_nightly-2025.4.29.2144.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
808
+ mani_skill_nightly-2025.4.29.2144.dist-info/top_level.txt,sha256=bkBgOVl_MZMoQx2aRFsSFEYlZLxjWlip5vtJ39FB3jA,11
809
+ mani_skill_nightly-2025.4.29.2144.dist-info/RECORD,,