mani-skill-nightly 2025.4.29.817__py3-none-any.whl → 2025.4.29.2144__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mani_skill/envs/tasks/tabletop/push_cube.py +13 -3
- {mani_skill_nightly-2025.4.29.817.dist-info → mani_skill_nightly-2025.4.29.2144.dist-info}/METADATA +1 -1
- {mani_skill_nightly-2025.4.29.817.dist-info → mani_skill_nightly-2025.4.29.2144.dist-info}/RECORD +6 -6
- {mani_skill_nightly-2025.4.29.817.dist-info → mani_skill_nightly-2025.4.29.2144.dist-info}/LICENSE +0 -0
- {mani_skill_nightly-2025.4.29.817.dist-info → mani_skill_nightly-2025.4.29.2144.dist-info}/WHEEL +0 -0
- {mani_skill_nightly-2025.4.29.817.dist-info → mani_skill_nightly-2025.4.29.2144.dist-info}/top_level.txt +0 -0
@@ -45,7 +45,7 @@ class PushCubeEnv(BaseEnv):
|
|
45
45
|
- the target goal region is marked by a red/white circular target. The position of the target is fixed to be the cube xy position + [0.1 + goal_radius, 0]
|
46
46
|
|
47
47
|
**Success Conditions:**
|
48
|
-
- the cube's xy position is within goal_radius (default 0.1) of the target's xy position by euclidean distance.
|
48
|
+
- the cube's xy position is within goal_radius (default 0.1) of the target's xy position by euclidean distance and the cube is still on the table.
|
49
49
|
"""
|
50
50
|
|
51
51
|
_sample_video_link = "https://github.com/haosulab/ManiSkill/raw/main/figures/environment_demos/PushCube-v1_rt.mp4"
|
@@ -226,12 +226,22 @@ class PushCubeEnv(BaseEnv):
|
|
226
226
|
)
|
227
227
|
place_reward = 1 - torch.tanh(5 * obj_to_goal_dist)
|
228
228
|
reward += place_reward * reached
|
229
|
+
|
230
|
+
# Compute a z reward to encourage the robot to keep the cube on the table
|
231
|
+
desired_obj_z = self.cube_half_size
|
232
|
+
current_obj_z = self.obj.pose.p[..., 2]
|
233
|
+
z_deviation = torch.abs(current_obj_z - desired_obj_z)
|
234
|
+
z_reward = 1 - torch.tanh(5 * z_deviation)
|
235
|
+
# We multiply the z reward by the place_reward and reached mask so that
|
236
|
+
# we only add the z reward if the robot has reached the desired push pose
|
237
|
+
# and the z reward becomes more important as the robot gets closer to the goal.
|
238
|
+
reward += place_reward * z_reward * reached
|
229
239
|
|
230
240
|
# assign rewards to parallel environments that achieved success to the maximum of 3.
|
231
|
-
reward[info["success"]] =
|
241
|
+
reward[info["success"]] = 4
|
232
242
|
return reward
|
233
243
|
|
234
244
|
def compute_normalized_dense_reward(self, obs: Any, action: Array, info: Dict):
|
235
245
|
# this should be equal to compute_dense_reward / max possible reward
|
236
|
-
max_reward =
|
246
|
+
max_reward = 4.0
|
237
247
|
return self.compute_dense_reward(obs=obs, action=action, info=info) / max_reward
|
{mani_skill_nightly-2025.4.29.817.dist-info → mani_skill_nightly-2025.4.29.2144.dist-info}/RECORD
RENAMED
@@ -606,7 +606,7 @@ mani_skill/envs/tasks/tabletop/plug_charger.py,sha256=0g-rkNf-oo2ovttlcQ58jqUq6S
|
|
606
606
|
mani_skill/envs/tasks/tabletop/poke_cube.py,sha256=KV6mp-Xgm9h4GYUcAUop2AZ4IECTdQKEMRRd9NThyBo,9343
|
607
607
|
mani_skill/envs/tasks/tabletop/pull_cube.py,sha256=txtWuIRFzTKxJtWbrygxVEgOPDvm73WlERXldjlUB-I,5546
|
608
608
|
mani_skill/envs/tasks/tabletop/pull_cube_tool.py,sha256=NaZpdbYYL4zC41GVY__eq4uRIQpVXthzAqe5oSq8YWU,9951
|
609
|
-
mani_skill/envs/tasks/tabletop/push_cube.py,sha256=
|
609
|
+
mani_skill/envs/tasks/tabletop/push_cube.py,sha256=WZ4k89f8inbwbomYtJAxodQDcGUYhDMrn9UHoaqYODQ,12701
|
610
610
|
mani_skill/envs/tasks/tabletop/push_t.py,sha256=MpANhMe6ay5Qhsipe2G1Wy-LSJqrgeOyH3M8fZW_L2c,23522
|
611
611
|
mani_skill/envs/tasks/tabletop/roll_ball.py,sha256=OujblvDphjdQBzQiCUnm_gXFwGLubpr40VT7daCWlDo,6760
|
612
612
|
mani_skill/envs/tasks/tabletop/stack_cube.py,sha256=_3auYI95uj6hMzTmHMty8pFmD5RhiVxw48MPg5BpREA,7459
|
@@ -802,8 +802,8 @@ mani_skill/vector/wrappers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJ
|
|
802
802
|
mani_skill/vector/wrappers/gymnasium.py,sha256=v1MDPIrVACBKCulrpdXBK2jDZQI7LKYFZgGgaCC5avY,7408
|
803
803
|
mani_skill/vector/wrappers/sb3.py,sha256=SlXdiEPqcNHYMhJCzA29kBU6zK7DKTe1nc0L6Z3QQtY,4722
|
804
804
|
mani_skill/viewer/__init__.py,sha256=srvDBsk4LQU75K2VIttrhiQ68p_ro7PSDqQRls2PY5c,1722
|
805
|
-
mani_skill_nightly-2025.4.29.
|
806
|
-
mani_skill_nightly-2025.4.29.
|
807
|
-
mani_skill_nightly-2025.4.29.
|
808
|
-
mani_skill_nightly-2025.4.29.
|
809
|
-
mani_skill_nightly-2025.4.29.
|
805
|
+
mani_skill_nightly-2025.4.29.2144.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
806
|
+
mani_skill_nightly-2025.4.29.2144.dist-info/METADATA,sha256=CGkhsy7GS5mSxmW1Ct1yTcDEVdO0043WxrUfAcJvdIQ,9292
|
807
|
+
mani_skill_nightly-2025.4.29.2144.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
|
808
|
+
mani_skill_nightly-2025.4.29.2144.dist-info/top_level.txt,sha256=bkBgOVl_MZMoQx2aRFsSFEYlZLxjWlip5vtJ39FB3jA,11
|
809
|
+
mani_skill_nightly-2025.4.29.2144.dist-info/RECORD,,
|
{mani_skill_nightly-2025.4.29.817.dist-info → mani_skill_nightly-2025.4.29.2144.dist-info}/LICENSE
RENAMED
File without changes
|
{mani_skill_nightly-2025.4.29.817.dist-info → mani_skill_nightly-2025.4.29.2144.dist-info}/WHEEL
RENAMED
File without changes
|
File without changes
|