evolutionary-policy-optimization 0.0.57__py3-none-any.whl → 0.0.58__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -856,10 +856,12 @@ class Agent(Module):
856
856
  dones
857
857
  ) = memories
858
858
 
859
+ masks = 1. - dones.float()
860
+
859
861
  advantages = self.calc_gae(
860
862
  rewards[:-1],
861
863
  values,
862
- dones[:-1],
864
+ masks[:-1],
863
865
  )
864
866
 
865
867
  valid_episode = episode_ids >= 0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: evolutionary-policy-optimization
3
- Version: 0.0.57
3
+ Version: 0.0.58
4
4
  Summary: EPO - Pytorch
5
5
  Project-URL: Homepage, https://pypi.org/project/evolutionary-policy-optimization/
6
6
  Project-URL: Repository, https://github.com/lucidrains/evolutionary-policy-optimization
@@ -1,9 +1,9 @@
1
1
  evolutionary_policy_optimization/__init__.py,sha256=0q0aBuFgWi06MLMD8FiHzBYQ3_W4LYWrwmCtF3u5H2A,201
2
2
  evolutionary_policy_optimization/distributed.py,sha256=7KgZdeS_wxBHo_du9XZFB1Cu318J-Bp66Xdr6Log_20,2423
3
- evolutionary_policy_optimization/epo.py,sha256=qPj5kRsISY1I6WjCc-ejpuiwOSxtPsSdMABmchXJ3s0,35252
3
+ evolutionary_policy_optimization/epo.py,sha256=2PlLBrhX5_kkV4NOhxC5VB_plR-_jw3krrmMSjWAiCY,35288
4
4
  evolutionary_policy_optimization/experimental.py,sha256=-IgqjJ_Wk_CMB1y9YYWpoYqTG9GZHAS6kbRdTluVevg,1563
5
5
  evolutionary_policy_optimization/mock_env.py,sha256=202KJ5g57wQvOzhGYzgHfBa7Y2do5uuDvl5kFg5o73g,934
6
- evolutionary_policy_optimization-0.0.57.dist-info/METADATA,sha256=WBHRK98s_lzWbqG4ouq620ayykPF9SHUz3HdvsRUywc,6213
7
- evolutionary_policy_optimization-0.0.57.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
8
- evolutionary_policy_optimization-0.0.57.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
9
- evolutionary_policy_optimization-0.0.57.dist-info/RECORD,,
6
+ evolutionary_policy_optimization-0.0.58.dist-info/METADATA,sha256=ni9pyD5CS2QbBmwEUhCYt_RAxz3YnnOv3IY3ywNagSs,6213
7
+ evolutionary_policy_optimization-0.0.58.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
8
+ evolutionary_policy_optimization-0.0.58.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
9
+ evolutionary_policy_optimization-0.0.58.dist-info/RECORD,,