evolutionary-policy-optimization 0.2.0__py3-none-any.whl → 0.2.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- evolutionary_policy_optimization/epo.py +8 -3
- {evolutionary_policy_optimization-0.2.0.dist-info → evolutionary_policy_optimization-0.2.3.dist-info}/METADATA +1 -1
- {evolutionary_policy_optimization-0.2.0.dist-info → evolutionary_policy_optimization-0.2.3.dist-info}/RECORD +5 -5
- {evolutionary_policy_optimization-0.2.0.dist-info → evolutionary_policy_optimization-0.2.3.dist-info}/WHEEL +0 -0
- {evolutionary_policy_optimization-0.2.0.dist-info → evolutionary_policy_optimization-0.2.3.dist-info}/licenses/LICENSE +0 -0
@@ -1044,7 +1044,14 @@ class Agent(Module):
|
|
1044
1044
|
actor.state_norm = critic.state_norm = state_norm
|
1045
1045
|
|
1046
1046
|
self.use_critic_ema = use_critic_ema
|
1047
|
-
|
1047
|
+
|
1048
|
+
self.critic_ema = EMA(
|
1049
|
+
critic,
|
1050
|
+
beta = critic_ema_beta,
|
1051
|
+
include_online_model = False,
|
1052
|
+
ignore_startswith_names = {'state_norm'},
|
1053
|
+
**ema_kwargs
|
1054
|
+
) if use_critic_ema else None
|
1048
1055
|
|
1049
1056
|
self.latent_gene_pool = latent_gene_pool
|
1050
1057
|
self.num_latents = latent_gene_pool.num_latents if exists(latent_gene_pool) else 1
|
@@ -1179,8 +1186,6 @@ class Agent(Module):
|
|
1179
1186
|
|
1180
1187
|
unwrap(self.critic).load_state_dict(pkg['critic'])
|
1181
1188
|
|
1182
|
-
unwrap(self.latent_gene_pool).load_state_dict(pkg['latents'])
|
1183
|
-
|
1184
1189
|
if self.use_critic_ema:
|
1185
1190
|
self.critic_ema.load_state_dict(pkg['critic_ema'])
|
1186
1191
|
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: evolutionary-policy-optimization
|
3
|
-
Version: 0.2.
|
3
|
+
Version: 0.2.3
|
4
4
|
Summary: EPO - Pytorch
|
5
5
|
Project-URL: Homepage, https://pypi.org/project/evolutionary-policy-optimization/
|
6
6
|
Project-URL: Repository, https://github.com/lucidrains/evolutionary-policy-optimization
|
@@ -1,10 +1,10 @@
|
|
1
1
|
evolutionary_policy_optimization/__init__.py,sha256=NyiYDYU7DlpmOTM7xiBQET3r1WwX0ebrgMCBLSQrW3c,288
|
2
2
|
evolutionary_policy_optimization/distributed.py,sha256=MxyxqxANAuOm8GYb0Yu09EHd_aVLhK2uwgrfuVWciPU,2342
|
3
3
|
evolutionary_policy_optimization/env_wrappers.py,sha256=bDL06o9_b1iW6k3fw2xifnOnYlzs643tdW6Yv2gsIdw,803
|
4
|
-
evolutionary_policy_optimization/epo.py,sha256=
|
4
|
+
evolutionary_policy_optimization/epo.py,sha256=81rf249ykaPrAEMGk9KsF98qDkCUhW8xL3-2UXIvI2E,51838
|
5
5
|
evolutionary_policy_optimization/experimental.py,sha256=ZyOGHbE4dXmt4zCljSzcUklua4vlOwQtslhFEm0JN94,1716
|
6
6
|
evolutionary_policy_optimization/mock_env.py,sha256=TLyyRm6tOD0Kdn9QqJJQriaSnsR-YmNQHo4OohmZFG4,1410
|
7
|
-
evolutionary_policy_optimization-0.2.
|
8
|
-
evolutionary_policy_optimization-0.2.
|
9
|
-
evolutionary_policy_optimization-0.2.
|
10
|
-
evolutionary_policy_optimization-0.2.
|
7
|
+
evolutionary_policy_optimization-0.2.3.dist-info/METADATA,sha256=syjis1-9dDCEwfGt7CeMfhC5k7OegIl4BBsKaTnYssQ,8697
|
8
|
+
evolutionary_policy_optimization-0.2.3.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
9
|
+
evolutionary_policy_optimization-0.2.3.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
|
10
|
+
evolutionary_policy_optimization-0.2.3.dist-info/RECORD,,
|
File without changes
|