evolutionary-policy-optimization 0.0.17__py3-none-any.whl → 0.0.18__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- evolutionary_policy_optimization/epo.py +6 -0
- {evolutionary_policy_optimization-0.0.17.dist-info → evolutionary_policy_optimization-0.0.18.dist-info}/METADATA +2 -6
- evolutionary_policy_optimization-0.0.18.dist-info/RECORD +7 -0
- evolutionary_policy_optimization-0.0.17.dist-info/RECORD +0 -7
- {evolutionary_policy_optimization-0.0.17.dist-info → evolutionary_policy_optimization-0.0.18.dist-info}/WHEEL +0 -0
- {evolutionary_policy_optimization-0.0.17.dist-info → evolutionary_policy_optimization-0.0.18.dist-info}/licenses/LICENSE +0 -0
@@ -206,6 +206,8 @@ class Actor(Module):
|
|
206
206
|
assert len(dim_hiddens) >= 2
|
207
207
|
dim_first, *_, dim_last = dim_hiddens
|
208
208
|
|
209
|
+
self.dim_latent = dim_latent
|
210
|
+
|
209
211
|
self.init_layer = nn.Sequential(
|
210
212
|
nn.Linear(dim_state, dim_first),
|
211
213
|
nn.SiLU()
|
@@ -242,6 +244,8 @@ class Critic(Module):
|
|
242
244
|
assert len(dim_hiddens) >= 2
|
243
245
|
dim_first, *_, dim_last = dim_hiddens
|
244
246
|
|
247
|
+
self.dim_latent = dim_latent
|
248
|
+
|
245
249
|
self.init_layer = nn.Sequential(
|
246
250
|
nn.Linear(dim_state, dim_first),
|
247
251
|
nn.SiLU()
|
@@ -490,6 +494,8 @@ class Agent(Module):
|
|
490
494
|
|
491
495
|
self.latent_gene_pool = latent_gene_pool
|
492
496
|
|
497
|
+
assert actor.dim_latent == critic.dim_latent == latent_gene_pool.dim_latent
|
498
|
+
|
493
499
|
# optimizers
|
494
500
|
|
495
501
|
self.actor_optim = optim_klass(actor.parameters(), lr = actor_lr, **actor_optim_kwargs)
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: evolutionary-policy-optimization
|
3
|
-
Version: 0.0.
|
3
|
+
Version: 0.0.18
|
4
4
|
Summary: EPO - Pytorch
|
5
5
|
Project-URL: Homepage, https://pypi.org/project/evolutionary-policy-optimization/
|
6
6
|
Project-URL: Repository, https://github.com/lucidrains/evolutionary-policy-optimization
|
@@ -33,7 +33,7 @@ Classifier: Intended Audience :: Developers
|
|
33
33
|
Classifier: License :: OSI Approved :: MIT License
|
34
34
|
Classifier: Programming Language :: Python :: 3.8
|
35
35
|
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
36
|
-
Requires-Python: >=3.
|
36
|
+
Requires-Python: >=3.9
|
37
37
|
Requires-Dist: adam-atan2-pytorch
|
38
38
|
Requires-Dist: assoc-scan
|
39
39
|
Requires-Dist: einops>=0.8.0
|
@@ -44,10 +44,6 @@ Provides-Extra: examples
|
|
44
44
|
Requires-Dist: numpy; extra == 'examples'
|
45
45
|
Requires-Dist: pufferlib>=2.0.6; extra == 'examples'
|
46
46
|
Requires-Dist: tqdm; extra == 'examples'
|
47
|
-
Provides-Extra: examples-gym
|
48
|
-
Requires-Dist: box2d-py; extra == 'examples-gym'
|
49
|
-
Requires-Dist: gymnasium[box2d]>=1.0.0; extra == 'examples-gym'
|
50
|
-
Requires-Dist: tqdm; extra == 'examples-gym'
|
51
47
|
Provides-Extra: test
|
52
48
|
Requires-Dist: pytest; extra == 'test'
|
53
49
|
Description-Content-Type: text/markdown
|
@@ -0,0 +1,7 @@
|
|
1
|
+
evolutionary_policy_optimization/__init__.py,sha256=Qavcia0n13jjaWIS_LPW7QrxSLT_BBeKujCjF9kQjbA,133
|
2
|
+
evolutionary_policy_optimization/epo.py,sha256=3pvYPwAEZdrxwwV95Ea1qG4CQjLnyaxAr40opk07LDw,17747
|
3
|
+
evolutionary_policy_optimization/experimental.py,sha256=ktBKxRF27Qsj7WIgBpYlWXqMVxO9zOx2oD1JuDYRAwM,548
|
4
|
+
evolutionary_policy_optimization-0.0.18.dist-info/METADATA,sha256=BIyCXw2IbMs-x2hDbFs9NR5s2dYEbfbeK_LadUeUc8Q,4860
|
5
|
+
evolutionary_policy_optimization-0.0.18.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
6
|
+
evolutionary_policy_optimization-0.0.18.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
|
7
|
+
evolutionary_policy_optimization-0.0.18.dist-info/RECORD,,
|
@@ -1,7 +0,0 @@
|
|
1
|
-
evolutionary_policy_optimization/__init__.py,sha256=Qavcia0n13jjaWIS_LPW7QrxSLT_BBeKujCjF9kQjbA,133
|
2
|
-
evolutionary_policy_optimization/epo.py,sha256=U1iROmPdJjU_tqd50XtBUibfOHtYUE7MzfPu-6bU2Pw,17586
|
3
|
-
evolutionary_policy_optimization/experimental.py,sha256=ktBKxRF27Qsj7WIgBpYlWXqMVxO9zOx2oD1JuDYRAwM,548
|
4
|
-
evolutionary_policy_optimization-0.0.17.dist-info/METADATA,sha256=okvM0b28MQBex5XUXVWwflYcf7hqG3I5dAh8PxWGhrM,5047
|
5
|
-
evolutionary_policy_optimization-0.0.17.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
6
|
-
evolutionary_policy_optimization-0.0.17.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
|
7
|
-
evolutionary_policy_optimization-0.0.17.dist-info/RECORD,,
|
File without changes
|