evolutionary-policy-optimization 0.1.10__py3-none-any.whl → 0.1.12__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- evolutionary_policy_optimization/epo.py +18 -0
- {evolutionary_policy_optimization-0.1.10.dist-info → evolutionary_policy_optimization-0.1.12.dist-info}/METADATA +12 -1
- {evolutionary_policy_optimization-0.1.10.dist-info → evolutionary_policy_optimization-0.1.12.dist-info}/RECORD +5 -5
- {evolutionary_policy_optimization-0.1.10.dist-info → evolutionary_policy_optimization-0.1.12.dist-info}/WHEEL +0 -0
- {evolutionary_policy_optimization-0.1.10.dist-info → evolutionary_policy_optimization-0.1.12.dist-info}/licenses/LICENSE +0 -0
@@ -146,6 +146,24 @@ def temp_batch_dim(fn):
|
|
146
146
|
|
147
147
|
return inner
|
148
148
|
|
149
|
+
# plasticity related
|
150
|
+
|
151
|
+
def shrink_and_perturb_(
|
152
|
+
module,
|
153
|
+
shrink_factor = 0.5,
|
154
|
+
perturb_factor = 0.01
|
155
|
+
):
|
156
|
+
# Shrink & Perturb
|
157
|
+
# Ash et al. https://arxiv.org/abs/1910.08475
|
158
|
+
|
159
|
+
assert 0. <= shrink_factor <= 1.
|
160
|
+
|
161
|
+
for p in module.parameters():
|
162
|
+
noise = torch.randn_like(p.data)
|
163
|
+
p.data.mul_(1. - shrink_factor).add_(noise * perturb_factor)
|
164
|
+
|
165
|
+
return module
|
166
|
+
|
149
167
|
# fitness related
|
150
168
|
|
151
169
|
def get_fitness_scores(
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: evolutionary-policy-optimization
|
3
|
-
Version: 0.1.
|
3
|
+
Version: 0.1.12
|
4
4
|
Summary: EPO - Pytorch
|
5
5
|
Project-URL: Homepage, https://pypi.org/project/evolutionary-policy-optimization/
|
6
6
|
Project-URL: Repository, https://github.com/lucidrains/evolutionary-policy-optimization
|
@@ -215,4 +215,15 @@ agent.load('./agent.pt')
|
|
215
215
|
}
|
216
216
|
```
|
217
217
|
|
218
|
+
```bibtex
|
219
|
+
@article{Ash2019OnTD,
|
220
|
+
title = {On the Difficulty of Warm-Starting Neural Network Training},
|
221
|
+
author = {Jordan T. Ash and Ryan P. Adams},
|
222
|
+
journal = {ArXiv},
|
223
|
+
year = {2019},
|
224
|
+
volume = {abs/1910.08475},
|
225
|
+
url = {https://api.semanticscholar.org/CorpusID:204788802}
|
226
|
+
}
|
227
|
+
```
|
228
|
+
|
218
229
|
*Evolution is cleverer than you are.* - Leslie Orgel
|
@@ -1,10 +1,10 @@
|
|
1
1
|
evolutionary_policy_optimization/__init__.py,sha256=NyiYDYU7DlpmOTM7xiBQET3r1WwX0ebrgMCBLSQrW3c,288
|
2
2
|
evolutionary_policy_optimization/distributed.py,sha256=7KgZdeS_wxBHo_du9XZFB1Cu318J-Bp66Xdr6Log_20,2423
|
3
3
|
evolutionary_policy_optimization/env_wrappers.py,sha256=bDL06o9_b1iW6k3fw2xifnOnYlzs643tdW6Yv2gsIdw,803
|
4
|
-
evolutionary_policy_optimization/epo.py,sha256=
|
4
|
+
evolutionary_policy_optimization/epo.py,sha256=aOltJBkZVi2FxXao51zdfYaLynIi8T8v3qO1ex2HElg,46058
|
5
5
|
evolutionary_policy_optimization/experimental.py,sha256=-IgqjJ_Wk_CMB1y9YYWpoYqTG9GZHAS6kbRdTluVevg,1563
|
6
6
|
evolutionary_policy_optimization/mock_env.py,sha256=TLyyRm6tOD0Kdn9QqJJQriaSnsR-YmNQHo4OohmZFG4,1410
|
7
|
-
evolutionary_policy_optimization-0.1.
|
8
|
-
evolutionary_policy_optimization-0.1.
|
9
|
-
evolutionary_policy_optimization-0.1.
|
10
|
-
evolutionary_policy_optimization-0.1.
|
7
|
+
evolutionary_policy_optimization-0.1.12.dist-info/METADATA,sha256=B_eK4c8-dp4rr4K0HxRiNJqY6fK10XmwBbsPm-PE0_k,7625
|
8
|
+
evolutionary_policy_optimization-0.1.12.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
9
|
+
evolutionary_policy_optimization-0.1.12.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
|
10
|
+
evolutionary_policy_optimization-0.1.12.dist-info/RECORD,,
|
File without changes
|