adv-optm 1.2.dev4__py3-none-any.whl → 1.2.dev5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of adv-optm might be problematic. Click here for more details.
- adv_optm/__init__.py +1 -1
- adv_optm/optim/AdaMuon_adv.py +5 -5
- {adv_optm-1.2.dev4.dist-info → adv_optm-1.2.dev5.dist-info}/METADATA +1 -1
- {adv_optm-1.2.dev4.dist-info → adv_optm-1.2.dev5.dist-info}/RECORD +7 -7
- {adv_optm-1.2.dev4.dist-info → adv_optm-1.2.dev5.dist-info}/WHEEL +0 -0
- {adv_optm-1.2.dev4.dist-info → adv_optm-1.2.dev5.dist-info}/licenses/LICENSE +0 -0
- {adv_optm-1.2.dev4.dist-info → adv_optm-1.2.dev5.dist-info}/top_level.txt +0 -0
adv_optm/__init__.py
CHANGED
adv_optm/optim/AdaMuon_adv.py
CHANGED
|
@@ -182,7 +182,11 @@ class AdaMuon_adv(torch.optim.Optimizer):
|
|
|
182
182
|
|
|
183
183
|
for key, value in defaults_to_use.items():
|
|
184
184
|
new_group.setdefault(key, value)
|
|
185
|
-
|
|
185
|
+
if '_kourkoutas_beta' not in new_group:
|
|
186
|
+
if optim_type == 'adam':
|
|
187
|
+
new_group['_kourkoutas_beta'] = False
|
|
188
|
+
else:
|
|
189
|
+
new_group['_kourkoutas_beta'] = muon_defaults['_kourkoutas_beta']
|
|
186
190
|
final_param_groups.append(new_group)
|
|
187
191
|
|
|
188
192
|
super().__init__(final_param_groups, {})
|
|
@@ -225,10 +229,6 @@ class AdaMuon_adv(torch.optim.Optimizer):
|
|
|
225
229
|
# We need to temporarily "lend" our state and param_groups
|
|
226
230
|
self.aux_adam.state = self.state
|
|
227
231
|
self.aux_adam.param_groups = self.param_groups
|
|
228
|
-
|
|
229
|
-
# Ensure the aux optimizer uses the same Kourkoutas helper instance.
|
|
230
|
-
if self._kourkoutas_helper is not None:
|
|
231
|
-
self.aux_adam.kourkoutas_helper = self._kourkoutas_helper
|
|
232
232
|
|
|
233
233
|
self.aux_adam.step_parameter(p, group, i)
|
|
234
234
|
return
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
adv_optm/__init__.py,sha256=
|
|
2
|
-
adv_optm/optim/AdaMuon_adv.py,sha256=
|
|
1
|
+
adv_optm/__init__.py,sha256=qN0PCs5LCVh4uMyLfaz48OfCa-g_HZc55JUjWu4o9lI,379
|
|
2
|
+
adv_optm/optim/AdaMuon_adv.py,sha256=hTGSH8wzmQ-NYIcqV6EAEbqCxxfEwmmMWaIadX1qiuQ,21009
|
|
3
3
|
adv_optm/optim/AdamW_adv.py,sha256=7IvdD1rqYeHZwQCZU9X0H7x87MCKcHQ5M68GLuMCkvE,17702
|
|
4
4
|
adv_optm/optim/Adopt_adv.py,sha256=C2FsEZGvCk9q4YNKAj0qIxdZ5AfPlda-1lIpSX0a1nE,21256
|
|
5
5
|
adv_optm/optim/Lion_Prodigy_adv.py,sha256=LEA3UYJpPeFnmxeniLNv1u2LKKj4ufx3Bq_MLw-nWXk,14617
|
|
@@ -17,8 +17,8 @@ adv_optm/util/Newton_Schulz.py,sha256=wJ_sKRaGVIsOofQ737my4ng494qX_pfgOqlDDmYtnC
|
|
|
17
17
|
adv_optm/util/One_Bit_Boolean.py,sha256=Wat49esdwohuN-OHOFMW8D0aOQgV9cP5Rl8z6yfmpos,1068
|
|
18
18
|
adv_optm/util/OrthoGrad.py,sha256=NzInuBQGy_Ja__M1R9XbvqVaQ0fhGbtGgFE9YON7B3I,707
|
|
19
19
|
adv_optm/util/__init__.py,sha256=jAaUfaAjFrTJ6-Q915ezAbq0efRbpYjriW2OdeCbSzo,433
|
|
20
|
-
adv_optm-1.2.
|
|
21
|
-
adv_optm-1.2.
|
|
22
|
-
adv_optm-1.2.
|
|
23
|
-
adv_optm-1.2.
|
|
24
|
-
adv_optm-1.2.
|
|
20
|
+
adv_optm-1.2.dev5.dist-info/licenses/LICENSE,sha256=HrhfyXIkWY2tGFK11kg7vPCqhgh5DcxleloqdhrpyMY,11558
|
|
21
|
+
adv_optm-1.2.dev5.dist-info/METADATA,sha256=7fZuoYwICMHtJ2-3azNC9Z5IOPnx9cJ6Wbyc5VTMo0I,14022
|
|
22
|
+
adv_optm-1.2.dev5.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
23
|
+
adv_optm-1.2.dev5.dist-info/top_level.txt,sha256=iNfBIIzu-lPrQ7jyC56WBCcbkRwitM2nJ15-MRQ_6fg,9
|
|
24
|
+
adv_optm-1.2.dev5.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|