adv-optm 1.0.0__py3-none-any.whl → 1.0.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of adv-optm might be problematic. Click here for more details.

@@ -46,8 +46,8 @@ class Simplified_AdEMAMix(torch.optim.Optimizer):
46
46
  matrices to apply low-rank compression (default: True).
47
47
  stochastic_rounding (bool): whether to use stochastic
48
48
  rounding for BF16 parameter updates (default: True).
49
- use_orthograd (bool): whether to use OrthoGrad. (default: False)
50
- factored (bool): whether to use the factorization or disable it to use
49
+ orthogonal_gradient (bool): whether to use OrthoGrad. (default: False)
50
+ nnmf_factor (bool): whether to use the factorization or disable it to use
51
51
  the uncompressed optimizer. (default: False)
52
52
  """
53
53
 
@@ -64,8 +64,8 @@ class Simplified_AdEMAMix(torch.optim.Optimizer):
64
64
  use_bias_correction: bool = True,
65
65
  vector_reshape: bool = True,
66
66
  stochastic_rounding: bool = True,
67
- use_orthograd: bool = False,
68
- factored: bool = False,
67
+ orthogonal_gradient: bool = False,
68
+ nnmf_factor: bool = False,
69
69
  ):
70
70
  if not (lr >= 0.0):
71
71
  raise ValueError(f"Learning-rate should be >= 0.0. Got {lr}")
@@ -82,10 +82,10 @@ class Simplified_AdEMAMix(torch.optim.Optimizer):
82
82
  "lr": lr, "betas": betas, "eps": eps, "weight_decay": weight_decay,
83
83
  "alpha_grad": alpha_grad, "beta1_warmup": beta1_warmup, "min_beta1": min_beta1,
84
84
  "vector_reshape": vector_reshape,
85
- "use_orthograd": use_orthograd, "use_bias_correction": use_bias_correction,
85
+ "orthogonal_gradient": orthogonal_gradient, "use_bias_correction": use_bias_correction,
86
86
  }
87
87
  self.stochastic_rounding = stochastic_rounding
88
- self.factored = factored
88
+ self.factored = nnmf_factor
89
89
  super().__init__(params, defaults)
90
90
 
91
91
  @property
@@ -108,7 +108,7 @@ class Simplified_AdEMAMix(torch.optim.Optimizer):
108
108
  grad = p.grad
109
109
  if grad.dtype != torch.float32 and self.factored:
110
110
  grad = grad.float()
111
- if group["use_orthograd"]:
111
+ if group["orthogonal_gradient"]:
112
112
  grad = _orthogonalize_gradient(p, grad)
113
113
  state = self.state[p]
114
114
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: adv_optm
3
- Version: 1.0.0
3
+ Version: 1.0.3
4
4
  Summary: A family of highly efficient, lightweight yet powerful optimizers.
5
5
  Home-page: https://github.com/Koratahiu/Advanced_Optimizers
6
6
  Author: Koratahiu
@@ -0,0 +1,19 @@
1
+ adv_optm/__init__.py,sha256=zL7hnbPAHt7w-0fZQld04Pt58F-aYaRAqz15e-RZh-Y,306
2
+ adv_optm/optim/AdamW_adv.py,sha256=aTuYcJgd_EcZOrs6TDgBrBKw3wtU5LPzE5WvTBDDeEo,14317
3
+ adv_optm/optim/Adopt_adv.py,sha256=lElmraSiIZiGu9W6ELXnIPZNEEYi1ZWuvuemgPZOixk,17484
4
+ adv_optm/optim/Lion_Prodigy_adv.py,sha256=sGzhts9a6gHfCkuHTB5L9IrClo4c6UThzYYErBwqOaA,12844
5
+ adv_optm/optim/Lion_adv.py,sha256=6G1CukJB_pC7l9HwFEuY1ydsNHZFabVmOvcHDsHHVuQ,8295
6
+ adv_optm/optim/Prodigy_adv.py,sha256=8XUpu19BaBmHb-R9K3jgwySDbtVaLU1_Drtttc_zITs,22461
7
+ adv_optm/optim/Simplified_AdEMAMix.py,sha256=tb3d6Cw_nGwcTzYUhDnKqyP7GzjD1hn8k4WqGG5lhmw,9813
8
+ adv_optm/optim/__init__.py,sha256=pcP865H2j1tut2VfTUhzQh7V8TF_tzPjqFnjMfFed2k,382
9
+ adv_optm/util/BF16_Stochastic_Rounding.py,sha256=Q5H0BcogmE4atP65dLoI21HKSf50lRdsBDfeF6v9Tbg,1548
10
+ adv_optm/util/Effective_Shape.py,sha256=TBvIk1V8IuTbbBsxuekJA4e_v8JlR5Nujtut8RTWAm4,318
11
+ adv_optm/util/NNMF.py,sha256=yRf5IP5Sjq0Uf0DxN0Q8NxEGSdD-f1ULziLVDOjY8K4,639
12
+ adv_optm/util/One_Bit_Boolean.py,sha256=Wat49esdwohuN-OHOFMW8D0aOQgV9cP5Rl8z6yfmpos,1068
13
+ adv_optm/util/OrthoGrad.py,sha256=NzInuBQGy_Ja__M1R9XbvqVaQ0fhGbtGgFE9YON7B3I,707
14
+ adv_optm/util/__init__.py,sha256=qoyIF0jcLjs_vSEcsv36clw5LFNBEbifyXrrVxMH-G4,349
15
+ adv_optm-1.0.3.dist-info/licenses/LICENSE,sha256=HrhfyXIkWY2tGFK11kg7vPCqhgh5DcxleloqdhrpyMY,11558
16
+ adv_optm-1.0.3.dist-info/METADATA,sha256=Cx9bqS9VFt2nBey-H7GxVS0AXwNzTy0eW5NtSW6uXKk,8422
17
+ adv_optm-1.0.3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
18
+ adv_optm-1.0.3.dist-info/top_level.txt,sha256=iNfBIIzu-lPrQ7jyC56WBCcbkRwitM2nJ15-MRQ_6fg,9
19
+ adv_optm-1.0.3.dist-info/RECORD,,
@@ -1,19 +0,0 @@
1
- adv_optm/__init__.py,sha256=2qu7FpN7btJdmkvyT4uVs8XOIrvSkyZdOf2pHm1JWRU,306
2
- adv_optm/optim/AdamW_adv.py,sha256=Pu0TB14dOhcq9kwXclMIeKCI6ef_P0emwzxPu6xuBM0,14252
3
- adv_optm/optim/Adopt_adv.py,sha256=71o9BHV3XFefJX21G37PKG96D09x-PSU0eW3Q7WkAjs,17427
4
- adv_optm/optim/Lion_Prodigy_adv.py,sha256=kIAGXoMbDNRg5reKXtUC_vQQ2gyM-NXPB-Pv9zSpiE8,12787
5
- adv_optm/optim/Lion_adv.py,sha256=05j_j6LIzHW5b79DVwMIf1FZHVNB8xnStNVjlOdVkCE,8256
6
- adv_optm/optim/Prodigy_adv.py,sha256=0BsCNYnq5O0UBvvyUuV385oMTJmNOyv5IQ3wEFuNfeM,21929
7
- adv_optm/optim/Simplified_AdEMAMix.py,sha256=opIZjnGJ03-DDAIHTZyJBMReVfgusGDb8FZSWMU3-UM,9774
8
- adv_optm/optim/__init__.py,sha256=pcP865H2j1tut2VfTUhzQh7V8TF_tzPjqFnjMfFed2k,382
9
- adv_optm/util/BF16_Stochastic_Rounding.py,sha256=Q5H0BcogmE4atP65dLoI21HKSf50lRdsBDfeF6v9Tbg,1548
10
- adv_optm/util/Effective_Shape.py,sha256=TBvIk1V8IuTbbBsxuekJA4e_v8JlR5Nujtut8RTWAm4,318
11
- adv_optm/util/NNMF.py,sha256=yRf5IP5Sjq0Uf0DxN0Q8NxEGSdD-f1ULziLVDOjY8K4,639
12
- adv_optm/util/One_Bit_Boolean.py,sha256=Wat49esdwohuN-OHOFMW8D0aOQgV9cP5Rl8z6yfmpos,1068
13
- adv_optm/util/OrthoGrad.py,sha256=NzInuBQGy_Ja__M1R9XbvqVaQ0fhGbtGgFE9YON7B3I,707
14
- adv_optm/util/__init__.py,sha256=qoyIF0jcLjs_vSEcsv36clw5LFNBEbifyXrrVxMH-G4,349
15
- adv_optm-1.0.0.dist-info/licenses/LICENSE,sha256=HrhfyXIkWY2tGFK11kg7vPCqhgh5DcxleloqdhrpyMY,11558
16
- adv_optm-1.0.0.dist-info/METADATA,sha256=sxxTU-62diwjtJPWHFeL6gMWuX8xmlWzEzqk9KfpXvA,8422
17
- adv_optm-1.0.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
18
- adv_optm-1.0.0.dist-info/top_level.txt,sha256=iNfBIIzu-lPrQ7jyC56WBCcbkRwitM2nJ15-MRQ_6fg,9
19
- adv_optm-1.0.0.dist-info/RECORD,,