broccoli-ml 0.38.0__py3-none-any.whl → 0.39.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
broccoli/linear.py CHANGED
@@ -34,7 +34,8 @@ class SpectralNormLinear(nn.Module):
34
34
 
35
35
  def reset_parameters(self) -> None:
36
36
  weights = torch.empty(self.out_features, self.in_features)
37
- nn.init.kaiming_uniform_(weights, a=math.sqrt(5))
37
+ stdv = 1.0 / math.sqrt(self.in_features)
38
+ nn.init.uniform_(weights, a=-stdv, b=stdv)
38
39
  if self.use_bias:
39
40
  fan_in, _ = nn.init._calculate_fan_in_and_fan_out(weights)
40
41
  bound = 1 / math.sqrt(fan_in) if fan_in > 0 else 0
@@ -77,7 +78,8 @@ class AnchoredLinear(nn.Module):
77
78
 
78
79
  def reset_parameters(self) -> None:
79
80
  weights = torch.empty(self.out_features, self.in_features)
80
- nn.init.kaiming_uniform_(weights, a=math.sqrt(5))
81
+ stdv = 1.0 / math.sqrt(self.in_features)
82
+ nn.init.uniform_(weights, a=-stdv, b=stdv)
81
83
  if self.use_bias:
82
84
  fan_in, _ = nn.init._calculate_fan_in_and_fan_out(weights)
83
85
  bound = 1 / math.sqrt(fan_in) if fan_in > 0 else 0
@@ -120,7 +122,8 @@ class WeightNormedLinear(nn.Module):
120
122
 
121
123
  def reset_parameters(self) -> None:
122
124
  weights = torch.empty(self.out_features, self.in_features)
123
- nn.init.kaiming_uniform_(weights, a=math.sqrt(5))
125
+ stdv = 1.0 / math.sqrt(self.in_features)
126
+ nn.init.uniform_(weights, a=-stdv, b=stdv)
124
127
  if self.use_bias:
125
128
  fan_in, _ = nn.init._calculate_fan_in_and_fan_out(weights)
126
129
  bound = 1 / math.sqrt(fan_in) if fan_in > 0 else 0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: broccoli-ml
3
- Version: 0.38.0
3
+ Version: 0.39.0
4
4
  Summary: Some useful Pytorch models, circa 2025
5
5
  License: MIT
6
6
  Author: Nicholas Bailey
@@ -5,13 +5,13 @@ broccoli/assets/cifar100_eigenvectors_size_2.pt,sha256=DjXDOXMeuMpIqNuGhX9z-OWYV
5
5
  broccoli/assets/cifar100_eigenvectors_size_3.pt,sha256=gL6k0xtXYiYP6ZSvEiMBdJ7kIkT0AngTpDJHFQqwgxA,7173
6
6
  broccoli/cnn.py,sha256=jeRyKIAMWu1E3iyI14MGgSZuZivPMh12iqkqW9ilNjo,17785
7
7
  broccoli/eigenpatches.py,sha256=J6n2usN1oQuHEHYiBNyYpn_a9eQcHjOBiIlvSei520Y,2413
8
- broccoli/linear.py,sha256=zlFDij9TngqDzTTpUlZtX0PXAQgxyWWnTIXpiO1rBk0,4768
8
+ broccoli/linear.py,sha256=w021EDzWVDEu9odzrf9QwBZ3G8Ydu3nroV8soIJeRng,4894
9
9
  broccoli/rope.py,sha256=hw7kBPNR9GQXj4GxyIAffsGKPfcTPOFh8Bc7oEHtaZY,12108
10
10
  broccoli/tensor.py,sha256=um8mrxkYbvNDo-QvHlmJm8Aw6qcngOlUZPoAk_PMReA,4480
11
11
  broccoli/transformer.py,sha256=Xw1oBLsvVeHmMqgurhorRa49nrjfooLev5uBPFeK9og,17004
12
12
  broccoli/utils.py,sha256=htq_hOsdhUhL0nJi9WkKiEYOjEoWqFpK5X49PtgTf-0,299
13
13
  broccoli/vit.py,sha256=RaSJZh2ogqNAvAkQDuZpNqdtRTWaW_8ug4BsBCBK_f4,17728
14
- broccoli_ml-0.38.0.dist-info/LICENSE,sha256=0BAzJE5BqQ7Iixp_AFdB2W1uO-HCRX-Qfun8PHt6yVM,1073
15
- broccoli_ml-0.38.0.dist-info/METADATA,sha256=8lcwJvmlPT_-SkJZ5Qd6nFc4Njz7mQD-JefeUxhk8Xw,1257
16
- broccoli_ml-0.38.0.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
17
- broccoli_ml-0.38.0.dist-info/RECORD,,
14
+ broccoli_ml-0.39.0.dist-info/LICENSE,sha256=0BAzJE5BqQ7Iixp_AFdB2W1uO-HCRX-Qfun8PHt6yVM,1073
15
+ broccoli_ml-0.39.0.dist-info/METADATA,sha256=wR3glIOttDNALtYadYXNBbwjHS3p5wtBoWGwjLEg8c8,1257
16
+ broccoli_ml-0.39.0.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
17
+ broccoli_ml-0.39.0.dist-info/RECORD,,