broccoli-ml 13.0.0__py3-none-any.whl → 13.0.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
broccoli/transformer.py CHANGED
@@ -387,13 +387,6 @@ class FeedforwardBlock(nn.Module):
387
387
  self.beta = beta
388
388
  self.xglu = activation.__name__.endswith("GLU")
389
389
 
390
- if self.residual_path and (output_features < input_features):
391
- raise ValueError(
392
- "If the number of output features will be less than "
393
- "the number of input features, then `residual_path` "
394
- "should be set to False."
395
- )
396
-
397
390
  if self.post_norm:
398
391
  self.layernorm = nn.LayerNorm(output_features)
399
392
 
broccoli/vit.py CHANGED
@@ -187,9 +187,14 @@ class ViTEncoder(nn.Module):
187
187
  transformer_stochastic_depth=0.1,
188
188
  transformer_checkpoint_ff=True,
189
189
  linear_module=nn.Linear,
190
+ alpha=1.0,
191
+ beta=1.0,
190
192
  ):
191
193
  super().__init__()
192
194
 
195
+ self.alpha = alpha
196
+ self.beta = beta
197
+
193
198
  if cnn_activation_kwargs is not None:
194
199
  self.cnn_activation = cnn_activation(**cnn_activation_kwargs)
195
200
  else:
@@ -491,6 +496,8 @@ class ViT(nn.Module):
491
496
  batch_norm_logits=True,
492
497
  logit_projection_layer=nn.Linear,
493
498
  linear_module=nn.Linear,
499
+ alpha=1.0,
500
+ beta=1.0,
494
501
  ):
495
502
 
496
503
  super().__init__()
@@ -511,6 +518,9 @@ class ViT(nn.Module):
511
518
  "SwiGLU": SwiGLU,
512
519
  }[transformer_activation]
513
520
 
521
+ self.alpha = alpha
522
+ self.beta = beta
523
+
514
524
  self.encoder = ViTEncoder(
515
525
  input_size=input_size,
516
526
  initial_batch_norm=initial_batch_norm,
@@ -559,6 +569,8 @@ class ViT(nn.Module):
559
569
  transformer_stochastic_depth=transformer_stochastic_depth,
560
570
  transformer_checkpoint_ff=transformer_checkpoint_ff,
561
571
  linear_module=linear_module,
572
+ alpha=alpha,
573
+ beta=beta,
562
574
  )
563
575
 
564
576
  self.pool = head(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: broccoli-ml
3
- Version: 13.0.0
3
+ Version: 13.0.2
4
4
  Summary: Some useful Pytorch models, circa 2025
5
5
  License: MIT
6
6
  Author: Nicholas Bailey
@@ -4,10 +4,10 @@ broccoli/cnn.py,sha256=WjoPDSpe3ttwxCBNfCVRdaCHvbeZ7G-a5_i8fUsK_d8,4889
4
4
  broccoli/linear.py,sha256=W-3aNpBjd_0xRyzbCKkmg4H1qmslQOIQhB-WDDay2nM,13125
5
5
  broccoli/rope.py,sha256=GRqApBNmYCFaDak0WL1xE_BC5CTTYKQU_PBdeTcQcjc,12557
6
6
  broccoli/tensor.py,sha256=um8mrxkYbvNDo-QvHlmJm8Aw6qcngOlUZPoAk_PMReA,4480
7
- broccoli/transformer.py,sha256=3vAQQ75SAyr4-m3e7vSru8M-RpUy2Enp5cVUafaVYMU,28410
7
+ broccoli/transformer.py,sha256=LoQk41Wpio2AECHLGyDxwKiR_HFoJ5l_YNpPga4Ki0I,28113
8
8
  broccoli/utils.py,sha256=oOWzn6dJ5nC_9r4zq0emmfmaYACJXJNFS48AOpW2jqc,358
9
- broccoli/vit.py,sha256=ZOrbfORhl29HXRDWvLt2A2WbEANJlkNdiiucFB-1CmU,22244
10
- broccoli_ml-13.0.0.dist-info/LICENSE,sha256=0BAzJE5BqQ7Iixp_AFdB2W1uO-HCRX-Qfun8PHt6yVM,1073
11
- broccoli_ml-13.0.0.dist-info/METADATA,sha256=aiwPYSEkNHgJU89jT3tYoNaF_WsaFHoRC2DhgUN7IUE,1369
12
- broccoli_ml-13.0.0.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
13
- broccoli_ml-13.0.0.dist-info/RECORD,,
9
+ broccoli/vit.py,sha256=jd4e6MjL2JKB8ynSQssWRh6Hs36RuLj4uWyUNVhIMUY,22472
10
+ broccoli_ml-13.0.2.dist-info/LICENSE,sha256=0BAzJE5BqQ7Iixp_AFdB2W1uO-HCRX-Qfun8PHt6yVM,1073
11
+ broccoli_ml-13.0.2.dist-info/METADATA,sha256=JKnTpiCVV7mo300gauy1DNHvZnv7P1-4zHIxcUTFpQ0,1369
12
+ broccoli_ml-13.0.2.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
13
+ broccoli_ml-13.0.2.dist-info/RECORD,,