broccoli-ml 0.39.0__py3-none-any.whl → 0.40.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
broccoli/vit.py CHANGED
@@ -120,6 +120,7 @@ class ViTEncoder(nn.Module):
120
120
  transformer_initial_ff_residual_path=True,
121
121
  transformer_initial_ff_linear_module_up=None,
122
122
  transformer_initial_ff_linear_module_down=None,
123
+ transformer_initial_ff_mlp_dropout=None,
123
124
  transformer_pre_norm=True,
124
125
  transformer_normformer=False,
125
126
  transformer_post_norm=False,
@@ -307,7 +308,12 @@ class ViTEncoder(nn.Module):
307
308
  transformer_embedding_size,
308
309
  activation=transformer_activation,
309
310
  activation_kwargs=transformer_activation_kwargs,
310
- dropout=transformer_mlp_dropout,
311
+ dropout=(
312
+ # First truthy assigned value
313
+ transformer_initial_ff_mlp_dropout
314
+ if transformer_initial_ff_mlp_dropout is not None
315
+ else transformer_mlp_dropout
316
+ ),
311
317
  linear_module_up=(
312
318
  # First truthy assigned value
313
319
  transformer_initial_ff_linear_module_up
@@ -349,11 +355,7 @@ class ViTEncoder(nn.Module):
349
355
 
350
356
  class ViT(nn.Module):
351
357
  """
352
- Denoising convolutional transformer
353
- Based on the Compact Convolutional Transformer (CCT) of [Hasani et al. (2021)
354
- *''Escaping the Big Data Paradigm with Compact Transformers''*](
355
- https://arxiv.org/abs/2104.05704). It's a convolutional neural network
356
- leading into a transformer encoder, followed by a sequence pooling layer.
358
+ ...
357
359
  """
358
360
 
359
361
  def __init__(
@@ -380,6 +382,7 @@ class ViT(nn.Module):
380
382
  transformer_initial_ff_residual_path=True,
381
383
  transformer_initial_ff_linear_module_up=None,
382
384
  transformer_initial_ff_linear_module_down=None,
385
+ transformer_initial_ff_mlp_dropout=None,
383
386
  transformer_pre_norm=True,
384
387
  transformer_normformer=False,
385
388
  transformer_post_norm=False,
@@ -442,6 +445,7 @@ class ViT(nn.Module):
442
445
  transformer_initial_ff_residual_path=transformer_initial_ff_residual_path,
443
446
  transformer_initial_ff_linear_module_up=transformer_initial_ff_linear_module_up,
444
447
  transformer_initial_ff_linear_module_down=transformer_initial_ff_linear_module_down,
448
+ transformer_initial_ff_mlp_dropout=transformer_initial_ff_mlp_dropout,
445
449
  transformer_pre_norm=transformer_pre_norm,
446
450
  transformer_normformer=transformer_normformer,
447
451
  transformer_post_norm=transformer_post_norm,
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: broccoli-ml
3
- Version: 0.39.0
3
+ Version: 0.40.0
4
4
  Summary: Some useful Pytorch models, circa 2025
5
5
  License: MIT
6
6
  Author: Nicholas Bailey
@@ -10,8 +10,8 @@ broccoli/rope.py,sha256=hw7kBPNR9GQXj4GxyIAffsGKPfcTPOFh8Bc7oEHtaZY,12108
10
10
  broccoli/tensor.py,sha256=um8mrxkYbvNDo-QvHlmJm8Aw6qcngOlUZPoAk_PMReA,4480
11
11
  broccoli/transformer.py,sha256=Xw1oBLsvVeHmMqgurhorRa49nrjfooLev5uBPFeK9og,17004
12
12
  broccoli/utils.py,sha256=htq_hOsdhUhL0nJi9WkKiEYOjEoWqFpK5X49PtgTf-0,299
13
- broccoli/vit.py,sha256=RaSJZh2ogqNAvAkQDuZpNqdtRTWaW_8ug4BsBCBK_f4,17728
14
- broccoli_ml-0.39.0.dist-info/LICENSE,sha256=0BAzJE5BqQ7Iixp_AFdB2W1uO-HCRX-Qfun8PHt6yVM,1073
15
- broccoli_ml-0.39.0.dist-info/METADATA,sha256=wR3glIOttDNALtYadYXNBbwjHS3p5wtBoWGwjLEg8c8,1257
16
- broccoli_ml-0.39.0.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
17
- broccoli_ml-0.39.0.dist-info/RECORD,,
13
+ broccoli/vit.py,sha256=qnA7Utyp83CQ2o7kdkDB0d9Yj2UHFOVhNF8TtqwefIc,17781
14
+ broccoli_ml-0.40.0.dist-info/LICENSE,sha256=0BAzJE5BqQ7Iixp_AFdB2W1uO-HCRX-Qfun8PHt6yVM,1073
15
+ broccoli_ml-0.40.0.dist-info/METADATA,sha256=f9pHDub9pIvrB5SIoiTsfAKrHRhHyZGFNdWNJhDwnH0,1257
16
+ broccoli_ml-0.40.0.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
17
+ broccoli_ml-0.40.0.dist-info/RECORD,,