broccoli-ml 0.39.0__py3-none-any.whl → 0.40.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- broccoli/vit.py +10 -6
- {broccoli_ml-0.39.0.dist-info → broccoli_ml-0.40.0.dist-info}/METADATA +1 -1
- {broccoli_ml-0.39.0.dist-info → broccoli_ml-0.40.0.dist-info}/RECORD +5 -5
- {broccoli_ml-0.39.0.dist-info → broccoli_ml-0.40.0.dist-info}/LICENSE +0 -0
- {broccoli_ml-0.39.0.dist-info → broccoli_ml-0.40.0.dist-info}/WHEEL +0 -0
broccoli/vit.py
CHANGED
@@ -120,6 +120,7 @@ class ViTEncoder(nn.Module):
|
|
120
120
|
transformer_initial_ff_residual_path=True,
|
121
121
|
transformer_initial_ff_linear_module_up=None,
|
122
122
|
transformer_initial_ff_linear_module_down=None,
|
123
|
+
transformer_initial_ff_mlp_dropout=None,
|
123
124
|
transformer_pre_norm=True,
|
124
125
|
transformer_normformer=False,
|
125
126
|
transformer_post_norm=False,
|
@@ -307,7 +308,12 @@ class ViTEncoder(nn.Module):
|
|
307
308
|
transformer_embedding_size,
|
308
309
|
activation=transformer_activation,
|
309
310
|
activation_kwargs=transformer_activation_kwargs,
|
310
|
-
dropout=
|
311
|
+
dropout=(
|
312
|
+
# First truthy assigned value
|
313
|
+
transformer_initial_ff_mlp_dropout
|
314
|
+
if transformer_initial_ff_mlp_dropout is not None
|
315
|
+
else transformer_mlp_dropout
|
316
|
+
),
|
311
317
|
linear_module_up=(
|
312
318
|
# First truthy assigned value
|
313
319
|
transformer_initial_ff_linear_module_up
|
@@ -349,11 +355,7 @@ class ViTEncoder(nn.Module):
|
|
349
355
|
|
350
356
|
class ViT(nn.Module):
|
351
357
|
"""
|
352
|
-
|
353
|
-
Based on the Compact Convolutional Transformer (CCT) of [Hasani et al. (2021)
|
354
|
-
*''Escaping the Big Data Paradigm with Compact Transformers''*](
|
355
|
-
https://arxiv.org/abs/2104.05704). It's a convolutional neural network
|
356
|
-
leading into a transformer encoder, followed by a sequence pooling layer.
|
358
|
+
...
|
357
359
|
"""
|
358
360
|
|
359
361
|
def __init__(
|
@@ -380,6 +382,7 @@ class ViT(nn.Module):
|
|
380
382
|
transformer_initial_ff_residual_path=True,
|
381
383
|
transformer_initial_ff_linear_module_up=None,
|
382
384
|
transformer_initial_ff_linear_module_down=None,
|
385
|
+
transformer_initial_ff_mlp_dropout=None,
|
383
386
|
transformer_pre_norm=True,
|
384
387
|
transformer_normformer=False,
|
385
388
|
transformer_post_norm=False,
|
@@ -442,6 +445,7 @@ class ViT(nn.Module):
|
|
442
445
|
transformer_initial_ff_residual_path=transformer_initial_ff_residual_path,
|
443
446
|
transformer_initial_ff_linear_module_up=transformer_initial_ff_linear_module_up,
|
444
447
|
transformer_initial_ff_linear_module_down=transformer_initial_ff_linear_module_down,
|
448
|
+
transformer_initial_ff_mlp_dropout=transformer_initial_ff_mlp_dropout,
|
445
449
|
transformer_pre_norm=transformer_pre_norm,
|
446
450
|
transformer_normformer=transformer_normformer,
|
447
451
|
transformer_post_norm=transformer_post_norm,
|
@@ -10,8 +10,8 @@ broccoli/rope.py,sha256=hw7kBPNR9GQXj4GxyIAffsGKPfcTPOFh8Bc7oEHtaZY,12108
|
|
10
10
|
broccoli/tensor.py,sha256=um8mrxkYbvNDo-QvHlmJm8Aw6qcngOlUZPoAk_PMReA,4480
|
11
11
|
broccoli/transformer.py,sha256=Xw1oBLsvVeHmMqgurhorRa49nrjfooLev5uBPFeK9og,17004
|
12
12
|
broccoli/utils.py,sha256=htq_hOsdhUhL0nJi9WkKiEYOjEoWqFpK5X49PtgTf-0,299
|
13
|
-
broccoli/vit.py,sha256=
|
14
|
-
broccoli_ml-0.
|
15
|
-
broccoli_ml-0.
|
16
|
-
broccoli_ml-0.
|
17
|
-
broccoli_ml-0.
|
13
|
+
broccoli/vit.py,sha256=qnA7Utyp83CQ2o7kdkDB0d9Yj2UHFOVhNF8TtqwefIc,17781
|
14
|
+
broccoli_ml-0.40.0.dist-info/LICENSE,sha256=0BAzJE5BqQ7Iixp_AFdB2W1uO-HCRX-Qfun8PHt6yVM,1073
|
15
|
+
broccoli_ml-0.40.0.dist-info/METADATA,sha256=f9pHDub9pIvrB5SIoiTsfAKrHRhHyZGFNdWNJhDwnH0,1257
|
16
|
+
broccoli_ml-0.40.0.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
|
17
|
+
broccoli_ml-0.40.0.dist-info/RECORD,,
|
File without changes
|
File without changes
|