broccoli-ml 0.5.1__py3-none-any.whl → 0.5.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- broccoli/vit.py +8 -8
- {broccoli_ml-0.5.1.dist-info → broccoli_ml-0.5.3.dist-info}/METADATA +1 -1
- {broccoli_ml-0.5.1.dist-info → broccoli_ml-0.5.3.dist-info}/RECORD +5 -5
- {broccoli_ml-0.5.1.dist-info → broccoli_ml-0.5.3.dist-info}/LICENSE +0 -0
- {broccoli_ml-0.5.1.dist-info → broccoli_ml-0.5.3.dist-info}/WHEEL +0 -0
broccoli/vit.py
CHANGED
@@ -91,7 +91,7 @@ class ViTEncoder(nn.Module):
|
|
91
91
|
transformer_activation_kwargs: Optional[dict] = None,
|
92
92
|
transformer_mlp_dropout=0.0,
|
93
93
|
transformer_msa_dropout=0.1,
|
94
|
-
|
94
|
+
transformer_stochastic_depth=0.1,
|
95
95
|
linear_module=nn.Linear,
|
96
96
|
initial_batch_norm=True,
|
97
97
|
):
|
@@ -285,9 +285,9 @@ class ViTEncoder(nn.Module):
|
|
285
285
|
mlp_ratio=transformer_mlp_ratio,
|
286
286
|
activation=transformer_activation,
|
287
287
|
activation_kwargs=transformer_activation_kwargs,
|
288
|
-
|
289
|
-
|
290
|
-
stochastic_depth=
|
288
|
+
transformer_mlp_dropout=transformer_mlp_dropout,
|
289
|
+
transformer_msa_dropout=transformer_msa_dropout,
|
290
|
+
stochastic_depth=transformer_stochastic_depth,
|
291
291
|
causal=False,
|
292
292
|
linear_module=linear_module,
|
293
293
|
bos_tokens=transformer_bos_tokens,
|
@@ -359,7 +359,7 @@ class CCT(nn.Module):
|
|
359
359
|
transformer_activation_kwargs: Optional[dict] = None,
|
360
360
|
transformer_mlp_dropout=0.0,
|
361
361
|
transformer_msa_dropout=0.1,
|
362
|
-
|
362
|
+
transformer_stochastic_depth=0.1,
|
363
363
|
batch_norm_outputs=True,
|
364
364
|
initial_batch_norm=True,
|
365
365
|
linear_module=nn.Linear,
|
@@ -409,9 +409,9 @@ class CCT(nn.Module):
|
|
409
409
|
transformer_bos_tokens=transformer_bos_tokens,
|
410
410
|
transformer_activation=transformer_activation,
|
411
411
|
transformer_activation_kwargs=transformer_activation_kwargs,
|
412
|
-
|
413
|
-
|
414
|
-
|
412
|
+
transformer_mlp_dropout=transformer_mlp_dropout,
|
413
|
+
transformer_msa_dropout=transformer_msa_dropout,
|
414
|
+
transformer_stochastic_depth=transformer_stochastic_depth,
|
415
415
|
linear_module=linear_module,
|
416
416
|
initial_batch_norm=initial_batch_norm,
|
417
417
|
)
|
@@ -10,8 +10,8 @@ broccoli/rope.py,sha256=hw7kBPNR9GQXj4GxyIAffsGKPfcTPOFh8Bc7oEHtaZY,12108
|
|
10
10
|
broccoli/tensor.py,sha256=E2JK5mQwJf75e23-JGcDoT7QxQf89DJReUo2et1LhRY,1716
|
11
11
|
broccoli/transformer.py,sha256=SwvutiYOiPlqLzbO_twye7Hna5DsJukVOzzAx9CTCyU,16417
|
12
12
|
broccoli/utils.py,sha256=htq_hOsdhUhL0nJi9WkKiEYOjEoWqFpK5X49PtgTf-0,299
|
13
|
-
broccoli/vit.py,sha256=
|
14
|
-
broccoli_ml-0.5.
|
15
|
-
broccoli_ml-0.5.
|
16
|
-
broccoli_ml-0.5.
|
17
|
-
broccoli_ml-0.5.
|
13
|
+
broccoli/vit.py,sha256=DzpZPrvSJrXitKgu3TDJ4r6Pq_I4XDKjZsjbL5LUGYU,15380
|
14
|
+
broccoli_ml-0.5.3.dist-info/LICENSE,sha256=0BAzJE5BqQ7Iixp_AFdB2W1uO-HCRX-Qfun8PHt6yVM,1073
|
15
|
+
broccoli_ml-0.5.3.dist-info/METADATA,sha256=0WcAWopuuskj2IagQhTcEjxcuWyHXqOlAuRGEjcoGA0,1256
|
16
|
+
broccoli_ml-0.5.3.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
|
17
|
+
broccoli_ml-0.5.3.dist-info/RECORD,,
|
File without changes
|
File without changes
|