PyPI - x-transformers - Versions diffs - 1.28.5__py3-none-any.whl → 1.29.1__py3-none-any.whl - Mend

x-transformers 1.28.5py3-none-any.whl → 1.29.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

x_transformers/x_transformers.py CHANGED Viewed

@@ -1001,7 +1001,7 @@ class AttentionLayers(Module):
     def __init__(
         self,
         dim,
-        depth,
+        depth = None,
         heads = 8,
         causal = False,
         cross_attend = False,
@@ -1054,10 +1054,11 @@ class AttentionLayers(Module):
         attn_kwargs, kwargs = groupby_prefix_and_trim('attn_', kwargs)
         cross_attn_kwargs, kwargs = groupby_prefix_and_trim('cross_attn_', kwargs)
+        assert len(kwargs) == 0, f'unrecognized kwargs passed in {kwargs.keys()}'
         dim_head = attn_kwargs.get('dim_head', DEFAULT_DIM_HEAD)
         self.dim = dim
-        self.depth = depth
         self.causal = causal
         self.layers = ModuleList([])
@@ -1138,9 +1139,12 @@ class AttentionLayers(Module):
         # setup weight tying, which is a special case of `layer_execute_order`
+        assert not (exists(layers_execute_order) and exists(custom_layers) and exists(depth)), 'depth should not be passed in if using custom layers and custom layer execution order'
         assert not (weight_tie_layers and any([*map(exists, (custom_layers, par_ratio, sandwich_coef))]))
         if weight_tie_layers:
+            assert exists(depth), 'depth must be passed in with `weight_tie_layers` = True'
             assert not exists(layers_execute_order)
             layers_execute_order = tuple(range(len(default_block))) * depth
             depth = 1
@@ -1164,6 +1168,7 @@ class AttentionLayers(Module):
             assert sandwich_coef > 0 and sandwich_coef <= depth, 'sandwich coefficient should be less than the depth'
             layer_types = ('a',) * sandwich_coef + default_block * (depth - sandwich_coef) + ('f',) * sandwich_coef
         else:
+            assert exists(depth), '`depth` must be passed in for `Decoder` or `Encoder`'
             layer_types = default_block * depth
         self.layer_types = layer_types
@@ -1173,6 +1178,13 @@ class AttentionLayers(Module):
         self.num_attn_layers = len(list(filter(equals('a'), layer_types)))
+        # validate and set the depth
+        depth = default(depth, len(self.layers_execute_order))
+        assert depth == len(self.layers_execute_order)
+        self.depth = depth
         # stochastic depth
         self.layer_dropouts = cast_tuple(layer_dropout, len(layer_types))

{x_transformers-1.28.5.dist-info → x_transformers-1.29.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: x-transformers
-Version: 1.28.5
+Version: 1.29.1
 Summary: X-Transformers - Pytorch
 Home-page: https://github.com/lucidrains/x-transformers
 Author: Phil Wang

{x_transformers-1.28.5.dist-info → x_transformers-1.29.1.dist-info}/RECORD RENAMED Viewed

@@ -4,11 +4,11 @@ x_transformers/autoregressive_wrapper.py,sha256=gYKIN5Rm8dMYSTX5yHpg9sPYyZf9rsRT
 x_transformers/continuous.py,sha256=dpHK4NSMDQAJQ_N3Uj9rip0fYGXyu0QCCO_OfEdbRGs,6192
 x_transformers/dpo.py,sha256=LjvWgCkqTl-UuehrzQ8nkX5guLr4whYwsmm7SKSwdls,3450
 x_transformers/nonautoregressive_wrapper.py,sha256=ys_p8obc7lTeeodCqvkRKxOXQ1C9T3j5Jwr-JbVgnXk,10432
-x_transformers/x_transformers.py,sha256=w_S0zOCKJtAO2M5ZKdE7gqSUWzkqECkA87ah-vkqx0Y,64656
+x_transformers/x_transformers.py,sha256=jj87ALpQpHGgvG1oHn4Z6UDmc1pqkoO6dY7YtY038w8,65269
 x_transformers/xl_autoregressive_wrapper.py,sha256=DCx4n0_c1tFai4nOqaWVnqx2p9eutsZsDMiMP1ckxNU,4117
 x_transformers/xval.py,sha256=EN3hxxleTRGYeAz6i4x3U_PrOm9TjxMF3eDhMKGx59E,8575
-x_transformers-1.28.5.dist-info/LICENSE,sha256=As9u198X-U-vph5noInuUfqsAG2zX_oXPHDmdjwlPPY,1066
-x_transformers-1.28.5.dist-info/METADATA,sha256=jLcNekd2_ccREKevcTAtHNAnjwqnxaRmAvq90_eSdQI,661
-x_transformers-1.28.5.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
-x_transformers-1.28.5.dist-info/top_level.txt,sha256=hO6KGpFuGucRNEtRfme4A_rGcM53AKwGP7RVlRIxS5Q,15
-x_transformers-1.28.5.dist-info/RECORD,,
+x_transformers-1.29.1.dist-info/LICENSE,sha256=As9u198X-U-vph5noInuUfqsAG2zX_oXPHDmdjwlPPY,1066
+x_transformers-1.29.1.dist-info/METADATA,sha256=4Nnxc5THUI-d21Szj2mPLTlZYF0A9xVjHN4laFiLCIE,661
+x_transformers-1.29.1.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
+x_transformers-1.29.1.dist-info/top_level.txt,sha256=hO6KGpFuGucRNEtRfme4A_rGcM53AKwGP7RVlRIxS5Q,15
+x_transformers-1.29.1.dist-info/RECORD,,

{x_transformers-1.28.5.dist-info → x_transformers-1.29.1.dist-info}/LICENSE RENAMED Viewed

File without changes

{x_transformers-1.28.5.dist-info → x_transformers-1.29.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{x_transformers-1.28.5.dist-info → x_transformers-1.29.1.dist-info}/top_level.txt RENAMED Viewed

File without changes

x-transformers 1.28.5__py3-none-any.whl → 1.29.1__py3-none-any.whl

x-transformers 1.28.5py3-none-any.whl → 1.29.1py3-none-any.whl