x-transformers 1.40.0__py3-none-any.whl → 1.40.2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- x_transformers/attend.py +7 -2
- x_transformers/x_transformers.py +2 -1
- {x_transformers-1.40.0.dist-info → x_transformers-1.40.2.dist-info}/METADATA +1 -1
- {x_transformers-1.40.0.dist-info → x_transformers-1.40.2.dist-info}/RECORD +7 -7
- {x_transformers-1.40.0.dist-info → x_transformers-1.40.2.dist-info}/LICENSE +0 -0
- {x_transformers-1.40.0.dist-info → x_transformers-1.40.2.dist-info}/WHEEL +0 -0
- {x_transformers-1.40.0.dist-info → x_transformers-1.40.2.dist-info}/top_level.txt +0 -0
x_transformers/attend.py
CHANGED
@@ -119,7 +119,12 @@ def one_hot_straight_through(logits, temperature = 1.):
|
|
119
119
|
# sparse topk attention - only keep topk attn logits for softmax
|
120
120
|
# optional straight through with masked out logits by setting `attn_sparse_topk_straight_through = True`
|
121
121
|
|
122
|
-
def sparse_topk_attn(
|
122
|
+
def sparse_topk_attn(
|
123
|
+
logits,
|
124
|
+
sparse_topk,
|
125
|
+
temperature = 1.,
|
126
|
+
straight_through = False
|
127
|
+
):
|
123
128
|
orig_logits = logits
|
124
129
|
|
125
130
|
mask_value = -torch.finfo(logits.dtype).max
|
@@ -132,7 +137,7 @@ def sparse_topk_attn(logits, sparse_topk, temperature = 1., straight_through = F
|
|
132
137
|
return topk_attn
|
133
138
|
|
134
139
|
soft_attn = (orig_logits / temperature).softmax(dim = -1)
|
135
|
-
return topk_attn + soft_attn - soft_attn.detach()
|
140
|
+
return topk_attn.detach() + soft_attn - soft_attn.detach()
|
136
141
|
|
137
142
|
# functions for creating causal mask
|
138
143
|
# need a special one for onnx cpu (no support for .triu)
|
x_transformers/x_transformers.py
CHANGED
@@ -1107,6 +1107,7 @@ class Attention(Module):
|
|
1107
1107
|
context_mask = None,
|
1108
1108
|
attn_mask = None,
|
1109
1109
|
rel_pos = None,
|
1110
|
+
attn_bias = None,
|
1110
1111
|
rotary_pos_emb = None,
|
1111
1112
|
prev_attn = None,
|
1112
1113
|
mem = None,
|
@@ -1237,8 +1238,8 @@ class Attention(Module):
|
|
1237
1238
|
|
1238
1239
|
# prepare relative positional bias, if needed
|
1239
1240
|
|
1240
|
-
attn_bias = None
|
1241
1241
|
if exists(rel_pos):
|
1242
|
+
assert not exists(attn_bias)
|
1242
1243
|
attn_bias = rel_pos(i, j)
|
1243
1244
|
attn_bias = pad_at_dim(attn_bias, (num_mem_kv, 0), value = 0.) # handle memory key / values
|
1244
1245
|
|
@@ -1,15 +1,15 @@
|
|
1
1
|
x_transformers/__init__.py,sha256=-MkQrSc37cTVDX7AOykxunYnqVtFlQ7lb0Cse5dsGWU,793
|
2
|
-
x_transformers/attend.py,sha256=
|
2
|
+
x_transformers/attend.py,sha256=VbB0fi-ETgAF4dc2a_Meaqvt14LMaRVIjZ8NexUX8F0,17239
|
3
3
|
x_transformers/autoregressive_wrapper.py,sha256=DOJJCMMDOqDYKWy_IaG5IyKsXD3AW6amzfUgdAADOLY,10500
|
4
4
|
x_transformers/continuous.py,sha256=cIVEdhfei258__ziV7kQBrJMxCel54bExBTDrO9rfCI,6450
|
5
5
|
x_transformers/dpo.py,sha256=LjvWgCkqTl-UuehrzQ8nkX5guLr4whYwsmm7SKSwdls,3450
|
6
6
|
x_transformers/multi_input.py,sha256=tCh-fTJDj2ib4SMGtsa-AM8MxKzJAQSwqAXOu3HU2mg,9252
|
7
7
|
x_transformers/nonautoregressive_wrapper.py,sha256=2NU58hYMgn-4Jzg3mie-mXb0XH_dCN7fjlzd3K1rLUY,10510
|
8
|
-
x_transformers/x_transformers.py,sha256=
|
8
|
+
x_transformers/x_transformers.py,sha256=SfM0ql3wK7t8KzBXRNnGTdcyq3tQVmHB4VIcfg5sSv4,84604
|
9
9
|
x_transformers/xl_autoregressive_wrapper.py,sha256=CvZMJ6A6PA-Y_bQAhnORwjJBSl6Vjq2IdW5KTdk8NI8,4195
|
10
10
|
x_transformers/xval.py,sha256=QE1ltYZTR_eGgIHPP2BrMWVWVLqMW-OpDZh87BSmQEg,8563
|
11
|
-
x_transformers-1.40.
|
12
|
-
x_transformers-1.40.
|
13
|
-
x_transformers-1.40.
|
14
|
-
x_transformers-1.40.
|
15
|
-
x_transformers-1.40.
|
11
|
+
x_transformers-1.40.2.dist-info/LICENSE,sha256=As9u198X-U-vph5noInuUfqsAG2zX_oXPHDmdjwlPPY,1066
|
12
|
+
x_transformers-1.40.2.dist-info/METADATA,sha256=G1LWuKpy25e1rXV7MFRT5r2F4bHjvyMUrgxTgJIQLic,661
|
13
|
+
x_transformers-1.40.2.dist-info/WHEEL,sha256=OVMc5UfuAQiSplgO0_WdW7vXVGAt9Hdd6qtN4HotdyA,91
|
14
|
+
x_transformers-1.40.2.dist-info/top_level.txt,sha256=hO6KGpFuGucRNEtRfme4A_rGcM53AKwGP7RVlRIxS5Q,15
|
15
|
+
x_transformers-1.40.2.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|