x-transformers 1.42.21__tar.gz → 1.42.23__tar.gz
Sign up to get free protection for your applications and to get access to all the features.
- {x_transformers-1.42.21/x_transformers.egg-info → x_transformers-1.42.23}/PKG-INFO +1 -1
- {x_transformers-1.42.21 → x_transformers-1.42.23}/setup.py +1 -1
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/x_transformers.py +4 -4
- {x_transformers-1.42.21 → x_transformers-1.42.23/x_transformers.egg-info}/PKG-INFO +1 -1
- {x_transformers-1.42.21 → x_transformers-1.42.23}/LICENSE +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/README.md +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/setup.cfg +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/tests/test_x_transformers.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/__init__.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/attend.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/autoregressive_wrapper.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/continuous.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/dpo.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/multi_input.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/neo_mlp.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/nonautoregressive_wrapper.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/xl_autoregressive_wrapper.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/xval.py +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers.egg-info/SOURCES.txt +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers.egg-info/dependency_links.txt +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers.egg-info/requires.txt +0 -0
- {x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers.egg-info/top_level.txt +0 -0
@@ -1079,6 +1079,7 @@ class Attention(Module):
|
|
1079
1079
|
neutreno_alpha = 0.4,
|
1080
1080
|
learned_value_residual_mix = False,
|
1081
1081
|
laser = False, # https://arxiv.org/abs/2411.03493v1
|
1082
|
+
laser_softclamp_value = 15.,
|
1082
1083
|
onnxable = False,
|
1083
1084
|
attend_sdp_kwargs: dict = dict(
|
1084
1085
|
enable_flash = True,
|
@@ -1119,9 +1120,9 @@ class Attention(Module):
|
|
1119
1120
|
self.to_v = LinearNoBias(dim_kv, v_dim) if not shared_kv else None
|
1120
1121
|
|
1121
1122
|
# enhancing gradients to attention through exponentiated values
|
1122
|
-
# todo - compare it to `attn = attn * large_value + attn.detach() * (1. - large_value)`
|
1123
1123
|
|
1124
1124
|
self.laser = laser
|
1125
|
+
self.laser_softclamp_value = laser_softclamp_value
|
1125
1126
|
|
1126
1127
|
# relations projection from tp-attention
|
1127
1128
|
|
@@ -1449,8 +1450,7 @@ class Attention(Module):
|
|
1449
1450
|
attn_bias = pad_at_dim(attn_bias, (num_mem_kv, 0))
|
1450
1451
|
|
1451
1452
|
if self.laser:
|
1452
|
-
|
1453
|
-
v = v - values_max
|
1453
|
+
v = softclamp(v, self.laser_softclamp_value)
|
1454
1454
|
v = v.exp()
|
1455
1455
|
|
1456
1456
|
# attention is all we need
|
@@ -1465,7 +1465,7 @@ class Attention(Module):
|
|
1465
1465
|
# laser
|
1466
1466
|
|
1467
1467
|
if self.laser:
|
1468
|
-
out =
|
1468
|
+
out = log(out)
|
1469
1469
|
|
1470
1470
|
# store the values for resformer or Neutreno
|
1471
1471
|
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/nonautoregressive_wrapper.py
RENAMED
File without changes
|
{x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers/xl_autoregressive_wrapper.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
{x_transformers-1.42.21 → x_transformers-1.42.23}/x_transformers.egg-info/dependency_links.txt
RENAMED
File without changes
|
File without changes
|
File without changes
|