x-transformers 2.1.35__py3-none-any.whl → 2.1.36__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- x_transformers/x_transformers.py +5 -4
- {x_transformers-2.1.35.dist-info → x_transformers-2.1.36.dist-info}/METADATA +1 -1
- {x_transformers-2.1.35.dist-info → x_transformers-2.1.36.dist-info}/RECORD +5 -5
- {x_transformers-2.1.35.dist-info → x_transformers-2.1.36.dist-info}/WHEEL +0 -0
- {x_transformers-2.1.35.dist-info → x_transformers-2.1.36.dist-info}/licenses/LICENSE +0 -0
x_transformers/x_transformers.py
CHANGED
@@ -864,14 +864,15 @@ class DynamicTanh(Module):
|
|
864
864
|
self.gamma = nn.Parameter(torch.ones(dim))
|
865
865
|
self.beta = nn.Parameter(torch.zeros(dim))
|
866
866
|
|
867
|
-
self.
|
867
|
+
self.pre_tanh_scale_offset = init_alpha if unit_offset else 0.
|
868
|
+
self.gamma_offset = float(unit_offset)
|
868
869
|
|
869
|
-
nn.init.constant_(self.pre_tanh_scale,
|
870
|
+
nn.init.constant_(self.pre_tanh_scale, 0 if unit_offset else init_alpha)
|
870
871
|
nn.init.constant_(self.gamma, 1. - float(unit_offset))
|
871
872
|
|
872
873
|
def forward(self, x):
|
873
|
-
pre_tanh_scale = self.pre_tanh_scale + self.
|
874
|
-
gamma = self.gamma + self.
|
874
|
+
pre_tanh_scale = self.pre_tanh_scale + self.pre_tanh_scale_offset
|
875
|
+
gamma = self.gamma + self.gamma_offset
|
875
876
|
return (x * pre_tanh_scale).tanh() * gamma + self.beta
|
876
877
|
|
877
878
|
# residual and residual gates
|
@@ -7,10 +7,10 @@ x_transformers/dpo.py,sha256=xt4OuOWhU8pN3OKN2LZAaC2NC8iiEnchqqcrPWVqf0o,3521
|
|
7
7
|
x_transformers/multi_input.py,sha256=tCh-fTJDj2ib4SMGtsa-AM8MxKzJAQSwqAXOu3HU2mg,9252
|
8
8
|
x_transformers/neo_mlp.py,sha256=XCNnnop9WLarcxap1kGuYc1x8GHvwkZiDRnXOxSl3Po,3452
|
9
9
|
x_transformers/nonautoregressive_wrapper.py,sha256=2NU58hYMgn-4Jzg3mie-mXb0XH_dCN7fjlzd3K1rLUY,10510
|
10
|
-
x_transformers/x_transformers.py,sha256=
|
10
|
+
x_transformers/x_transformers.py,sha256=voN-uEBEKxpUu9K4MVcneSTrzdgJWnZGuQ1QRZQw4Q4,111596
|
11
11
|
x_transformers/xl_autoregressive_wrapper.py,sha256=CvZMJ6A6PA-Y_bQAhnORwjJBSl6Vjq2IdW5KTdk8NI8,4195
|
12
12
|
x_transformers/xval.py,sha256=7S00kCuab4tWQa-vf-z-XfzADjVj48MoFIr7VSIvttg,8575
|
13
|
-
x_transformers-2.1.
|
14
|
-
x_transformers-2.1.
|
15
|
-
x_transformers-2.1.
|
16
|
-
x_transformers-2.1.
|
13
|
+
x_transformers-2.1.36.dist-info/METADATA,sha256=D0qdMRucK3PWwEi8WwdiJdZ8X_hGTm1r3_7bJzYiWSM,88161
|
14
|
+
x_transformers-2.1.36.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
15
|
+
x_transformers-2.1.36.dist-info/licenses/LICENSE,sha256=As9u198X-U-vph5noInuUfqsAG2zX_oXPHDmdjwlPPY,1066
|
16
|
+
x_transformers-2.1.36.dist-info/RECORD,,
|
File without changes
|
File without changes
|