liger-kernel-nightly 0.5.10.dev20250614003833__py3-none-any.whl → 0.5.10.dev20250618170631__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- liger_kernel/ops/dyt.py +0 -2
- liger_kernel/transformers/monkey_patch.py +2 -1
- {liger_kernel_nightly-0.5.10.dev20250614003833.dist-info → liger_kernel_nightly-0.5.10.dev20250618170631.dist-info}/METADATA +1 -1
- {liger_kernel_nightly-0.5.10.dev20250614003833.dist-info → liger_kernel_nightly-0.5.10.dev20250618170631.dist-info}/RECORD +8 -8
- {liger_kernel_nightly-0.5.10.dev20250614003833.dist-info → liger_kernel_nightly-0.5.10.dev20250618170631.dist-info}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250614003833.dist-info → liger_kernel_nightly-0.5.10.dev20250618170631.dist-info}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250614003833.dist-info → liger_kernel_nightly-0.5.10.dev20250618170631.dist-info}/WHEEL +0 -0
- {liger_kernel_nightly-0.5.10.dev20250614003833.dist-info → liger_kernel_nightly-0.5.10.dev20250618170631.dist-info}/top_level.txt +0 -0
liger_kernel/ops/dyt.py
CHANGED
@@ -4,8 +4,6 @@ import torch
|
|
4
4
|
import triton
|
5
5
|
import triton.language as tl
|
6
6
|
|
7
|
-
from triton.language.extra.libdevice import tanh
|
8
|
-
|
9
7
|
from liger_kernel.ops.utils import compare_version
|
10
8
|
from liger_kernel.ops.utils import ensure_contiguous
|
11
9
|
from liger_kernel.ops.utils import infer_device
|
@@ -1208,7 +1208,8 @@ def apply_liger_kernel_to_qwen3_moe(
|
|
1208
1208
|
_patch_rms_norm_module(base_model.norm)
|
1209
1209
|
for decoder_layer in base_model.layers:
|
1210
1210
|
if swiglu:
|
1211
|
-
|
1211
|
+
for mlp_expert in decoder_layer.mlp.experts:
|
1212
|
+
_patch_swiglu_module(mlp_expert, LigerQwen3MoeSwiGLUMLP)
|
1212
1213
|
if rms_norm:
|
1213
1214
|
_patch_rms_norm_module(decoder_layer.input_layernorm)
|
1214
1215
|
_patch_rms_norm_module(decoder_layer.post_attention_layernorm)
|
@@ -17,7 +17,7 @@ liger_kernel/chunked_loss/orpo_loss.py,sha256=nu9UYG16dcMw93lvHi4_hYs3Q0FK1KnlmM
|
|
17
17
|
liger_kernel/chunked_loss/simpo_loss.py,sha256=fy2w8KbhMrBv7b1jdIeH3bBFxY52bPQPZb3KwBvmurM,5385
|
18
18
|
liger_kernel/ops/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
19
19
|
liger_kernel/ops/cross_entropy.py,sha256=e8THGnhOcy_0SbOLABx67HEM7-B8a8pG7nDKbCRpQKM,19123
|
20
|
-
liger_kernel/ops/dyt.py,sha256=
|
20
|
+
liger_kernel/ops/dyt.py,sha256=gCLz4S8aul8SY9nvIGaoK67aGb7U9MJRQdo3ONqmQYs,5417
|
21
21
|
liger_kernel/ops/fused_linear_cross_entropy.py,sha256=5fbGhN85n3zf0uIdJ7PYHWIRzTf0VTFiS0ARtOmqIP0,11020
|
22
22
|
liger_kernel/ops/fused_linear_jsd.py,sha256=CSoprxb-YcJy-YUKiTcYkxN8sb9h2kdk_iHuncvSV5c,9683
|
23
23
|
liger_kernel/ops/fused_neighborhood_attention.py,sha256=vPi5xbnh6wxyZehaqo6Tuilqo2fN5SGDiONjnNmIKqs,35556
|
@@ -53,7 +53,7 @@ liger_kernel/transformers/grpo_loss.py,sha256=uAkUNKSnUGEOqa82L9w2e6AI1kcmG8K45-
|
|
53
53
|
liger_kernel/transformers/jsd.py,sha256=DGqRnxIZxsvxo0_tbbxX3b-sDbDjC_yKufyRIHCcScY,2979
|
54
54
|
liger_kernel/transformers/kl_div.py,sha256=WLffFbh1EExD2Eb1F7lN11fo9JJC-0751WJjZAF1Fj8,409
|
55
55
|
liger_kernel/transformers/layer_norm.py,sha256=c9pk3PEasOKYR0rhe5e5nNrnYKVCEW4VC8S6LpCq9EQ,906
|
56
|
-
liger_kernel/transformers/monkey_patch.py,sha256=
|
56
|
+
liger_kernel/transformers/monkey_patch.py,sha256=pB9qQPKfaA3MS-qtsOTG1YEAC6kRYyrsdk7JhMLrwSE,77594
|
57
57
|
liger_kernel/transformers/multi_token_attention.py,sha256=l9VDICK0dfmifUDW668hGscP8AHq2rYcM2oGUa3baRQ,1751
|
58
58
|
liger_kernel/transformers/qwen2vl_mrope.py,sha256=5EwSqrMdsL9MYspeBMXBsNJKvH0MOmRrtJXAJlnnlOI,1047
|
59
59
|
liger_kernel/transformers/rms_norm.py,sha256=eErIr1n-13oVrc1VJY07lqazYelw_vlu9Az__RmXPSE,2717
|
@@ -87,9 +87,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
|
|
87
87
|
liger_kernel/transformers/trainer/orpo_trainer.py,sha256=tX0h63aOFe3rNqTmk6JpMf75UPo981yzEa6TghnjS0Q,5370
|
88
88
|
liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
|
89
89
|
liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
|
90
|
-
liger_kernel_nightly-0.5.10.
|
91
|
-
liger_kernel_nightly-0.5.10.
|
92
|
-
liger_kernel_nightly-0.5.10.
|
93
|
-
liger_kernel_nightly-0.5.10.
|
94
|
-
liger_kernel_nightly-0.5.10.
|
95
|
-
liger_kernel_nightly-0.5.10.
|
90
|
+
liger_kernel_nightly-0.5.10.dev20250618170631.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
|
91
|
+
liger_kernel_nightly-0.5.10.dev20250618170631.dist-info/METADATA,sha256=sxNO4_4HQ8OZ23Qx5TUIbXSHesEBgYfJGXM4qCOFn_8,24358
|
92
|
+
liger_kernel_nightly-0.5.10.dev20250618170631.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
|
93
|
+
liger_kernel_nightly-0.5.10.dev20250618170631.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
|
94
|
+
liger_kernel_nightly-0.5.10.dev20250618170631.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
|
95
|
+
liger_kernel_nightly-0.5.10.dev20250618170631.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|