liger-kernel-nightly 0.3.1.dev20241026002338__py3-none-any.whl → 0.3.1.dev20241030171531__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- liger_kernel/ops/fused_linear_jsd.py +3 -1
- liger_kernel/ops/jsd.py +1 -1
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/METADATA +1 -1
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/RECORD +13 -13
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/WHEEL +1 -1
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/LICENSE +0 -0
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/LICENSE-MIT-Efficient Cross Entropy +0 -0
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/NOTICE +0 -0
- {liger_kernel_nightly-0.3.1.dev20241026002338.dist-info → liger_kernel_nightly-0.3.1.dev20241030171531.dist-info}/top_level.txt +0 -0
|
@@ -92,7 +92,9 @@ def fused_linear_jsd_forward(
|
|
|
92
92
|
dX_ptr=student_prob_chunk,
|
|
93
93
|
dX_stride=student_prob_chunk.stride(-2),
|
|
94
94
|
label_ptr=(
|
|
95
|
-
shift_labels
|
|
95
|
+
shift_labels[start_idx:end_idx]
|
|
96
|
+
if has_label
|
|
97
|
+
else torch.empty(1, device=device)
|
|
96
98
|
), # dummy ptr if no label
|
|
97
99
|
beta=jsd_beta,
|
|
98
100
|
n_non_ignore=n_non_ignore,
|
liger_kernel/ops/jsd.py
CHANGED
|
@@ -2,9 +2,9 @@ liger_kernel/env_report.py,sha256=LFUJ6UMkFFGPBYXBlqHFGy4bhsemEpSI-_1edSazlHI,11
|
|
|
2
2
|
liger_kernel/ops/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
3
3
|
liger_kernel/ops/cross_entropy.py,sha256=OB3nvIONLB_sj9LO6UQv1qLnf861k-pR58RtwgoiyYA,11192
|
|
4
4
|
liger_kernel/ops/fused_linear_cross_entropy.py,sha256=qg7qBQFLDJClnkUOGhFFHPSW_x7rPvQekbm_4OOYxys,9331
|
|
5
|
-
liger_kernel/ops/fused_linear_jsd.py,sha256=
|
|
5
|
+
liger_kernel/ops/fused_linear_jsd.py,sha256=eZ8y4GPtPRE0QcNNMLX8l4gSEMPzA3ZuzknfbAbiREA,9234
|
|
6
6
|
liger_kernel/ops/geglu.py,sha256=MQL4zyzneZqZYUGPvb1QjI_EYT9_pKfSDgR25WD9jrI,4127
|
|
7
|
-
liger_kernel/ops/jsd.py,sha256=
|
|
7
|
+
liger_kernel/ops/jsd.py,sha256=anWfdioucxZy4JQfTvbHBR-IQrZKeH-gBF1MHwwTuTQ,5781
|
|
8
8
|
liger_kernel/ops/kl_div.py,sha256=qnmtFQwuO3FR7Ovup_DDzpkD1A1LpwOaWlcO6K9ysHk,8342
|
|
9
9
|
liger_kernel/ops/layer_norm.py,sha256=unGMYMOPqtkM9aTrokhcqgPmsV2AUN7Yzv86isVB9OI,7422
|
|
10
10
|
liger_kernel/ops/rms_norm.py,sha256=9S9wyZLmzNyJlBxV4vbv4p5es7bGP-m_5wK9JC6JIdA,10911
|
|
@@ -40,14 +40,14 @@ liger_kernel/transformers/model/qwen2.py,sha256=3inWFXGHYT7wA10OR6bq3mDUBrr10AS5
|
|
|
40
40
|
liger_kernel/transformers/model/qwen2_vl.py,sha256=ymsm9aQpSUiSU12GY8FO608p9dSHOz4TCnNI1htX5bk,6975
|
|
41
41
|
liger_kernel/triton/__init__.py,sha256=yfRe0zMb47QnqjecZWG7LnanfCTzeku7SgWRAwNVmzU,101
|
|
42
42
|
liger_kernel/triton/monkey_patch.py,sha256=5BcGKTtdqeYchypBIBopGIWPx1-cFALz7sOKoEsqXJ0,1584
|
|
43
|
-
liger_kernel_nightly-0.3.1.
|
|
44
|
-
liger_kernel_nightly-0.3.1.
|
|
45
|
-
liger_kernel_nightly-0.3.1.
|
|
46
|
-
liger_kernel_nightly-0.3.1.
|
|
47
|
-
liger_kernel_nightly-0.3.1.
|
|
48
|
-
liger_kernel_nightly-0.3.1.
|
|
49
|
-
liger_kernel_nightly-0.3.1.
|
|
50
|
-
liger_kernel_nightly-0.3.1.
|
|
51
|
-
liger_kernel_nightly-0.3.1.
|
|
52
|
-
liger_kernel_nightly-0.3.1.
|
|
53
|
-
liger_kernel_nightly-0.3.1.
|
|
43
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
|
|
44
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/LICENSE-Apache-2.0,sha256=NRaCIsL9eblGS35gk4WKTC0usNYnR_mgRHJTKqz2_UE,11348
|
|
45
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/LICENSE-MIT-AutoAWQ,sha256=pfiOyInrAPY3xQbvV1i-gOqNZK7QEyIepT1IbqOYYYo,1067
|
|
46
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/LICENSE-MIT-Efficient Cross Entropy,sha256=PaC9HqyFYTy-ClS0H8Zfa2motJuTppjECXmjHwJcaOk,1063
|
|
47
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/LICENSE-MIT-llmc,sha256=kyFLt_XUcXS88CuxQt5-PjOcLjpJP2m-T4gtqZf3GLc,1071
|
|
48
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/LICENSE-MIT-triton,sha256=wL6W8IwsKiyHtzXubg8TCXhRZuo8S83EPdqXffYtqWg,1131
|
|
49
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/METADATA,sha256=kU0TUWpAqa7tZ2gXlmkZWpwnBT2OOUNjBm6C0sxdem8,27717
|
|
50
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
|
|
51
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
|
|
52
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
|
|
53
|
+
liger_kernel_nightly-0.3.1.dev20241030171531.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|