liger-kernel-nightly 0.4.2.dev20241210001927__py3-none-any.whl → 0.4.2.dev20241210002150__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -285,11 +285,12 @@ def cross_entropy_forward(
285
285
  num_warps=32 if not is_hip() else 16,
286
286
  )
287
287
 
288
- loss = torch.sum(loss_1d)
289
- if return_z_loss == _TRUE.value:
290
- z_loss = torch.sum(z_loss_1d)
288
+ if reduction == "none":
289
+ loss = loss_1d
290
+ z_loss = z_loss_1d if return_z_loss == _TRUE.value else None
291
291
  else:
292
- z_loss = None
292
+ loss = torch.sum(loss_1d)
293
+ z_loss = torch.sum(z_loss_1d) if return_z_loss == _TRUE.value else None
293
294
 
294
295
  return loss, z_loss, _input
295
296
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.4.2.dev20241210001927
3
+ Version: 0.4.2.dev20241210002150
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -10,7 +10,7 @@ liger_kernel/chunked_loss/fused_linear_preference.py,sha256=vlWfaaIECWvCQhY9PM7z
10
10
  liger_kernel/chunked_loss/orpo_loss.py,sha256=ZuKGjbkIYzV4UzvupNdq6vyxCp7-BztQkUt8ZnFvKos,3531
11
11
  liger_kernel/chunked_loss/simpo_loss.py,sha256=Wa4LOlDG9PbJkOOkKg8hbKvnKgg7OTBz6-qIkwPK1yw,3275
12
12
  liger_kernel/ops/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
13
- liger_kernel/ops/cross_entropy.py,sha256=VqaYB9Zirc51eZ28OmjEZRrrV9UysRjS_vhIftB9sKo,15753
13
+ liger_kernel/ops/cross_entropy.py,sha256=oG5hfrlmnlF5lOoZRhHRglObxgH4B0KadjWMJj9EWPM,15860
14
14
  liger_kernel/ops/fused_linear_cross_entropy.py,sha256=Tnw4gyAYVVdnCOqhOuLEzbUQ3goOTnoAfk3pqSIM5ac,9301
15
15
  liger_kernel/ops/fused_linear_jsd.py,sha256=nOv4zwfxHqqepKEmMsQuz-B3H-gRjyo8uClpmqSGLYA,9693
16
16
  liger_kernel/ops/geglu.py,sha256=MQL4zyzneZqZYUGPvb1QjI_EYT9_pKfSDgR25WD9jrI,4127
@@ -56,9 +56,9 @@ liger_kernel/transformers/model/qwen2.py,sha256=EyhSSzQOskGjSnCsKMZpd1s5IAIlHd5P
56
56
  liger_kernel/transformers/model/qwen2_vl.py,sha256=bIQe2bWiY--G84FhCD29Gdi64_qHP6vbcGsK6vKysQE,8547
57
57
  liger_kernel/triton/__init__.py,sha256=yfRe0zMb47QnqjecZWG7LnanfCTzeku7SgWRAwNVmzU,101
58
58
  liger_kernel/triton/monkey_patch.py,sha256=5BcGKTtdqeYchypBIBopGIWPx1-cFALz7sOKoEsqXJ0,1584
59
- liger_kernel_nightly-0.4.2.dev20241210001927.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
60
- liger_kernel_nightly-0.4.2.dev20241210001927.dist-info/METADATA,sha256=wrWkymMyq_0vPXBK37t2PuzS_aWbuIa0Xu_DBMUPPZ0,19485
61
- liger_kernel_nightly-0.4.2.dev20241210001927.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
62
- liger_kernel_nightly-0.4.2.dev20241210001927.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
63
- liger_kernel_nightly-0.4.2.dev20241210001927.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
64
- liger_kernel_nightly-0.4.2.dev20241210001927.dist-info/RECORD,,
59
+ liger_kernel_nightly-0.4.2.dev20241210002150.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
60
+ liger_kernel_nightly-0.4.2.dev20241210002150.dist-info/METADATA,sha256=XMk5DN74rqGLsOWe-dmLLHrueliPJ-XBn9zsyanKt9o,19485
61
+ liger_kernel_nightly-0.4.2.dev20241210002150.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
62
+ liger_kernel_nightly-0.4.2.dev20241210002150.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
63
+ liger_kernel_nightly-0.4.2.dev20241210002150.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
64
+ liger_kernel_nightly-0.4.2.dev20241210002150.dist-info/RECORD,,