liger-kernel-nightly 0.6.1.dev20250809233744__py3-none-any.whl → 0.6.1.dev20250812205818__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -13,6 +13,7 @@ def fixed_fused_linear_cross_entropy(
13
13
  num_items_in_batch: Optional[int] = None,
14
14
  ignore_index: int = -100,
15
15
  final_logit_softcapping: Optional[float] = None,
16
+ accum_dtype: Optional[torch.dtype] = None,
16
17
  **kwargs,
17
18
  ):
18
19
  reduction = "sum" if num_items_in_batch is not None else "mean"
@@ -23,6 +24,7 @@ def fixed_fused_linear_cross_entropy(
23
24
  reduction=reduction,
24
25
  ignore_index=ignore_index,
25
26
  softcap=final_logit_softcapping,
27
+ accum_dtype=accum_dtype,
26
28
  )
27
29
  if reduction == "sum":
28
30
  loss = loss / num_items_in_batch
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.6.1.dev20250809233744
3
+ Version: 0.6.1.dev20250812205818
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -77,7 +77,7 @@ liger_kernel/transformers/model/glm4.py,sha256=GlnEhdGJuDIqp2R9qC54biY3HwV1tWmfp
77
77
  liger_kernel/transformers/model/llama.py,sha256=i8jJgyZsMKWQ-zKloETLugtwFpUOdaWxLDceciFXKd4,12832
78
78
  liger_kernel/transformers/model/llama4.py,sha256=IgbB8sTh3dlETQnaNNy1bZLuXy-Nt7qmeAjF27ydGpg,4210
79
79
  liger_kernel/transformers/model/llava.py,sha256=bLCioday_SOm69ogMDBhy_4UsVkH2-BSl93-EXY6-7I,15076
80
- liger_kernel/transformers/model/loss_utils.py,sha256=WWAMdiONPaXpIvxyOim_0igLrYh0yyOok5Q9_L9xvZw,1787
80
+ liger_kernel/transformers/model/loss_utils.py,sha256=YiYsmRHIuoRnFjGpwyIM18DCsrPPmO32YWMWqkEm1UQ,1867
81
81
  liger_kernel/transformers/model/mistral.py,sha256=syYNL8dLThX2-4uC13Lu0krEZ5zw3InviDUR3AJmc-I,5500
82
82
  liger_kernel/transformers/model/mixtral.py,sha256=VY-y73IyjcCyWyI7ahxXLw0fJrhgjYfr1xwRYtsHX0o,11396
83
83
  liger_kernel/transformers/model/mllama.py,sha256=my29NXk-p6ckQaP8qDIN8e318yI_9mQZHt38MV3SqLY,11280
@@ -94,9 +94,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
94
94
  liger_kernel/transformers/trainer/orpo_trainer.py,sha256=tX0h63aOFe3rNqTmk6JpMf75UPo981yzEa6TghnjS0Q,5370
95
95
  liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
96
96
  liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
97
- liger_kernel_nightly-0.6.1.dev20250809233744.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
98
- liger_kernel_nightly-0.6.1.dev20250809233744.dist-info/METADATA,sha256=nClPzQutLCx1b5T1KZGIsCPMTAaYbSw6PVkt9EJjhVw,24504
99
- liger_kernel_nightly-0.6.1.dev20250809233744.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
100
- liger_kernel_nightly-0.6.1.dev20250809233744.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
101
- liger_kernel_nightly-0.6.1.dev20250809233744.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
102
- liger_kernel_nightly-0.6.1.dev20250809233744.dist-info/RECORD,,
97
+ liger_kernel_nightly-0.6.1.dev20250812205818.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
98
+ liger_kernel_nightly-0.6.1.dev20250812205818.dist-info/METADATA,sha256=1s-igyDBWH7I09Q1f-7-h5BtStzEN30M_ffGQk5ZE4M,24504
99
+ liger_kernel_nightly-0.6.1.dev20250812205818.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
100
+ liger_kernel_nightly-0.6.1.dev20250812205818.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
101
+ liger_kernel_nightly-0.6.1.dev20250812205818.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
102
+ liger_kernel_nightly-0.6.1.dev20250812205818.dist-info/RECORD,,