liger-kernel-nightly 0.5.2.dev20250130172806__py3-none-any.whl → 0.5.2.dev20250203052716__py3-none-any.whl
Sign up to get free protection for your applications and to get access to all the features.
- liger_kernel/chunked_loss/dpo_loss.py +5 -2
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250203052716.dist-info}/METADATA +2 -1
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250203052716.dist-info}/RECORD +7 -7
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250203052716.dist-info}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250203052716.dist-info}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250203052716.dist-info}/WHEEL +0 -0
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250203052716.dist-info}/top_level.txt +0 -0
@@ -45,9 +45,12 @@ class LigerFusedLinearDPOFunction(LigerFusedLinearPreferenceBase):
|
|
45
45
|
chosen_logratios = chosen_logps - ref_chosen_logps
|
46
46
|
rejected_logratios = rejected_logps - ref_rejected_logps
|
47
47
|
|
48
|
+
chosen_rewards = beta * (chosen_logps - ref_chosen_logps)
|
49
|
+
rejected_rewards = beta * (rejected_logps - ref_rejected_logps)
|
50
|
+
|
48
51
|
logits_diff = beta * (chosen_logratios - rejected_logratios)
|
49
52
|
loss = -F.logsigmoid(logits_diff).sum() / (full_target.shape[0] // 2)
|
50
|
-
return loss
|
53
|
+
return loss, chosen_rewards, rejected_rewards
|
51
54
|
|
52
55
|
@staticmethod
|
53
56
|
def forward(
|
@@ -99,7 +102,7 @@ class LigerFusedLinearDPOLoss(torch.nn.Module):
|
|
99
102
|
beta: float = 0.1,
|
100
103
|
compute_nll_loss: bool = False,
|
101
104
|
compiled: bool = True,
|
102
|
-
use_ref_model: bool =
|
105
|
+
use_ref_model: bool = True,
|
103
106
|
):
|
104
107
|
"""
|
105
108
|
Args:
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: liger_kernel_nightly
|
3
|
-
Version: 0.5.2.
|
3
|
+
Version: 0.5.2.dev20250203052716
|
4
4
|
Summary: Efficient Triton kernels for LLM Training
|
5
5
|
License: BSD 2-CLAUSE LICENSE
|
6
6
|
Copyright 2024 LinkedIn Corporation
|
@@ -356,6 +356,7 @@ loss.backward()
|
|
356
356
|
|
357
357
|
## Sponsorship and Collaboration
|
358
358
|
|
359
|
+
- [Glows.ai](https://platform.glows.ai/): Sponsoring NVIDIA GPUs for our open source developers.
|
359
360
|
- [AMD](https://www.amd.com/en.html): Providing AMD GPUs for our AMD CI.
|
360
361
|
- [Intel](https://www.intel.com/): Providing Intel GPUs for our Intel CI.
|
361
362
|
- [Modal](https://modal.com/): Free 3000 credits from GPU MODE IRL for our NVIDIA CI.
|
@@ -4,7 +4,7 @@ liger_kernel/utils.py,sha256=HJa-xVKOohDn6pLVIx-Fv0V9h0QAL3qZGQNRICI-OpI,249
|
|
4
4
|
liger_kernel/chunked_loss/README.md,sha256=0FmkFC3hKBqyoDT5uTlIYmrvRkF-EOCR1y-EBU1LpWU,2248
|
5
5
|
liger_kernel/chunked_loss/__init__.py,sha256=48m-8IMOAReZbi0HK5aV-KGBp2IsZSwFvdnzTNrS4bk,516
|
6
6
|
liger_kernel/chunked_loss/cpo_loss.py,sha256=OdBR8WYdHTKpLI_c9DcuwqKSWPeAAeTyREz46Vu_cAY,3682
|
7
|
-
liger_kernel/chunked_loss/dpo_loss.py,sha256=
|
7
|
+
liger_kernel/chunked_loss/dpo_loss.py,sha256=enFVgqIvWWOamOV3cl_dbq2HsjX7PF2d0kibDNyuCW4,4545
|
8
8
|
liger_kernel/chunked_loss/functional.py,sha256=THWWpCnRVhTVfnPnyvQjdBvo1JDtxhwLmtZE_yiBBqM,817
|
9
9
|
liger_kernel/chunked_loss/fused_linear_distillation.py,sha256=5V8rdva89WyHVbmJ8JOmC4DYNOR6ByXfx3qlUieOZkI,11002
|
10
10
|
liger_kernel/chunked_loss/fused_linear_preference.py,sha256=idK9V9NivoVITqVpiG0fEGUHSvinYWkn9-EYXZjR-KQ,18356
|
@@ -61,9 +61,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
|
|
61
61
|
liger_kernel/transformers/trainer/orpo_trainer.py,sha256=pdekW7l6Qg_aqa5SYKYlSWUF8m3lkOFvFLcIMEHrz9s,8338
|
62
62
|
liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
|
63
63
|
liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
|
64
|
-
liger_kernel_nightly-0.5.2.
|
65
|
-
liger_kernel_nightly-0.5.2.
|
66
|
-
liger_kernel_nightly-0.5.2.
|
67
|
-
liger_kernel_nightly-0.5.2.
|
68
|
-
liger_kernel_nightly-0.5.2.
|
69
|
-
liger_kernel_nightly-0.5.2.
|
64
|
+
liger_kernel_nightly-0.5.2.dev20250203052716.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
|
65
|
+
liger_kernel_nightly-0.5.2.dev20250203052716.dist-info/METADATA,sha256=7P3fadHkpsB_m9i4oZAC5lpO_3U_k3gQ39BX6qPSY04,21302
|
66
|
+
liger_kernel_nightly-0.5.2.dev20250203052716.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
|
67
|
+
liger_kernel_nightly-0.5.2.dev20250203052716.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
|
68
|
+
liger_kernel_nightly-0.5.2.dev20250203052716.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
|
69
|
+
liger_kernel_nightly-0.5.2.dev20250203052716.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|