liger-kernel-nightly 0.5.2.dev20250130172806__py3-none-any.whl → 0.5.2.dev20250130213846__py3-none-any.whl
Sign up to get free protection for your applications and to get access to all the features.
- liger_kernel/chunked_loss/dpo_loss.py +5 -2
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250130213846.dist-info}/METADATA +1 -1
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250130213846.dist-info}/RECORD +7 -7
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250130213846.dist-info}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250130213846.dist-info}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250130213846.dist-info}/WHEEL +0 -0
- {liger_kernel_nightly-0.5.2.dev20250130172806.dist-info → liger_kernel_nightly-0.5.2.dev20250130213846.dist-info}/top_level.txt +0 -0
@@ -45,9 +45,12 @@ class LigerFusedLinearDPOFunction(LigerFusedLinearPreferenceBase):
|
|
45
45
|
chosen_logratios = chosen_logps - ref_chosen_logps
|
46
46
|
rejected_logratios = rejected_logps - ref_rejected_logps
|
47
47
|
|
48
|
+
chosen_rewards = beta * (chosen_logps - ref_chosen_logps)
|
49
|
+
rejected_rewards = beta * (rejected_logps - ref_rejected_logps)
|
50
|
+
|
48
51
|
logits_diff = beta * (chosen_logratios - rejected_logratios)
|
49
52
|
loss = -F.logsigmoid(logits_diff).sum() / (full_target.shape[0] // 2)
|
50
|
-
return loss
|
53
|
+
return loss, chosen_rewards, rejected_rewards
|
51
54
|
|
52
55
|
@staticmethod
|
53
56
|
def forward(
|
@@ -99,7 +102,7 @@ class LigerFusedLinearDPOLoss(torch.nn.Module):
|
|
99
102
|
beta: float = 0.1,
|
100
103
|
compute_nll_loss: bool = False,
|
101
104
|
compiled: bool = True,
|
102
|
-
use_ref_model: bool =
|
105
|
+
use_ref_model: bool = True,
|
103
106
|
):
|
104
107
|
"""
|
105
108
|
Args:
|
@@ -4,7 +4,7 @@ liger_kernel/utils.py,sha256=HJa-xVKOohDn6pLVIx-Fv0V9h0QAL3qZGQNRICI-OpI,249
|
|
4
4
|
liger_kernel/chunked_loss/README.md,sha256=0FmkFC3hKBqyoDT5uTlIYmrvRkF-EOCR1y-EBU1LpWU,2248
|
5
5
|
liger_kernel/chunked_loss/__init__.py,sha256=48m-8IMOAReZbi0HK5aV-KGBp2IsZSwFvdnzTNrS4bk,516
|
6
6
|
liger_kernel/chunked_loss/cpo_loss.py,sha256=OdBR8WYdHTKpLI_c9DcuwqKSWPeAAeTyREz46Vu_cAY,3682
|
7
|
-
liger_kernel/chunked_loss/dpo_loss.py,sha256=
|
7
|
+
liger_kernel/chunked_loss/dpo_loss.py,sha256=enFVgqIvWWOamOV3cl_dbq2HsjX7PF2d0kibDNyuCW4,4545
|
8
8
|
liger_kernel/chunked_loss/functional.py,sha256=THWWpCnRVhTVfnPnyvQjdBvo1JDtxhwLmtZE_yiBBqM,817
|
9
9
|
liger_kernel/chunked_loss/fused_linear_distillation.py,sha256=5V8rdva89WyHVbmJ8JOmC4DYNOR6ByXfx3qlUieOZkI,11002
|
10
10
|
liger_kernel/chunked_loss/fused_linear_preference.py,sha256=idK9V9NivoVITqVpiG0fEGUHSvinYWkn9-EYXZjR-KQ,18356
|
@@ -61,9 +61,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
|
|
61
61
|
liger_kernel/transformers/trainer/orpo_trainer.py,sha256=pdekW7l6Qg_aqa5SYKYlSWUF8m3lkOFvFLcIMEHrz9s,8338
|
62
62
|
liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
|
63
63
|
liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
|
64
|
-
liger_kernel_nightly-0.5.2.
|
65
|
-
liger_kernel_nightly-0.5.2.
|
66
|
-
liger_kernel_nightly-0.5.2.
|
67
|
-
liger_kernel_nightly-0.5.2.
|
68
|
-
liger_kernel_nightly-0.5.2.
|
69
|
-
liger_kernel_nightly-0.5.2.
|
64
|
+
liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
|
65
|
+
liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/METADATA,sha256=piBJYHmJpYyIojWrErmhbQnpy29ILTI03ttIe1ekUZU,21205
|
66
|
+
liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
|
67
|
+
liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
|
68
|
+
liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
|
69
|
+
liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|