liger-kernel-nightly 0.5.2.dev20250130172806__py3-none-any.whl → 0.5.2.dev20250130213846__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
@@ -45,9 +45,12 @@ class LigerFusedLinearDPOFunction(LigerFusedLinearPreferenceBase):
45
45
  chosen_logratios = chosen_logps - ref_chosen_logps
46
46
  rejected_logratios = rejected_logps - ref_rejected_logps
47
47
 
48
+ chosen_rewards = beta * (chosen_logps - ref_chosen_logps)
49
+ rejected_rewards = beta * (rejected_logps - ref_rejected_logps)
50
+
48
51
  logits_diff = beta * (chosen_logratios - rejected_logratios)
49
52
  loss = -F.logsigmoid(logits_diff).sum() / (full_target.shape[0] // 2)
50
- return loss
53
+ return loss, chosen_rewards, rejected_rewards
51
54
 
52
55
  @staticmethod
53
56
  def forward(
@@ -99,7 +102,7 @@ class LigerFusedLinearDPOLoss(torch.nn.Module):
99
102
  beta: float = 0.1,
100
103
  compute_nll_loss: bool = False,
101
104
  compiled: bool = True,
102
- use_ref_model: bool = False,
105
+ use_ref_model: bool = True,
103
106
  ):
104
107
  """
105
108
  Args:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.2.dev20250130172806
3
+ Version: 0.5.2.dev20250130213846
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -4,7 +4,7 @@ liger_kernel/utils.py,sha256=HJa-xVKOohDn6pLVIx-Fv0V9h0QAL3qZGQNRICI-OpI,249
4
4
  liger_kernel/chunked_loss/README.md,sha256=0FmkFC3hKBqyoDT5uTlIYmrvRkF-EOCR1y-EBU1LpWU,2248
5
5
  liger_kernel/chunked_loss/__init__.py,sha256=48m-8IMOAReZbi0HK5aV-KGBp2IsZSwFvdnzTNrS4bk,516
6
6
  liger_kernel/chunked_loss/cpo_loss.py,sha256=OdBR8WYdHTKpLI_c9DcuwqKSWPeAAeTyREz46Vu_cAY,3682
7
- liger_kernel/chunked_loss/dpo_loss.py,sha256=VYZMOafdvE8xlhvTtwjrz81tIzxR1mHF4lXdsADnIQg,4373
7
+ liger_kernel/chunked_loss/dpo_loss.py,sha256=enFVgqIvWWOamOV3cl_dbq2HsjX7PF2d0kibDNyuCW4,4545
8
8
  liger_kernel/chunked_loss/functional.py,sha256=THWWpCnRVhTVfnPnyvQjdBvo1JDtxhwLmtZE_yiBBqM,817
9
9
  liger_kernel/chunked_loss/fused_linear_distillation.py,sha256=5V8rdva89WyHVbmJ8JOmC4DYNOR6ByXfx3qlUieOZkI,11002
10
10
  liger_kernel/chunked_loss/fused_linear_preference.py,sha256=idK9V9NivoVITqVpiG0fEGUHSvinYWkn9-EYXZjR-KQ,18356
@@ -61,9 +61,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
61
61
  liger_kernel/transformers/trainer/orpo_trainer.py,sha256=pdekW7l6Qg_aqa5SYKYlSWUF8m3lkOFvFLcIMEHrz9s,8338
62
62
  liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
63
63
  liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
64
- liger_kernel_nightly-0.5.2.dev20250130172806.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
65
- liger_kernel_nightly-0.5.2.dev20250130172806.dist-info/METADATA,sha256=LCLD7LcN4x7h1_LMuYPAtIUrhHGi2eoON-NOBtofCN0,21205
66
- liger_kernel_nightly-0.5.2.dev20250130172806.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
67
- liger_kernel_nightly-0.5.2.dev20250130172806.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
68
- liger_kernel_nightly-0.5.2.dev20250130172806.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
69
- liger_kernel_nightly-0.5.2.dev20250130172806.dist-info/RECORD,,
64
+ liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
65
+ liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/METADATA,sha256=piBJYHmJpYyIojWrErmhbQnpy29ILTI03ttIe1ekUZU,21205
66
+ liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
67
+ liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
68
+ liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
69
+ liger_kernel_nightly-0.5.2.dev20250130213846.dist-info/RECORD,,