liger-kernel-nightly 0.5.2.dev20241220220835__py3-none-any.whl → 0.5.2.dev20241220231758__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
@@ -36,8 +36,8 @@ class LigerFusedLinearCPOFunction(LigerFusedLinearPreferenceBase):
36
36
  """
37
37
  logits = beta * (chosen_logps - rejected_logps)
38
38
  loss = (
39
- F.logsigmoid(logits) * (1 - label_smoothing)
40
- + F.logsigmoid(-logits) * label_smoothing
39
+ - F.logsigmoid(logits) * (1 - label_smoothing)
40
+ - F.logsigmoid(-logits) * label_smoothing
41
41
  ).sum() / (full_target.shape[0] // 2)
42
42
 
43
43
  return loss
@@ -408,7 +408,7 @@ class LigerFusedLinearPreferenceBase(torch.autograd.Function):
408
408
  else:
409
409
  preference_loss, aux_outputs = preference_loss_outputs, []
410
410
 
411
- loss = alpha * chosen_nll_loss - preference_loss
411
+ loss = alpha * chosen_nll_loss + preference_loss
412
412
  return_vars = (
413
413
  chosen_logps,
414
414
  rejected_logps,
@@ -36,7 +36,7 @@ class LigerFusedLinearORPOFunction(LigerFusedLinearPreferenceBase):
36
36
  - torch.log1p(-torch.exp(rejected_logps))
37
37
  )
38
38
  ratio = F.logsigmoid(log_odds)
39
- loss = beta * ratio.sum() / (full_target.shape[0] // 2)
39
+ loss = -beta * ratio.sum() / (full_target.shape[0] // 2)
40
40
 
41
41
  chosen_rewards = beta * chosen_logps
42
42
  rejected_rewards = beta * rejected_logps
@@ -42,8 +42,8 @@ class LigerFusedLinearSimPOFunction(LigerFusedLinearPreferenceBase):
42
42
  """
43
43
  logits = beta * (chosen_logps - rejected_logps) - gamma
44
44
  loss = (
45
- F.logsigmoid(logits) * (1 - label_smoothing)
46
- + F.logsigmoid(-logits) * label_smoothing
45
+ - F.logsigmoid(logits) * (1 - label_smoothing)
46
+ - F.logsigmoid(-logits) * label_smoothing
47
47
  ).sum() / (full_target.shape[0] // 2)
48
48
 
49
49
  return loss
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.2.dev20241220220835
3
+ Version: 0.5.2.dev20241220231758
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -3,13 +3,13 @@ liger_kernel/env_report.py,sha256=ok9PMXtO-8uLj_feCJI4h9hz2NtolZ2AG_OJTW5qmo4,18
3
3
  liger_kernel/utils.py,sha256=HJa-xVKOohDn6pLVIx-Fv0V9h0QAL3qZGQNRICI-OpI,249
4
4
  liger_kernel/chunked_loss/README.md,sha256=K6rucm6nqHpWCmxUOhBYcE3apwQxAy0TfRUippR7Icw,2243
5
5
  liger_kernel/chunked_loss/__init__.py,sha256=R2wCcz4Y0kTAve926DH3k182XKezpXeACMHj05g9Mm8,346
6
- liger_kernel/chunked_loss/cpo_loss.py,sha256=_0phkDQg_SG239xNVlaAvGoL33myt0Zt6avDJfg6HC0,3552
6
+ liger_kernel/chunked_loss/cpo_loss.py,sha256=3PdSp1gju1u0ffFGpUufbZPIva8aI3SW1TfqkJOpw1g,3554
7
7
  liger_kernel/chunked_loss/dpo_loss.py,sha256=jbTno1pKEc-HxAGFY3NSycBzdWyTacyRCzH3FhrMUMo,4383
8
8
  liger_kernel/chunked_loss/functional.py,sha256=9Gr-YXIuEzEJkBUhDx3G2fuQayckLor7cC7svhmPML4,549
9
9
  liger_kernel/chunked_loss/fused_linear_distillation.py,sha256=2BH6DCPjsR2zS6zcwFPcIIZRhLF8SohjGdKsAJ_301o,10222
10
- liger_kernel/chunked_loss/fused_linear_preference.py,sha256=AsovMdfsOjgWVxtDhZ_rXqpahMsKTg8YueXnZcHt1XQ,16376
11
- liger_kernel/chunked_loss/orpo_loss.py,sha256=ZuKGjbkIYzV4UzvupNdq6vyxCp7-BztQkUt8ZnFvKos,3531
12
- liger_kernel/chunked_loss/simpo_loss.py,sha256=Lb7v-a1nmapiCZGxgoWtoLRBiSLI3arFJ-WstjTqIAs,3757
10
+ liger_kernel/chunked_loss/fused_linear_preference.py,sha256=vvratrj8rba8NaGbO2ffbUfWMVEvDMxDCo6SI8nCtbo,16376
11
+ liger_kernel/chunked_loss/orpo_loss.py,sha256=xHsKjlCWQVew7_hhpyUp3a1wd0tdpgx-zQAezNjk3Q4,3532
12
+ liger_kernel/chunked_loss/simpo_loss.py,sha256=_5gXIkEAT0Kt_AufziQlYhBjzDJVSQVk7oSDHcrw1xw,3759
13
13
  liger_kernel/ops/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
14
14
  liger_kernel/ops/cross_entropy.py,sha256=oG5hfrlmnlF5lOoZRhHRglObxgH4B0KadjWMJj9EWPM,15860
15
15
  liger_kernel/ops/fused_linear_cross_entropy.py,sha256=Tnw4gyAYVVdnCOqhOuLEzbUQ3goOTnoAfk3pqSIM5ac,9301
@@ -58,9 +58,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=c4OQVJmhNOloj0JYSEc0j_cQuBb
58
58
  liger_kernel/transformers/trainer/orpo_trainer.py,sha256=O2k2vdHl-O1S-U61aEmyUFu3QrEuNAipQa2oUBb3HAA,7679
59
59
  liger_kernel/triton/__init__.py,sha256=yfRe0zMb47QnqjecZWG7LnanfCTzeku7SgWRAwNVmzU,101
60
60
  liger_kernel/triton/monkey_patch.py,sha256=5BcGKTtdqeYchypBIBopGIWPx1-cFALz7sOKoEsqXJ0,1584
61
- liger_kernel_nightly-0.5.2.dev20241220220835.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
62
- liger_kernel_nightly-0.5.2.dev20241220220835.dist-info/METADATA,sha256=TKTsG1OaMEqrbqun7C_JsCMT3Ui6ED2G0CPLnno79QA,21055
63
- liger_kernel_nightly-0.5.2.dev20241220220835.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
64
- liger_kernel_nightly-0.5.2.dev20241220220835.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
65
- liger_kernel_nightly-0.5.2.dev20241220220835.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
66
- liger_kernel_nightly-0.5.2.dev20241220220835.dist-info/RECORD,,
61
+ liger_kernel_nightly-0.5.2.dev20241220231758.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
62
+ liger_kernel_nightly-0.5.2.dev20241220231758.dist-info/METADATA,sha256=o8KNSXeyS1E1vgQVqX7pZRdbzCXPDeG2iaGDZ2a2_mM,21055
63
+ liger_kernel_nightly-0.5.2.dev20241220231758.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
64
+ liger_kernel_nightly-0.5.2.dev20241220231758.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
65
+ liger_kernel_nightly-0.5.2.dev20241220231758.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
66
+ liger_kernel_nightly-0.5.2.dev20241220231758.dist-info/RECORD,,