liger-kernel-nightly 0.5.2.dev20241211213024__tar.gz → 0.5.2.dev20241211231633__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.5.2.dev20241211213024/src/liger_kernel_nightly.egg-info → liger_kernel_nightly-0.5.2.dev20241211231633}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/chunked_loss/fused_linear_preference.py +2 -6
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633/src/liger_kernel_nightly.egg-info}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/README.md +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/setup.cfg +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.5.2.
|
7
|
+
version = "0.5.2.dev20241211231633"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -29,7 +29,7 @@ class LigerFusedLinearPreferenceBase(torch.autograd.Function):
|
|
29
29
|
compute_nll_loss=True,
|
30
30
|
compiled=True,
|
31
31
|
use_ref_model=False,
|
32
|
-
|
32
|
+
# TODO: ref input
|
33
33
|
ref_weight=None,
|
34
34
|
ref_bias=None,
|
35
35
|
**loss_kwargs,
|
@@ -59,7 +59,6 @@ class LigerFusedLinearPreferenceBase(torch.autograd.Function):
|
|
59
59
|
compute_nll_loss (bool): Whether to compute NLL loss.
|
60
60
|
compiled (bool): Whether to use torch compile for chunk accumulation.
|
61
61
|
use_ref_model (bool): Whether to use a reference model for the alignment loss.
|
62
|
-
ref_input (torch.Tensor): Reference input tensor. Shape: (batch_size, seq_len, hidden_size).
|
63
62
|
ref_weight (torch.Tensor): Reference weight tensor. Shape: (vocab_size, hidden_size).
|
64
63
|
ref_bias (torch.Tensor, optional): Reference bias tensor. Shape: (vocab_size,).
|
65
64
|
loss_kwargs (dict): Other possible arguments that a loss function might need
|
@@ -93,7 +92,6 @@ class LigerFusedLinearPreferenceBase(torch.autograd.Function):
|
|
93
92
|
compute_nll_loss=compute_nll_loss,
|
94
93
|
full_target=target,
|
95
94
|
use_ref_model=use_ref_model,
|
96
|
-
ref_input=ref_input,
|
97
95
|
ref_weight=ref_weight,
|
98
96
|
ref_bias=ref_bias,
|
99
97
|
**loss_kwargs,
|
@@ -303,7 +301,6 @@ class LigerFusedLinearPreferenceBase(torch.autograd.Function):
|
|
303
301
|
beta=0.1,
|
304
302
|
compute_nll_loss=True,
|
305
303
|
use_ref_model=False,
|
306
|
-
ref_input=None,
|
307
304
|
ref_weight=None,
|
308
305
|
ref_bias=None,
|
309
306
|
**loss_kwargs,
|
@@ -322,7 +319,6 @@ class LigerFusedLinearPreferenceBase(torch.autograd.Function):
|
|
322
319
|
beta (float): Weight for the preference loss.
|
323
320
|
compute_nll_loss (bool): Whether to compute NLL loss.
|
324
321
|
use_ref_model (bool): Whether to use a reference model for the alignment loss.
|
325
|
-
ref_input (torch.Tensor): Reference input tensor. Shape: (2 * chunk_size, sequence_length, hidden_size).
|
326
322
|
ref_weight (torch.Tensor): Reference weight tensor. Shape: (vocab_size, hidden_size).
|
327
323
|
ref_bias (torch.Tensor, optional): Reference bias tensor. Shape: (vocab_size,).
|
328
324
|
loss_kwargs (dict): Additional arguments for the loss function.
|
@@ -361,7 +357,7 @@ class LigerFusedLinearPreferenceBase(torch.autograd.Function):
|
|
361
357
|
ref_rejected_logits,
|
362
358
|
ref_chosen_nll_loss,
|
363
359
|
) = LigerFusedLinearPreferenceBase.chunk_forward(
|
364
|
-
|
360
|
+
input_chunk,
|
365
361
|
ref_weight,
|
366
362
|
target_chunk,
|
367
363
|
ref_bias,
|
File without changes
|
{liger_kernel_nightly-0.5.2.dev20241211213024 → liger_kernel_nightly-0.5.2.dev20241211231633}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|