liger-kernel-nightly 0.5.8.dev20250416185644__tar.gz → 0.5.8.dev20250422210723__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/workflows/intel-ci.yml +24 -11
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/dpo_loss.py +8 -1
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/bf16/test_mini_models_multimodal.py +1 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/fp32/test_mini_models_multimodal.py +7 -4
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/.gitignore +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/Makefile +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/README.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/index.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/docs/license.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/setup.cfg +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/setup.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/gema3_rms.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/test/utils.py +0 -0
@@ -45,27 +45,40 @@ jobs:
|
|
45
45
|
run: make checkstyle
|
46
46
|
|
47
47
|
tests:
|
48
|
-
runs-on: linux-max1550-
|
48
|
+
runs-on: linux-max1550-pvc-8
|
49
49
|
needs: [checkstyle]
|
50
|
-
|
50
|
+
if: success()
|
51
|
+
container:
|
52
|
+
image: intel/oneapi-basekit:2025.0.1-0-devel-ubuntu24.04
|
53
|
+
options: --privileged -v /dev/dri/by-path:/dev/dri/by-path --device=/dev/dri --ipc=host
|
51
54
|
steps:
|
55
|
+
- name: Set up python
|
56
|
+
shell: bash
|
57
|
+
run: |
|
58
|
+
apt-get update && \
|
59
|
+
apt-get install -y python3.12-venv python3-pip && \
|
60
|
+
ln -sf /usr/bin/python3 /usr/bin/python && \
|
61
|
+
apt-get clean && rm -rf /var/lib/apt/lists/*
|
62
|
+
|
52
63
|
- name: Checkout code
|
53
64
|
uses: actions/checkout@v3
|
54
|
-
|
55
|
-
- name: Set up Python
|
56
|
-
uses: actions/setup-python@v3
|
57
|
-
with:
|
58
|
-
python-version: '3.10'
|
59
|
-
|
65
|
+
|
60
66
|
- name: Setup Dependencies
|
67
|
+
shell: bash
|
61
68
|
run: |
|
62
|
-
python -m
|
69
|
+
python -m venv test-env
|
70
|
+
. test-env/bin/activate
|
63
71
|
pip install -e .[dev] --extra-index-url https://download.pytorch.org/whl/test/xpu
|
64
|
-
|
72
|
+
|
65
73
|
- name: List Python Environments
|
66
|
-
|
74
|
+
shell: bash
|
75
|
+
run: |
|
76
|
+
. test-env/bin/activate
|
77
|
+
python -m pip list
|
67
78
|
|
68
79
|
- name: Run Unit Tests
|
80
|
+
shell: bash
|
69
81
|
run: |
|
82
|
+
. test-env/bin/activate
|
70
83
|
make test
|
71
84
|
make test-convergence
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.5.8.
|
7
|
+
version = "0.5.8.dev20250422210723"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -68,6 +68,7 @@ class LigerFusedLinearDPOFunction(LigerFusedLinearPreferenceBase):
|
|
68
68
|
compute_nll_loss=False,
|
69
69
|
compiled=True,
|
70
70
|
use_ref_model=True,
|
71
|
+
average_log_prob=False,
|
71
72
|
chunk_size=1,
|
72
73
|
):
|
73
74
|
"""
|
@@ -85,6 +86,7 @@ class LigerFusedLinearDPOFunction(LigerFusedLinearPreferenceBase):
|
|
85
86
|
compute_nll_loss (bool): Whether to compute the NLL loss
|
86
87
|
compiled (bool): Whether to use torch compile
|
87
88
|
use_ref_model (bool): Whether to use a reference model
|
89
|
+
average_log_prob (bool): Whether to average the log probability per non-masked token
|
88
90
|
chunk_size (int): Size of chunks for processing.
|
89
91
|
Returns:
|
90
92
|
torch.Tensor: Computed loss
|
@@ -104,13 +106,14 @@ class LigerFusedLinearDPOFunction(LigerFusedLinearPreferenceBase):
|
|
104
106
|
ref_input=ref_input,
|
105
107
|
ref_weight=ref_weight,
|
106
108
|
ref_bias=ref_bias,
|
109
|
+
average_log_prob=average_log_prob,
|
107
110
|
chunk_size=chunk_size,
|
108
111
|
)
|
109
112
|
|
110
113
|
@staticmethod
|
111
114
|
def backward(ctx, *grad_output):
|
112
115
|
grads = LigerFusedLinearPreferenceBase.backward(ctx, grad_output)[:4]
|
113
|
-
return *grads, None, None, None, None, None, None, None, None, None
|
116
|
+
return *grads, None, None, None, None, None, None, None, None, None, None
|
114
117
|
|
115
118
|
|
116
119
|
class LigerFusedLinearDPOLoss(torch.nn.Module):
|
@@ -125,6 +128,7 @@ class LigerFusedLinearDPOLoss(torch.nn.Module):
|
|
125
128
|
compute_nll_loss: bool = False,
|
126
129
|
compiled: bool = True,
|
127
130
|
use_ref_model: bool = True,
|
131
|
+
average_log_prob: bool = True,
|
128
132
|
chunk_size: int = 1,
|
129
133
|
):
|
130
134
|
"""
|
@@ -134,6 +138,7 @@ class LigerFusedLinearDPOLoss(torch.nn.Module):
|
|
134
138
|
compute_nll_loss (bool): Whether to compute the NLL loss.
|
135
139
|
compiled (bool): Whether to use the torch compiled kernel.
|
136
140
|
use_ref_model (bool): Whether to use a reference model for the DPO loss.
|
141
|
+
average_log_prob (bool): Whether to average the log probability per non-masked token.
|
137
142
|
chunk_size (int): Size of chunks for processing.
|
138
143
|
"""
|
139
144
|
super().__init__()
|
@@ -142,6 +147,7 @@ class LigerFusedLinearDPOLoss(torch.nn.Module):
|
|
142
147
|
self.compute_nll_loss = compute_nll_loss
|
143
148
|
self.compiled = compiled
|
144
149
|
self.use_ref_model = use_ref_model
|
150
|
+
self.average_log_prob = average_log_prob
|
145
151
|
self.chunk_size = chunk_size
|
146
152
|
|
147
153
|
def forward(
|
@@ -167,5 +173,6 @@ class LigerFusedLinearDPOLoss(torch.nn.Module):
|
|
167
173
|
self.compute_nll_loss,
|
168
174
|
self.compiled,
|
169
175
|
self.use_ref_model,
|
176
|
+
self.average_log_prob,
|
170
177
|
self.chunk_size,
|
171
178
|
)
|
@@ -862,10 +862,13 @@ def run_mini_model_multimodal(
|
|
862
862
|
1e-5,
|
863
863
|
5e-3,
|
864
864
|
1e-5,
|
865
|
-
marks=
|
866
|
-
|
867
|
-
|
868
|
-
|
865
|
+
marks=[
|
866
|
+
pytest.mark.skipif(
|
867
|
+
not GEMMA3_AVAILABLE,
|
868
|
+
reason="Gemma3 not available in this version of transformers",
|
869
|
+
),
|
870
|
+
pytest.mark.skipif(device == "xpu", reason="skip for XPU"),
|
871
|
+
],
|
869
872
|
),
|
870
873
|
],
|
871
874
|
)
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.5.8.dev20250416185644 → liger_kernel_nightly-0.5.8.dev20250422210723}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|