liger-kernel-nightly 0.6.0.dev20250722224228__tar.gz → 0.6.0.dev20250722231330__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/workflows/benchmark.yml +15 -6
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/layer_norm.py +1 -2
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/.gitignore +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/Makefile +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/index.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/docs/license.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/setup.cfg +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/setup.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/model/smollm3.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/test/utils.py +0 -0
@@ -1,6 +1,8 @@
|
|
1
1
|
name: Benchmarks
|
2
2
|
|
3
3
|
on:
|
4
|
+
release:
|
5
|
+
types: [published]
|
4
6
|
schedule:
|
5
7
|
# Runs at 00:00 UTC every Friday
|
6
8
|
- cron: '0 0 * * 5'
|
@@ -69,10 +71,8 @@ jobs:
|
|
69
71
|
|
70
72
|
# Save benchmark folder from main
|
71
73
|
cp -r benchmark /tmp/benchmark_main
|
72
|
-
|
73
74
|
# Checkout back to target commit
|
74
75
|
git checkout $ORIG_COMMIT
|
75
|
-
|
76
76
|
# Replace old benchmark with one from main
|
77
77
|
rm -rf benchmark
|
78
78
|
cp -r /tmp/benchmark_main benchmark
|
@@ -124,8 +124,17 @@ jobs:
|
|
124
124
|
|
125
125
|
# Step 6: Copy benchmark CSV to gh-pages directory
|
126
126
|
- name: Copy generated benchmark to gh-pages
|
127
|
+
id: copy_benchmark
|
127
128
|
run: |
|
128
|
-
|
129
|
+
if [[ "${{ github.event_name }}" == "release" ]]; then
|
130
|
+
echo "Release event detected"
|
131
|
+
path=${{steps.choose_commit.outputs.hash}}-${{ github.event.release.tag_name }}
|
132
|
+
else
|
133
|
+
echo "Not a release event"
|
134
|
+
path=${{steps.choose_commit.outputs.hash}}
|
135
|
+
fi
|
136
|
+
COMMIT_DIR="gh-pages/${OUTPUT_DIR}/${path}"
|
137
|
+
|
129
138
|
mkdir -p "$COMMIT_DIR"
|
130
139
|
|
131
140
|
if [ -f "$COMMIT_DIR/${OUTPUT_FILENAME}" ]; then
|
@@ -144,7 +153,8 @@ jobs:
|
|
144
153
|
mkdir -p ${OUTPUT_DIR}
|
145
154
|
touch ${OUTPUT_DIR}/commits.txt
|
146
155
|
|
147
|
-
echo "${{ steps.
|
156
|
+
echo "${{ steps.copy_benchmark.outputs.path }}" >> ${OUTPUT_DIR}/commits.txt
|
157
|
+
|
148
158
|
echo "Added commit hash to commits.txt"
|
149
159
|
# Step 7: Commit and push
|
150
160
|
- name: Commit and push to gh-pages
|
@@ -153,6 +163,5 @@ jobs:
|
|
153
163
|
git config user.name github-actions[bot]
|
154
164
|
git config user.email 41898282+github-actions[bot]@users.noreply.github.com
|
155
165
|
git add .
|
156
|
-
git commit -m "Add benchmark for commit ${{ steps.
|
166
|
+
git commit -m "Add benchmark for commit ${{ steps.copy_benchmark.outputs.path }}" || echo "No changes to commit"
|
157
167
|
git push origin gh-pages
|
158
|
-
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.6.0.
|
7
|
+
version = "0.6.0.dev20250722231330"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -256,8 +256,8 @@ def layer_norm_backward(dY, X, W, B, Mean, RSTD):
|
|
256
256
|
# Use float32 for atomic operations if bfloat16 is not supported
|
257
257
|
atomic_dtype = tl.float32 if triton_dtype == tl.bfloat16 else triton_dtype
|
258
258
|
|
259
|
+
kernel_args = {"num_warps": num_warps}
|
259
260
|
# XPU-specific optimization
|
260
|
-
kernel_args = {}
|
261
261
|
if X.device.type == "xpu":
|
262
262
|
kernel_args.update({"grf_mode": "large", "num_warps": 32, "num_stages": 4})
|
263
263
|
|
@@ -279,7 +279,6 @@ def layer_norm_backward(dY, X, W, B, Mean, RSTD):
|
|
279
279
|
BLOCK_SIZE=BLOCK_SIZE,
|
280
280
|
dtype=triton_dtype,
|
281
281
|
atomic_dtype=atomic_dtype,
|
282
|
-
num_warps=num_warps,
|
283
282
|
**kernel_args,
|
284
283
|
)
|
285
284
|
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.6.0.dev20250722224228 → liger_kernel_nightly-0.6.0.dev20250722231330}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|