liger-kernel-nightly 0.6.0.dev20250716142659__tar.gz → 0.6.0.dev20250718050347__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- liger_kernel_nightly-0.6.0.dev20250718050347/.github/workflows/benchmark.yml +158 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_embedding.py +8 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/dev/modal/benchmarks.py +1 -1
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- liger_kernel_nightly-0.6.0.dev20250716142659/.github/workflows/benchmark.yml +0 -93
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/.gitignore +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/Makefile +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/index.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/docs/license.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/setup.cfg +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/setup.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/test/utils.py +0 -0
@@ -0,0 +1,158 @@
|
|
1
|
+
name: Benchmarks
|
2
|
+
|
3
|
+
on:
|
4
|
+
schedule:
|
5
|
+
# Runs at 00:00 UTC every Friday
|
6
|
+
- cron: '0 0 * * 5'
|
7
|
+
workflow_dispatch: # Enables manual trigger
|
8
|
+
inputs:
|
9
|
+
commit_hash:
|
10
|
+
description: 'Commit hash to benchmark'
|
11
|
+
default: 'main'
|
12
|
+
overwrite:
|
13
|
+
description: 'Overwrite existing benchmark data if it exists'
|
14
|
+
type: boolean
|
15
|
+
default: false
|
16
|
+
|
17
|
+
permissions:
|
18
|
+
contents: write
|
19
|
+
|
20
|
+
concurrency:
|
21
|
+
# This causes it to cancel previous in-progress actions on the same PR / branch,
|
22
|
+
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
|
23
|
+
cancel-in-progress: true
|
24
|
+
|
25
|
+
jobs:
|
26
|
+
benchmarks:
|
27
|
+
runs-on: ubuntu-latest
|
28
|
+
env:
|
29
|
+
MODAL_TOKEN_ID: ${{ secrets.MODAL_TOKEN_ID }}
|
30
|
+
MODAL_TOKEN_SECRET: ${{ secrets.MODAL_TOKEN_SECRET }}
|
31
|
+
GITHUB_USERNAME: linkedin
|
32
|
+
REPO_NAME: Liger-Kernel
|
33
|
+
OUTPUT_DIR: benchmarks
|
34
|
+
OUTPUT_FILENAME: benchmark.csv
|
35
|
+
GENERATED_CSV: benchmark/data/all_benchmark_data.csv
|
36
|
+
|
37
|
+
|
38
|
+
steps:
|
39
|
+
# Step: Decide the commit hash to use
|
40
|
+
- name: Determine commit hash to checkout
|
41
|
+
id: choose_commit
|
42
|
+
run: |
|
43
|
+
if [ "${{ github.event.inputs.commit_hash }}" != "" ]; then
|
44
|
+
echo "Using manual input commit: ${{ github.event.inputs.commit_hash }}"
|
45
|
+
echo "hash=${{ github.event.inputs.commit_hash }}" >> $GITHUB_OUTPUT
|
46
|
+
else
|
47
|
+
echo "Using latest commit from main"
|
48
|
+
git fetch origin main
|
49
|
+
echo "hash=$(git rev-parse origin/main)" >> $GITHUB_OUTPUT
|
50
|
+
fi
|
51
|
+
|
52
|
+
# Step: Checkout full history so we can check out any commit
|
53
|
+
- name: Checkout full repo history
|
54
|
+
uses: actions/checkout@v3
|
55
|
+
with:
|
56
|
+
fetch-depth: 0 # Important: so we can checkout arbitrary commit
|
57
|
+
# Step: Conditionally replace benchmark folder from main
|
58
|
+
- name: Replace benchmark folder from main (manual only, commit ≠ main)
|
59
|
+
if: ${{ github.event_name == 'workflow_dispatch' && github.event.inputs.commit_hash != 'main' }}
|
60
|
+
run: |
|
61
|
+
echo "Detected manual trigger with commit_hash = ${{ github.event.inputs.commit_hash }}"
|
62
|
+
|
63
|
+
# Save current branch (detached HEAD at old commit)
|
64
|
+
ORIG_COMMIT=${{ github.event.inputs.commit_hash }}
|
65
|
+
|
66
|
+
# Fetch and checkout main
|
67
|
+
git fetch origin main
|
68
|
+
git checkout origin/main -- benchmark/
|
69
|
+
|
70
|
+
# Save benchmark folder from main
|
71
|
+
cp -r benchmark /tmp/benchmark_main
|
72
|
+
|
73
|
+
# Checkout back to target commit
|
74
|
+
git checkout $ORIG_COMMIT
|
75
|
+
|
76
|
+
# Replace old benchmark with one from main
|
77
|
+
rm -rf benchmark
|
78
|
+
cp -r /tmp/benchmark_main benchmark
|
79
|
+
|
80
|
+
# Step: Check if benchmark exists and exit if overwrite is false
|
81
|
+
- name: Check existing benchmark
|
82
|
+
run: |
|
83
|
+
COMMIT_HASH="${{ steps.choose_commit.outputs.hash }}"
|
84
|
+
BENCHMARK_URL="https://raw.githubusercontent.com/linkedin/Liger-Kernel/refs/heads/gh-pages/benchmarks/${COMMIT_HASH}/benchmark.csv"
|
85
|
+
|
86
|
+
if curl --output /dev/null --silent --head --fail "$BENCHMARK_URL"; then
|
87
|
+
echo "Benchmark already exists for commit $COMMIT_HASH"
|
88
|
+
if [ "${{ github.event.inputs.overwrite }}" != "true" ]; then
|
89
|
+
echo "Overwrite is false - exiting"
|
90
|
+
exit 1
|
91
|
+
else
|
92
|
+
echo "Overwrite is true - proceeding"
|
93
|
+
fi
|
94
|
+
else
|
95
|
+
echo "No existing benchmark found - proceeding"
|
96
|
+
fi
|
97
|
+
|
98
|
+
- name: Set up Python
|
99
|
+
uses: actions/setup-python@v3
|
100
|
+
with:
|
101
|
+
python-version: '3.10'
|
102
|
+
|
103
|
+
# Install dependencies
|
104
|
+
- name: Install dependencies
|
105
|
+
run: |
|
106
|
+
python -m pip install --upgrade pip
|
107
|
+
pip install modal
|
108
|
+
|
109
|
+
# Delete previous benchmark results.
|
110
|
+
- name: Remove previous benchmark data
|
111
|
+
run: |
|
112
|
+
rm -f benchmark/data/all_benchmark_data.csv
|
113
|
+
|
114
|
+
- name: Run benchmarks on GPU
|
115
|
+
run: |
|
116
|
+
modal run dev.modal.benchmarks
|
117
|
+
|
118
|
+
# Step 5: Checkout gh-pages branch in a subfolderAdd commentMore actions
|
119
|
+
- name: Checkout gh-pages
|
120
|
+
uses: actions/checkout@v3
|
121
|
+
with:
|
122
|
+
ref: gh-pages
|
123
|
+
path: gh-pages
|
124
|
+
|
125
|
+
# Step 6: Copy benchmark CSV to gh-pages directory
|
126
|
+
- name: Copy generated benchmark to gh-pages
|
127
|
+
run: |
|
128
|
+
COMMIT_DIR="gh-pages/${OUTPUT_DIR}/${{ steps.choose_commit.outputs.hash }}"
|
129
|
+
mkdir -p "$COMMIT_DIR"
|
130
|
+
|
131
|
+
if [ -f "$COMMIT_DIR/${OUTPUT_FILENAME}" ]; then
|
132
|
+
echo "Removing existing benchmark.csv for this commit"
|
133
|
+
rm "$COMMIT_DIR/${OUTPUT_FILENAME}"
|
134
|
+
fi
|
135
|
+
|
136
|
+
cp "${GENERATED_CSV}" "$COMMIT_DIR/${OUTPUT_FILENAME}"
|
137
|
+
|
138
|
+
# Step 7: Append commit hash to commits.txt if not already present
|
139
|
+
- name: Update commits.txt
|
140
|
+
run: |
|
141
|
+
cd gh-pages
|
142
|
+
echo "commits.txt file path: ${OUTPUT_DIR}/commits.txt"
|
143
|
+
# Create file if it doesn't exist
|
144
|
+
mkdir -p ${OUTPUT_DIR}
|
145
|
+
touch ${OUTPUT_DIR}/commits.txt
|
146
|
+
|
147
|
+
echo "${{ steps.choose_commit.outputs.hash }}" >> ${OUTPUT_DIR}/commits.txt
|
148
|
+
echo "Added commit hash to commits.txt"
|
149
|
+
# Step 7: Commit and push
|
150
|
+
- name: Commit and push to gh-pages
|
151
|
+
run: |
|
152
|
+
cd gh-pages
|
153
|
+
git config user.name github-actions[bot]
|
154
|
+
git config user.email 41898282+github-actions[bot]@users.noreply.github.com
|
155
|
+
git add .
|
156
|
+
git commit -m "Add benchmark for commit ${{ steps.choose_commit.outputs.hash }}" || echo "No changes to commit"
|
157
|
+
git push origin gh-pages
|
158
|
+
|
@@ -48,6 +48,14 @@ def bench_speed_embedding(input: SingleBenchmarkRunInput) -> SingleBenchmarkRunO
|
|
48
48
|
|
49
49
|
if mode == "forward":
|
50
50
|
ms_50, ms_20, ms_80 = triton.testing.do_bench(fwd, quantiles=QUANTILES, rep=100)
|
51
|
+
elif mode == "backward":
|
52
|
+
output = fwd()
|
53
|
+
ms_50, ms_20, ms_80 = triton.testing.do_bench(
|
54
|
+
lambda: output.backward(torch.randn_like(output), retain_graph=True),
|
55
|
+
quantiles=QUANTILES,
|
56
|
+
grad_to_none=[input_ids],
|
57
|
+
rep=100,
|
58
|
+
)
|
51
59
|
elif mode == "full":
|
52
60
|
ms_50, ms_20, ms_80 = triton.testing.do_bench(full, quantiles=QUANTILES, rep=100)
|
53
61
|
return SingleBenchmarkRunOutput(
|
@@ -14,7 +14,7 @@ app = modal.App("liger_benchmarks", image=image)
|
|
14
14
|
repo = image.add_local_dir(ROOT_PATH, remote_path=REMOTE_ROOT_PATH)
|
15
15
|
|
16
16
|
|
17
|
-
@app.function(gpu=
|
17
|
+
@app.function(gpu="H100!", image=repo, timeout=60 * 90)
|
18
18
|
def liger_benchmarks():
|
19
19
|
import os
|
20
20
|
import subprocess
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.6.0.
|
7
|
+
version = "0.6.0.dev20250718050347"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -1,93 +0,0 @@
|
|
1
|
-
name: Benchmarks
|
2
|
-
|
3
|
-
on:
|
4
|
-
schedule:
|
5
|
-
# Runs at 00:00 UTC every Friday
|
6
|
-
- cron: '0 0 * * 5'
|
7
|
-
workflow_dispatch: # Enables manual trigger
|
8
|
-
|
9
|
-
permissions:
|
10
|
-
contents: write
|
11
|
-
|
12
|
-
concurrency:
|
13
|
-
# This causes it to cancel previous in-progress actions on the same PR / branch,
|
14
|
-
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
|
15
|
-
cancel-in-progress: true
|
16
|
-
|
17
|
-
jobs:
|
18
|
-
benchmarks:
|
19
|
-
runs-on: ubuntu-latest
|
20
|
-
env:
|
21
|
-
MODAL_TOKEN_ID: ${{ secrets.MODAL_TOKEN_ID }}
|
22
|
-
MODAL_TOKEN_SECRET: ${{ secrets.MODAL_TOKEN_SECRET }}
|
23
|
-
GITHUB_USERNAME: linkedin
|
24
|
-
REPO_NAME: Liger-Kernel
|
25
|
-
OUTPUT_DIR: benchmarks
|
26
|
-
OUTPUT_FILENAME: benchmark.csv
|
27
|
-
GENERATED_CSV: benchmark/data/all_benchmark_data.csv
|
28
|
-
|
29
|
-
|
30
|
-
steps:
|
31
|
-
- name: Checkout code
|
32
|
-
uses: actions/checkout@v3
|
33
|
-
|
34
|
-
# Get the latest commit hash from main branch
|
35
|
-
- name: Get commit hash
|
36
|
-
id: get_hash
|
37
|
-
run: echo "hash=$(git rev-parse --short HEAD)" >> $GITHUB_OUTPUT
|
38
|
-
|
39
|
-
- name: Set up Python
|
40
|
-
uses: actions/setup-python@v3
|
41
|
-
with:
|
42
|
-
python-version: '3.10'
|
43
|
-
|
44
|
-
# Install dependencies
|
45
|
-
- name: Install dependencies
|
46
|
-
run: |
|
47
|
-
python -m pip install --upgrade pip
|
48
|
-
pip install modal
|
49
|
-
pip install pandas
|
50
|
-
|
51
|
-
# Delete previous benchmark results.
|
52
|
-
- name: Remove previous benchmark data
|
53
|
-
run: |
|
54
|
-
rm -f benchmark/data/all_benchmark_data.csv
|
55
|
-
|
56
|
-
- name: Run benchmarks on GPU
|
57
|
-
run: |
|
58
|
-
modal run dev.modal.benchmarks
|
59
|
-
|
60
|
-
# Step 5: Checkout gh-pages branch in a subfolderAdd commentMore actions
|
61
|
-
- name: Checkout gh-pages
|
62
|
-
uses: actions/checkout@v3
|
63
|
-
with:
|
64
|
-
ref: gh-pages
|
65
|
-
path: gh-pages
|
66
|
-
|
67
|
-
# Step 6: Copy benchmark CSV to gh-pages directory
|
68
|
-
- name: Copy generated benchmark to gh-pages
|
69
|
-
run: |
|
70
|
-
mkdir -p gh-pages/${OUTPUT_DIR}/${{ steps.get_hash.outputs.hash }}
|
71
|
-
cp ${GENERATED_CSV} gh-pages/${OUTPUT_DIR}/${{ steps.get_hash.outputs.hash }}/${OUTPUT_FILENAME}
|
72
|
-
# Step 7: Append commit hash to commits.txt if not already present
|
73
|
-
- name: Update commits.txt
|
74
|
-
run: |
|
75
|
-
cd gh-pages
|
76
|
-
echo "commits.txt file path: ${OUTPUT_DIR}/commits.txt"
|
77
|
-
# Create file if it doesn't exist
|
78
|
-
mkdir -p ${OUTPUT_DIR}
|
79
|
-
touch ${OUTPUT_DIR}/commits.txt
|
80
|
-
# Append only if not already present
|
81
|
-
if ! grep -q "${{ steps.get_hash.outputs.hash }}" ${OUTPUT_DIR}/commits.txt; then
|
82
|
-
echo "${{ steps.get_hash.outputs.hash }}" >> ${OUTPUT_DIR}/commits.txt
|
83
|
-
fi
|
84
|
-
# Step 7: Commit and push
|
85
|
-
- name: Commit and push to gh-pages
|
86
|
-
run: |
|
87
|
-
cd gh-pages
|
88
|
-
git config user.name github-actions[bot]
|
89
|
-
git config user.email 41898282+github-actions[bot]@users.noreply.github.com
|
90
|
-
git add .
|
91
|
-
git commit -m "Add benchmark for commit ${{ steps.get_hash.outputs.hash }}" || echo "No changes to commit"
|
92
|
-
git push origin gh-pages
|
93
|
-
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.6.0.dev20250716142659 → liger_kernel_nightly-0.6.0.dev20250718050347}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|