liger-kernel-nightly 0.5.10.dev20250611191801__tar.gz → 0.5.10.dev20250613192702__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/PKG-INFO +2 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_cpo_loss.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_cross_entropy.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_distill_jsd_loss.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_dpo_loss.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_embedding.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_linear_jsd.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_jsd.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_kl_div.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_kto_loss.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_layer_norm.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_orpo_loss.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_simpo_loss.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_softmax.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_swiglu.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_tvd.py +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/utils.py +1 -1
- liger_kernel_nightly-0.5.10.dev20250613192702/dev/modal/benchmarks.py +73 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/setup.py +1 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/PKG-INFO +2 -1
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/requires.txt +1 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models_multimodal.py +3 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models_multimodal.py +3 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/utils.py +7 -0
- liger_kernel_nightly-0.5.10.dev20250611191801/dev/modal/benchmarks.py +0 -28
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/benchmark.yml +2 -2
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.gitignore +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.idea/workspace.xml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/Makefile +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/index.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/license.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/setup.cfg +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/triton/test_triton_monkey_patch.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: liger_kernel_nightly
|
3
|
-
Version: 0.5.10.
|
3
|
+
Version: 0.5.10.dev20250613192702
|
4
4
|
Summary: Efficient Triton kernels for LLM Training
|
5
5
|
License: BSD 2-CLAUSE LICENSE
|
6
6
|
Copyright 2024 LinkedIn Corporation
|
@@ -45,6 +45,7 @@ Requires-Dist: datasets>=2.19.2; extra == "dev"
|
|
45
45
|
Requires-Dist: seaborn; extra == "dev"
|
46
46
|
Requires-Dist: mkdocs; extra == "dev"
|
47
47
|
Requires-Dist: mkdocs-material; extra == "dev"
|
48
|
+
Requires-Dist: torchvision>=0.20; extra == "dev"
|
48
49
|
|
49
50
|
<a name="readme-top"></a>
|
50
51
|
|
@@ -147,7 +147,7 @@ if __name__ == "__main__":
|
|
147
147
|
|
148
148
|
run_benchmarks(
|
149
149
|
bench_test_fn=bench_speed_fused_linear_cpo_loss,
|
150
|
-
kernel_operation_modes=["forward", "full"],
|
150
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
151
151
|
metric_name="speed",
|
152
152
|
metric_unit="ms",
|
153
153
|
**common_configs,
|
@@ -109,7 +109,7 @@ if __name__ == "__main__":
|
|
109
109
|
|
110
110
|
run_benchmarks(
|
111
111
|
bench_test_fn=bench_speed_cross_entropy,
|
112
|
-
kernel_operation_modes=["forward", "full"],
|
112
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
113
113
|
metric_name="speed",
|
114
114
|
metric_unit="ms",
|
115
115
|
**common_configs,
|
@@ -248,7 +248,7 @@ if __name__ == "__main__":
|
|
248
248
|
|
249
249
|
run_benchmarks(
|
250
250
|
bench_test_fn=bench_speed_jsd_loss,
|
251
|
-
kernel_operation_modes=["forward", "full"],
|
251
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
252
252
|
metric_name="speed",
|
253
253
|
metric_unit="ms",
|
254
254
|
**common_configs,
|
@@ -166,7 +166,7 @@ if __name__ == "__main__":
|
|
166
166
|
|
167
167
|
run_benchmarks(
|
168
168
|
bench_test_fn=bench_speed_dpo_loss,
|
169
|
-
kernel_operation_modes=["forward", "full"],
|
169
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
170
170
|
metric_name="speed",
|
171
171
|
metric_unit="ms",
|
172
172
|
**common_configs,
|
@@ -112,7 +112,7 @@ if __name__ == "__main__":
|
|
112
112
|
|
113
113
|
run_benchmarks(
|
114
114
|
bench_test_fn=bench_speed_embedding,
|
115
|
-
kernel_operation_modes=["forward", "full"],
|
115
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
116
116
|
metric_name="speed",
|
117
117
|
metric_unit="ms",
|
118
118
|
**common_configs,
|
@@ -156,7 +156,7 @@ if __name__ == "__main__":
|
|
156
156
|
|
157
157
|
run_benchmarks(
|
158
158
|
bench_test_fn=bench_speed_fused_linear_cross_entropy,
|
159
|
-
kernel_operation_modes=["forward", "full"],
|
159
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
160
160
|
metric_name="speed",
|
161
161
|
metric_unit="ms",
|
162
162
|
**common_configs,
|
@@ -246,7 +246,7 @@ if __name__ == "__main__":
|
|
246
246
|
|
247
247
|
run_benchmarks(
|
248
248
|
bench_test_fn=bench_speed_fused_linear_jsd,
|
249
|
-
kernel_operation_modes=["forward", "full"],
|
249
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
250
250
|
metric_name="speed",
|
251
251
|
metric_unit="ms",
|
252
252
|
**common_configs,
|
@@ -143,7 +143,7 @@ if __name__ == "__main__":
|
|
143
143
|
|
144
144
|
run_benchmarks(
|
145
145
|
bench_test_fn=bench_speed_jsd,
|
146
|
-
kernel_operation_modes=["forward", "full"],
|
146
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
147
147
|
metric_name="speed",
|
148
148
|
metric_unit="ms",
|
149
149
|
**common_args,
|
@@ -110,7 +110,7 @@ if __name__ == "__main__":
|
|
110
110
|
|
111
111
|
run_benchmarks(
|
112
112
|
bench_test_fn=bench_speed_kldiv,
|
113
|
-
kernel_operation_modes=["forward", "full"],
|
113
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
114
114
|
metric_name="speed",
|
115
115
|
metric_unit="ms",
|
116
116
|
**common_args,
|
@@ -299,7 +299,7 @@ if __name__ == "__main__":
|
|
299
299
|
|
300
300
|
run_benchmarks(
|
301
301
|
bench_test_fn=bench_speed_kto_loss,
|
302
|
-
kernel_operation_modes=["forward", "full"],
|
302
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
303
303
|
metric_name="speed",
|
304
304
|
metric_unit="ms",
|
305
305
|
**common_configs,
|
@@ -111,7 +111,7 @@ if __name__ == "__main__":
|
|
111
111
|
|
112
112
|
run_benchmarks(
|
113
113
|
bench_test_fn=bench_speed_layer_norm,
|
114
|
-
kernel_operation_modes=["forward", "full"],
|
114
|
+
kernel_operation_modes=["forward", "backward", "full"],
|
115
115
|
metric_name="speed",
|
116
116
|
metric_unit="ms",
|
117
117
|
**common_configs,
|
@@ -149,7 +149,7 @@ if __name__ == "__main__":
|
|
149
149
|
|
150
150
|
run_benchmarks(
|
151
151
|
bench_test_fn=bench_speed_fused_linear_orpo_loss,
|
152
|
-
kernel_operation_modes=["forward", "full"],
|
152
|
+
kernel_operation_modes=["forward", "full", "backward"],
|
153
153
|
metric_name="speed",
|
154
154
|
metric_unit="ms",
|
155
155
|
**common_configs,
|
@@ -147,7 +147,7 @@ if __name__ == "__main__":
|
|
147
147
|
|
148
148
|
run_benchmarks(
|
149
149
|
bench_test_fn=bench_speed_fused_linear_simpo_loss,
|
150
|
-
kernel_operation_modes=["forward", "full"],
|
150
|
+
kernel_operation_modes=["forward", "full", "backward"],
|
151
151
|
metric_name="speed",
|
152
152
|
metric_unit="ms",
|
153
153
|
**common_configs,
|
@@ -124,7 +124,7 @@ if __name__ == "__main__":
|
|
124
124
|
|
125
125
|
run_benchmarks(
|
126
126
|
bench_test_fn=bench_speed_softmax,
|
127
|
-
kernel_operation_modes=["forward", "full"],
|
127
|
+
kernel_operation_modes=["forward", "full", "backward"],
|
128
128
|
metric_name="speed",
|
129
129
|
metric_unit="ms",
|
130
130
|
overwrite=args.overwrite,
|
@@ -161,7 +161,7 @@ if __name__ == "__main__":
|
|
161
161
|
|
162
162
|
run_benchmarks(
|
163
163
|
bench_test_fn=bench_speed_swiglu,
|
164
|
-
kernel_operation_modes=["forward"],
|
164
|
+
kernel_operation_modes=["forward", "full", "backward"],
|
165
165
|
metric_name="speed",
|
166
166
|
metric_unit="ms",
|
167
167
|
**common_configs,
|
@@ -126,7 +126,7 @@ if __name__ == "__main__":
|
|
126
126
|
|
127
127
|
run_benchmarks(
|
128
128
|
bench_test_fn=bench_speed_tvd,
|
129
|
-
kernel_operation_modes=["forward", "full"],
|
129
|
+
kernel_operation_modes=["forward", "full", "backward"],
|
130
130
|
metric_name="speed",
|
131
131
|
metric_unit="ms",
|
132
132
|
**common_args,
|
@@ -235,7 +235,7 @@ def update_benchmark_data_csv(
|
|
235
235
|
pass
|
236
236
|
else:
|
237
237
|
existing_data_dict[row_key] = row_dict
|
238
|
-
|
238
|
+
os.makedirs(os.path.dirname(filename_abs_path), exist_ok=True)
|
239
239
|
with open(filename_abs_path, mode="w", newline="") as file:
|
240
240
|
writer = csv.DictWriter(file, fieldnames=fieldnames)
|
241
241
|
writer.writeheader()
|
@@ -0,0 +1,73 @@
|
|
1
|
+
from pathlib import Path
|
2
|
+
|
3
|
+
import modal
|
4
|
+
|
5
|
+
ROOT_PATH = Path(__file__).parent.parent.parent
|
6
|
+
REMOTE_ROOT_PATH = "/root/liger-kernel"
|
7
|
+
PYTHON_VERSION = "3.12"
|
8
|
+
|
9
|
+
image = modal.Image.debian_slim(python_version=PYTHON_VERSION).pip_install("uv")
|
10
|
+
|
11
|
+
app = modal.App("liger_benchmarks", image=image)
|
12
|
+
|
13
|
+
# mount: add local files to the remote container
|
14
|
+
repo = image.add_local_dir(ROOT_PATH, remote_path=REMOTE_ROOT_PATH)
|
15
|
+
|
16
|
+
|
17
|
+
@app.function(gpu="H100", image=repo, timeout=60 * 45)
|
18
|
+
def liger_benchmarks():
|
19
|
+
import subprocess
|
20
|
+
import os
|
21
|
+
|
22
|
+
subprocess.run(
|
23
|
+
["uv pip install -e '.[dev]' --system"],
|
24
|
+
check=True,
|
25
|
+
shell=True,
|
26
|
+
cwd=REMOTE_ROOT_PATH,
|
27
|
+
)
|
28
|
+
subprocess.run(["make run-benchmarks"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
|
29
|
+
|
30
|
+
file_path = Path(REMOTE_ROOT_PATH) / "benchmark" / "data" / "all_benchmark_data.csv"
|
31
|
+
print(f"Checking if file exists at: {file_path}")
|
32
|
+
print(f"File exists: {os.path.exists(file_path)}")
|
33
|
+
|
34
|
+
if not os.path.exists(file_path):
|
35
|
+
print("Listing directory contents:")
|
36
|
+
data_dir = file_path.parent
|
37
|
+
if os.path.exists(data_dir):
|
38
|
+
print(f"Contents of {data_dir}:")
|
39
|
+
print(os.listdir(data_dir))
|
40
|
+
else:
|
41
|
+
print(f"Data directory {data_dir} does not exist")
|
42
|
+
raise FileNotFoundError(f"Benchmark data file not found at {file_path}")
|
43
|
+
|
44
|
+
with open(file_path, "rb") as f:
|
45
|
+
data = f.read()
|
46
|
+
print(f"Successfully read {len(data)} bytes of data")
|
47
|
+
return data
|
48
|
+
|
49
|
+
|
50
|
+
@app.local_entrypoint()
|
51
|
+
def main():
|
52
|
+
try:
|
53
|
+
# Run the benchmarks and get the data
|
54
|
+
print("Starting benchmark run...")
|
55
|
+
benchmark_data = liger_benchmarks.remote()
|
56
|
+
|
57
|
+
if not benchmark_data:
|
58
|
+
raise ValueError("No data received from remote function")
|
59
|
+
|
60
|
+
# Save the data locally
|
61
|
+
local_data_path = ROOT_PATH / "benchmark" / "data" / "all_benchmark_data.csv"
|
62
|
+
print(f"Attempting to save data to: {local_data_path}")
|
63
|
+
|
64
|
+
local_data_path.parent.mkdir(parents=True, exist_ok=True)
|
65
|
+
|
66
|
+
with open(local_data_path, "wb") as f:
|
67
|
+
f.write(benchmark_data)
|
68
|
+
|
69
|
+
print(f"Successfully saved {len(benchmark_data)} bytes to: {local_data_path}")
|
70
|
+
|
71
|
+
except Exception as e:
|
72
|
+
print(f"Error occurred: {str(e)}")
|
73
|
+
raise
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.5.10.
|
7
|
+
version = "0.5.10.dev20250613192702"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: liger_kernel_nightly
|
3
|
-
Version: 0.5.10.
|
3
|
+
Version: 0.5.10.dev20250613192702
|
4
4
|
Summary: Efficient Triton kernels for LLM Training
|
5
5
|
License: BSD 2-CLAUSE LICENSE
|
6
6
|
Copyright 2024 LinkedIn Corporation
|
@@ -45,6 +45,7 @@ Requires-Dist: datasets>=2.19.2; extra == "dev"
|
|
45
45
|
Requires-Dist: seaborn; extra == "dev"
|
46
46
|
Requires-Dist: mkdocs; extra == "dev"
|
47
47
|
Requires-Dist: mkdocs-material; extra == "dev"
|
48
|
+
Requires-Dist: torchvision>=0.20; extra == "dev"
|
48
49
|
|
49
50
|
<a name="readme-top"></a>
|
50
51
|
|
@@ -20,6 +20,7 @@ from test.utils import FAKE_CONFIGS_PATH
|
|
20
20
|
from test.utils import UNTOKENIZED_DATASET_PATH
|
21
21
|
from test.utils import MiniModelConfig
|
22
22
|
from test.utils import assert_verbose_allclose
|
23
|
+
from test.utils import is_torchvision_available
|
23
24
|
from test.utils import load_image_processing_config
|
24
25
|
from test.utils import load_processor_config
|
25
26
|
from test.utils import load_tokenizer_config
|
@@ -788,6 +789,7 @@ def run_mini_model_multimodal(
|
|
788
789
|
not QWEN2_VL_AVAILABLE,
|
789
790
|
reason="Qwen2-VL not available in this version of transformers",
|
790
791
|
),
|
792
|
+
pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
|
791
793
|
],
|
792
794
|
),
|
793
795
|
pytest.param(
|
@@ -826,6 +828,7 @@ def run_mini_model_multimodal(
|
|
826
828
|
not QWEN2_5_VL_AVAILABLE,
|
827
829
|
reason="Qwen2.5-VL not available in this version of transformers",
|
828
830
|
),
|
831
|
+
pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
|
829
832
|
],
|
830
833
|
),
|
831
834
|
pytest.param(
|
@@ -20,6 +20,7 @@ from test.utils import FAKE_CONFIGS_PATH
|
|
20
20
|
from test.utils import UNTOKENIZED_DATASET_PATH
|
21
21
|
from test.utils import MiniModelConfig
|
22
22
|
from test.utils import assert_verbose_allclose
|
23
|
+
from test.utils import is_torchvision_available
|
23
24
|
from test.utils import load_image_processing_config
|
24
25
|
from test.utils import load_processor_config
|
25
26
|
from test.utils import load_tokenizer_config
|
@@ -783,6 +784,7 @@ def run_mini_model_multimodal(
|
|
783
784
|
not QWEN2_VL_AVAILABLE,
|
784
785
|
reason="Qwen2-VL not available in this version of transformers",
|
785
786
|
),
|
787
|
+
pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
|
786
788
|
],
|
787
789
|
),
|
788
790
|
pytest.param(
|
@@ -817,6 +819,7 @@ def run_mini_model_multimodal(
|
|
817
819
|
not QWEN2_5_VL_AVAILABLE,
|
818
820
|
reason="Qwen2.5-VL not available in this version of transformers",
|
819
821
|
),
|
822
|
+
pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
|
820
823
|
],
|
821
824
|
),
|
822
825
|
pytest.param(
|
@@ -228,6 +228,13 @@ def supports_bfloat16():
|
|
228
228
|
return False
|
229
229
|
|
230
230
|
|
231
|
+
def is_torchvision_available():
|
232
|
+
if importlib.util.find_spec("torchvision") is not None:
|
233
|
+
return True
|
234
|
+
else:
|
235
|
+
return False
|
236
|
+
|
237
|
+
|
231
238
|
def revert_liger_kernel_to_granite(model_config: MiniModelConfig):
|
232
239
|
"""
|
233
240
|
Revert all Liger kernel patches applied to Granite.
|
@@ -1,28 +0,0 @@
|
|
1
|
-
from pathlib import Path
|
2
|
-
|
3
|
-
import modal
|
4
|
-
|
5
|
-
ROOT_PATH = Path(__file__).parent.parent.parent
|
6
|
-
REMOTE_ROOT_PATH = "/root/liger-kernel"
|
7
|
-
PYTHON_VERSION = "3.12"
|
8
|
-
|
9
|
-
image = modal.Image.debian_slim(python_version=PYTHON_VERSION).pip_install("uv")
|
10
|
-
|
11
|
-
app = modal.App("liger_benchmarks", image=image)
|
12
|
-
|
13
|
-
# mount: add local files to the remote container
|
14
|
-
repo = image.add_local_dir(ROOT_PATH, remote_path=REMOTE_ROOT_PATH)
|
15
|
-
|
16
|
-
|
17
|
-
@app.function(gpu="H100", image=repo, timeout=60 * 45)
|
18
|
-
def liger_benchmarks():
|
19
|
-
import subprocess
|
20
|
-
|
21
|
-
subprocess.run(
|
22
|
-
["uv pip install -e '.[dev]' --system"],
|
23
|
-
check=True,
|
24
|
-
shell=True,
|
25
|
-
cwd=REMOTE_ROOT_PATH,
|
26
|
-
)
|
27
|
-
subprocess.run(["python benchmark/scripts/benchmark_kto_loss.py"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
|
28
|
-
subprocess.run(["python benchmark/scripts/benchmark_cpo_loss.py"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
@@ -29,6 +29,7 @@ jobs:
|
|
29
29
|
OUTPUT_FILENAME: benchmark.csv
|
30
30
|
GENERATED_CSV: benchmark/data/all_benchmark_data.csv
|
31
31
|
|
32
|
+
|
32
33
|
steps:
|
33
34
|
- name: Checkout code
|
34
35
|
uses: actions/checkout@v3
|
@@ -71,7 +72,6 @@ jobs:
|
|
71
72
|
run: |
|
72
73
|
mkdir -p gh-pages/${OUTPUT_DIR}/${{ steps.get_hash.outputs.hash }}
|
73
74
|
cp ${GENERATED_CSV} gh-pages/${OUTPUT_DIR}/${{ steps.get_hash.outputs.hash }}/${OUTPUT_FILENAME}
|
74
|
-
|
75
75
|
# Step 7: Append commit hash to commits.txt if not already present
|
76
76
|
- name: Update commits.txt
|
77
77
|
run: |
|
@@ -84,7 +84,6 @@ jobs:
|
|
84
84
|
if ! grep -q "${{ steps.get_hash.outputs.hash }}" ${OUTPUT_DIR}/commits.txt; then
|
85
85
|
echo "${{ steps.get_hash.outputs.hash }}" >> ${OUTPUT_DIR}/commits.txt
|
86
86
|
fi
|
87
|
-
|
88
87
|
# Step 7: Commit and push
|
89
88
|
- name: Commit and push to gh-pages
|
90
89
|
run: |
|
@@ -94,3 +93,4 @@ jobs:
|
|
94
93
|
git add .
|
95
94
|
git commit -m "Add benchmark for commit ${{ steps.get_hash.outputs.hash }}" || echo "No changes to commit"
|
96
95
|
git push origin gh-pages
|
96
|
+
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|