liger-kernel-nightly 0.5.10.dev20250611064616__tar.gz → 0.5.10.dev20250611215839__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/workflows/benchmark.yml +5 -11
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/workflows/docs.yml +2 -5
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/PKG-INFO +2 -1
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/setup.py +1 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel_nightly.egg-info/PKG-INFO +2 -1
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel_nightly.egg-info/requires.txt +1 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/bf16/test_mini_models_multimodal.py +3 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/fp32/test_mini_models_multimodal.py +3 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/utils.py +7 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.gitignore +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/.idea/workspace.xml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/Makefile +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/index.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/docs/license.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/setup.cfg +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250611064616 → liger_kernel_nightly-0.5.10.dev20250611215839}/test/triton/test_triton_monkey_patch.py +0 -0
@@ -33,30 +33,28 @@ jobs:
|
|
33
33
|
- name: Checkout code
|
34
34
|
uses: actions/checkout@v3
|
35
35
|
|
36
|
-
|
36
|
+
# Get the latest commit hash from main branch
|
37
37
|
- name: Get commit hash
|
38
38
|
id: get_hash
|
39
39
|
run: echo "hash=$(git rev-parse --short HEAD)" >> $GITHUB_OUTPUT
|
40
40
|
|
41
|
-
|
42
41
|
- name: Set up Python
|
43
42
|
uses: actions/setup-python@v3
|
44
43
|
with:
|
45
44
|
python-version: '3.10'
|
46
45
|
|
47
|
-
|
46
|
+
# Install dependencies
|
48
47
|
- name: Install dependencies
|
49
48
|
run: |
|
50
49
|
python -m pip install --upgrade pip
|
51
50
|
pip install modal
|
52
51
|
pip install pandas
|
53
52
|
|
54
|
-
|
55
|
-
|
53
|
+
# Delete previous benchmark results.
|
54
|
+
- name: Remove previous benchmark data
|
56
55
|
run: |
|
57
56
|
rm -f benchmark/data/all_benchmark_data.csv
|
58
|
-
|
59
|
-
|
57
|
+
|
60
58
|
- name: Run benchmarks on GPU
|
61
59
|
run: |
|
62
60
|
modal run dev.modal.benchmarks
|
@@ -79,11 +77,9 @@ jobs:
|
|
79
77
|
run: |
|
80
78
|
cd gh-pages
|
81
79
|
echo "commits.txt file path: ${OUTPUT_DIR}/commits.txt"
|
82
|
-
|
83
80
|
# Create file if it doesn't exist
|
84
81
|
mkdir -p ${OUTPUT_DIR}
|
85
82
|
touch ${OUTPUT_DIR}/commits.txt
|
86
|
-
|
87
83
|
# Append only if not already present
|
88
84
|
if ! grep -q "${{ steps.get_hash.outputs.hash }}" ${OUTPUT_DIR}/commits.txt; then
|
89
85
|
echo "${{ steps.get_hash.outputs.hash }}" >> ${OUTPUT_DIR}/commits.txt
|
@@ -98,5 +94,3 @@ jobs:
|
|
98
94
|
git add .
|
99
95
|
git commit -m "Add benchmark for commit ${{ steps.get_hash.outputs.hash }}" || echo "No changes to commit"
|
100
96
|
git push origin gh-pages
|
101
|
-
|
102
|
-
|
@@ -4,14 +4,11 @@ on:
|
|
4
4
|
branches:
|
5
5
|
- main
|
6
6
|
|
7
|
-
env:
|
8
|
-
ENABLE_DEPLOY: false
|
9
|
-
|
10
7
|
permissions:
|
11
8
|
contents: write
|
12
9
|
jobs:
|
13
10
|
deploy:
|
14
|
-
if:
|
11
|
+
if: False
|
15
12
|
runs-on: ubuntu-latest
|
16
13
|
steps:
|
17
14
|
- uses: actions/checkout@v4
|
@@ -30,4 +27,4 @@ jobs:
|
|
30
27
|
restore-keys: |
|
31
28
|
mkdocs-material-
|
32
29
|
- run: pip install mkdocs-material
|
33
|
-
- run: mkdocs gh-deploy --force
|
30
|
+
- run: mkdocs gh-deploy --force
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: liger_kernel_nightly
|
3
|
-
Version: 0.5.10.
|
3
|
+
Version: 0.5.10.dev20250611215839
|
4
4
|
Summary: Efficient Triton kernels for LLM Training
|
5
5
|
License: BSD 2-CLAUSE LICENSE
|
6
6
|
Copyright 2024 LinkedIn Corporation
|
@@ -45,6 +45,7 @@ Requires-Dist: datasets>=2.19.2; extra == "dev"
|
|
45
45
|
Requires-Dist: seaborn; extra == "dev"
|
46
46
|
Requires-Dist: mkdocs; extra == "dev"
|
47
47
|
Requires-Dist: mkdocs-material; extra == "dev"
|
48
|
+
Requires-Dist: torchvision>=0.20; extra == "dev"
|
48
49
|
|
49
50
|
<a name="readme-top"></a>
|
50
51
|
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.5.10.
|
7
|
+
version = "0.5.10.dev20250611215839"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: liger_kernel_nightly
|
3
|
-
Version: 0.5.10.
|
3
|
+
Version: 0.5.10.dev20250611215839
|
4
4
|
Summary: Efficient Triton kernels for LLM Training
|
5
5
|
License: BSD 2-CLAUSE LICENSE
|
6
6
|
Copyright 2024 LinkedIn Corporation
|
@@ -45,6 +45,7 @@ Requires-Dist: datasets>=2.19.2; extra == "dev"
|
|
45
45
|
Requires-Dist: seaborn; extra == "dev"
|
46
46
|
Requires-Dist: mkdocs; extra == "dev"
|
47
47
|
Requires-Dist: mkdocs-material; extra == "dev"
|
48
|
+
Requires-Dist: torchvision>=0.20; extra == "dev"
|
48
49
|
|
49
50
|
<a name="readme-top"></a>
|
50
51
|
|
@@ -20,6 +20,7 @@ from test.utils import FAKE_CONFIGS_PATH
|
|
20
20
|
from test.utils import UNTOKENIZED_DATASET_PATH
|
21
21
|
from test.utils import MiniModelConfig
|
22
22
|
from test.utils import assert_verbose_allclose
|
23
|
+
from test.utils import is_torchvision_available
|
23
24
|
from test.utils import load_image_processing_config
|
24
25
|
from test.utils import load_processor_config
|
25
26
|
from test.utils import load_tokenizer_config
|
@@ -788,6 +789,7 @@ def run_mini_model_multimodal(
|
|
788
789
|
not QWEN2_VL_AVAILABLE,
|
789
790
|
reason="Qwen2-VL not available in this version of transformers",
|
790
791
|
),
|
792
|
+
pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
|
791
793
|
],
|
792
794
|
),
|
793
795
|
pytest.param(
|
@@ -826,6 +828,7 @@ def run_mini_model_multimodal(
|
|
826
828
|
not QWEN2_5_VL_AVAILABLE,
|
827
829
|
reason="Qwen2.5-VL not available in this version of transformers",
|
828
830
|
),
|
831
|
+
pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
|
829
832
|
],
|
830
833
|
),
|
831
834
|
pytest.param(
|
@@ -20,6 +20,7 @@ from test.utils import FAKE_CONFIGS_PATH
|
|
20
20
|
from test.utils import UNTOKENIZED_DATASET_PATH
|
21
21
|
from test.utils import MiniModelConfig
|
22
22
|
from test.utils import assert_verbose_allclose
|
23
|
+
from test.utils import is_torchvision_available
|
23
24
|
from test.utils import load_image_processing_config
|
24
25
|
from test.utils import load_processor_config
|
25
26
|
from test.utils import load_tokenizer_config
|
@@ -783,6 +784,7 @@ def run_mini_model_multimodal(
|
|
783
784
|
not QWEN2_VL_AVAILABLE,
|
784
785
|
reason="Qwen2-VL not available in this version of transformers",
|
785
786
|
),
|
787
|
+
pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
|
786
788
|
],
|
787
789
|
),
|
788
790
|
pytest.param(
|
@@ -817,6 +819,7 @@ def run_mini_model_multimodal(
|
|
817
819
|
not QWEN2_5_VL_AVAILABLE,
|
818
820
|
reason="Qwen2.5-VL not available in this version of transformers",
|
819
821
|
),
|
822
|
+
pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
|
820
823
|
],
|
821
824
|
),
|
822
825
|
pytest.param(
|
@@ -228,6 +228,13 @@ def supports_bfloat16():
|
|
228
228
|
return False
|
229
229
|
|
230
230
|
|
231
|
+
def is_torchvision_available():
|
232
|
+
if importlib.util.find_spec("torchvision") is not None:
|
233
|
+
return True
|
234
|
+
else:
|
235
|
+
return False
|
236
|
+
|
237
|
+
|
231
238
|
def revert_liger_kernel_to_granite(model_config: MiniModelConfig):
|
232
239
|
"""
|
233
240
|
Revert all Liger kernel patches applied to Granite.
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|