liger-kernel-nightly 0.6.2.dev20251011154427__tar.gz → 0.6.2.dev20251013144132__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/monkey_patch.py +5 -2
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_monkey_patch.py +26 -4
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/workflows/benchmark.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/.gitignore +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/Makefile +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/index.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/docs/license.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/setup.cfg +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/setup.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/experimental/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/falcon_h1.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/glm4v.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/glm4v_moe.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/internvl.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/model/smollm3.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/OpenGVLab/InternVL3-1B-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/test/utils.py +0 -0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.6.2.
|
7
|
+
version = "0.6.2.dev20251013144132"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -469,7 +469,7 @@ def apply_liger_kernel_to_llama4(
|
|
469
469
|
`cross_entropy` and `fused_linear_cross_entropy` cannot both be True.
|
470
470
|
If `fused_linear_cross_entropy` is True, the logits will not be materialized but more memory efficient.
|
471
471
|
rms_norm (bool): Whether to apply Liger's RMSNorm. Default is True.
|
472
|
-
swiglu (bool): Whether to apply Liger's SwiGLU MLP. Default is
|
472
|
+
swiglu (bool): Whether to apply Liger's SwiGLU MLP. Default is True.
|
473
473
|
model (PreTrainedModel): The model instance to apply Liger kernels to, if the model has already been
|
474
474
|
loaded. Default is None.
|
475
475
|
"""
|
@@ -522,7 +522,10 @@ def apply_liger_kernel_to_llama4(
|
|
522
522
|
_patch_rms_norm_module(text_model.norm)
|
523
523
|
for decoder_layer in text_model.layers:
|
524
524
|
if swiglu:
|
525
|
-
|
525
|
+
if decoder_layer.is_moe_layer:
|
526
|
+
_patch_swiglu_module(decoder_layer.feed_forward.shared_expert, LigerSwiGLUMLP)
|
527
|
+
else:
|
528
|
+
_patch_swiglu_module(decoder_layer.feed_forward, LigerSwiGLUMLP)
|
526
529
|
if rms_norm:
|
527
530
|
_patch_rms_norm_module(decoder_layer.input_layernorm)
|
528
531
|
_patch_rms_norm_module(decoder_layer.post_attention_layernorm)
|
@@ -600,13 +600,19 @@ def test_apply_liger_kernel_to_instance_for_llama4_for_causal_lm():
|
|
600
600
|
intermediate_size=64,
|
601
601
|
hidden_act="silu",
|
602
602
|
num_hidden_layers=2,
|
603
|
+
moe_layers=[1],
|
603
604
|
)
|
604
605
|
dummy_model_instance = Llama4ForCausalLM._from_config(config)
|
605
606
|
|
606
607
|
# Check that model instance variables are not yet patched with Liger modules
|
607
608
|
assert inspect.getsource(dummy_model_instance.model.norm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
608
609
|
for layer in dummy_model_instance.model.layers:
|
609
|
-
|
610
|
+
if layer.is_moe_layer:
|
611
|
+
assert inspect.getsource(layer.feed_forward.shared_expert.forward) != inspect.getsource(
|
612
|
+
LigerSwiGLUMLP.forward
|
613
|
+
)
|
614
|
+
else:
|
615
|
+
assert inspect.getsource(layer.feed_forward.forward) != inspect.getsource(LigerSwiGLUMLP.forward)
|
610
616
|
assert inspect.getsource(layer.input_layernorm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
611
617
|
assert inspect.getsource(layer.post_attention_layernorm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
612
618
|
|
@@ -616,7 +622,12 @@ def test_apply_liger_kernel_to_instance_for_llama4_for_causal_lm():
|
|
616
622
|
# Check that the model's instance variables were correctly patched with Liger modules
|
617
623
|
assert inspect.getsource(dummy_model_instance.model.norm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
618
624
|
for layer in dummy_model_instance.model.layers:
|
619
|
-
|
625
|
+
if layer.is_moe_layer:
|
626
|
+
assert inspect.getsource(layer.feed_forward.shared_expert.forward) == inspect.getsource(
|
627
|
+
LigerSwiGLUMLP.forward
|
628
|
+
)
|
629
|
+
else:
|
630
|
+
assert inspect.getsource(layer.feed_forward.forward) == inspect.getsource(LigerSwiGLUMLP.forward)
|
620
631
|
assert inspect.getsource(layer.input_layernorm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
621
632
|
assert inspect.getsource(layer.post_attention_layernorm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
622
633
|
|
@@ -642,6 +653,7 @@ def test_apply_liger_kernel_to_instance_for_llama4_for_conditional_generation():
|
|
642
653
|
intermediate_size=64,
|
643
654
|
hidden_act="silu",
|
644
655
|
num_hidden_layers=2,
|
656
|
+
moe_layers=[1],
|
645
657
|
),
|
646
658
|
vision_config=transformers.models.llama4.configuration_llama4.Llama4VisionConfig(
|
647
659
|
rms_norm_eps=1e-5,
|
@@ -662,7 +674,12 @@ def test_apply_liger_kernel_to_instance_for_llama4_for_conditional_generation():
|
|
662
674
|
LigerRMSNorm.forward
|
663
675
|
)
|
664
676
|
for layer in dummy_model_instance.language_model.model.layers:
|
665
|
-
|
677
|
+
if layer.is_moe_layer:
|
678
|
+
assert inspect.getsource(layer.feed_forward.shared_expert.forward) != inspect.getsource(
|
679
|
+
LigerSwiGLUMLP.forward
|
680
|
+
)
|
681
|
+
else:
|
682
|
+
assert inspect.getsource(layer.feed_forward.forward) != inspect.getsource(LigerSwiGLUMLP.forward)
|
666
683
|
assert inspect.getsource(layer.input_layernorm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
667
684
|
assert inspect.getsource(layer.post_attention_layernorm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
668
685
|
|
@@ -686,7 +703,12 @@ def test_apply_liger_kernel_to_instance_for_llama4_for_conditional_generation():
|
|
686
703
|
LigerRMSNorm.forward
|
687
704
|
)
|
688
705
|
for layer in dummy_model_instance.language_model.model.layers:
|
689
|
-
|
706
|
+
if layer.is_moe_layer:
|
707
|
+
assert inspect.getsource(layer.feed_forward.shared_expert.forward) == inspect.getsource(
|
708
|
+
LigerSwiGLUMLP.forward
|
709
|
+
)
|
710
|
+
else:
|
711
|
+
assert inspect.getsource(layer.feed_forward.forward) == inspect.getsource(LigerSwiGLUMLP.forward)
|
690
712
|
assert inspect.getsource(layer.input_layernorm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
691
713
|
assert inspect.getsource(layer.post_attention_layernorm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
692
714
|
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.6.2.dev20251011154427 → liger_kernel_nightly-0.6.2.dev20251013144132}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|