liger-kernel-nightly 0.5.10.dev20250708114334__tar.gz → 0.6.0.dev20250709030408__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/monkey_patch.py +4 -2
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_monkey_patch.py +67 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/workflows/benchmark.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/.gitignore +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/Makefile +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/index.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/docs/license.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/setup.cfg +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/setup.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250708114334 → liger_kernel_nightly-0.6.0.dev20250709030408}/test/utils.py +0 -0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.
|
7
|
+
version = "0.6.0.dev20250709030408"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -1096,7 +1096,9 @@ def apply_liger_kernel_to_paligemma(
|
|
1096
1096
|
# PaliGemma submodules are ['vision_tower', 'multi_modal_projector', 'language_model']
|
1097
1097
|
|
1098
1098
|
from transformers.models.gemma.modeling_gemma import GemmaForCausalLM
|
1099
|
+
from transformers.models.gemma.modeling_gemma import GemmaModel
|
1099
1100
|
from transformers.models.gemma2.modeling_gemma2 import Gemma2ForCausalLM
|
1101
|
+
from transformers.models.gemma2.modeling_gemma2 import Gemma2Model
|
1100
1102
|
from transformers.models.paligemma import modeling_paligemma
|
1101
1103
|
from transformers.models.paligemma.modeling_paligemma import PaliGemmaForConditionalGeneration
|
1102
1104
|
from transformers.models.siglip import modeling_siglip
|
@@ -1155,7 +1157,7 @@ def apply_liger_kernel_to_paligemma(
|
|
1155
1157
|
|
1156
1158
|
language_model = model.language_model
|
1157
1159
|
|
1158
|
-
if isinstance(language_model, GemmaForCausalLM):
|
1160
|
+
if isinstance(language_model, (GemmaForCausalLM, GemmaModel)):
|
1159
1161
|
apply_liger_kernel_to_gemma(
|
1160
1162
|
rope=rope,
|
1161
1163
|
cross_entropy=False,
|
@@ -1165,7 +1167,7 @@ def apply_liger_kernel_to_paligemma(
|
|
1165
1167
|
model=language_model,
|
1166
1168
|
)
|
1167
1169
|
|
1168
|
-
elif isinstance(language_model, Gemma2ForCausalLM):
|
1170
|
+
elif isinstance(language_model, (Gemma2ForCausalLM, Gemma2Model)):
|
1169
1171
|
apply_liger_kernel_to_gemma2(
|
1170
1172
|
rope=rope,
|
1171
1173
|
cross_entropy=False,
|
@@ -38,6 +38,7 @@ if transformer_version >= version.parse(SUPPORTED_TRANSFORMER_VERSION):
|
|
38
38
|
from liger_kernel.transformers.model.mistral import lce_forward as mistral_lce_forward
|
39
39
|
from liger_kernel.transformers.model.mixtral import lce_forward as mixtral_lce_forward
|
40
40
|
from liger_kernel.transformers.model.mllama import lce_forward as mllama_lce_forward
|
41
|
+
from liger_kernel.transformers.model.paligemma import lce_forward as paligemma_lce_forward
|
41
42
|
from liger_kernel.transformers.model.phi3 import lce_forward as phi3_lce_forward
|
42
43
|
from liger_kernel.transformers.model.qwen2 import lce_forward as qwen2_lce_forward
|
43
44
|
else:
|
@@ -49,6 +50,7 @@ else:
|
|
49
50
|
)
|
50
51
|
from liger_kernel.transformers.model.mixtral import lce_forward_deprecated as mixtral_lce_forward
|
51
52
|
from liger_kernel.transformers.model.mllama import lce_forward_deprecated as mllama_lce_forward
|
53
|
+
from liger_kernel.transformers.model.paligemma import lce_forward_deprecated as paligemma_lce_forward
|
52
54
|
from liger_kernel.transformers.model.phi3 import lce_forward_deprecated as phi3_lce_forward
|
53
55
|
from liger_kernel.transformers.model.qwen2 import lce_forward_deprecated as qwen2_lce_forward
|
54
56
|
|
@@ -126,6 +128,15 @@ def is_gemma3_available():
|
|
126
128
|
return False
|
127
129
|
|
128
130
|
|
131
|
+
def is_paligemma_available():
|
132
|
+
try:
|
133
|
+
import transformers.models.paligemma # noqa: F401
|
134
|
+
|
135
|
+
return True
|
136
|
+
except ImportError:
|
137
|
+
return False
|
138
|
+
|
139
|
+
|
129
140
|
def test_import_from_root():
|
130
141
|
try:
|
131
142
|
from liger_kernel.transformers import AutoLigerKernelForCausalLM # noqa: F401
|
@@ -793,6 +804,62 @@ def test_apply_liger_kernel_to_instance_for_gemma2():
|
|
793
804
|
pytest.fail(f"An exception occured in extra_expr: {type(e).__name__} - {e}")
|
794
805
|
|
795
806
|
|
807
|
+
@pytest.mark.skipif(not is_paligemma_available(), reason="paligemma module not available")
|
808
|
+
def test_apply_liger_kernel_to_instance_for_paligemma():
|
809
|
+
# Ensure any monkey patching is cleaned up for subsequent tests
|
810
|
+
with patch("transformers.models.paligemma.modeling_paligemma"):
|
811
|
+
from transformers.models.paligemma.modeling_paligemma import PaliGemmaForConditionalGeneration
|
812
|
+
|
813
|
+
# Instantiate a dummy model
|
814
|
+
config = transformers.models.paligemma.configuration_paligemma.PaliGemmaConfig(
|
815
|
+
torch_dtype=torch.bfloat16,
|
816
|
+
text_config={
|
817
|
+
"num_hidden_layers": 2,
|
818
|
+
"rms_norm_eps": 1e-5,
|
819
|
+
"hidden_size": 32,
|
820
|
+
"intermediate_size": 64,
|
821
|
+
"hidden_act": "silu",
|
822
|
+
},
|
823
|
+
vision_config={
|
824
|
+
"num_hidden_layers": 2,
|
825
|
+
"layer_norm_eps": 1e-5,
|
826
|
+
"hidden_size": 48,
|
827
|
+
"intermediate_size": 64,
|
828
|
+
},
|
829
|
+
)
|
830
|
+
|
831
|
+
dummy_model_instance = PaliGemmaForConditionalGeneration(config)
|
832
|
+
assert isinstance(dummy_model_instance, PaliGemmaForConditionalGeneration)
|
833
|
+
|
834
|
+
# Check that model instance variables are not yet patched with Liger modules
|
835
|
+
assert inspect.getsource(dummy_model_instance.forward) != inspect.getsource(paligemma_lce_forward)
|
836
|
+
assert inspect.getsource(
|
837
|
+
dummy_model_instance.vision_tower.vision_model.post_layernorm.forward
|
838
|
+
) != inspect.getsource(LigerLayerNorm.forward)
|
839
|
+
|
840
|
+
for layer in dummy_model_instance.vision_tower.vision_model.encoder.layers:
|
841
|
+
assert inspect.getsource(layer.layer_norm1.forward) != inspect.getsource(LigerLayerNorm.forward)
|
842
|
+
assert inspect.getsource(layer.layer_norm2.forward) != inspect.getsource(LigerLayerNorm.forward)
|
843
|
+
|
844
|
+
# Test applying kernels to the model instance
|
845
|
+
_apply_liger_kernel_to_instance(model=dummy_model_instance)
|
846
|
+
|
847
|
+
# Check that the model's instance variables were correctly patched with Liger modules
|
848
|
+
assert inspect.getsource(dummy_model_instance.forward) == inspect.getsource(paligemma_lce_forward)
|
849
|
+
assert inspect.getsource(
|
850
|
+
dummy_model_instance.vision_tower.vision_model.post_layernorm.forward
|
851
|
+
) == inspect.getsource(LigerLayerNorm.forward)
|
852
|
+
|
853
|
+
for layer in dummy_model_instance.vision_tower.vision_model.encoder.layers:
|
854
|
+
assert inspect.getsource(layer.layer_norm1.forward) == inspect.getsource(LigerLayerNorm.forward)
|
855
|
+
assert inspect.getsource(layer.layer_norm2.forward) == inspect.getsource(LigerLayerNorm.forward)
|
856
|
+
|
857
|
+
try:
|
858
|
+
print(dummy_model_instance)
|
859
|
+
except Exception as e:
|
860
|
+
pytest.fail(f"An exception occured in extra_expr: {type(e).__name__} - {e}")
|
861
|
+
|
862
|
+
|
796
863
|
@pytest.mark.skipif(not is_gemma3_available(), reason="gemma3 module not available")
|
797
864
|
def test_apply_liger_kernel_to_instance_for_gemma3_text():
|
798
865
|
# Ensure any monkey patching is cleaned up for subsequent tests
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|