liger-kernel-nightly 0.6.1.dev20250812205818__tar.gz → 0.6.1.dev20250819172918__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/__init__.py +8 -0
- liger_kernel_nightly-0.6.1.dev20250819172918/src/liger_kernel/transformers/experimental/__init__.py +5 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/mllama.py +4 -2
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel_nightly.egg-info/SOURCES.txt +1 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/bf16/test_mini_models_multimodal.py +12 -1
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/fp32/test_mini_models_multimodal.py +1 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/workflows/benchmark.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/.gitignore +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/Makefile +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/index.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/docs/license.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/setup.cfg +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/setup.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/model/smollm3.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/test/utils.py +0 -0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.6.1.
|
7
|
+
version = "0.6.1.dev20250819172918"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -10,11 +10,15 @@ from liger_kernel.transformers.fused_linear_cross_entropy import LigerFusedLinea
|
|
10
10
|
from liger_kernel.transformers.fused_linear_jsd import LigerFusedLinearJSD # noqa: F401
|
11
11
|
from liger_kernel.transformers.geglu import LigerGEGLUMLP # noqa: F401
|
12
12
|
from liger_kernel.transformers.jsd import LigerJSD # noqa: F401
|
13
|
+
from liger_kernel.transformers.kl_div import LigerKLDIVLoss # noqa: F401
|
13
14
|
from liger_kernel.transformers.layer_norm import LigerLayerNorm # noqa: F401
|
14
15
|
from liger_kernel.transformers.llama4_rope import liger_llama4_text_rotary_pos_emb # noqa: F401
|
15
16
|
from liger_kernel.transformers.llama4_rope import liger_llama4_vision_rotary_pos_emb # noqa: F401
|
17
|
+
from liger_kernel.transformers.multi_token_attention import LigerMultiTokenAttention # noqa: F401
|
16
18
|
from liger_kernel.transformers.rms_norm import LigerRMSNorm # noqa: F401
|
17
19
|
from liger_kernel.transformers.rope import liger_rotary_pos_emb # noqa: F401
|
20
|
+
from liger_kernel.transformers.softmax import LigerSoftmax # noqa: F401
|
21
|
+
from liger_kernel.transformers.sparsemax import LigerSparsemax # noqa: F401
|
18
22
|
from liger_kernel.transformers.swiglu import LigerBlockSparseTop2MLP # noqa: F401
|
19
23
|
from liger_kernel.transformers.swiglu import LigerPhi3SwiGLUMLP # noqa: F401
|
20
24
|
from liger_kernel.transformers.swiglu import LigerQwen3MoeSwiGLUMLP # noqa: F401
|
@@ -134,6 +138,10 @@ __all__ = [
|
|
134
138
|
"LigerQwen3MoeSwiGLUMLP",
|
135
139
|
"LigerSwiGLUMLP",
|
136
140
|
"LigerTVDLoss",
|
141
|
+
"LigerKLDIVLoss",
|
142
|
+
"LigerMultiTokenAttention",
|
143
|
+
"LigerSoftmax",
|
144
|
+
"LigerSparsemax",
|
137
145
|
]
|
138
146
|
|
139
147
|
# Add transformer-dependent symbols only if available
|
@@ -190,7 +190,9 @@ def lce_forward(
|
|
190
190
|
output_hidden_states if output_hidden_states is not None else self.config.output_hidden_states
|
191
191
|
)
|
192
192
|
return_dict = return_dict if return_dict is not None else self.config.use_return_dict
|
193
|
-
|
193
|
+
# Filter out accum_dtype from kwargs for model call as MllamaTextModel doesn't accept it in transformers 4.49.0
|
194
|
+
# but preserve it for loss function calls
|
195
|
+
model_kwargs = {k: v for k, v in kwargs.items() if k != "accum_dtype"}
|
194
196
|
# decoder outputs consists of (dec_features, layer_state, dec_hidden, dec_attn)
|
195
197
|
outputs = self.model(
|
196
198
|
input_ids=input_ids,
|
@@ -206,7 +208,7 @@ def lce_forward(
|
|
206
208
|
output_hidden_states=output_hidden_states,
|
207
209
|
return_dict=return_dict,
|
208
210
|
cache_position=cache_position,
|
209
|
-
**
|
211
|
+
**model_kwargs,
|
210
212
|
)
|
211
213
|
|
212
214
|
hidden_states = outputs[0]
|
@@ -183,6 +183,7 @@ src/liger_kernel/transformers/sparsemax.py
|
|
183
183
|
src/liger_kernel/transformers/swiglu.py
|
184
184
|
src/liger_kernel/transformers/trainer_integration.py
|
185
185
|
src/liger_kernel/transformers/tvd.py
|
186
|
+
src/liger_kernel/transformers/experimental/__init__.py
|
186
187
|
src/liger_kernel/transformers/experimental/embedding.py
|
187
188
|
src/liger_kernel/transformers/model/__init__.py
|
188
189
|
src/liger_kernel/transformers/model/gemma.py
|
@@ -557,6 +557,7 @@ if QWEN2_5_VL_AVAILABLE:
|
|
557
557
|
"hidden_size": 128, # 1280
|
558
558
|
"num_heads": 16,
|
559
559
|
"in_chans": 3,
|
560
|
+
"out_hidden_size": 1024,
|
560
561
|
},
|
561
562
|
attn_implementation="sdpa",
|
562
563
|
),
|
@@ -860,7 +861,17 @@ def run_mini_model_multimodal(
|
|
860
861
|
for i in range(num_steps):
|
861
862
|
batch = next(loader_iter).to(model.device)
|
862
863
|
optimizer.zero_grad()
|
863
|
-
|
864
|
+
supports_accum = getattr(model, "_supports_accum_dtype", None)
|
865
|
+
if supports_accum is None:
|
866
|
+
import inspect
|
867
|
+
|
868
|
+
params = inspect.signature(model.forward).parameters
|
869
|
+
supports_accum = ("accum_dtype" in params) or any(
|
870
|
+
p.kind == inspect.Parameter.VAR_KEYWORD for p in params.values()
|
871
|
+
)
|
872
|
+
setattr(model, "_supports_accum_dtype", supports_accum)
|
873
|
+
|
874
|
+
output = model(**batch, accum_dtype=torch.float32) if supports_accum else model(**batch)
|
864
875
|
output.loss.backward()
|
865
876
|
optimizer.step()
|
866
877
|
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.6.1.dev20250812205818 → liger_kernel_nightly-0.6.1.dev20250819172918}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|