liger-kernel-nightly 0.6.2.dev20250822031319__tar.gz → 0.6.2.dev20250823034010__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/jsd_loss.py +5 -2
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/test_jsd_loss.py +5 -2
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_monkey_patch.py +5 -17
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/workflows/benchmark.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/.gitignore +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/Makefile +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/index.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/docs/license.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/setup.cfg +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/setup.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/experimental/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/glm4v.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/model/smollm3.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/test/utils.py +0 -0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.6.2.
|
7
|
+
version = "0.6.2.dev20250823034010"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -1,3 +1,5 @@
|
|
1
|
+
import math
|
2
|
+
|
1
3
|
import torch
|
2
4
|
import torch.nn.functional as F
|
3
5
|
|
@@ -25,8 +27,9 @@ class LigerFusedLinearJSDFunction(LigerFusedLinearDistillationBase):
|
|
25
27
|
jsd_loss = F.kl_div(teacher_log_probs, student_log_probs, reduction="sum", log_target=True)
|
26
28
|
else:
|
27
29
|
# Compute probabilities (only required for mean calculation)
|
28
|
-
|
29
|
-
|
30
|
+
log_mean_probs = torch.logsumexp(
|
31
|
+
torch.stack([student_log_probs + math.log(1 - beta), teacher_log_probs + math.log(beta)], dim=0), dim=0
|
32
|
+
)
|
30
33
|
|
31
34
|
student_kl = F.kl_div(log_mean_probs, student_log_probs, reduction="sum", log_target=True)
|
32
35
|
teacher_kl = F.kl_div(log_mean_probs, teacher_log_probs, reduction="sum", log_target=True)
|
@@ -1,3 +1,5 @@
|
|
1
|
+
import math
|
2
|
+
|
1
3
|
import pytest
|
2
4
|
import torch
|
3
5
|
import torch.nn.functional as F
|
@@ -54,8 +56,9 @@ class HFJSDLoss(HFDistillationLoss):
|
|
54
56
|
jsd_loss = F.kl_div(teacher_log_probs, student_log_probs, reduction="none", log_target=True)
|
55
57
|
else:
|
56
58
|
# Compute probabilities (only required for mean calculation)
|
57
|
-
|
58
|
-
|
59
|
+
log_mean_probs = torch.logsumexp(
|
60
|
+
torch.stack([student_log_probs + math.log(1 - beta), teacher_log_probs + math.log(beta)], dim=0), dim=0
|
61
|
+
)
|
59
62
|
|
60
63
|
student_kl = F.kl_div(log_mean_probs, student_log_probs, reduction="batchmean", log_target=True)
|
61
64
|
teacher_kl = F.kl_div(log_mean_probs, teacher_log_probs, reduction="batchmean", log_target=True)
|
@@ -1617,38 +1617,26 @@ def test_apply_liger_kernel_to_instance_for_glm4():
|
|
1617
1617
|
|
1618
1618
|
# Check that model instance variables are not yet patched with Liger modules
|
1619
1619
|
assert inspect.getsource(dummy_model_instance.forward) != inspect.getsource(glm4_lce_forward)
|
1620
|
-
assert inspect.getsource(dummy_model_instance.
|
1621
|
-
|
1622
|
-
)
|
1623
|
-
for layer in dummy_model_instance.language_model.layers:
|
1620
|
+
assert inspect.getsource(dummy_model_instance.model.norm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
1621
|
+
for layer in dummy_model_instance.model.layers:
|
1624
1622
|
assert inspect.getsource(layer.mlp.forward) != inspect.getsource(LigerPhi3SwiGLUMLP.forward)
|
1625
1623
|
assert inspect.getsource(layer.input_layernorm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
1626
1624
|
assert inspect.getsource(layer.post_attention_layernorm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
1627
1625
|
assert inspect.getsource(layer.post_self_attn_layernorm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
1628
1626
|
assert inspect.getsource(layer.post_mlp_layernorm.forward) != inspect.getsource(LigerRMSNorm.forward)
|
1629
|
-
for vision_block in dummy_model_instance.visual.blocks:
|
1630
|
-
assert inspect.getsource(vision_block.norm1.forward) != inspect.getsource(LigerRMSNorm.forward)
|
1631
|
-
assert inspect.getsource(vision_block.norm2.forward) != inspect.getsource(LigerRMSNorm.forward)
|
1632
|
-
assert inspect.getsource(vision_block.mlp.forward) != inspect.getsource(LigerSwiGLUMLP.forward)
|
1633
1627
|
|
1634
1628
|
# Test applying kernels to the model instance
|
1635
1629
|
_apply_liger_kernel_to_instance(model=dummy_model_instance)
|
1636
1630
|
|
1637
1631
|
# Check that the model's instance variables were correctly patched with Liger modules
|
1638
|
-
assert inspect.getsource(dummy_model_instance.forward)
|
1639
|
-
assert inspect.getsource(dummy_model_instance.
|
1640
|
-
|
1641
|
-
)
|
1642
|
-
for layer in dummy_model_instance.language_model.layers:
|
1632
|
+
assert inspect.getsource(dummy_model_instance.forward) == inspect.getsource(glm4_lce_forward)
|
1633
|
+
assert inspect.getsource(dummy_model_instance.model.norm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
1634
|
+
for layer in dummy_model_instance.model.layers:
|
1643
1635
|
assert inspect.getsource(layer.mlp.forward) == inspect.getsource(LigerPhi3SwiGLUMLP.forward)
|
1644
1636
|
assert inspect.getsource(layer.input_layernorm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
1645
1637
|
assert inspect.getsource(layer.post_attention_layernorm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
1646
1638
|
assert inspect.getsource(layer.post_self_attn_layernorm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
1647
1639
|
assert inspect.getsource(layer.post_mlp_layernorm.forward) == inspect.getsource(LigerRMSNorm.forward)
|
1648
|
-
for vision_block in dummy_model_instance.visual.blocks:
|
1649
|
-
assert inspect.getsource(vision_block.norm1.forward) == inspect.getsource(LigerRMSNorm.forward)
|
1650
|
-
assert inspect.getsource(vision_block.norm2.forward) == inspect.getsource(LigerRMSNorm.forward)
|
1651
|
-
assert inspect.getsource(vision_block.mlp.forward) == inspect.getsource(LigerSwiGLUMLP.forward)
|
1652
1640
|
|
1653
1641
|
try:
|
1654
1642
|
print(dummy_model_instance)
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.6.2.dev20250822031319 → liger_kernel_nightly-0.6.2.dev20250823034010}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|