liger-kernel-nightly 0.6.3.dev20251105190428__tar.gz → 0.6.3.dev20251105224413__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/monkey_patch.py +4 -2
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/fp32/test_mini_models_multimodal.py +3 -3
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_monkey_patch.py +8 -8
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/workflows/benchmark.yml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/.gitignore +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/Makefile +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/README.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_poly_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/index.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/docs/license.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/setup.cfg +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/setup.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/poly_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/experimental/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/falcon_h1.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/glm4v.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/glm4v_moe.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/internvl.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/qwen3_next.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/qwen3_vl.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/qwen3_vl_moe.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/smollm3.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/model/smolvlm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/poly_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/HuggingFaceTB/SmolVLM2-256M-Video-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/OpenGVLab/InternVL3-1B-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/Qwen/Qwen3-VL-4B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_poly_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/test/utils.py +0 -0
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
|
4
4
|
|
|
5
5
|
[project]
|
|
6
6
|
name = "liger_kernel_nightly"
|
|
7
|
-
version = "0.6.3.
|
|
7
|
+
version = "0.6.3.dev20251105224413"
|
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
|
@@ -30,8 +30,6 @@ from liger_kernel.transformers.model.mixtral import lce_forward_deprecated as mi
|
|
|
30
30
|
from liger_kernel.transformers.model.phi3 import lce_forward as phi3_lce_forward
|
|
31
31
|
from liger_kernel.transformers.model.qwen2 import lce_forward as qwen2_lce_forward
|
|
32
32
|
from liger_kernel.transformers.model.qwen2 import lce_forward_deprecated as qwen2_lce_forward_deprecated
|
|
33
|
-
from liger_kernel.transformers.model.qwen3_vl import lce_forward as qwen3_vl_lce_forward
|
|
34
|
-
from liger_kernel.transformers.model.qwen3_vl_moe import lce_forward as qwen3_vl_moe_lce_forward
|
|
35
33
|
from liger_kernel.transformers.model.smollm3 import lce_forward as smollm3_lce_forward
|
|
36
34
|
from liger_kernel.transformers.qwen2vl_mrope import liger_multimodal_rotary_pos_emb
|
|
37
35
|
from liger_kernel.transformers.rms_norm import LigerRMSNorm
|
|
@@ -1679,6 +1677,8 @@ def apply_liger_kernel_to_qwen3_vl(
|
|
|
1679
1677
|
from transformers.models.qwen3_vl.modeling_qwen3_vl import Qwen3VLModel
|
|
1680
1678
|
from transformers.models.qwen3_vl.modeling_qwen3_vl import Qwen3VLTextModel
|
|
1681
1679
|
|
|
1680
|
+
from liger_kernel.transformers.model.qwen3_vl import lce_forward as qwen3_vl_lce_forward
|
|
1681
|
+
|
|
1682
1682
|
if rope:
|
|
1683
1683
|
modeling_qwen3_vl.apply_rotary_pos_emb = liger_rotary_pos_emb_with_cast
|
|
1684
1684
|
modeling_qwen3_vl.apply_rotary_pos_emb_vision = liger_rotary_pos_emb_with_cast_and_leading_batch
|
|
@@ -1752,6 +1752,8 @@ def apply_liger_kernel_to_qwen3_vl_moe(
|
|
|
1752
1752
|
from transformers.models.qwen3_vl_moe.modeling_qwen3_vl_moe import Qwen3VLMoeModel
|
|
1753
1753
|
from transformers.models.qwen3_vl_moe.modeling_qwen3_vl_moe import Qwen3VLMoeTextModel
|
|
1754
1754
|
|
|
1755
|
+
from liger_kernel.transformers.model.qwen3_vl_moe import lce_forward as qwen3_vl_moe_lce_forward
|
|
1756
|
+
|
|
1755
1757
|
if rope:
|
|
1756
1758
|
modeling_qwen3_vl_moe.apply_rotary_pos_emb = liger_rotary_pos_emb_with_cast
|
|
1757
1759
|
modeling_qwen3_vl_moe.apply_rotary_pos_emb_vision = liger_rotary_pos_emb_with_cast_and_leading_batch
|
|
@@ -1001,8 +1001,8 @@ def test_apply_liger_kernel_to_instance_for_qwen3_vl_moe_text():
|
|
|
1001
1001
|
def test_qwen3_vl_rope_hooks_applied():
|
|
1002
1002
|
# Ensure any monkey patching is cleaned up for subsequent tests
|
|
1003
1003
|
with patch("transformers.models.qwen3_vl.modeling_qwen3_vl") as modeling_mod:
|
|
1004
|
-
from liger_kernel.transformers.monkey_patch import
|
|
1005
|
-
from liger_kernel.transformers.monkey_patch import
|
|
1004
|
+
from liger_kernel.transformers.monkey_patch import liger_rotary_pos_emb_with_cast
|
|
1005
|
+
from liger_kernel.transformers.monkey_patch import liger_rotary_pos_emb_with_cast_and_leading_batch
|
|
1006
1006
|
|
|
1007
1007
|
# Before applying, make sure attributes exist but are not the liger implementations
|
|
1008
1008
|
setattr(modeling_mod, "apply_rotary_pos_emb", object())
|
|
@@ -1010,16 +1010,16 @@ def test_qwen3_vl_rope_hooks_applied():
|
|
|
1010
1010
|
|
|
1011
1011
|
_apply_liger_kernel("qwen3_vl")
|
|
1012
1012
|
|
|
1013
|
-
assert modeling_mod.apply_rotary_pos_emb is
|
|
1014
|
-
assert modeling_mod.apply_rotary_pos_emb_vision is
|
|
1013
|
+
assert modeling_mod.apply_rotary_pos_emb is liger_rotary_pos_emb_with_cast
|
|
1014
|
+
assert modeling_mod.apply_rotary_pos_emb_vision is liger_rotary_pos_emb_with_cast_and_leading_batch
|
|
1015
1015
|
|
|
1016
1016
|
|
|
1017
1017
|
@pytest.mark.skipif(not is_qwen3_vl_moe_available(), reason="qwen3_vl_moe module not available")
|
|
1018
1018
|
def test_qwen3_vl_moe_rope_hooks_applied():
|
|
1019
1019
|
# Ensure any monkey patching is cleaned up for subsequent tests
|
|
1020
1020
|
with patch("transformers.models.qwen3_vl_moe.modeling_qwen3_vl_moe") as modeling_mod:
|
|
1021
|
-
from liger_kernel.transformers.monkey_patch import
|
|
1022
|
-
from liger_kernel.transformers.monkey_patch import
|
|
1021
|
+
from liger_kernel.transformers.monkey_patch import liger_rotary_pos_emb_with_cast
|
|
1022
|
+
from liger_kernel.transformers.monkey_patch import liger_rotary_pos_emb_with_cast_and_leading_batch
|
|
1023
1023
|
|
|
1024
1024
|
# Before applying, make sure attributes exist but are not the liger implementations
|
|
1025
1025
|
setattr(modeling_mod, "apply_rotary_pos_emb", object())
|
|
@@ -1027,8 +1027,8 @@ def test_qwen3_vl_moe_rope_hooks_applied():
|
|
|
1027
1027
|
|
|
1028
1028
|
_apply_liger_kernel("qwen3_vl_moe")
|
|
1029
1029
|
|
|
1030
|
-
assert modeling_mod.apply_rotary_pos_emb is
|
|
1031
|
-
assert modeling_mod.apply_rotary_pos_emb_vision is
|
|
1030
|
+
assert modeling_mod.apply_rotary_pos_emb is liger_rotary_pos_emb_with_cast
|
|
1031
|
+
assert modeling_mod.apply_rotary_pos_emb_vision is liger_rotary_pos_emb_with_cast_and_leading_batch
|
|
1032
1032
|
|
|
1033
1033
|
|
|
1034
1034
|
@pytest.mark.skipif(not is_falcon_h1_available(), reason="falcon_h1 module not available")
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{liger_kernel_nightly-0.6.3.dev20251105190428 → liger_kernel_nightly-0.6.3.dev20251105224413}/NOTICE
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|