liger-kernel-nightly 0.5.10.dev20250526105714__tar.gz → 0.5.10.dev20250526154218__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.gitignore +1 -1
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/Makefile +1 -1
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_qwen2vl_mrope.py +3 -3
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/.idea/workspace.xml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/index.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/docs/license.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/setup.cfg +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/setup.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/gema3_rms.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.10.dev20250526105714 → liger_kernel_nightly-0.5.10.dev20250526154218}/test/utils.py +0 -0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.5.10.
|
7
|
+
version = "0.5.10.dev20250526154218"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -4,7 +4,7 @@ import torch
|
|
4
4
|
from test.utils import supports_bfloat16
|
5
5
|
|
6
6
|
try:
|
7
|
-
from transformers.models.qwen2_vl.configuration_qwen2_vl import
|
7
|
+
from transformers.models.qwen2_vl.configuration_qwen2_vl import Qwen2VLTextConfig
|
8
8
|
from transformers.models.qwen2_vl.modeling_qwen2_vl import Qwen2VLRotaryEmbedding
|
9
9
|
from transformers.models.qwen2_vl.modeling_qwen2_vl import apply_multimodal_rotary_pos_emb
|
10
10
|
|
@@ -45,7 +45,7 @@ device = infer_device()
|
|
45
45
|
],
|
46
46
|
)
|
47
47
|
def test_correctness(bsz, seq_len, num_q_heads, num_kv_heads, head_dim, mrope_section, dtype, atol, rtol):
|
48
|
-
rotary_emb = Qwen2VLRotaryEmbedding(config=
|
48
|
+
rotary_emb = Qwen2VLRotaryEmbedding(config=Qwen2VLTextConfig(head_dim=head_dim), device=device)
|
49
49
|
|
50
50
|
_tensor_q = torch.randn((bsz, seq_len, num_q_heads, head_dim), device=device).transpose(1, 2).to(dtype)
|
51
51
|
|
@@ -105,7 +105,7 @@ def test_functional_correctness(bsz, seq_len, num_q_heads, num_kv_heads, head_di
|
|
105
105
|
k1 = _k.clone().requires_grad_(True)
|
106
106
|
k2 = _k.clone().requires_grad_(True)
|
107
107
|
|
108
|
-
rotary_emb = Qwen2VLRotaryEmbedding(config=
|
108
|
+
rotary_emb = Qwen2VLRotaryEmbedding(config=Qwen2VLTextConfig(head_dim=head_dim), device=device)
|
109
109
|
|
110
110
|
pos_ids = torch.arange(seq_len * 3 * bsz, device=device, dtype=torch.long).view(3, bsz, seq_len)
|
111
111
|
cos, sin = rotary_emb(k1, pos_ids)
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|