liger-kernel-nightly 0.6.4.dev20251201192513__tar.gz → 0.6.4.dev20251202094519__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/setup.py +20 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/cross_entropy.py +2 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/dyt.py +5 -2
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/fused_add_rms_norm.py +5 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/geglu.py +2 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/group_norm.py +2 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/layer_norm.py +2 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/poly_norm.py +5 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/rms_norm.py +5 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/utils.py +2 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/gemma3.py +1 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/paligemma.py +1 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/utils.py +25 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/conftest.py +4 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/utils.py +5 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/workflows/benchmark.yml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/.gitignore +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/Makefile +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/README.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_poly_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_tiled_mlp.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/index.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/docs/license.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/setup.cfg +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/tiled_mlp.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/experimental/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/llama4_rope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/falcon_h1.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/glm4v.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/glm4v_moe.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/hunyuan_v1.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/internvl.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/olmo3.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/output_classes.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/qwen3_next.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/qwen3_vl.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/qwen3_vl_moe.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/smollm3.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/model/smolvlm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/poly_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/tiled_mlp.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/HuggingFaceTB/SmolVLM2-256M-Video-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/OpenGVLab/InternVL3-1B-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/Qwen/Qwen3-VL-4B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_poly_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_tiled_mlp.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/test/triton/test_triton_monkey_patch.py +0 -0
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
|
4
4
|
|
|
5
5
|
[project]
|
|
6
6
|
name = "liger_kernel_nightly"
|
|
7
|
-
version = "0.6.4.
|
|
7
|
+
version = "0.6.4.dev20251202094519"
|
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
|
@@ -24,6 +24,8 @@ def get_default_dependencies():
|
|
|
24
24
|
return [
|
|
25
25
|
"torch>=2.6.0",
|
|
26
26
|
]
|
|
27
|
+
elif platform == "npu":
|
|
28
|
+
return ["torch_npu==2.6.0", "triton-ascend"]
|
|
27
29
|
|
|
28
30
|
|
|
29
31
|
def get_optional_dependencies():
|
|
@@ -67,7 +69,21 @@ def is_xpu_available():
|
|
|
67
69
|
return False
|
|
68
70
|
|
|
69
71
|
|
|
70
|
-
def
|
|
72
|
+
def is_ascend_available() -> bool:
|
|
73
|
+
"""Best-effort Ascend detection.
|
|
74
|
+
|
|
75
|
+
Checks for common Ascend environment variables and a possible `npu-smi`
|
|
76
|
+
utility if present.
|
|
77
|
+
"""
|
|
78
|
+
try:
|
|
79
|
+
subprocess.run(["npu-smi", "info"], check=True)
|
|
80
|
+
return True
|
|
81
|
+
except (subprocess.SubprocessError, FileNotFoundError):
|
|
82
|
+
pass
|
|
83
|
+
return False
|
|
84
|
+
|
|
85
|
+
|
|
86
|
+
def get_platform() -> Literal["cuda", "rocm", "cpu", "xpu", "npu"]:
|
|
71
87
|
"""
|
|
72
88
|
Detect whether the system has NVIDIA or AMD GPU without torch dependency.
|
|
73
89
|
"""
|
|
@@ -86,6 +102,9 @@ def get_platform() -> Literal["cuda", "rocm", "cpu", "xpu"]:
|
|
|
86
102
|
if is_xpu_available():
|
|
87
103
|
print("Intel GPU detected")
|
|
88
104
|
return "xpu"
|
|
105
|
+
elif is_ascend_available():
|
|
106
|
+
print("Ascend NPU detected")
|
|
107
|
+
return "npu"
|
|
89
108
|
else:
|
|
90
109
|
print("No GPU detected")
|
|
91
110
|
return "cpu"
|
|
@@ -10,8 +10,9 @@ from liger_kernel.ops.utils import compare_version
|
|
|
10
10
|
from liger_kernel.ops.utils import element_mul_kernel
|
|
11
11
|
from liger_kernel.ops.utils import is_hip
|
|
12
12
|
from liger_kernel.utils import infer_device
|
|
13
|
+
from liger_kernel.utils import is_npu_available
|
|
13
14
|
|
|
14
|
-
if compare_version("triton", operator.ge, "3.0.0"):
|
|
15
|
+
if compare_version("triton", operator.ge, "3.0.0") and not is_npu_available():
|
|
15
16
|
try:
|
|
16
17
|
# typical import path with dispatch available
|
|
17
18
|
from triton.language.extra.libdevice import tanh
|
|
@@ -7,8 +7,10 @@ import triton.language as tl
|
|
|
7
7
|
from liger_kernel.ops.utils import compare_version
|
|
8
8
|
from liger_kernel.ops.utils import ensure_contiguous
|
|
9
9
|
from liger_kernel.ops.utils import infer_device
|
|
10
|
+
from liger_kernel.utils import get_npu_multi_processor_count
|
|
11
|
+
from liger_kernel.utils import is_npu_available
|
|
10
12
|
|
|
11
|
-
if compare_version("triton", operator.ge, "3.0.0"):
|
|
13
|
+
if compare_version("triton", operator.ge, "3.0.0") and not is_npu_available():
|
|
12
14
|
try:
|
|
13
15
|
# typical import path with dispatch available
|
|
14
16
|
from triton.language.extra.libdevice import tanh
|
|
@@ -125,7 +127,8 @@ def liger_dyt_bwd(dy, x, alpha, gamma, beta):
|
|
|
125
127
|
NUM_SMS = torch.cuda.get_device_properties(x.device).multi_processor_count
|
|
126
128
|
elif device == "xpu":
|
|
127
129
|
NUM_SMS = torch.xpu.get_device_properties(x.device).gpu_subslice_count
|
|
128
|
-
|
|
130
|
+
elif device == "npu":
|
|
131
|
+
NUM_SMS = get_npu_multi_processor_count()
|
|
129
132
|
da = torch.zeros(NUM_SMS, triton.cdiv(N, 512), dtype=torch.float32, device=x.device)
|
|
130
133
|
dg = torch.empty(NUM_SMS, N, dtype=torch.float32, device=x.device)
|
|
131
134
|
db = torch.empty(NUM_SMS, N, dtype=torch.float32, device=x.device) if HAVE_BETA else None
|
|
@@ -9,8 +9,10 @@ from liger_kernel.ops.utils import calculate_settings
|
|
|
9
9
|
from liger_kernel.ops.utils import compare_version
|
|
10
10
|
from liger_kernel.ops.utils import ensure_contiguous
|
|
11
11
|
from liger_kernel.ops.utils import torch_to_triton_dtype
|
|
12
|
+
from liger_kernel.utils import get_npu_multi_processor_count
|
|
13
|
+
from liger_kernel.utils import is_npu_available
|
|
12
14
|
|
|
13
|
-
if compare_version("triton", operator.ge, "3.0.0"):
|
|
15
|
+
if compare_version("triton", operator.ge, "3.0.0") and not is_npu_available():
|
|
14
16
|
try:
|
|
15
17
|
# typical import path with dispatch available
|
|
16
18
|
from triton.language.extra.libdevice import rsqrt
|
|
@@ -293,6 +295,8 @@ def fused_add_rms_norm_backward(dY, dS_out, S, W, RSTD, offset, casting_mode, BL
|
|
|
293
295
|
sm_count = torch.cuda.get_device_properties(S.device).multi_processor_count
|
|
294
296
|
elif S.device.type == "xpu":
|
|
295
297
|
sm_count = torch.xpu.get_device_properties(S.device).gpu_eu_count
|
|
298
|
+
elif S.device.type == "npu":
|
|
299
|
+
sm_count = get_npu_multi_processor_count()
|
|
296
300
|
|
|
297
301
|
# fp32 for numerical stability especially.
|
|
298
302
|
_dW = torch.empty((sm_count, n_cols), dtype=torch.float32, device=W.device)
|
|
@@ -7,8 +7,9 @@ import triton.language as tl
|
|
|
7
7
|
from liger_kernel.ops.utils import calculate_settings
|
|
8
8
|
from liger_kernel.ops.utils import compare_version
|
|
9
9
|
from liger_kernel.ops.utils import ensure_contiguous
|
|
10
|
+
from liger_kernel.utils import is_npu_available
|
|
10
11
|
|
|
11
|
-
if compare_version("triton", operator.ge, "3.0.0"):
|
|
12
|
+
if compare_version("triton", operator.ge, "3.0.0") and not is_npu_available():
|
|
12
13
|
try:
|
|
13
14
|
# typical import path with dispatch available
|
|
14
15
|
from triton.language.extra.libdevice import tanh
|
|
@@ -6,8 +6,9 @@ import triton.language as tl
|
|
|
6
6
|
|
|
7
7
|
from liger_kernel.ops.utils import compare_version
|
|
8
8
|
from liger_kernel.ops.utils import ensure_contiguous
|
|
9
|
+
from liger_kernel.utils import is_npu_available
|
|
9
10
|
|
|
10
|
-
if compare_version("triton", operator.ge, "3.0.0"):
|
|
11
|
+
if compare_version("triton", operator.ge, "3.0.0") and not is_npu_available():
|
|
11
12
|
try:
|
|
12
13
|
# typical import path with dispatch available
|
|
13
14
|
from triton.language.extra.libdevice import rsqrt
|
|
@@ -8,8 +8,9 @@ import triton.language as tl
|
|
|
8
8
|
from liger_kernel.ops.utils import calculate_settings
|
|
9
9
|
from liger_kernel.ops.utils import compare_version
|
|
10
10
|
from liger_kernel.ops.utils import ensure_contiguous
|
|
11
|
+
from liger_kernel.utils import is_npu_available
|
|
11
12
|
|
|
12
|
-
if compare_version("triton", operator.ge, "3.0.0"):
|
|
13
|
+
if compare_version("triton", operator.ge, "3.0.0") and not is_npu_available():
|
|
13
14
|
try:
|
|
14
15
|
# typical import path with dispatch available
|
|
15
16
|
from triton.language.extra.libdevice import rsqrt
|
|
@@ -7,8 +7,10 @@ import triton.language as tl
|
|
|
7
7
|
from liger_kernel.ops.utils import calculate_settings
|
|
8
8
|
from liger_kernel.ops.utils import compare_version
|
|
9
9
|
from liger_kernel.ops.utils import ensure_contiguous
|
|
10
|
+
from liger_kernel.utils import get_npu_multi_processor_count
|
|
11
|
+
from liger_kernel.utils import is_npu_available
|
|
10
12
|
|
|
11
|
-
if compare_version("triton", operator.ge, "3.0.0"):
|
|
13
|
+
if compare_version("triton", operator.ge, "3.0.0") and not is_npu_available():
|
|
12
14
|
try:
|
|
13
15
|
from triton.language.extra.libdevice import rsqrt
|
|
14
16
|
except ModuleNotFoundError:
|
|
@@ -290,6 +292,8 @@ def poly_norm_backward(dY, X, W, RSTD, BLOCK_SIZE, num_warps, in_place):
|
|
|
290
292
|
sm_count = torch.cuda.get_device_properties(X.device).multi_processor_count
|
|
291
293
|
elif X.device.type == "xpu":
|
|
292
294
|
sm_count = torch.xpu.get_device_properties(X.device).gpu_eu_count
|
|
295
|
+
elif X.device.type == "npu":
|
|
296
|
+
sm_count = get_npu_multi_processor_count()
|
|
293
297
|
|
|
294
298
|
# Allocate or reuse gradients
|
|
295
299
|
if in_place is True:
|
|
@@ -21,8 +21,10 @@ from liger_kernel.ops.utils import calculate_settings
|
|
|
21
21
|
from liger_kernel.ops.utils import compare_version
|
|
22
22
|
from liger_kernel.ops.utils import ensure_contiguous
|
|
23
23
|
from liger_kernel.ops.utils import torch_to_triton_dtype
|
|
24
|
+
from liger_kernel.utils import get_npu_multi_processor_count
|
|
25
|
+
from liger_kernel.utils import is_npu_available
|
|
24
26
|
|
|
25
|
-
if compare_version("triton", operator.ge, "3.0.0"):
|
|
27
|
+
if compare_version("triton", operator.ge, "3.0.0") and not is_npu_available():
|
|
26
28
|
try:
|
|
27
29
|
# typical import path with dispatch available
|
|
28
30
|
from triton.language.extra.libdevice import rsqrt
|
|
@@ -450,6 +452,8 @@ def rms_norm_backward(dY, X, W, RSTD, offset, casting_mode, BLOCK_SIZE, num_warp
|
|
|
450
452
|
sm_count = torch.cuda.get_device_properties(X.device).multi_processor_count
|
|
451
453
|
elif X.device.type == "xpu":
|
|
452
454
|
sm_count = torch.xpu.get_device_properties(X.device).gpu_eu_count
|
|
455
|
+
elif X.device.type == "npu":
|
|
456
|
+
sm_count = get_npu_multi_processor_count()
|
|
453
457
|
|
|
454
458
|
# fp32 for numerical stability especially.
|
|
455
459
|
_dW = torch.empty((sm_count, n_cols), dtype=torch.float32, device=W.device)
|
|
@@ -78,6 +78,8 @@ def get_amp_custom_fwd_bwd() -> Callable:
|
|
|
78
78
|
functools.partial(torch.amp.custom_fwd, device_type=device),
|
|
79
79
|
functools.partial(torch.amp.custom_bwd, device_type=device),
|
|
80
80
|
)
|
|
81
|
+
if hasattr(torch, "npu") and getattr(torch.npu, "amp", None) is not None:
|
|
82
|
+
return torch.npu.amp.custom_fwd, torch.npu.amp.custom_bwd
|
|
81
83
|
return torch.cuda.amp.custom_fwd, torch.cuda.amp.custom_bwd
|
|
82
84
|
|
|
83
85
|
|
|
@@ -18,12 +18,37 @@ def infer_device():
|
|
|
18
18
|
"""
|
|
19
19
|
if torch.cuda.is_available(): # Works for both Nvidia and AMD
|
|
20
20
|
return "cuda"
|
|
21
|
+
# Use Ascend NPU if available (torch.npu)
|
|
22
|
+
elif is_npu_available():
|
|
23
|
+
return "npu"
|
|
24
|
+
# XPU (Intel) if available
|
|
21
25
|
elif torch.xpu.is_available():
|
|
22
26
|
return "xpu"
|
|
23
27
|
else:
|
|
24
28
|
return "cpu"
|
|
25
29
|
|
|
26
30
|
|
|
31
|
+
def is_npu_available() -> bool:
|
|
32
|
+
"""Detect Ascend NPU availability."""
|
|
33
|
+
try:
|
|
34
|
+
from transformers.utils import is_torch_npu_available
|
|
35
|
+
|
|
36
|
+
return is_torch_npu_available()
|
|
37
|
+
except Exception:
|
|
38
|
+
return False
|
|
39
|
+
|
|
40
|
+
|
|
41
|
+
def get_npu_multi_processor_count() -> int:
|
|
42
|
+
"""Return a heuristic multi-processor count for NPU."""
|
|
43
|
+
if is_npu_available():
|
|
44
|
+
NPU_MULTI_PROCESSOR_COUNT = 48
|
|
45
|
+
dev_props = torch.npu.get_device_properties()
|
|
46
|
+
# The vector_core_num attribute is supported in the torch.npu v7.2.0 release version.
|
|
47
|
+
return dev_props.vector_core_num if hasattr(dev_props, "vector_core_num") else NPU_MULTI_PROCESSOR_COUNT
|
|
48
|
+
# Reasonable default to avoid division by zero
|
|
49
|
+
return 1
|
|
50
|
+
|
|
51
|
+
|
|
27
52
|
def transformers_version_dispatch(
|
|
28
53
|
required_version: str,
|
|
29
54
|
before_fn,
|
|
@@ -1,11 +1,15 @@
|
|
|
1
1
|
import pytest
|
|
2
2
|
import torch
|
|
3
3
|
|
|
4
|
+
from liger_kernel.utils import is_npu_available
|
|
5
|
+
|
|
4
6
|
|
|
5
7
|
@pytest.fixture(autouse=True)
|
|
6
8
|
def clear_gpu_cache():
|
|
7
9
|
yield
|
|
8
10
|
if torch.cuda.is_available():
|
|
9
11
|
torch.cuda.empty_cache()
|
|
12
|
+
elif is_npu_available():
|
|
13
|
+
torch.npu.empty_cache()
|
|
10
14
|
elif torch.xpu.is_available():
|
|
11
15
|
torch.xpu.empty_cache()
|
|
@@ -55,6 +55,9 @@ def set_seed(seed=42):
|
|
|
55
55
|
# If you are using XPU
|
|
56
56
|
torch.xpu.manual_seed(seed)
|
|
57
57
|
torch.xpu.manual_seed_all(seed)
|
|
58
|
+
elif device == "npu":
|
|
59
|
+
torch.npu.manual_seed(seed)
|
|
60
|
+
torch.npu.manual_seed_all(seed)
|
|
58
61
|
|
|
59
62
|
# Python hash seed
|
|
60
63
|
os.environ["PYTHONHASHSEED"] = str(seed)
|
|
@@ -258,6 +261,8 @@ def supports_bfloat16():
|
|
|
258
261
|
return torch.cuda.get_device_capability() >= (8, 0) # Ampere and newer
|
|
259
262
|
elif device == "xpu":
|
|
260
263
|
return True
|
|
264
|
+
elif device == "npu":
|
|
265
|
+
return True
|
|
261
266
|
else:
|
|
262
267
|
return False
|
|
263
268
|
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{liger_kernel_nightly-0.6.4.dev20251201192513 → liger_kernel_nightly-0.6.4.dev20251202094519}/NOTICE
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|