liger-kernel-nightly 0.5.6.dev20250403190551__tar.gz → 0.5.6.dev20250403230052__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/chunked_loss/test_grpo_loss.py +9 -13
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/bf16/test_mini_models_multimodal.py +2 -2
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/.gitignore +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/Makefile +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/README.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/index.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/docs/license.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/setup.cfg +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/setup.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/gema3_rms.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/test/utils.py +0 -0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.5.6.
|
7
|
+
version = "0.5.6.dev20250403230052"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -14,9 +14,6 @@ device = infer_device()
|
|
14
14
|
# set random seed globally
|
15
15
|
set_seed()
|
16
16
|
|
17
|
-
# reset torch compiler cache
|
18
|
-
torch.compiler.reset()
|
19
|
-
|
20
17
|
|
21
18
|
class TorchLMHeadGRPO(torch.nn.Module):
|
22
19
|
def __init__(
|
@@ -52,7 +49,7 @@ class TorchLMHeadGRPO(torch.nn.Module):
|
|
52
49
|
):
|
53
50
|
logits = x @ self.lin.weight.t()
|
54
51
|
if self.lin.bias is not None:
|
55
|
-
logits = logits + self.lin.bias
|
52
|
+
logits = logits + self.lin.bias.float()
|
56
53
|
if self.temperature != 1.0:
|
57
54
|
logits = logits / self.temperature
|
58
55
|
# Get log probabilities
|
@@ -258,10 +255,11 @@ def test_correctness(
|
|
258
255
|
|
259
256
|
# Compute per-token logps
|
260
257
|
with torch.no_grad():
|
261
|
-
|
258
|
+
logits = _input @ torch_lm_head_grpo.lin.weight.t()
|
262
259
|
if torch_lm_head_grpo.lin.bias is not None:
|
263
|
-
|
264
|
-
|
260
|
+
logits = logits + torch_lm_head_grpo.lin.bias
|
261
|
+
logits = logits / temperature
|
262
|
+
logps = F.log_softmax(logits.float(), dim=-1)
|
265
263
|
per_token_logps = logps.gather(dim=-1, index=selected_token_ids.unsqueeze(-1)).squeeze(-1)
|
266
264
|
|
267
265
|
# Create attention mask with random padding [B, T]
|
@@ -314,9 +312,8 @@ def test_correctness(
|
|
314
312
|
# Check metrics match
|
315
313
|
assert len(aux1) == len(aux2)
|
316
314
|
# aggregated metrics are unstable for bfloat16
|
317
|
-
|
318
|
-
|
319
|
-
assert_verbose_allclose(metric1, metric2, atol=atol, rtol=rtol)
|
315
|
+
for metric1, metric2 in zip(aux1, aux2):
|
316
|
+
assert_verbose_allclose(metric1, metric2, atol=atol, rtol=rtol)
|
320
317
|
|
321
318
|
# Backward pass
|
322
319
|
loss1.backward()
|
@@ -455,9 +452,8 @@ def test_functional_correctness(
|
|
455
452
|
# Check metrics match
|
456
453
|
assert len(aux1) == len(aux2)
|
457
454
|
# aggregated metrics are unstable for bfloat16
|
458
|
-
|
459
|
-
|
460
|
-
assert_verbose_allclose(metric1, metric2, atol=atol, rtol=rtol)
|
455
|
+
for metric1, metric2 in zip(aux1, aux2):
|
456
|
+
assert_verbose_allclose(metric1, metric2, atol=atol, rtol=rtol)
|
461
457
|
|
462
458
|
# Backward pass
|
463
459
|
loss1.backward()
|
@@ -876,8 +876,8 @@ def run_mini_model_multimodal(
|
|
876
876
|
torch.bfloat16,
|
877
877
|
1e-3,
|
878
878
|
1e-2,
|
879
|
-
|
880
|
-
1e-
|
879
|
+
0.25, # Increase the absolute tolerance for the logits of Gemma-3.
|
880
|
+
1e-1,
|
881
881
|
1e-2,
|
882
882
|
1e-2,
|
883
883
|
marks=[
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.5.6.dev20250403190551 → liger_kernel_nightly-0.5.6.dev20250403230052}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|