liger-kernel-nightly 0.5.9.dev20250504194613__tar.gz → 0.5.9.dev20250505192105__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/benchmarks_visualizer.py +1 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/training_multimodal.py +1 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/train.py +1 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/bf16/test_mini_models.py +0 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/bf16/test_mini_models_multimodal.py +0 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/bf16/test_mini_models_with_logits.py +0 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/fp32/test_mini_models.py +0 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/fp32/test_mini_models_multimodal.py +0 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/fp32/test_mini_models_with_logits.py +0 -1
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/.gitignore +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/LICENSE +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/Makefile +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/NOTICE +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/README.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/index.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/docs/license.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/setup.cfg +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/setup.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/gema3_rms.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/phi3.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/test/utils.py +0 -0
@@ -123,7 +123,7 @@ def plot_data(df: pd.DataFrame, config: VisualizationsConfig):
|
|
123
123
|
lines = ax.get_lines()
|
124
124
|
colors = [line.get_color() for line in lines]
|
125
125
|
|
126
|
-
for (_, group_data), color in zip(df.groupby("kernel_provider"), colors
|
126
|
+
for (_, group_data), color in zip(df.groupby("kernel_provider"), colors):
|
127
127
|
# for i, row in group_data.iterrows():
|
128
128
|
y_error_lower = group_data["y_value_50"] - group_data["y_value_20"]
|
129
129
|
y_error_upper = group_data["y_value_80"] - group_data["y_value_50"]
|
@@ -68,7 +68,7 @@ def construct_model_and_processor(model_name: str, use_liger: bool) -> torch.nn.
|
|
68
68
|
def _validate_and_extract_the_cauldron(examples) -> dict[str, list]:
|
69
69
|
batch_texts = []
|
70
70
|
batch_images = []
|
71
|
-
for images, texts in zip(examples["images"], examples["texts"]
|
71
|
+
for images, texts in zip(examples["images"], examples["texts"]):
|
72
72
|
if not images:
|
73
73
|
raise ValueError("No image found in example from the_cauldron dataset")
|
74
74
|
if len(images) > 1:
|
@@ -175,7 +175,7 @@ def preprocess(
|
|
175
175
|
input_ids = encoding.input_ids
|
176
176
|
|
177
177
|
# Mask targets. Only compute loss on the assistant outputs.
|
178
|
-
for conv_index, (conversation, target, prompt) in enumerate(zip(conversations, targets, prompts
|
178
|
+
for conv_index, (conversation, target, prompt) in enumerate(zip(conversations, targets, prompts)):
|
179
179
|
# print(conv_index)
|
180
180
|
for turn in conversation:
|
181
181
|
if turn["role"] == "assistant":
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.5.9.
|
7
|
+
version = "0.5.9.dev20250505192105"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -222,7 +222,6 @@ class LigerFusedLinearPreferenceBase(torch.autograd.Function):
|
|
222
222
|
(_ref_chosen_input_chunks if use_ref_model else [None] * len(_chosen_input_chunks)),
|
223
223
|
(_ref_rejected_input_chunks if use_ref_model else [None] * len(_rejected_input_chunks)),
|
224
224
|
(_chosen_nll_target_chunks if nll_target is not None else [None] * len(_chosen_input_chunks)),
|
225
|
-
strict=False,
|
226
225
|
):
|
227
226
|
input_chunk = torch.cat([chosen_input_chunk, rejected_input_chunk], dim=0)
|
228
227
|
ref_input_chunk = (
|
@@ -1130,6 +1130,5 @@ def test_mini_model(
|
|
1130
1130
|
for expected_param, actual_param in zip(
|
1131
1131
|
expected_output["model"].named_parameters(),
|
1132
1132
|
actual_output["model"].named_parameters(),
|
1133
|
-
strict=False,
|
1134
1133
|
):
|
1135
1134
|
assert_verbose_allclose(expected_param[1], actual_param[1], atol=param_atol, rtol=param_rtol)
|
@@ -929,6 +929,5 @@ def test_mini_model_multimodal(
|
|
929
929
|
for expected_param, actual_param in zip(
|
930
930
|
expected_output["model"].named_parameters(),
|
931
931
|
actual_output["model"].named_parameters(),
|
932
|
-
strict=False,
|
933
932
|
):
|
934
933
|
assert_verbose_allclose(expected_param[1], actual_param[1], atol=param_atol, rtol=param_rtol)
|
@@ -1129,6 +1129,5 @@ def test_mini_model(
|
|
1129
1129
|
for expected_param, actual_param in zip(
|
1130
1130
|
expected_output["model"].named_parameters(),
|
1131
1131
|
actual_output["model"].named_parameters(),
|
1132
|
-
strict=False,
|
1133
1132
|
):
|
1134
1133
|
assert_verbose_allclose(expected_param[1], actual_param[1], atol=param_atol, rtol=param_rtol)
|
@@ -1000,6 +1000,5 @@ def test_mini_model(
|
|
1000
1000
|
for expected_param, actual_param in zip(
|
1001
1001
|
expected_output["model"].named_parameters(),
|
1002
1002
|
actual_output["model"].named_parameters(),
|
1003
|
-
strict=False,
|
1004
1003
|
):
|
1005
1004
|
assert_verbose_allclose(expected_param[1], actual_param[1], atol=param_atol, rtol=param_rtol)
|
@@ -910,6 +910,5 @@ def test_mini_model_multimodal(
|
|
910
910
|
for expected_param, actual_param in zip(
|
911
911
|
expected_output["model"].named_parameters(),
|
912
912
|
actual_output["model"].named_parameters(),
|
913
|
-
strict=False,
|
914
913
|
):
|
915
914
|
assert_verbose_allclose(expected_param[1], actual_param[1], atol=param_atol, rtol=param_rtol)
|
@@ -1000,6 +1000,5 @@ def test_mini_model(
|
|
1000
1000
|
for expected_param, actual_param in zip(
|
1001
1001
|
expected_output["model"].named_parameters(),
|
1002
1002
|
actual_output["model"].named_parameters(),
|
1003
|
-
strict=False,
|
1004
1003
|
):
|
1005
1004
|
assert_verbose_allclose(expected_param[1], actual_param[1], atol=param_atol, rtol=param_rtol)
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.5.9.dev20250504194613 → liger_kernel_nightly-0.5.9.dev20250505192105}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|