liger-kernel-nightly 0.6.1.dev20250730201750__tar.gz → 0.6.1.dev20250805235815__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/PKG-INFO +2 -2
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/README.md +1 -1
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/pyproject.toml +1 -1
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/phi3.py +0 -14
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel_nightly.egg-info/PKG-INFO +2 -2
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/fp32/test_mini_models_multimodal.py +1 -1
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/pull_request_template.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/workflows/amd-ci.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/workflows/benchmark.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/workflows/docs.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/workflows/intel-ci.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/workflows/nvi-ci.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/workflows/publish-nightly.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.github/workflows/publish-release.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/.gitignore +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/Makefile +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/benchmarks_visualizer.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/data/all_benchmark_data.csv +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_distill_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_dyt.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_embedding.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_geglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_softmax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/benchmark_tvd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/benchmark/scripts/utils.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/dev/fmt-requirements.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/dev/modal/benchmarks.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/dev/modal/tests.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/dev/modal/tests_bwd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/Examples.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/Getting-Started.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/High-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/Low-Level-APIs.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/acknowledgement.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/contributing.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/images/banner.GIF +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/images/compose.gif +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/images/e2e-memory.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/images/e2e-tps.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/images/logo-banner.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/images/patch.gif +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/images/post-training.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/index.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/docs/license.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/alignment/accelerate_config.yaml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/alignment/run_orpo.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/callback.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/config/fsdp_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/img/gemma_7b_mem.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/img/gemma_7b_tp.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/img/llama_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/img/llama_tps.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/img/qwen_tps.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/launch_on_modal.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/run_benchmarks.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/run_gemma.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/run_llama.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/run_qwen.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/run_qwen2_vl.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/training.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/huggingface/training_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/lightning/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/lightning/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/lightning/training.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/callback.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/medusa_util.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/requirements.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/examples/medusa/train.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/licenses/LICENSE-Apache-2.0 +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/licenses/LICENSE-MIT-AutoAWQ +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/licenses/LICENSE-MIT-llmc +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/licenses/LICENSE-MIT-triton +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/mkdocs.yml +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/setup.cfg +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/setup.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/README.md +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/cosine_similarity_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/functional.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/env_report.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/dyt.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/geglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/softmax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/tvd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/ops/utils.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/auto_model.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/dyt.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/fsdp.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/functional.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/geglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/group_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/kl_div.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/gemma.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/gemma2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/gemma3.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/glm4.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/llama.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/llama4.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/llava.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/mistral.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/mixtral.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/mllama.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/olmo2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/paligemma.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/qwen2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/qwen3.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/model/smollm3.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/softmax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/swiglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/transformers/tvd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/triton/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/triton/monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel/utils.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/test_cosine_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/test_cpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/test_dpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/test_jsd_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/test_kto_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/test_orpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/chunked_loss/test_simpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/conftest.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/bf16/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/bf16/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/fp32/__init__.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/fp32/test_mini_models.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/fake_configs/meta-llama/Llama-4-Scout-17B-16E-Instruct/tokenizer_config.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/tiny_shakespeare.txt +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_auto_model.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_dyt.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_embedding.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_flex_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_fused_add_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_fused_linear_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_fused_neighborhood_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_geglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_group_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_grpo_loss.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_jsd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_kl_div.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_layer_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_mm_int8int2.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_multi_token_attention.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_qwen2vl_mrope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_rms_norm.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_rope.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_softmax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_sparsemax.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_swiglu.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_trainer_integration.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_transformers.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/transformers/test_tvd.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/triton/test_triton_monkey_patch.py +0 -0
- {liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/test/utils.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: liger_kernel_nightly
|
3
|
-
Version: 0.6.1.
|
3
|
+
Version: 0.6.1.dev20250805235815
|
4
4
|
Summary: Efficient Triton kernels for LLM Training
|
5
5
|
License: BSD 2-CLAUSE LICENSE
|
6
6
|
Copyright 2024 LinkedIn Corporation
|
@@ -397,7 +397,7 @@ loss.backward()
|
|
397
397
|
</a>
|
398
398
|
</div>
|
399
399
|
<div style="display: block;">
|
400
|
-
<a href="https://github.com/linkedin/Liger-Kernel/actions/workflows/
|
400
|
+
<a href="https://github.com/linkedin/Liger-Kernel/actions/workflows/intel-ci.yml">
|
401
401
|
<img src="https://github.com/linkedin/Liger-Kernel/actions/workflows/intel-ci.yml/badge.svg?event=schedule" alt="Build">
|
402
402
|
</a>
|
403
403
|
</div>
|
@@ -348,7 +348,7 @@ loss.backward()
|
|
348
348
|
</a>
|
349
349
|
</div>
|
350
350
|
<div style="display: block;">
|
351
|
-
<a href="https://github.com/linkedin/Liger-Kernel/actions/workflows/
|
351
|
+
<a href="https://github.com/linkedin/Liger-Kernel/actions/workflows/intel-ci.yml">
|
352
352
|
<img src="https://github.com/linkedin/Liger-Kernel/actions/workflows/intel-ci.yml/badge.svg?event=schedule" alt="Build">
|
353
353
|
</a>
|
354
354
|
</div>
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "liger_kernel_nightly"
|
7
|
-
version = "0.6.1.
|
7
|
+
version = "0.6.1.dev20250805235815"
|
8
8
|
description = "Efficient Triton kernels for LLM Training"
|
9
9
|
urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
|
10
10
|
readme = { file = "README.md", content-type = "text/markdown" }
|
@@ -180,20 +180,6 @@ def lce_forward(
|
|
180
180
|
'This is an example script .\n Certainly! Below is a sample script that demonstrates a simple task, such as calculating the sum'
|
181
181
|
```"""
|
182
182
|
|
183
|
-
from transformers.models.phi3.modeling_phi3 import logging
|
184
|
-
|
185
|
-
logger = logging.get_logger(__name__)
|
186
|
-
|
187
|
-
if (
|
188
|
-
use_cache
|
189
|
-
and self.config.rope_scaling
|
190
|
-
and cache_position is not None
|
191
|
-
and cache_position[0] == self.config.original_max_position_embeddings
|
192
|
-
):
|
193
|
-
logger.warning(
|
194
|
-
f"If you are not using the generate method, you may encounter nonsensical outputs after the {self.config.original_max_position_embeddings}th token, as the KV cache needs to be recomputed."
|
195
|
-
)
|
196
|
-
|
197
183
|
output_attentions = output_attentions if output_attentions is not None else self.config.output_attentions
|
198
184
|
output_hidden_states = (
|
199
185
|
output_hidden_states if output_hidden_states is not None else self.config.output_hidden_states
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: liger_kernel_nightly
|
3
|
-
Version: 0.6.1.
|
3
|
+
Version: 0.6.1.dev20250805235815
|
4
4
|
Summary: Efficient Triton kernels for LLM Training
|
5
5
|
License: BSD 2-CLAUSE LICENSE
|
6
6
|
Copyright 2024 LinkedIn Corporation
|
@@ -397,7 +397,7 @@ loss.backward()
|
|
397
397
|
</a>
|
398
398
|
</div>
|
399
399
|
<div style="display: block;">
|
400
|
-
<a href="https://github.com/linkedin/Liger-Kernel/actions/workflows/
|
400
|
+
<a href="https://github.com/linkedin/Liger-Kernel/actions/workflows/intel-ci.yml">
|
401
401
|
<img src="https://github.com/linkedin/Liger-Kernel/actions/workflows/intel-ci.yml/badge.svg?event=schedule" alt="Build">
|
402
402
|
</a>
|
403
403
|
</div>
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{liger_kernel_nightly-0.6.1.dev20250730201750 → liger_kernel_nightly-0.6.1.dev20250805235815}/NOTICE
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|