liger-kernel-nightly 0.5.10.dev20250611191801__tar.gz → 0.5.10.dev20250613192702__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (270) hide show
  1. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/PKG-INFO +2 -1
  2. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_cpo_loss.py +1 -1
  3. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_cross_entropy.py +1 -1
  4. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_distill_jsd_loss.py +1 -1
  5. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_dpo_loss.py +1 -1
  6. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_embedding.py +1 -1
  7. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +1 -1
  8. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_linear_jsd.py +1 -1
  9. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_jsd.py +1 -1
  10. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_kl_div.py +1 -1
  11. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_kto_loss.py +1 -1
  12. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_layer_norm.py +1 -1
  13. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_orpo_loss.py +1 -1
  14. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_simpo_loss.py +1 -1
  15. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_softmax.py +1 -1
  16. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_swiglu.py +1 -1
  17. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_tvd.py +1 -1
  18. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/utils.py +1 -1
  19. liger_kernel_nightly-0.5.10.dev20250613192702/dev/modal/benchmarks.py +73 -0
  20. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/pyproject.toml +1 -1
  21. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/setup.py +1 -0
  22. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/PKG-INFO +2 -1
  23. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/requires.txt +1 -0
  24. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models_multimodal.py +3 -0
  25. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models_multimodal.py +3 -0
  26. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/utils.py +7 -0
  27. liger_kernel_nightly-0.5.10.dev20250611191801/dev/modal/benchmarks.py +0 -28
  28. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
  29. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
  30. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/pull_request_template.md +0 -0
  31. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/amd-ci.yml +0 -0
  32. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/benchmark.yml +2 -2
  33. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/docs.yml +0 -0
  34. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/intel-ci.yml +0 -0
  35. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/nvi-ci.yml +0 -0
  36. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/publish-nightly.yml +0 -0
  37. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/publish-release.yml +0 -0
  38. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.gitignore +0 -0
  39. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/.idea/workspace.xml +0 -0
  40. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/LICENSE +0 -0
  41. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/Makefile +0 -0
  42. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/NOTICE +0 -0
  43. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/README.md +0 -0
  44. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/README.md +0 -0
  45. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/__init__.py +0 -0
  46. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/benchmarks_visualizer.py +0 -0
  47. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/data/all_benchmark_data.csv +0 -0
  48. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/__init__.py +0 -0
  49. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_dyt.py +0 -0
  50. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
  51. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_geglu.py +0 -0
  52. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_group_norm.py +0 -0
  53. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
  54. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
  55. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_rms_norm.py +0 -0
  56. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_rope.py +0 -0
  57. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
  58. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_sparsemax.py +0 -0
  59. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/fmt-requirements.txt +0 -0
  60. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/modal/tests.py +0 -0
  61. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/modal/tests_bwd.py +0 -0
  62. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Examples.md +0 -0
  63. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Getting-Started.md +0 -0
  64. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/High-Level-APIs.md +0 -0
  65. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Low-Level-APIs.md +0 -0
  66. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/acknowledgement.md +0 -0
  67. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/contributing.md +0 -0
  68. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/banner.GIF +0 -0
  69. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/compose.gif +0 -0
  70. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/e2e-memory.png +0 -0
  71. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/e2e-tps.png +0 -0
  72. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/logo-banner.png +0 -0
  73. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/patch.gif +0 -0
  74. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/post-training.png +0 -0
  75. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/index.md +0 -0
  76. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/license.md +0 -0
  77. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/alignment/accelerate_config.yaml +0 -0
  78. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/alignment/run_orpo.py +0 -0
  79. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/README.md +0 -0
  80. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/callback.py +0 -0
  81. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/config/fsdp_config.json +0 -0
  82. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/gemma_7b_mem.png +0 -0
  83. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/gemma_7b_tp.png +0 -0
  84. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/llama_mem_alloc.png +0 -0
  85. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/llama_tps.png +0 -0
  86. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
  87. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/qwen_tps.png +0 -0
  88. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/launch_on_modal.py +0 -0
  89. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/requirements.txt +0 -0
  90. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_benchmarks.sh +0 -0
  91. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_gemma.sh +0 -0
  92. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_llama.sh +0 -0
  93. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_qwen.sh +0 -0
  94. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_qwen2_vl.sh +0 -0
  95. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/training.py +0 -0
  96. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/training_multimodal.py +0 -0
  97. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/README.md +0 -0
  98. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/requirements.txt +0 -0
  99. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/training.py +0 -0
  100. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/README.md +0 -0
  101. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/callback.py +0 -0
  102. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
  103. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
  104. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
  105. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
  106. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
  107. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
  108. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
  109. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
  110. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
  111. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/medusa_util.py +0 -0
  112. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/requirements.txt +0 -0
  113. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
  114. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/train.py +0 -0
  115. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-Apache-2.0 +0 -0
  116. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-AutoAWQ +0 -0
  117. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
  118. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-llmc +0 -0
  119. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-triton +0 -0
  120. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/mkdocs.yml +0 -0
  121. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/setup.cfg +0 -0
  122. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/__init__.py +0 -0
  123. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/README.md +0 -0
  124. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/__init__.py +0 -0
  125. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
  126. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
  127. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/functional.py +0 -0
  128. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
  129. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
  130. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
  131. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
  132. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
  133. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
  134. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
  135. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
  136. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
  137. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/env_report.py +0 -0
  138. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/__init__.py +0 -0
  139. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/cross_entropy.py +0 -0
  140. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/dyt.py +0 -0
  141. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/experimental/embedding.py +0 -0
  142. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
  143. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
  144. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
  145. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
  146. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/geglu.py +0 -0
  147. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/group_norm.py +0 -0
  148. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/grpo_loss.py +0 -0
  149. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/jsd.py +0 -0
  150. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/kl_div.py +0 -0
  151. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/layer_norm.py +0 -0
  152. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/multi_token_attention.py +0 -0
  153. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
  154. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/rms_norm.py +0 -0
  155. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/rope.py +0 -0
  156. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/softmax.py +0 -0
  157. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/sparsemax.py +0 -0
  158. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/swiglu.py +0 -0
  159. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/tvd.py +0 -0
  160. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/utils.py +0 -0
  161. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/__init__.py +0 -0
  162. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/auto_model.py +0 -0
  163. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/cross_entropy.py +0 -0
  164. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/dyt.py +0 -0
  165. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
  166. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fsdp.py +0 -0
  167. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/functional.py +0 -0
  168. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
  169. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
  170. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
  171. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/geglu.py +0 -0
  172. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/group_norm.py +0 -0
  173. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/grpo_loss.py +0 -0
  174. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/jsd.py +0 -0
  175. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/kl_div.py +0 -0
  176. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/layer_norm.py +0 -0
  177. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/__init__.py +0 -0
  178. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma.py +0 -0
  179. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma2.py +0 -0
  180. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma3.py +0 -0
  181. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/glm4.py +0 -0
  182. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/llama.py +0 -0
  183. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/llava.py +0 -0
  184. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
  185. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mistral.py +0 -0
  186. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mixtral.py +0 -0
  187. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mllama.py +0 -0
  188. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/olmo2.py +0 -0
  189. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/paligemma.py +0 -0
  190. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/phi3.py +0 -0
  191. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2.py +0 -0
  192. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
  193. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
  194. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen3.py +0 -0
  195. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
  196. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/monkey_patch.py +0 -0
  197. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
  198. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
  199. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/rms_norm.py +0 -0
  200. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/rope.py +0 -0
  201. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/softmax.py +0 -0
  202. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/sparsemax.py +0 -0
  203. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/swiglu.py +0 -0
  204. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
  205. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
  206. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer_integration.py +0 -0
  207. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/tvd.py +0 -0
  208. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/triton/__init__.py +0 -0
  209. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/triton/monkey_patch.py +0 -0
  210. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/utils.py +0 -0
  211. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
  212. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
  213. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
  214. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/__init__.py +0 -0
  215. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/__init__.py +0 -0
  216. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_cpo_loss.py +0 -0
  217. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_dpo_loss.py +0 -0
  218. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_grpo_loss.py +0 -0
  219. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_jsd_loss.py +0 -0
  220. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_kto_loss.py +0 -0
  221. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_orpo_loss.py +0 -0
  222. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_simpo_loss.py +0 -0
  223. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/conftest.py +0 -0
  224. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/__init__.py +0 -0
  225. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/__init__.py +0 -0
  226. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models.py +0 -0
  227. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
  228. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/__init__.py +0 -0
  229. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models.py +0 -0
  230. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
  231. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
  232. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
  233. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
  234. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
  235. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
  236. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
  237. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
  238. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
  239. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
  240. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare.txt +0 -0
  241. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
  242. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
  243. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
  244. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_auto_model.py +0 -0
  245. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_cross_entropy.py +0 -0
  246. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_dyt.py +0 -0
  247. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_embedding.py +0 -0
  248. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_flex_attention.py +0 -0
  249. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
  250. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_linear_jsd.py +0 -0
  251. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_neighborhood_attention.py +0 -0
  252. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_geglu.py +0 -0
  253. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_group_norm.py +0 -0
  254. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_grpo_loss.py +0 -0
  255. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_jsd.py +0 -0
  256. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_kl_div.py +0 -0
  257. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_layer_norm.py +0 -0
  258. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_mm_int8int2.py +0 -0
  259. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_monkey_patch.py +0 -0
  260. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_multi_token_attention.py +0 -0
  261. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_qwen2vl_mrope.py +0 -0
  262. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_rms_norm.py +0 -0
  263. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_rope.py +0 -0
  264. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_softmax.py +0 -0
  265. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_sparsemax.py +0 -0
  266. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_swiglu.py +0 -0
  267. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_trainer_integration.py +0 -0
  268. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_transformers.py +0 -0
  269. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_tvd.py +0 -0
  270. {liger_kernel_nightly-0.5.10.dev20250611191801 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/triton/test_triton_monkey_patch.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.10.dev20250611191801
3
+ Version: 0.5.10.dev20250613192702
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -45,6 +45,7 @@ Requires-Dist: datasets>=2.19.2; extra == "dev"
45
45
  Requires-Dist: seaborn; extra == "dev"
46
46
  Requires-Dist: mkdocs; extra == "dev"
47
47
  Requires-Dist: mkdocs-material; extra == "dev"
48
+ Requires-Dist: torchvision>=0.20; extra == "dev"
48
49
 
49
50
  <a name="readme-top"></a>
50
51
 
@@ -147,7 +147,7 @@ if __name__ == "__main__":
147
147
 
148
148
  run_benchmarks(
149
149
  bench_test_fn=bench_speed_fused_linear_cpo_loss,
150
- kernel_operation_modes=["forward", "full"],
150
+ kernel_operation_modes=["forward", "backward", "full"],
151
151
  metric_name="speed",
152
152
  metric_unit="ms",
153
153
  **common_configs,
@@ -109,7 +109,7 @@ if __name__ == "__main__":
109
109
 
110
110
  run_benchmarks(
111
111
  bench_test_fn=bench_speed_cross_entropy,
112
- kernel_operation_modes=["forward", "full"],
112
+ kernel_operation_modes=["forward", "backward", "full"],
113
113
  metric_name="speed",
114
114
  metric_unit="ms",
115
115
  **common_configs,
@@ -248,7 +248,7 @@ if __name__ == "__main__":
248
248
 
249
249
  run_benchmarks(
250
250
  bench_test_fn=bench_speed_jsd_loss,
251
- kernel_operation_modes=["forward", "full"],
251
+ kernel_operation_modes=["forward", "backward", "full"],
252
252
  metric_name="speed",
253
253
  metric_unit="ms",
254
254
  **common_configs,
@@ -166,7 +166,7 @@ if __name__ == "__main__":
166
166
 
167
167
  run_benchmarks(
168
168
  bench_test_fn=bench_speed_dpo_loss,
169
- kernel_operation_modes=["forward", "full"],
169
+ kernel_operation_modes=["forward", "backward", "full"],
170
170
  metric_name="speed",
171
171
  metric_unit="ms",
172
172
  **common_configs,
@@ -112,7 +112,7 @@ if __name__ == "__main__":
112
112
 
113
113
  run_benchmarks(
114
114
  bench_test_fn=bench_speed_embedding,
115
- kernel_operation_modes=["forward", "full"],
115
+ kernel_operation_modes=["forward", "backward", "full"],
116
116
  metric_name="speed",
117
117
  metric_unit="ms",
118
118
  **common_configs,
@@ -156,7 +156,7 @@ if __name__ == "__main__":
156
156
 
157
157
  run_benchmarks(
158
158
  bench_test_fn=bench_speed_fused_linear_cross_entropy,
159
- kernel_operation_modes=["forward", "full"],
159
+ kernel_operation_modes=["forward", "backward", "full"],
160
160
  metric_name="speed",
161
161
  metric_unit="ms",
162
162
  **common_configs,
@@ -246,7 +246,7 @@ if __name__ == "__main__":
246
246
 
247
247
  run_benchmarks(
248
248
  bench_test_fn=bench_speed_fused_linear_jsd,
249
- kernel_operation_modes=["forward", "full"],
249
+ kernel_operation_modes=["forward", "backward", "full"],
250
250
  metric_name="speed",
251
251
  metric_unit="ms",
252
252
  **common_configs,
@@ -143,7 +143,7 @@ if __name__ == "__main__":
143
143
 
144
144
  run_benchmarks(
145
145
  bench_test_fn=bench_speed_jsd,
146
- kernel_operation_modes=["forward", "full"],
146
+ kernel_operation_modes=["forward", "backward", "full"],
147
147
  metric_name="speed",
148
148
  metric_unit="ms",
149
149
  **common_args,
@@ -110,7 +110,7 @@ if __name__ == "__main__":
110
110
 
111
111
  run_benchmarks(
112
112
  bench_test_fn=bench_speed_kldiv,
113
- kernel_operation_modes=["forward", "full"],
113
+ kernel_operation_modes=["forward", "backward", "full"],
114
114
  metric_name="speed",
115
115
  metric_unit="ms",
116
116
  **common_args,
@@ -299,7 +299,7 @@ if __name__ == "__main__":
299
299
 
300
300
  run_benchmarks(
301
301
  bench_test_fn=bench_speed_kto_loss,
302
- kernel_operation_modes=["forward", "full"],
302
+ kernel_operation_modes=["forward", "backward", "full"],
303
303
  metric_name="speed",
304
304
  metric_unit="ms",
305
305
  **common_configs,
@@ -111,7 +111,7 @@ if __name__ == "__main__":
111
111
 
112
112
  run_benchmarks(
113
113
  bench_test_fn=bench_speed_layer_norm,
114
- kernel_operation_modes=["forward", "full"],
114
+ kernel_operation_modes=["forward", "backward", "full"],
115
115
  metric_name="speed",
116
116
  metric_unit="ms",
117
117
  **common_configs,
@@ -149,7 +149,7 @@ if __name__ == "__main__":
149
149
 
150
150
  run_benchmarks(
151
151
  bench_test_fn=bench_speed_fused_linear_orpo_loss,
152
- kernel_operation_modes=["forward", "full"],
152
+ kernel_operation_modes=["forward", "full", "backward"],
153
153
  metric_name="speed",
154
154
  metric_unit="ms",
155
155
  **common_configs,
@@ -147,7 +147,7 @@ if __name__ == "__main__":
147
147
 
148
148
  run_benchmarks(
149
149
  bench_test_fn=bench_speed_fused_linear_simpo_loss,
150
- kernel_operation_modes=["forward", "full"],
150
+ kernel_operation_modes=["forward", "full", "backward"],
151
151
  metric_name="speed",
152
152
  metric_unit="ms",
153
153
  **common_configs,
@@ -124,7 +124,7 @@ if __name__ == "__main__":
124
124
 
125
125
  run_benchmarks(
126
126
  bench_test_fn=bench_speed_softmax,
127
- kernel_operation_modes=["forward", "full"],
127
+ kernel_operation_modes=["forward", "full", "backward"],
128
128
  metric_name="speed",
129
129
  metric_unit="ms",
130
130
  overwrite=args.overwrite,
@@ -161,7 +161,7 @@ if __name__ == "__main__":
161
161
 
162
162
  run_benchmarks(
163
163
  bench_test_fn=bench_speed_swiglu,
164
- kernel_operation_modes=["forward"],
164
+ kernel_operation_modes=["forward", "full", "backward"],
165
165
  metric_name="speed",
166
166
  metric_unit="ms",
167
167
  **common_configs,
@@ -126,7 +126,7 @@ if __name__ == "__main__":
126
126
 
127
127
  run_benchmarks(
128
128
  bench_test_fn=bench_speed_tvd,
129
- kernel_operation_modes=["forward", "full"],
129
+ kernel_operation_modes=["forward", "full", "backward"],
130
130
  metric_name="speed",
131
131
  metric_unit="ms",
132
132
  **common_args,
@@ -235,7 +235,7 @@ def update_benchmark_data_csv(
235
235
  pass
236
236
  else:
237
237
  existing_data_dict[row_key] = row_dict
238
-
238
+ os.makedirs(os.path.dirname(filename_abs_path), exist_ok=True)
239
239
  with open(filename_abs_path, mode="w", newline="") as file:
240
240
  writer = csv.DictWriter(file, fieldnames=fieldnames)
241
241
  writer.writeheader()
@@ -0,0 +1,73 @@
1
+ from pathlib import Path
2
+
3
+ import modal
4
+
5
+ ROOT_PATH = Path(__file__).parent.parent.parent
6
+ REMOTE_ROOT_PATH = "/root/liger-kernel"
7
+ PYTHON_VERSION = "3.12"
8
+
9
+ image = modal.Image.debian_slim(python_version=PYTHON_VERSION).pip_install("uv")
10
+
11
+ app = modal.App("liger_benchmarks", image=image)
12
+
13
+ # mount: add local files to the remote container
14
+ repo = image.add_local_dir(ROOT_PATH, remote_path=REMOTE_ROOT_PATH)
15
+
16
+
17
+ @app.function(gpu="H100", image=repo, timeout=60 * 45)
18
+ def liger_benchmarks():
19
+ import subprocess
20
+ import os
21
+
22
+ subprocess.run(
23
+ ["uv pip install -e '.[dev]' --system"],
24
+ check=True,
25
+ shell=True,
26
+ cwd=REMOTE_ROOT_PATH,
27
+ )
28
+ subprocess.run(["make run-benchmarks"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
29
+
30
+ file_path = Path(REMOTE_ROOT_PATH) / "benchmark" / "data" / "all_benchmark_data.csv"
31
+ print(f"Checking if file exists at: {file_path}")
32
+ print(f"File exists: {os.path.exists(file_path)}")
33
+
34
+ if not os.path.exists(file_path):
35
+ print("Listing directory contents:")
36
+ data_dir = file_path.parent
37
+ if os.path.exists(data_dir):
38
+ print(f"Contents of {data_dir}:")
39
+ print(os.listdir(data_dir))
40
+ else:
41
+ print(f"Data directory {data_dir} does not exist")
42
+ raise FileNotFoundError(f"Benchmark data file not found at {file_path}")
43
+
44
+ with open(file_path, "rb") as f:
45
+ data = f.read()
46
+ print(f"Successfully read {len(data)} bytes of data")
47
+ return data
48
+
49
+
50
+ @app.local_entrypoint()
51
+ def main():
52
+ try:
53
+ # Run the benchmarks and get the data
54
+ print("Starting benchmark run...")
55
+ benchmark_data = liger_benchmarks.remote()
56
+
57
+ if not benchmark_data:
58
+ raise ValueError("No data received from remote function")
59
+
60
+ # Save the data locally
61
+ local_data_path = ROOT_PATH / "benchmark" / "data" / "all_benchmark_data.csv"
62
+ print(f"Attempting to save data to: {local_data_path}")
63
+
64
+ local_data_path.parent.mkdir(parents=True, exist_ok=True)
65
+
66
+ with open(local_data_path, "wb") as f:
67
+ f.write(benchmark_data)
68
+
69
+ print(f"Successfully saved {len(benchmark_data)} bytes to: {local_data_path}")
70
+
71
+ except Exception as e:
72
+ print(f"Error occurred: {str(e)}")
73
+ raise
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "liger_kernel_nightly"
7
- version = "0.5.10.dev20250611191801"
7
+ version = "0.5.10.dev20250613192702"
8
8
  description = "Efficient Triton kernels for LLM Training"
9
9
  urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
10
10
  readme = { file = "README.md", content-type = "text/markdown" }
@@ -43,6 +43,7 @@ def get_optional_dependencies():
43
43
  "seaborn",
44
44
  "mkdocs",
45
45
  "mkdocs-material",
46
+ "torchvision>=0.20",
46
47
  ]
47
48
  }
48
49
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.10.dev20250611191801
3
+ Version: 0.5.10.dev20250613192702
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -45,6 +45,7 @@ Requires-Dist: datasets>=2.19.2; extra == "dev"
45
45
  Requires-Dist: seaborn; extra == "dev"
46
46
  Requires-Dist: mkdocs; extra == "dev"
47
47
  Requires-Dist: mkdocs-material; extra == "dev"
48
+ Requires-Dist: torchvision>=0.20; extra == "dev"
48
49
 
49
50
  <a name="readme-top"></a>
50
51
 
@@ -20,6 +20,7 @@ from test.utils import FAKE_CONFIGS_PATH
20
20
  from test.utils import UNTOKENIZED_DATASET_PATH
21
21
  from test.utils import MiniModelConfig
22
22
  from test.utils import assert_verbose_allclose
23
+ from test.utils import is_torchvision_available
23
24
  from test.utils import load_image_processing_config
24
25
  from test.utils import load_processor_config
25
26
  from test.utils import load_tokenizer_config
@@ -788,6 +789,7 @@ def run_mini_model_multimodal(
788
789
  not QWEN2_VL_AVAILABLE,
789
790
  reason="Qwen2-VL not available in this version of transformers",
790
791
  ),
792
+ pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
791
793
  ],
792
794
  ),
793
795
  pytest.param(
@@ -826,6 +828,7 @@ def run_mini_model_multimodal(
826
828
  not QWEN2_5_VL_AVAILABLE,
827
829
  reason="Qwen2.5-VL not available in this version of transformers",
828
830
  ),
831
+ pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
829
832
  ],
830
833
  ),
831
834
  pytest.param(
@@ -20,6 +20,7 @@ from test.utils import FAKE_CONFIGS_PATH
20
20
  from test.utils import UNTOKENIZED_DATASET_PATH
21
21
  from test.utils import MiniModelConfig
22
22
  from test.utils import assert_verbose_allclose
23
+ from test.utils import is_torchvision_available
23
24
  from test.utils import load_image_processing_config
24
25
  from test.utils import load_processor_config
25
26
  from test.utils import load_tokenizer_config
@@ -783,6 +784,7 @@ def run_mini_model_multimodal(
783
784
  not QWEN2_VL_AVAILABLE,
784
785
  reason="Qwen2-VL not available in this version of transformers",
785
786
  ),
787
+ pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
786
788
  ],
787
789
  ),
788
790
  pytest.param(
@@ -817,6 +819,7 @@ def run_mini_model_multimodal(
817
819
  not QWEN2_5_VL_AVAILABLE,
818
820
  reason="Qwen2.5-VL not available in this version of transformers",
819
821
  ),
822
+ pytest.mark.skipif(not is_torchvision_available(), reason="Qwen2VLVideoProcessor requires torchvision"),
820
823
  ],
821
824
  ),
822
825
  pytest.param(
@@ -228,6 +228,13 @@ def supports_bfloat16():
228
228
  return False
229
229
 
230
230
 
231
+ def is_torchvision_available():
232
+ if importlib.util.find_spec("torchvision") is not None:
233
+ return True
234
+ else:
235
+ return False
236
+
237
+
231
238
  def revert_liger_kernel_to_granite(model_config: MiniModelConfig):
232
239
  """
233
240
  Revert all Liger kernel patches applied to Granite.
@@ -1,28 +0,0 @@
1
- from pathlib import Path
2
-
3
- import modal
4
-
5
- ROOT_PATH = Path(__file__).parent.parent.parent
6
- REMOTE_ROOT_PATH = "/root/liger-kernel"
7
- PYTHON_VERSION = "3.12"
8
-
9
- image = modal.Image.debian_slim(python_version=PYTHON_VERSION).pip_install("uv")
10
-
11
- app = modal.App("liger_benchmarks", image=image)
12
-
13
- # mount: add local files to the remote container
14
- repo = image.add_local_dir(ROOT_PATH, remote_path=REMOTE_ROOT_PATH)
15
-
16
-
17
- @app.function(gpu="H100", image=repo, timeout=60 * 45)
18
- def liger_benchmarks():
19
- import subprocess
20
-
21
- subprocess.run(
22
- ["uv pip install -e '.[dev]' --system"],
23
- check=True,
24
- shell=True,
25
- cwd=REMOTE_ROOT_PATH,
26
- )
27
- subprocess.run(["python benchmark/scripts/benchmark_kto_loss.py"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
28
- subprocess.run(["python benchmark/scripts/benchmark_cpo_loss.py"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
@@ -29,6 +29,7 @@ jobs:
29
29
  OUTPUT_FILENAME: benchmark.csv
30
30
  GENERATED_CSV: benchmark/data/all_benchmark_data.csv
31
31
 
32
+
32
33
  steps:
33
34
  - name: Checkout code
34
35
  uses: actions/checkout@v3
@@ -71,7 +72,6 @@ jobs:
71
72
  run: |
72
73
  mkdir -p gh-pages/${OUTPUT_DIR}/${{ steps.get_hash.outputs.hash }}
73
74
  cp ${GENERATED_CSV} gh-pages/${OUTPUT_DIR}/${{ steps.get_hash.outputs.hash }}/${OUTPUT_FILENAME}
74
-
75
75
  # Step 7: Append commit hash to commits.txt if not already present
76
76
  - name: Update commits.txt
77
77
  run: |
@@ -84,7 +84,6 @@ jobs:
84
84
  if ! grep -q "${{ steps.get_hash.outputs.hash }}" ${OUTPUT_DIR}/commits.txt; then
85
85
  echo "${{ steps.get_hash.outputs.hash }}" >> ${OUTPUT_DIR}/commits.txt
86
86
  fi
87
-
88
87
  # Step 7: Commit and push
89
88
  - name: Commit and push to gh-pages
90
89
  run: |
@@ -94,3 +93,4 @@ jobs:
94
93
  git add .
95
94
  git commit -m "Add benchmark for commit ${{ steps.get_hash.outputs.hash }}" || echo "No changes to commit"
96
95
  git push origin gh-pages
96
+