liger-kernel-nightly 0.5.10.dev20250611215839__tar.gz → 0.5.10.dev20250613192702__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (270) hide show
  1. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/PKG-INFO +1 -1
  2. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_cpo_loss.py +1 -1
  3. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_cross_entropy.py +1 -1
  4. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_distill_jsd_loss.py +1 -1
  5. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_dpo_loss.py +1 -1
  6. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_embedding.py +1 -1
  7. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +1 -1
  8. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_linear_jsd.py +1 -1
  9. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_jsd.py +1 -1
  10. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_kl_div.py +1 -1
  11. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_kto_loss.py +1 -1
  12. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_layer_norm.py +1 -1
  13. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_orpo_loss.py +1 -1
  14. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_simpo_loss.py +1 -1
  15. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_softmax.py +1 -1
  16. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_swiglu.py +1 -1
  17. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_tvd.py +1 -1
  18. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/utils.py +1 -1
  19. liger_kernel_nightly-0.5.10.dev20250613192702/dev/modal/benchmarks.py +73 -0
  20. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/pyproject.toml +1 -1
  21. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
  22. liger_kernel_nightly-0.5.10.dev20250611215839/dev/modal/benchmarks.py +0 -28
  23. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
  24. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
  25. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/pull_request_template.md +0 -0
  26. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/amd-ci.yml +0 -0
  27. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/benchmark.yml +2 -2
  28. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/docs.yml +0 -0
  29. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/intel-ci.yml +0 -0
  30. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/nvi-ci.yml +0 -0
  31. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/publish-nightly.yml +0 -0
  32. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.github/workflows/publish-release.yml +0 -0
  33. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.gitignore +0 -0
  34. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/.idea/workspace.xml +0 -0
  35. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/LICENSE +0 -0
  36. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/Makefile +0 -0
  37. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/NOTICE +0 -0
  38. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/README.md +0 -0
  39. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/README.md +0 -0
  40. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/__init__.py +0 -0
  41. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/benchmarks_visualizer.py +0 -0
  42. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/data/all_benchmark_data.csv +0 -0
  43. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/__init__.py +0 -0
  44. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_dyt.py +0 -0
  45. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_fused_neighborhood_attention.py +0 -0
  46. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_geglu.py +0 -0
  47. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_group_norm.py +0 -0
  48. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_multi_token_attention.py +0 -0
  49. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
  50. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_rms_norm.py +0 -0
  51. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_rope.py +0 -0
  52. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_sparse_multi_token_attention.py +0 -0
  53. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/benchmark/scripts/benchmark_sparsemax.py +0 -0
  54. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/fmt-requirements.txt +0 -0
  55. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/modal/tests.py +0 -0
  56. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/dev/modal/tests_bwd.py +0 -0
  57. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Examples.md +0 -0
  58. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Getting-Started.md +0 -0
  59. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/High-Level-APIs.md +0 -0
  60. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/Low-Level-APIs.md +0 -0
  61. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/acknowledgement.md +0 -0
  62. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/contributing.md +0 -0
  63. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/banner.GIF +0 -0
  64. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/compose.gif +0 -0
  65. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/e2e-memory.png +0 -0
  66. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/e2e-tps.png +0 -0
  67. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/logo-banner.png +0 -0
  68. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/patch.gif +0 -0
  69. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/images/post-training.png +0 -0
  70. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/index.md +0 -0
  71. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/docs/license.md +0 -0
  72. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/alignment/accelerate_config.yaml +0 -0
  73. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/alignment/run_orpo.py +0 -0
  74. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/README.md +0 -0
  75. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/callback.py +0 -0
  76. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/config/fsdp_config.json +0 -0
  77. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/gemma_7b_mem.png +0 -0
  78. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/gemma_7b_tp.png +0 -0
  79. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/llama_mem_alloc.png +0 -0
  80. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/llama_tps.png +0 -0
  81. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
  82. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/img/qwen_tps.png +0 -0
  83. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/launch_on_modal.py +0 -0
  84. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/requirements.txt +0 -0
  85. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_benchmarks.sh +0 -0
  86. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_gemma.sh +0 -0
  87. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_llama.sh +0 -0
  88. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_qwen.sh +0 -0
  89. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/run_qwen2_vl.sh +0 -0
  90. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/training.py +0 -0
  91. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/huggingface/training_multimodal.py +0 -0
  92. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/README.md +0 -0
  93. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/requirements.txt +0 -0
  94. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/lightning/training.py +0 -0
  95. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/README.md +0 -0
  96. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/callback.py +0 -0
  97. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
  98. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
  99. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
  100. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
  101. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
  102. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
  103. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
  104. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
  105. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
  106. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/medusa_util.py +0 -0
  107. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/requirements.txt +0 -0
  108. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
  109. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/examples/medusa/train.py +0 -0
  110. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-Apache-2.0 +0 -0
  111. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-AutoAWQ +0 -0
  112. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
  113. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-llmc +0 -0
  114. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/licenses/LICENSE-MIT-triton +0 -0
  115. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/mkdocs.yml +0 -0
  116. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/setup.cfg +0 -0
  117. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/setup.py +0 -0
  118. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/__init__.py +0 -0
  119. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/README.md +0 -0
  120. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/__init__.py +0 -0
  121. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
  122. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
  123. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/functional.py +0 -0
  124. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
  125. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
  126. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
  127. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
  128. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
  129. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
  130. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
  131. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
  132. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
  133. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/env_report.py +0 -0
  134. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/__init__.py +0 -0
  135. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/cross_entropy.py +0 -0
  136. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/dyt.py +0 -0
  137. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/experimental/embedding.py +0 -0
  138. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
  139. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
  140. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
  141. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/fused_neighborhood_attention.py +0 -0
  142. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/geglu.py +0 -0
  143. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/group_norm.py +0 -0
  144. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/grpo_loss.py +0 -0
  145. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/jsd.py +0 -0
  146. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/kl_div.py +0 -0
  147. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/layer_norm.py +0 -0
  148. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/multi_token_attention.py +0 -0
  149. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
  150. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/rms_norm.py +0 -0
  151. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/rope.py +0 -0
  152. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/softmax.py +0 -0
  153. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/sparsemax.py +0 -0
  154. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/swiglu.py +0 -0
  155. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/tvd.py +0 -0
  156. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/ops/utils.py +0 -0
  157. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/__init__.py +0 -0
  158. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/auto_model.py +0 -0
  159. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/cross_entropy.py +0 -0
  160. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/dyt.py +0 -0
  161. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
  162. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fsdp.py +0 -0
  163. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/functional.py +0 -0
  164. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
  165. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
  166. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/fused_neighborhood_attention.py +0 -0
  167. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/geglu.py +0 -0
  168. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/group_norm.py +0 -0
  169. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/grpo_loss.py +0 -0
  170. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/jsd.py +0 -0
  171. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/kl_div.py +0 -0
  172. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/layer_norm.py +0 -0
  173. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/__init__.py +0 -0
  174. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma.py +0 -0
  175. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma2.py +0 -0
  176. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/gemma3.py +0 -0
  177. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/glm4.py +0 -0
  178. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/llama.py +0 -0
  179. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/llava.py +0 -0
  180. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
  181. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mistral.py +0 -0
  182. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mixtral.py +0 -0
  183. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/mllama.py +0 -0
  184. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/olmo2.py +0 -0
  185. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/paligemma.py +0 -0
  186. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/phi3.py +0 -0
  187. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2.py +0 -0
  188. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
  189. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
  190. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen3.py +0 -0
  191. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/model/qwen3_moe.py +0 -0
  192. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/monkey_patch.py +0 -0
  193. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/multi_token_attention.py +0 -0
  194. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
  195. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/rms_norm.py +0 -0
  196. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/rope.py +0 -0
  197. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/softmax.py +0 -0
  198. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/sparsemax.py +0 -0
  199. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/swiglu.py +0 -0
  200. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
  201. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
  202. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/trainer_integration.py +0 -0
  203. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/transformers/tvd.py +0 -0
  204. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/triton/__init__.py +0 -0
  205. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/triton/monkey_patch.py +0 -0
  206. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel/utils.py +0 -0
  207. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
  208. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
  209. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
  210. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
  211. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/__init__.py +0 -0
  212. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/__init__.py +0 -0
  213. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_cpo_loss.py +0 -0
  214. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_dpo_loss.py +0 -0
  215. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_grpo_loss.py +0 -0
  216. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_jsd_loss.py +0 -0
  217. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_kto_loss.py +0 -0
  218. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_orpo_loss.py +0 -0
  219. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/chunked_loss/test_simpo_loss.py +0 -0
  220. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/conftest.py +0 -0
  221. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/__init__.py +0 -0
  222. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/__init__.py +0 -0
  223. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models.py +0 -0
  224. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
  225. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
  226. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/__init__.py +0 -0
  227. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models.py +0 -0
  228. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
  229. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
  230. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
  231. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
  232. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
  233. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
  234. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
  235. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
  236. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
  237. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
  238. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
  239. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare.txt +0 -0
  240. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
  241. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
  242. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
  243. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_auto_model.py +0 -0
  244. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_cross_entropy.py +0 -0
  245. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_dyt.py +0 -0
  246. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_embedding.py +0 -0
  247. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_flex_attention.py +0 -0
  248. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
  249. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_linear_jsd.py +0 -0
  250. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_fused_neighborhood_attention.py +0 -0
  251. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_geglu.py +0 -0
  252. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_group_norm.py +0 -0
  253. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_grpo_loss.py +0 -0
  254. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_jsd.py +0 -0
  255. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_kl_div.py +0 -0
  256. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_layer_norm.py +0 -0
  257. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_mm_int8int2.py +0 -0
  258. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_monkey_patch.py +0 -0
  259. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_multi_token_attention.py +0 -0
  260. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_qwen2vl_mrope.py +0 -0
  261. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_rms_norm.py +0 -0
  262. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_rope.py +0 -0
  263. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_softmax.py +0 -0
  264. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_sparsemax.py +0 -0
  265. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_swiglu.py +0 -0
  266. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_trainer_integration.py +0 -0
  267. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_transformers.py +0 -0
  268. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/transformers/test_tvd.py +0 -0
  269. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/triton/test_triton_monkey_patch.py +0 -0
  270. {liger_kernel_nightly-0.5.10.dev20250611215839 → liger_kernel_nightly-0.5.10.dev20250613192702}/test/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.10.dev20250611215839
3
+ Version: 0.5.10.dev20250613192702
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -147,7 +147,7 @@ if __name__ == "__main__":
147
147
 
148
148
  run_benchmarks(
149
149
  bench_test_fn=bench_speed_fused_linear_cpo_loss,
150
- kernel_operation_modes=["forward", "full"],
150
+ kernel_operation_modes=["forward", "backward", "full"],
151
151
  metric_name="speed",
152
152
  metric_unit="ms",
153
153
  **common_configs,
@@ -109,7 +109,7 @@ if __name__ == "__main__":
109
109
 
110
110
  run_benchmarks(
111
111
  bench_test_fn=bench_speed_cross_entropy,
112
- kernel_operation_modes=["forward", "full"],
112
+ kernel_operation_modes=["forward", "backward", "full"],
113
113
  metric_name="speed",
114
114
  metric_unit="ms",
115
115
  **common_configs,
@@ -248,7 +248,7 @@ if __name__ == "__main__":
248
248
 
249
249
  run_benchmarks(
250
250
  bench_test_fn=bench_speed_jsd_loss,
251
- kernel_operation_modes=["forward", "full"],
251
+ kernel_operation_modes=["forward", "backward", "full"],
252
252
  metric_name="speed",
253
253
  metric_unit="ms",
254
254
  **common_configs,
@@ -166,7 +166,7 @@ if __name__ == "__main__":
166
166
 
167
167
  run_benchmarks(
168
168
  bench_test_fn=bench_speed_dpo_loss,
169
- kernel_operation_modes=["forward", "full"],
169
+ kernel_operation_modes=["forward", "backward", "full"],
170
170
  metric_name="speed",
171
171
  metric_unit="ms",
172
172
  **common_configs,
@@ -112,7 +112,7 @@ if __name__ == "__main__":
112
112
 
113
113
  run_benchmarks(
114
114
  bench_test_fn=bench_speed_embedding,
115
- kernel_operation_modes=["forward", "full"],
115
+ kernel_operation_modes=["forward", "backward", "full"],
116
116
  metric_name="speed",
117
117
  metric_unit="ms",
118
118
  **common_configs,
@@ -156,7 +156,7 @@ if __name__ == "__main__":
156
156
 
157
157
  run_benchmarks(
158
158
  bench_test_fn=bench_speed_fused_linear_cross_entropy,
159
- kernel_operation_modes=["forward", "full"],
159
+ kernel_operation_modes=["forward", "backward", "full"],
160
160
  metric_name="speed",
161
161
  metric_unit="ms",
162
162
  **common_configs,
@@ -246,7 +246,7 @@ if __name__ == "__main__":
246
246
 
247
247
  run_benchmarks(
248
248
  bench_test_fn=bench_speed_fused_linear_jsd,
249
- kernel_operation_modes=["forward", "full"],
249
+ kernel_operation_modes=["forward", "backward", "full"],
250
250
  metric_name="speed",
251
251
  metric_unit="ms",
252
252
  **common_configs,
@@ -143,7 +143,7 @@ if __name__ == "__main__":
143
143
 
144
144
  run_benchmarks(
145
145
  bench_test_fn=bench_speed_jsd,
146
- kernel_operation_modes=["forward", "full"],
146
+ kernel_operation_modes=["forward", "backward", "full"],
147
147
  metric_name="speed",
148
148
  metric_unit="ms",
149
149
  **common_args,
@@ -110,7 +110,7 @@ if __name__ == "__main__":
110
110
 
111
111
  run_benchmarks(
112
112
  bench_test_fn=bench_speed_kldiv,
113
- kernel_operation_modes=["forward", "full"],
113
+ kernel_operation_modes=["forward", "backward", "full"],
114
114
  metric_name="speed",
115
115
  metric_unit="ms",
116
116
  **common_args,
@@ -299,7 +299,7 @@ if __name__ == "__main__":
299
299
 
300
300
  run_benchmarks(
301
301
  bench_test_fn=bench_speed_kto_loss,
302
- kernel_operation_modes=["forward", "full"],
302
+ kernel_operation_modes=["forward", "backward", "full"],
303
303
  metric_name="speed",
304
304
  metric_unit="ms",
305
305
  **common_configs,
@@ -111,7 +111,7 @@ if __name__ == "__main__":
111
111
 
112
112
  run_benchmarks(
113
113
  bench_test_fn=bench_speed_layer_norm,
114
- kernel_operation_modes=["forward", "full"],
114
+ kernel_operation_modes=["forward", "backward", "full"],
115
115
  metric_name="speed",
116
116
  metric_unit="ms",
117
117
  **common_configs,
@@ -149,7 +149,7 @@ if __name__ == "__main__":
149
149
 
150
150
  run_benchmarks(
151
151
  bench_test_fn=bench_speed_fused_linear_orpo_loss,
152
- kernel_operation_modes=["forward", "full"],
152
+ kernel_operation_modes=["forward", "full", "backward"],
153
153
  metric_name="speed",
154
154
  metric_unit="ms",
155
155
  **common_configs,
@@ -147,7 +147,7 @@ if __name__ == "__main__":
147
147
 
148
148
  run_benchmarks(
149
149
  bench_test_fn=bench_speed_fused_linear_simpo_loss,
150
- kernel_operation_modes=["forward", "full"],
150
+ kernel_operation_modes=["forward", "full", "backward"],
151
151
  metric_name="speed",
152
152
  metric_unit="ms",
153
153
  **common_configs,
@@ -124,7 +124,7 @@ if __name__ == "__main__":
124
124
 
125
125
  run_benchmarks(
126
126
  bench_test_fn=bench_speed_softmax,
127
- kernel_operation_modes=["forward", "full"],
127
+ kernel_operation_modes=["forward", "full", "backward"],
128
128
  metric_name="speed",
129
129
  metric_unit="ms",
130
130
  overwrite=args.overwrite,
@@ -161,7 +161,7 @@ if __name__ == "__main__":
161
161
 
162
162
  run_benchmarks(
163
163
  bench_test_fn=bench_speed_swiglu,
164
- kernel_operation_modes=["forward"],
164
+ kernel_operation_modes=["forward", "full", "backward"],
165
165
  metric_name="speed",
166
166
  metric_unit="ms",
167
167
  **common_configs,
@@ -126,7 +126,7 @@ if __name__ == "__main__":
126
126
 
127
127
  run_benchmarks(
128
128
  bench_test_fn=bench_speed_tvd,
129
- kernel_operation_modes=["forward", "full"],
129
+ kernel_operation_modes=["forward", "full", "backward"],
130
130
  metric_name="speed",
131
131
  metric_unit="ms",
132
132
  **common_args,
@@ -235,7 +235,7 @@ def update_benchmark_data_csv(
235
235
  pass
236
236
  else:
237
237
  existing_data_dict[row_key] = row_dict
238
-
238
+ os.makedirs(os.path.dirname(filename_abs_path), exist_ok=True)
239
239
  with open(filename_abs_path, mode="w", newline="") as file:
240
240
  writer = csv.DictWriter(file, fieldnames=fieldnames)
241
241
  writer.writeheader()
@@ -0,0 +1,73 @@
1
+ from pathlib import Path
2
+
3
+ import modal
4
+
5
+ ROOT_PATH = Path(__file__).parent.parent.parent
6
+ REMOTE_ROOT_PATH = "/root/liger-kernel"
7
+ PYTHON_VERSION = "3.12"
8
+
9
+ image = modal.Image.debian_slim(python_version=PYTHON_VERSION).pip_install("uv")
10
+
11
+ app = modal.App("liger_benchmarks", image=image)
12
+
13
+ # mount: add local files to the remote container
14
+ repo = image.add_local_dir(ROOT_PATH, remote_path=REMOTE_ROOT_PATH)
15
+
16
+
17
+ @app.function(gpu="H100", image=repo, timeout=60 * 45)
18
+ def liger_benchmarks():
19
+ import subprocess
20
+ import os
21
+
22
+ subprocess.run(
23
+ ["uv pip install -e '.[dev]' --system"],
24
+ check=True,
25
+ shell=True,
26
+ cwd=REMOTE_ROOT_PATH,
27
+ )
28
+ subprocess.run(["make run-benchmarks"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
29
+
30
+ file_path = Path(REMOTE_ROOT_PATH) / "benchmark" / "data" / "all_benchmark_data.csv"
31
+ print(f"Checking if file exists at: {file_path}")
32
+ print(f"File exists: {os.path.exists(file_path)}")
33
+
34
+ if not os.path.exists(file_path):
35
+ print("Listing directory contents:")
36
+ data_dir = file_path.parent
37
+ if os.path.exists(data_dir):
38
+ print(f"Contents of {data_dir}:")
39
+ print(os.listdir(data_dir))
40
+ else:
41
+ print(f"Data directory {data_dir} does not exist")
42
+ raise FileNotFoundError(f"Benchmark data file not found at {file_path}")
43
+
44
+ with open(file_path, "rb") as f:
45
+ data = f.read()
46
+ print(f"Successfully read {len(data)} bytes of data")
47
+ return data
48
+
49
+
50
+ @app.local_entrypoint()
51
+ def main():
52
+ try:
53
+ # Run the benchmarks and get the data
54
+ print("Starting benchmark run...")
55
+ benchmark_data = liger_benchmarks.remote()
56
+
57
+ if not benchmark_data:
58
+ raise ValueError("No data received from remote function")
59
+
60
+ # Save the data locally
61
+ local_data_path = ROOT_PATH / "benchmark" / "data" / "all_benchmark_data.csv"
62
+ print(f"Attempting to save data to: {local_data_path}")
63
+
64
+ local_data_path.parent.mkdir(parents=True, exist_ok=True)
65
+
66
+ with open(local_data_path, "wb") as f:
67
+ f.write(benchmark_data)
68
+
69
+ print(f"Successfully saved {len(benchmark_data)} bytes to: {local_data_path}")
70
+
71
+ except Exception as e:
72
+ print(f"Error occurred: {str(e)}")
73
+ raise
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "liger_kernel_nightly"
7
- version = "0.5.10.dev20250611215839"
7
+ version = "0.5.10.dev20250613192702"
8
8
  description = "Efficient Triton kernels for LLM Training"
9
9
  urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
10
10
  readme = { file = "README.md", content-type = "text/markdown" }
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.10.dev20250611215839
3
+ Version: 0.5.10.dev20250613192702
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -1,28 +0,0 @@
1
- from pathlib import Path
2
-
3
- import modal
4
-
5
- ROOT_PATH = Path(__file__).parent.parent.parent
6
- REMOTE_ROOT_PATH = "/root/liger-kernel"
7
- PYTHON_VERSION = "3.12"
8
-
9
- image = modal.Image.debian_slim(python_version=PYTHON_VERSION).pip_install("uv")
10
-
11
- app = modal.App("liger_benchmarks", image=image)
12
-
13
- # mount: add local files to the remote container
14
- repo = image.add_local_dir(ROOT_PATH, remote_path=REMOTE_ROOT_PATH)
15
-
16
-
17
- @app.function(gpu="H100", image=repo, timeout=60 * 45)
18
- def liger_benchmarks():
19
- import subprocess
20
-
21
- subprocess.run(
22
- ["uv pip install -e '.[dev]' --system"],
23
- check=True,
24
- shell=True,
25
- cwd=REMOTE_ROOT_PATH,
26
- )
27
- subprocess.run(["python benchmark/scripts/benchmark_kto_loss.py"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
28
- subprocess.run(["python benchmark/scripts/benchmark_cpo_loss.py"], check=True, shell=True, cwd=REMOTE_ROOT_PATH)
@@ -29,6 +29,7 @@ jobs:
29
29
  OUTPUT_FILENAME: benchmark.csv
30
30
  GENERATED_CSV: benchmark/data/all_benchmark_data.csv
31
31
 
32
+
32
33
  steps:
33
34
  - name: Checkout code
34
35
  uses: actions/checkout@v3
@@ -71,7 +72,6 @@ jobs:
71
72
  run: |
72
73
  mkdir -p gh-pages/${OUTPUT_DIR}/${{ steps.get_hash.outputs.hash }}
73
74
  cp ${GENERATED_CSV} gh-pages/${OUTPUT_DIR}/${{ steps.get_hash.outputs.hash }}/${OUTPUT_FILENAME}
74
-
75
75
  # Step 7: Append commit hash to commits.txt if not already present
76
76
  - name: Update commits.txt
77
77
  run: |
@@ -84,7 +84,6 @@ jobs:
84
84
  if ! grep -q "${{ steps.get_hash.outputs.hash }}" ${OUTPUT_DIR}/commits.txt; then
85
85
  echo "${{ steps.get_hash.outputs.hash }}" >> ${OUTPUT_DIR}/commits.txt
86
86
  fi
87
-
88
87
  # Step 7: Commit and push
89
88
  - name: Commit and push to gh-pages
90
89
  run: |
@@ -94,3 +93,4 @@ jobs:
94
93
  git add .
95
94
  git commit -m "Add benchmark for commit ${{ steps.get_hash.outputs.hash }}" || echo "No changes to commit"
96
95
  git push origin gh-pages
96
+