liger-kernel-nightly 0.5.6.dev20250407214804__tar.gz → 0.5.6.dev20250408194537__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (244) hide show
  1. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/PKG-INFO +1 -1
  2. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/pyproject.toml +1 -1
  3. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/layer_norm.py +14 -1
  4. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/rms_norm.py +12 -1
  5. liger_kernel_nightly-0.5.6.dev20250408194537/src/liger_kernel/transformers/__init__.py +120 -0
  6. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
  7. liger_kernel_nightly-0.5.6.dev20250407214804/src/liger_kernel/transformers/__init__.py +0 -32
  8. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
  9. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
  10. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/pull_request_template.md +0 -0
  11. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/workflows/amd-ci.yml +0 -0
  12. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/workflows/docs.yml +0 -0
  13. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/workflows/intel-ci.yml +0 -0
  14. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/workflows/nvi-ci.yml +0 -0
  15. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/workflows/publish-nightly.yml +0 -0
  16. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.github/workflows/publish-release.yml +0 -0
  17. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/.gitignore +0 -0
  18. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/LICENSE +0 -0
  19. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/Makefile +0 -0
  20. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/NOTICE +0 -0
  21. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/README.md +0 -0
  22. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/README.md +0 -0
  23. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/__init__.py +0 -0
  24. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/benchmarks_visualizer.py +0 -0
  25. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/data/all_benchmark_data.csv +0 -0
  26. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/__init__.py +0 -0
  27. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
  28. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
  29. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
  30. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
  31. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_dyt.py +0 -0
  32. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_embedding.py +0 -0
  33. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
  34. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
  35. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_geglu.py +0 -0
  36. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_group_norm.py +0 -0
  37. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_jsd.py +0 -0
  38. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_kl_div.py +0 -0
  39. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_kto_loss.py +0 -0
  40. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_layer_norm.py +0 -0
  41. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
  42. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
  43. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_rms_norm.py +0 -0
  44. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_rope.py +0 -0
  45. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
  46. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_swiglu.py +0 -0
  47. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/benchmark_tvd.py +0 -0
  48. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/benchmark/scripts/utils.py +0 -0
  49. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/dev/fmt-requirements.txt +0 -0
  50. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/dev/modal/tests.py +0 -0
  51. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/dev/modal/tests_bwd.py +0 -0
  52. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/Examples.md +0 -0
  53. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/Getting-Started.md +0 -0
  54. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/High-Level-APIs.md +0 -0
  55. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/Low-Level-APIs.md +0 -0
  56. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/acknowledgement.md +0 -0
  57. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/contributing.md +0 -0
  58. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/images/banner.GIF +0 -0
  59. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/images/compose.gif +0 -0
  60. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/images/e2e-memory.png +0 -0
  61. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/images/e2e-tps.png +0 -0
  62. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/images/logo-banner.png +0 -0
  63. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/images/patch.gif +0 -0
  64. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/images/post-training.png +0 -0
  65. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/index.md +0 -0
  66. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/docs/license.md +0 -0
  67. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/alignment/accelerate_config.yaml +0 -0
  68. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/alignment/run_orpo.py +0 -0
  69. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/README.md +0 -0
  70. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/callback.py +0 -0
  71. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/config/fsdp_config.json +0 -0
  72. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/img/gemma_7b_mem.png +0 -0
  73. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/img/gemma_7b_tp.png +0 -0
  74. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/img/llama_mem_alloc.png +0 -0
  75. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/img/llama_tps.png +0 -0
  76. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
  77. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/img/qwen_tps.png +0 -0
  78. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/launch_on_modal.py +0 -0
  79. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/requirements.txt +0 -0
  80. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/run_benchmarks.sh +0 -0
  81. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/run_gemma.sh +0 -0
  82. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/run_llama.sh +0 -0
  83. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/run_qwen.sh +0 -0
  84. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/run_qwen2_vl.sh +0 -0
  85. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/training.py +0 -0
  86. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/huggingface/training_multimodal.py +0 -0
  87. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/lightning/README.md +0 -0
  88. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/lightning/requirements.txt +0 -0
  89. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/lightning/training.py +0 -0
  90. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/README.md +0 -0
  91. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/callback.py +0 -0
  92. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
  93. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
  94. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
  95. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
  96. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
  97. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
  98. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
  99. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
  100. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
  101. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/medusa_util.py +0 -0
  102. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/requirements.txt +0 -0
  103. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
  104. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/examples/medusa/train.py +0 -0
  105. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/licenses/LICENSE-Apache-2.0 +0 -0
  106. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/licenses/LICENSE-MIT-AutoAWQ +0 -0
  107. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
  108. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/licenses/LICENSE-MIT-llmc +0 -0
  109. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/licenses/LICENSE-MIT-triton +0 -0
  110. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/mkdocs.yml +0 -0
  111. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/setup.cfg +0 -0
  112. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/setup.py +0 -0
  113. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/__init__.py +0 -0
  114. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/README.md +0 -0
  115. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/__init__.py +0 -0
  116. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
  117. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
  118. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/functional.py +0 -0
  119. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
  120. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
  121. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
  122. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
  123. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
  124. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
  125. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
  126. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
  127. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
  128. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/env_report.py +0 -0
  129. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/__init__.py +0 -0
  130. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/cross_entropy.py +0 -0
  131. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/dyt.py +0 -0
  132. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/experimental/embedding.py +0 -0
  133. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
  134. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
  135. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
  136. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/geglu.py +0 -0
  137. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/group_norm.py +0 -0
  138. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/jsd.py +0 -0
  139. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/kl_div.py +0 -0
  140. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
  141. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/rope.py +0 -0
  142. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/swiglu.py +0 -0
  143. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/tvd.py +0 -0
  144. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/ops/utils.py +0 -0
  145. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/auto_model.py +0 -0
  146. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/cross_entropy.py +0 -0
  147. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/dyt.py +0 -0
  148. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
  149. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/functional.py +0 -0
  150. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
  151. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
  152. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/geglu.py +0 -0
  153. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/gema3_rms.py +0 -0
  154. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/group_norm.py +0 -0
  155. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/jsd.py +0 -0
  156. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/kl_div.py +0 -0
  157. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/layer_norm.py +0 -0
  158. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/__init__.py +0 -0
  159. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/gemma.py +0 -0
  160. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/gemma2.py +0 -0
  161. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/gemma3.py +0 -0
  162. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/llama.py +0 -0
  163. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/llava.py +0 -0
  164. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
  165. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/mistral.py +0 -0
  166. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/mixtral.py +0 -0
  167. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/mllama.py +0 -0
  168. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/olmo2.py +0 -0
  169. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/paligemma.py +0 -0
  170. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/phi3.py +0 -0
  171. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/qwen2.py +0 -0
  172. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
  173. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
  174. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/monkey_patch.py +0 -0
  175. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
  176. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/rms_norm.py +0 -0
  177. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/rope.py +0 -0
  178. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/swiglu.py +0 -0
  179. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
  180. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
  181. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/trainer_integration.py +0 -0
  182. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/transformers/tvd.py +0 -0
  183. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/triton/__init__.py +0 -0
  184. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/triton/monkey_patch.py +0 -0
  185. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel/utils.py +0 -0
  186. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
  187. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
  188. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
  189. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
  190. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/__init__.py +0 -0
  191. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/chunked_loss/__init__.py +0 -0
  192. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/chunked_loss/test_cpo_loss.py +0 -0
  193. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/chunked_loss/test_dpo_loss.py +0 -0
  194. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/chunked_loss/test_grpo_loss.py +0 -0
  195. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/chunked_loss/test_jsd_loss.py +0 -0
  196. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/chunked_loss/test_kto_loss.py +0 -0
  197. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/chunked_loss/test_orpo_loss.py +0 -0
  198. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/chunked_loss/test_simpo_loss.py +0 -0
  199. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/conftest.py +0 -0
  200. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/__init__.py +0 -0
  201. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/bf16/__init__.py +0 -0
  202. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/bf16/test_mini_models.py +0 -0
  203. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
  204. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
  205. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/fp32/__init__.py +0 -0
  206. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/fp32/test_mini_models.py +0 -0
  207. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
  208. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
  209. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
  210. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
  211. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
  212. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
  213. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
  214. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
  215. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
  216. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
  217. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
  218. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/tiny_shakespeare.txt +0 -0
  219. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
  220. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
  221. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
  222. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_auto_model.py +0 -0
  223. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_cross_entropy.py +0 -0
  224. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_dyt.py +0 -0
  225. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_embedding.py +0 -0
  226. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_flex_attention.py +0 -0
  227. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
  228. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_fused_linear_jsd.py +0 -0
  229. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_geglu.py +0 -0
  230. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_group_norm.py +0 -0
  231. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_jsd.py +0 -0
  232. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_kl_div.py +0 -0
  233. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_layer_norm.py +0 -0
  234. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_mm_int8int2.py +0 -0
  235. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_monkey_patch.py +0 -0
  236. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_qwen2vl_mrope.py +0 -0
  237. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_rms_norm.py +0 -0
  238. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_rope.py +0 -0
  239. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_swiglu.py +0 -0
  240. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_trainer_integration.py +0 -0
  241. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_transformers.py +0 -0
  242. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/transformers/test_tvd.py +0 -0
  243. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/triton/test_triton_monkey_patch.py +0 -0
  244. {liger_kernel_nightly-0.5.6.dev20250407214804 → liger_kernel_nightly-0.5.6.dev20250408194537}/test/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.6.dev20250407214804
3
+ Version: 0.5.6.dev20250408194537
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "liger_kernel_nightly"
7
- version = "0.5.6.dev20250407214804"
7
+ version = "0.5.6.dev20250408194537"
8
8
  description = "Efficient Triton kernels for LLM Training"
9
9
  urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
10
10
  readme = { file = "README.md", content-type = "text/markdown" }
@@ -154,6 +154,11 @@ def layer_norm_forward(X, W, B, eps):
154
154
  f"must match weight size (W.shape[0]={W.shape[0]})"
155
155
  )
156
156
 
157
+ # XPU-specific optimization
158
+ kernel_args = {}
159
+ if X.device.type == "xpu":
160
+ kernel_args["grf_mode"] = "large"
161
+
157
162
  _layer_norm_forward_kernel[(n_rows,)](
158
163
  Y,
159
164
  Y.stride(0),
@@ -171,6 +176,7 @@ def layer_norm_forward(X, W, B, eps):
171
176
  eps,
172
177
  BLOCK_SIZE=BLOCK_SIZE,
173
178
  num_warps=num_warps,
179
+ **kernel_args, # XPU-specific optimization
174
180
  )
175
181
  return Y.view(*shape), X, Mean, RSTD, BLOCK_SIZE, num_warps
176
182
 
@@ -185,7 +191,7 @@ def layer_norm_backward(dY, X, W, B, Mean, RSTD):
185
191
  if X.device.type == "cuda":
186
192
  sm_count = torch.cuda.get_device_properties(X.device).multi_processor_count
187
193
  elif X.device.type == "xpu":
188
- sm_count = torch.xpu.get_device_properties(X.device).gpu_subslice_count
194
+ sm_count = torch.xpu.get_device_properties(X.device).gpu_eu_count
189
195
 
190
196
  DX = torch.empty((n_rows, n_cols), dtype=X.dtype, device=X.device)
191
197
  _DW = torch.empty((sm_count, n_cols), dtype=W.dtype, device=W.device)
@@ -208,6 +214,12 @@ def layer_norm_backward(dY, X, W, B, Mean, RSTD):
208
214
  if X.dtype == torch.float16
209
215
  else tl.float32 # fallback to float32 for other types
210
216
  )
217
+
218
+ # XPU-specific optimization
219
+ kernel_args = {}
220
+ if X.device.type == "xpu":
221
+ kernel_args.update({"grf_mode": "large", "num_warps": 32, "num_stages": 4})
222
+
211
223
  _layer_norm_backward_kernel[grid](
212
224
  X,
213
225
  W,
@@ -227,6 +239,7 @@ def layer_norm_backward(dY, X, W, B, Mean, RSTD):
227
239
  rows_per_program,
228
240
  BLOCK_SIZE=BLOCK_SIZE,
229
241
  dtype=triton_dtype,
242
+ **kernel_args, # XPU-specific optimization
230
243
  )
231
244
 
232
245
  DW = _DW.sum(dim=0).to(W.dtype)
@@ -223,6 +223,10 @@ def rms_norm_forward(X, W, eps, offset, casting_mode):
223
223
  # Check constraints.
224
224
  assert X.shape[1] == W.shape[0], "Incompatible hidden size dimension between tensor1.shape[1] and tensor2.shape[0]"
225
225
 
226
+ # XPU-specific optimization
227
+ kernel_args = {}
228
+ if X.device.type == "xpu":
229
+ kernel_args["grf_mode"] = "large"
226
230
  _rms_norm_forward_kernel[(n_rows,)](
227
231
  Y,
228
232
  Y.stride(0),
@@ -238,6 +242,7 @@ def rms_norm_forward(X, W, eps, offset, casting_mode):
238
242
  casting_mode,
239
243
  BLOCK_SIZE=BLOCK_SIZE,
240
244
  num_warps=num_warps,
245
+ **kernel_args, # XPU-specific optimization
241
246
  )
242
247
  return Y.view(*shape), X, RSTD, BLOCK_SIZE, num_warps, casting_mode
243
248
 
@@ -252,7 +257,7 @@ def rms_norm_backward(dY, X, W, RSTD, offset, casting_mode, BLOCK_SIZE, num_warp
252
257
  if X.device.type == "cuda":
253
258
  sm_count = torch.cuda.get_device_properties(X.device).multi_processor_count
254
259
  elif X.device.type == "xpu":
255
- sm_count = torch.xpu.get_device_properties(X.device).gpu_subslice_count
260
+ sm_count = torch.xpu.get_device_properties(X.device).gpu_eu_count
256
261
 
257
262
  # fp32 for numerical stability especially.
258
263
  _dW = torch.empty((sm_count, n_cols), dtype=torch.float32, device=W.device)
@@ -267,6 +272,11 @@ def rms_norm_backward(dY, X, W, RSTD, offset, casting_mode, BLOCK_SIZE, num_warp
267
272
  else:
268
273
  dX = torch.zeros_like(dY)
269
274
 
275
+ # XPU-specific optimization
276
+ kernel_args = {}
277
+ if X.device.type == "xpu":
278
+ kernel_args["grf_mode"] = "large"
279
+
270
280
  _rms_norm_backward_kernel[grid](
271
281
  dY,
272
282
  dY.stride(0),
@@ -288,6 +298,7 @@ def rms_norm_backward(dY, X, W, RSTD, offset, casting_mode, BLOCK_SIZE, num_warp
288
298
  casting_mode,
289
299
  BLOCK_SIZE=BLOCK_SIZE,
290
300
  num_warps=num_warps,
301
+ **kernel_args, # XPU-specific optimization
291
302
  )
292
303
  dX = dX.view(*shape)
293
304
  dW = _dW.sum(dim=0).to(W.dtype)
@@ -0,0 +1,120 @@
1
+ import importlib
2
+
3
+ # Always-safe imports (independent of 'transformers')
4
+ from liger_kernel.transformers.cross_entropy import LigerCrossEntropyLoss # noqa: F401
5
+ from liger_kernel.transformers.dyt import LigerDyT # noqa: F401
6
+ from liger_kernel.transformers.fused_linear_cross_entropy import LigerFusedLinearCrossEntropyLoss # noqa: F401
7
+ from liger_kernel.transformers.fused_linear_jsd import LigerFusedLinearJSD # noqa: F401
8
+ from liger_kernel.transformers.geglu import LigerGEGLUMLP # noqa: F401
9
+ from liger_kernel.transformers.jsd import LigerJSD # noqa: F401
10
+ from liger_kernel.transformers.layer_norm import LigerLayerNorm # noqa: F401
11
+ from liger_kernel.transformers.rms_norm import LigerRMSNorm # noqa: F401
12
+ from liger_kernel.transformers.rope import liger_rotary_pos_emb # noqa: F401
13
+ from liger_kernel.transformers.swiglu import LigerBlockSparseTop2MLP # noqa: F401
14
+ from liger_kernel.transformers.swiglu import LigerPhi3SwiGLUMLP # noqa: F401
15
+ from liger_kernel.transformers.swiglu import LigerSwiGLUMLP # noqa: F401
16
+ from liger_kernel.transformers.tvd import LigerTVDLoss # noqa: F401
17
+
18
+ # Check if 'transformers' is installed
19
+ try:
20
+ import transformers # noqa: F401
21
+
22
+ _TRANSFORMERS_AVAILABLE = True
23
+ except ImportError:
24
+ _TRANSFORMERS_AVAILABLE = False
25
+
26
+
27
+ def is_transformers_available() -> bool:
28
+ """
29
+ Returns True if the 'transformers' package is available.
30
+ Useful for conditional logic in downstream code.
31
+ """
32
+ return _TRANSFORMERS_AVAILABLE
33
+
34
+
35
+ def __getattr__(name: str):
36
+ """
37
+ Handles lazy access to transformer-dependent attributes.
38
+ If 'transformers' is not installed, raises a user-friendly ImportError.
39
+ """
40
+ if not _TRANSFORMERS_AVAILABLE:
41
+ raise ImportError(
42
+ f"The attribute '{name}' requires the 'transformers' library, which is not installed.\n"
43
+ f"Please install it with `pip install transformers` to use this functionality."
44
+ )
45
+
46
+ if name == "AutoLigerKernelForCausalLM":
47
+ module = importlib.import_module("liger_kernel.transformers.auto_model")
48
+ return getattr(module, name)
49
+
50
+ monkey_patch_symbols = {
51
+ "_apply_liger_kernel",
52
+ "_apply_liger_kernel_to_instance",
53
+ "apply_liger_kernel_to_gemma",
54
+ "apply_liger_kernel_to_gemma2",
55
+ "apply_liger_kernel_to_gemma3",
56
+ "apply_liger_kernel_to_gemma3_text",
57
+ "apply_liger_kernel_to_granite",
58
+ "apply_liger_kernel_to_llama",
59
+ "apply_liger_kernel_to_llava",
60
+ "apply_liger_kernel_to_mistral",
61
+ "apply_liger_kernel_to_mixtral",
62
+ "apply_liger_kernel_to_mllama",
63
+ "apply_liger_kernel_to_olmo2",
64
+ "apply_liger_kernel_to_paligemma",
65
+ "apply_liger_kernel_to_phi3",
66
+ "apply_liger_kernel_to_qwen2",
67
+ "apply_liger_kernel_to_qwen2_5_vl",
68
+ "apply_liger_kernel_to_qwen2_vl",
69
+ }
70
+
71
+ if name in monkey_patch_symbols:
72
+ module = importlib.import_module("liger_kernel.transformers.monkey_patch")
73
+ return getattr(module, name)
74
+
75
+ raise AttributeError(f"module {__name__} has no attribute {name}")
76
+
77
+
78
+ # Shared symbols in all environments
79
+ __all__ = [
80
+ "is_transformers_available",
81
+ "LigerCrossEntropyLoss",
82
+ "LigerDyT",
83
+ "LigerFusedLinearCrossEntropyLoss",
84
+ "LigerFusedLinearJSD",
85
+ "LigerGEGLUMLP",
86
+ "LigerJSD",
87
+ "LigerLayerNorm",
88
+ "LigerRMSNorm",
89
+ "liger_rotary_pos_emb",
90
+ "LigerBlockSparseTop2MLP",
91
+ "LigerPhi3SwiGLUMLP",
92
+ "LigerSwiGLUMLP",
93
+ "LigerTVDLoss",
94
+ ]
95
+
96
+ # Add transformer-dependent symbols only if available
97
+ if _TRANSFORMERS_AVAILABLE:
98
+ __all__.extend(
99
+ [
100
+ "AutoLigerKernelForCausalLM",
101
+ "_apply_liger_kernel",
102
+ "_apply_liger_kernel_to_instance",
103
+ "apply_liger_kernel_to_gemma",
104
+ "apply_liger_kernel_to_gemma2",
105
+ "apply_liger_kernel_to_gemma3",
106
+ "apply_liger_kernel_to_gemma3_text",
107
+ "apply_liger_kernel_to_granite",
108
+ "apply_liger_kernel_to_llama",
109
+ "apply_liger_kernel_to_llava",
110
+ "apply_liger_kernel_to_mistral",
111
+ "apply_liger_kernel_to_mixtral",
112
+ "apply_liger_kernel_to_mllama",
113
+ "apply_liger_kernel_to_olmo2",
114
+ "apply_liger_kernel_to_paligemma",
115
+ "apply_liger_kernel_to_phi3",
116
+ "apply_liger_kernel_to_qwen2",
117
+ "apply_liger_kernel_to_qwen2_5_vl",
118
+ "apply_liger_kernel_to_qwen2_vl",
119
+ ]
120
+ )
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.6.dev20250407214804
3
+ Version: 0.5.6.dev20250408194537
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -1,32 +0,0 @@
1
- from liger_kernel.transformers.auto_model import AutoLigerKernelForCausalLM # noqa: F401
2
- from liger_kernel.transformers.cross_entropy import LigerCrossEntropyLoss # noqa: F401
3
- from liger_kernel.transformers.dyt import LigerDyT # noqa: F401
4
- from liger_kernel.transformers.fused_linear_cross_entropy import LigerFusedLinearCrossEntropyLoss # noqa: F401
5
- from liger_kernel.transformers.fused_linear_jsd import LigerFusedLinearJSD # noqa: F401
6
- from liger_kernel.transformers.geglu import LigerGEGLUMLP # noqa: F401
7
- from liger_kernel.transformers.jsd import LigerJSD # noqa: F401
8
- from liger_kernel.transformers.layer_norm import LigerLayerNorm # noqa: F401
9
- from liger_kernel.transformers.monkey_patch import _apply_liger_kernel # noqa: F401
10
- from liger_kernel.transformers.monkey_patch import _apply_liger_kernel_to_instance # noqa: F401
11
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma # noqa: F401
12
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma2 # noqa: F401
13
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma3 # noqa: F401
14
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma3_text # noqa: F401
15
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_granite # noqa: F401
16
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_llama # noqa: F401
17
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_llava # noqa: F401
18
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mistral # noqa: F401
19
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mixtral # noqa: F401
20
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mllama # noqa: F401
21
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_olmo2 # noqa: F401
22
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_paligemma # noqa: F401
23
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_phi3 # noqa: F401
24
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2 # noqa: F401
25
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2_5_vl # noqa: F401
26
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2_vl # noqa: F401
27
- from liger_kernel.transformers.rms_norm import LigerRMSNorm # noqa: F401
28
- from liger_kernel.transformers.rope import liger_rotary_pos_emb # noqa: F401
29
- from liger_kernel.transformers.swiglu import LigerBlockSparseTop2MLP # noqa: F401
30
- from liger_kernel.transformers.swiglu import LigerPhi3SwiGLUMLP # noqa: F401
31
- from liger_kernel.transformers.swiglu import LigerSwiGLUMLP # noqa: F401
32
- from liger_kernel.transformers.tvd import LigerTVDLoss # noqa: F401