liger-kernel-nightly 0.5.6.dev20250408182156__tar.gz → 0.5.6.dev20250408223717__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (244) hide show
  1. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/PKG-INFO +1 -1
  2. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/pyproject.toml +1 -1
  3. liger_kernel_nightly-0.5.6.dev20250408223717/src/liger_kernel/transformers/__init__.py +145 -0
  4. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel_nightly.egg-info/PKG-INFO +1 -1
  5. liger_kernel_nightly-0.5.6.dev20250408182156/src/liger_kernel/transformers/__init__.py +0 -32
  6. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/ISSUE_TEMPLATE/bug_report.yaml +0 -0
  7. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
  8. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/pull_request_template.md +0 -0
  9. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/workflows/amd-ci.yml +0 -0
  10. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/workflows/docs.yml +0 -0
  11. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/workflows/intel-ci.yml +0 -0
  12. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/workflows/nvi-ci.yml +0 -0
  13. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/workflows/publish-nightly.yml +0 -0
  14. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.github/workflows/publish-release.yml +0 -0
  15. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/.gitignore +0 -0
  16. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/LICENSE +0 -0
  17. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/Makefile +0 -0
  18. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/NOTICE +0 -0
  19. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/README.md +0 -0
  20. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/README.md +0 -0
  21. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/__init__.py +0 -0
  22. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/benchmarks_visualizer.py +0 -0
  23. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/data/all_benchmark_data.csv +0 -0
  24. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/__init__.py +0 -0
  25. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_cpo_loss.py +0 -0
  26. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_cross_entropy.py +0 -0
  27. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_distill_jsd_loss.py +0 -0
  28. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_dpo_loss.py +0 -0
  29. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_dyt.py +0 -0
  30. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_embedding.py +0 -0
  31. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_fused_linear_cross_entropy.py +0 -0
  32. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_fused_linear_jsd.py +0 -0
  33. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_geglu.py +0 -0
  34. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_group_norm.py +0 -0
  35. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_jsd.py +0 -0
  36. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_kl_div.py +0 -0
  37. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_kto_loss.py +0 -0
  38. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_layer_norm.py +0 -0
  39. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_orpo_loss.py +0 -0
  40. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_qwen2vl_mrope.py +0 -0
  41. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_rms_norm.py +0 -0
  42. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_rope.py +0 -0
  43. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_simpo_loss.py +0 -0
  44. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_swiglu.py +0 -0
  45. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/benchmark_tvd.py +0 -0
  46. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/benchmark/scripts/utils.py +0 -0
  47. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/dev/fmt-requirements.txt +0 -0
  48. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/dev/modal/tests.py +0 -0
  49. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/dev/modal/tests_bwd.py +0 -0
  50. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/Examples.md +0 -0
  51. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/Getting-Started.md +0 -0
  52. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/High-Level-APIs.md +0 -0
  53. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/Low-Level-APIs.md +0 -0
  54. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/acknowledgement.md +0 -0
  55. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/contributing.md +0 -0
  56. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/images/banner.GIF +0 -0
  57. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/images/compose.gif +0 -0
  58. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/images/e2e-memory.png +0 -0
  59. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/images/e2e-tps.png +0 -0
  60. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/images/logo-banner.png +0 -0
  61. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/images/patch.gif +0 -0
  62. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/images/post-training.png +0 -0
  63. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/index.md +0 -0
  64. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/docs/license.md +0 -0
  65. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/alignment/accelerate_config.yaml +0 -0
  66. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/alignment/run_orpo.py +0 -0
  67. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/README.md +0 -0
  68. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/callback.py +0 -0
  69. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/config/fsdp_config.json +0 -0
  70. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/img/gemma_7b_mem.png +0 -0
  71. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/img/gemma_7b_tp.png +0 -0
  72. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/img/llama_mem_alloc.png +0 -0
  73. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/img/llama_tps.png +0 -0
  74. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/img/qwen_mem_alloc.png +0 -0
  75. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/img/qwen_tps.png +0 -0
  76. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/launch_on_modal.py +0 -0
  77. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/requirements.txt +0 -0
  78. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/run_benchmarks.sh +0 -0
  79. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/run_gemma.sh +0 -0
  80. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/run_llama.sh +0 -0
  81. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/run_qwen.sh +0 -0
  82. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/run_qwen2_vl.sh +0 -0
  83. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/training.py +0 -0
  84. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/huggingface/training_multimodal.py +0 -0
  85. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/lightning/README.md +0 -0
  86. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/lightning/requirements.txt +0 -0
  87. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/lightning/training.py +0 -0
  88. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/README.md +0 -0
  89. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/callback.py +0 -0
  90. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/docs/images/Memory_Stage1_num_head_3.png +0 -0
  91. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/docs/images/Memory_Stage1_num_head_5.png +0 -0
  92. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/docs/images/Memory_Stage2_num_head_3.png +0 -0
  93. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/docs/images/Memory_Stage2_num_head_5.png +0 -0
  94. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/docs/images/Throughput_Stage1_num_head_3.png +0 -0
  95. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/docs/images/Throughput_Stage1_num_head_5.png +0 -0
  96. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/docs/images/Throughput_Stage2_num_head_3.png +0 -0
  97. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/docs/images/Throughput_Stage2_num_head_5.png +0 -0
  98. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/fsdp/acc-fsdp.conf +0 -0
  99. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/medusa_util.py +0 -0
  100. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/requirements.txt +0 -0
  101. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/scripts/llama3_8b_medusa.sh +0 -0
  102. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/examples/medusa/train.py +0 -0
  103. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/licenses/LICENSE-Apache-2.0 +0 -0
  104. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/licenses/LICENSE-MIT-AutoAWQ +0 -0
  105. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/licenses/LICENSE-MIT-Efficient-Cross-Entropy +0 -0
  106. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/licenses/LICENSE-MIT-llmc +0 -0
  107. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/licenses/LICENSE-MIT-triton +0 -0
  108. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/mkdocs.yml +0 -0
  109. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/setup.cfg +0 -0
  110. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/setup.py +0 -0
  111. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/__init__.py +0 -0
  112. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/README.md +0 -0
  113. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/__init__.py +0 -0
  114. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/cpo_loss.py +0 -0
  115. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/dpo_loss.py +0 -0
  116. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/functional.py +0 -0
  117. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/fused_linear_distillation.py +0 -0
  118. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/fused_linear_ppo.py +0 -0
  119. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/fused_linear_preference.py +0 -0
  120. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/fused_linear_unpaired_preference.py +0 -0
  121. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/grpo_loss.py +0 -0
  122. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/jsd_loss.py +0 -0
  123. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/kto_loss.py +0 -0
  124. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/orpo_loss.py +0 -0
  125. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/chunked_loss/simpo_loss.py +0 -0
  126. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/env_report.py +0 -0
  127. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/__init__.py +0 -0
  128. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/cross_entropy.py +0 -0
  129. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/dyt.py +0 -0
  130. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/experimental/embedding.py +0 -0
  131. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/experimental/mm_int8int2.py +0 -0
  132. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/fused_linear_cross_entropy.py +0 -0
  133. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/fused_linear_jsd.py +0 -0
  134. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/geglu.py +0 -0
  135. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/group_norm.py +0 -0
  136. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/jsd.py +0 -0
  137. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/kl_div.py +0 -0
  138. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/layer_norm.py +0 -0
  139. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/qwen2vl_mrope.py +0 -0
  140. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/rms_norm.py +0 -0
  141. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/rope.py +0 -0
  142. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/swiglu.py +0 -0
  143. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/tvd.py +0 -0
  144. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/ops/utils.py +0 -0
  145. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/auto_model.py +0 -0
  146. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/cross_entropy.py +0 -0
  147. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/dyt.py +0 -0
  148. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/experimental/embedding.py +0 -0
  149. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/functional.py +0 -0
  150. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/fused_linear_cross_entropy.py +0 -0
  151. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/fused_linear_jsd.py +0 -0
  152. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/geglu.py +0 -0
  153. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/gema3_rms.py +0 -0
  154. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/group_norm.py +0 -0
  155. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/jsd.py +0 -0
  156. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/kl_div.py +0 -0
  157. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/layer_norm.py +0 -0
  158. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/__init__.py +0 -0
  159. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/gemma.py +0 -0
  160. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/gemma2.py +0 -0
  161. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/gemma3.py +0 -0
  162. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/llama.py +0 -0
  163. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/llava.py +0 -0
  164. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/loss_utils.py +0 -0
  165. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/mistral.py +0 -0
  166. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/mixtral.py +0 -0
  167. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/mllama.py +0 -0
  168. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/olmo2.py +0 -0
  169. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/paligemma.py +0 -0
  170. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/phi3.py +0 -0
  171. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/qwen2.py +0 -0
  172. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/qwen2_5_vl.py +0 -0
  173. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/model/qwen2_vl.py +0 -0
  174. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/monkey_patch.py +0 -0
  175. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/qwen2vl_mrope.py +0 -0
  176. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/rms_norm.py +0 -0
  177. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/rope.py +0 -0
  178. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/swiglu.py +0 -0
  179. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/trainer/__init__.py +0 -0
  180. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/trainer/orpo_trainer.py +0 -0
  181. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/trainer_integration.py +0 -0
  182. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/transformers/tvd.py +0 -0
  183. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/triton/__init__.py +0 -0
  184. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/triton/monkey_patch.py +0 -0
  185. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel/utils.py +0 -0
  186. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel_nightly.egg-info/SOURCES.txt +0 -0
  187. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel_nightly.egg-info/dependency_links.txt +0 -0
  188. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel_nightly.egg-info/requires.txt +0 -0
  189. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/src/liger_kernel_nightly.egg-info/top_level.txt +0 -0
  190. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/__init__.py +0 -0
  191. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/chunked_loss/__init__.py +0 -0
  192. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/chunked_loss/test_cpo_loss.py +0 -0
  193. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/chunked_loss/test_dpo_loss.py +0 -0
  194. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/chunked_loss/test_grpo_loss.py +0 -0
  195. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/chunked_loss/test_jsd_loss.py +0 -0
  196. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/chunked_loss/test_kto_loss.py +0 -0
  197. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/chunked_loss/test_orpo_loss.py +0 -0
  198. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/chunked_loss/test_simpo_loss.py +0 -0
  199. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/conftest.py +0 -0
  200. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/__init__.py +0 -0
  201. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/bf16/__init__.py +0 -0
  202. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/bf16/test_mini_models.py +0 -0
  203. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/bf16/test_mini_models_multimodal.py +0 -0
  204. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/bf16/test_mini_models_with_logits.py +0 -0
  205. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/fp32/__init__.py +0 -0
  206. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/fp32/test_mini_models.py +0 -0
  207. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/fp32/test_mini_models_multimodal.py +0 -0
  208. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/convergence/fp32/test_mini_models_with_logits.py +0 -0
  209. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/fake_configs/Google/Gemma3/gemma-3-4b-it/tokenizer_config.json +0 -0
  210. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/fake_configs/Google/Paligemma/paligemma-3b-pt-224/tokenizer_config.json +0 -0
  211. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/preprocessor_config.json +0 -0
  212. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/processor_config.json +0 -0
  213. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/fake_configs/Llava/llava-1.5-7b-hf/tokenizer_config.json +0 -0
  214. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/fake_configs/Qwen/Qwen2-VL-7B-Instruct/tokenizer_config.json +0 -0
  215. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/fake_configs/Qwen/Qwen2.5-VL-7B-Instruct/tokenizer_config.json +0 -0
  216. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/fake_configs/meta-llama/Llama-3.2-11B-Vision-Instruct/tokenizer_config.json +0 -0
  217. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/scripts/generate_tokenized_dataset.py +0 -0
  218. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/tiny_shakespeare.txt +0 -0
  219. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/tiny_shakespeare_tokenized/data-00000-of-00001.arrow +0 -0
  220. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/tiny_shakespeare_tokenized/dataset_info.json +0 -0
  221. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/resources/tiny_shakespeare_tokenized/state.json +0 -0
  222. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_auto_model.py +0 -0
  223. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_cross_entropy.py +0 -0
  224. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_dyt.py +0 -0
  225. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_embedding.py +0 -0
  226. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_flex_attention.py +0 -0
  227. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_fused_linear_cross_entropy.py +0 -0
  228. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_fused_linear_jsd.py +0 -0
  229. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_geglu.py +0 -0
  230. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_group_norm.py +0 -0
  231. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_jsd.py +0 -0
  232. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_kl_div.py +0 -0
  233. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_layer_norm.py +0 -0
  234. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_mm_int8int2.py +0 -0
  235. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_monkey_patch.py +0 -0
  236. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_qwen2vl_mrope.py +0 -0
  237. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_rms_norm.py +0 -0
  238. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_rope.py +0 -0
  239. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_swiglu.py +0 -0
  240. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_trainer_integration.py +0 -0
  241. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_transformers.py +0 -0
  242. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/transformers/test_tvd.py +0 -0
  243. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/triton/test_triton_monkey_patch.py +0 -0
  244. {liger_kernel_nightly-0.5.6.dev20250408182156 → liger_kernel_nightly-0.5.6.dev20250408223717}/test/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.6.dev20250408182156
3
+ Version: 0.5.6.dev20250408223717
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "liger_kernel_nightly"
7
- version = "0.5.6.dev20250408182156"
7
+ version = "0.5.6.dev20250408223717"
8
8
  description = "Efficient Triton kernels for LLM Training"
9
9
  urls = { "Homepage" = "https://github.com/linkedin/Liger-Kernel" }
10
10
  readme = { file = "README.md", content-type = "text/markdown" }
@@ -0,0 +1,145 @@
1
+ import importlib
2
+
3
+ from typing import TYPE_CHECKING
4
+
5
+ # Always-safe imports (independent of 'transformers')
6
+ from liger_kernel.transformers.cross_entropy import LigerCrossEntropyLoss # noqa: F401
7
+ from liger_kernel.transformers.dyt import LigerDyT # noqa: F401
8
+ from liger_kernel.transformers.fused_linear_cross_entropy import LigerFusedLinearCrossEntropyLoss # noqa: F401
9
+ from liger_kernel.transformers.fused_linear_jsd import LigerFusedLinearJSD # noqa: F401
10
+ from liger_kernel.transformers.geglu import LigerGEGLUMLP # noqa: F401
11
+ from liger_kernel.transformers.jsd import LigerJSD # noqa: F401
12
+ from liger_kernel.transformers.layer_norm import LigerLayerNorm # noqa: F401
13
+ from liger_kernel.transformers.rms_norm import LigerRMSNorm # noqa: F401
14
+ from liger_kernel.transformers.rope import liger_rotary_pos_emb # noqa: F401
15
+ from liger_kernel.transformers.swiglu import LigerBlockSparseTop2MLP # noqa: F401
16
+ from liger_kernel.transformers.swiglu import LigerPhi3SwiGLUMLP # noqa: F401
17
+ from liger_kernel.transformers.swiglu import LigerSwiGLUMLP # noqa: F401
18
+ from liger_kernel.transformers.tvd import LigerTVDLoss # noqa: F401
19
+
20
+ # Static-only imports for IDEs and type checkers
21
+ if TYPE_CHECKING:
22
+ from liger_kernel.transformers.auto_model import AutoLigerKernelForCausalLM # noqa: F401
23
+ from liger_kernel.transformers.monkey_patch import _apply_liger_kernel # noqa: F401
24
+ from liger_kernel.transformers.monkey_patch import _apply_liger_kernel_to_instance # noqa: F401
25
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma # noqa: F401
26
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma2 # noqa: F401
27
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma3 # noqa: F401
28
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma3_text # noqa: F401
29
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_granite # noqa: F401
30
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_llama # noqa: F401
31
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_llava # noqa: F401
32
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mistral # noqa: F401
33
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mixtral # noqa: F401
34
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mllama # noqa: F401
35
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_olmo2 # noqa: F401
36
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_paligemma # noqa: F401
37
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_phi3 # noqa: F401
38
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2 # noqa: F401
39
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2_5_vl # noqa: F401
40
+ from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2_vl # noqa: F401
41
+
42
+
43
+ # Check if 'transformers' is installed
44
+ try:
45
+ import transformers # noqa: F401
46
+
47
+ _TRANSFORMERS_AVAILABLE = True
48
+ except ImportError:
49
+ _TRANSFORMERS_AVAILABLE = False
50
+
51
+
52
+ def is_transformers_available() -> bool:
53
+ """
54
+ Returns True if the 'transformers' package is available.
55
+ Useful for conditional logic in downstream code.
56
+ """
57
+ return _TRANSFORMERS_AVAILABLE
58
+
59
+
60
+ def __getattr__(name: str):
61
+ """
62
+ Handles lazy access to transformer-dependent attributes.
63
+ If 'transformers' is not installed, raises a user-friendly ImportError.
64
+ """
65
+ if not _TRANSFORMERS_AVAILABLE:
66
+ raise ImportError(
67
+ f"The attribute '{name}' requires the 'transformers' library, which is not installed.\n"
68
+ f"Please install it with `pip install transformers` to use this functionality."
69
+ )
70
+
71
+ if name == "AutoLigerKernelForCausalLM":
72
+ module = importlib.import_module("liger_kernel.transformers.auto_model")
73
+ return getattr(module, name)
74
+
75
+ monkey_patch_symbols = {
76
+ "_apply_liger_kernel",
77
+ "_apply_liger_kernel_to_instance",
78
+ "apply_liger_kernel_to_gemma",
79
+ "apply_liger_kernel_to_gemma2",
80
+ "apply_liger_kernel_to_gemma3",
81
+ "apply_liger_kernel_to_gemma3_text",
82
+ "apply_liger_kernel_to_granite",
83
+ "apply_liger_kernel_to_llama",
84
+ "apply_liger_kernel_to_llava",
85
+ "apply_liger_kernel_to_mistral",
86
+ "apply_liger_kernel_to_mixtral",
87
+ "apply_liger_kernel_to_mllama",
88
+ "apply_liger_kernel_to_olmo2",
89
+ "apply_liger_kernel_to_paligemma",
90
+ "apply_liger_kernel_to_phi3",
91
+ "apply_liger_kernel_to_qwen2",
92
+ "apply_liger_kernel_to_qwen2_5_vl",
93
+ "apply_liger_kernel_to_qwen2_vl",
94
+ }
95
+
96
+ if name in monkey_patch_symbols:
97
+ module = importlib.import_module("liger_kernel.transformers.monkey_patch")
98
+ return getattr(module, name)
99
+
100
+ raise AttributeError(f"module {__name__} has no attribute {name}")
101
+
102
+
103
+ # Shared symbols in all environments
104
+ __all__ = [
105
+ "is_transformers_available",
106
+ "LigerCrossEntropyLoss",
107
+ "LigerDyT",
108
+ "LigerFusedLinearCrossEntropyLoss",
109
+ "LigerFusedLinearJSD",
110
+ "LigerGEGLUMLP",
111
+ "LigerJSD",
112
+ "LigerLayerNorm",
113
+ "LigerRMSNorm",
114
+ "liger_rotary_pos_emb",
115
+ "LigerBlockSparseTop2MLP",
116
+ "LigerPhi3SwiGLUMLP",
117
+ "LigerSwiGLUMLP",
118
+ "LigerTVDLoss",
119
+ ]
120
+
121
+ # Add transformer-dependent symbols only if available
122
+ if _TRANSFORMERS_AVAILABLE:
123
+ __all__.extend(
124
+ [
125
+ "AutoLigerKernelForCausalLM",
126
+ "_apply_liger_kernel",
127
+ "_apply_liger_kernel_to_instance",
128
+ "apply_liger_kernel_to_gemma",
129
+ "apply_liger_kernel_to_gemma2",
130
+ "apply_liger_kernel_to_gemma3",
131
+ "apply_liger_kernel_to_gemma3_text",
132
+ "apply_liger_kernel_to_granite",
133
+ "apply_liger_kernel_to_llama",
134
+ "apply_liger_kernel_to_llava",
135
+ "apply_liger_kernel_to_mistral",
136
+ "apply_liger_kernel_to_mixtral",
137
+ "apply_liger_kernel_to_mllama",
138
+ "apply_liger_kernel_to_olmo2",
139
+ "apply_liger_kernel_to_paligemma",
140
+ "apply_liger_kernel_to_phi3",
141
+ "apply_liger_kernel_to_qwen2",
142
+ "apply_liger_kernel_to_qwen2_5_vl",
143
+ "apply_liger_kernel_to_qwen2_vl",
144
+ ]
145
+ )
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.5.6.dev20250408182156
3
+ Version: 0.5.6.dev20250408223717
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -1,32 +0,0 @@
1
- from liger_kernel.transformers.auto_model import AutoLigerKernelForCausalLM # noqa: F401
2
- from liger_kernel.transformers.cross_entropy import LigerCrossEntropyLoss # noqa: F401
3
- from liger_kernel.transformers.dyt import LigerDyT # noqa: F401
4
- from liger_kernel.transformers.fused_linear_cross_entropy import LigerFusedLinearCrossEntropyLoss # noqa: F401
5
- from liger_kernel.transformers.fused_linear_jsd import LigerFusedLinearJSD # noqa: F401
6
- from liger_kernel.transformers.geglu import LigerGEGLUMLP # noqa: F401
7
- from liger_kernel.transformers.jsd import LigerJSD # noqa: F401
8
- from liger_kernel.transformers.layer_norm import LigerLayerNorm # noqa: F401
9
- from liger_kernel.transformers.monkey_patch import _apply_liger_kernel # noqa: F401
10
- from liger_kernel.transformers.monkey_patch import _apply_liger_kernel_to_instance # noqa: F401
11
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma # noqa: F401
12
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma2 # noqa: F401
13
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma3 # noqa: F401
14
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_gemma3_text # noqa: F401
15
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_granite # noqa: F401
16
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_llama # noqa: F401
17
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_llava # noqa: F401
18
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mistral # noqa: F401
19
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mixtral # noqa: F401
20
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_mllama # noqa: F401
21
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_olmo2 # noqa: F401
22
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_paligemma # noqa: F401
23
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_phi3 # noqa: F401
24
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2 # noqa: F401
25
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2_5_vl # noqa: F401
26
- from liger_kernel.transformers.monkey_patch import apply_liger_kernel_to_qwen2_vl # noqa: F401
27
- from liger_kernel.transformers.rms_norm import LigerRMSNorm # noqa: F401
28
- from liger_kernel.transformers.rope import liger_rotary_pos_emb # noqa: F401
29
- from liger_kernel.transformers.swiglu import LigerBlockSparseTop2MLP # noqa: F401
30
- from liger_kernel.transformers.swiglu import LigerPhi3SwiGLUMLP # noqa: F401
31
- from liger_kernel.transformers.swiglu import LigerSwiGLUMLP # noqa: F401
32
- from liger_kernel.transformers.tvd import LigerTVDLoss # noqa: F401