liger-kernel-nightly 0.6.0.dev20250722231330__py3-none-any.whl → 0.6.0.dev20250724002613__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -78,8 +78,8 @@ def _patch_rms_norm_module(module, offset=0.0, eps=1e-6, casting_mode="llama", i
78
78
  _bind_method_to_module(module.modules_to_save.default, "extra_repr", LigerRMSNorm.extra_repr)
79
79
  _bind_method_to_module(module.original_module, "forward", LigerRMSNorm.forward)
80
80
  _bind_method_to_module(module.original_module, "extra_repr", LigerRMSNorm.extra_repr)
81
- module.modules_to_save.default.__class__.__name__ = LigerRMSNorm.__name__
82
- module.original_module.__class__.__name__ = LigerRMSNorm.__name__
81
+ _bind_method_to_module(module.modules_to_save.default, "_get_name", lambda self: LigerRMSNorm.__name__)
82
+ _bind_method_to_module(module.original_module, "_get_name", lambda self: LigerRMSNorm.__name__)
83
83
  else:
84
84
  module.offset = offset
85
85
  module.casting_mode = casting_mode
@@ -88,7 +88,7 @@ def _patch_rms_norm_module(module, offset=0.0, eps=1e-6, casting_mode="llama", i
88
88
  module.row_mode = row_mode
89
89
  _bind_method_to_module(module, "forward", LigerRMSNorm.forward)
90
90
  _bind_method_to_module(module, "extra_repr", LigerRMSNorm.extra_repr)
91
- module.__class__.__name__ = LigerRMSNorm.__name__
91
+ _bind_method_to_module(module, "_get_name", lambda self: LigerRMSNorm.__name__)
92
92
 
93
93
 
94
94
  def _patch_layer_norm_module(module, eps=1e-6):
@@ -110,28 +110,28 @@ def _patch_layer_norm_module(module, eps=1e-6):
110
110
  module.original_module.hidden_size = getattr(module, "hidden_size", None) or getattr(
111
111
  module, "normalized_shape", None
112
112
  )
113
- _bind_method_to_module(module.modules_to_save.default, "forward", LigerRMSNorm.forward)
114
- _bind_method_to_module(module.modules_to_save.default, "extra_repr", LigerRMSNorm.extra_repr)
115
- _bind_method_to_module(module.original_module, "forward", LigerRMSNorm.forward)
116
- _bind_method_to_module(module.original_module, "extra_repr", LigerRMSNorm.extra_repr)
117
- module.modules_to_save.default.__class__.__name__ = LigerLayerNorm.__name__
118
- module.original_module.__class__.__name__ = LigerLayerNorm.__name__
113
+ _bind_method_to_module(module.modules_to_save.default, "forward", LigerLayerNorm.forward)
114
+ _bind_method_to_module(module.modules_to_save.default, "extra_repr", LigerLayerNorm.extra_repr)
115
+ _bind_method_to_module(module.original_module, "forward", LigerLayerNorm.forward)
116
+ _bind_method_to_module(module.original_module, "extra_repr", LigerLayerNorm.extra_repr)
117
+ _bind_method_to_module(module.modules_to_save.default, "_get_name", lambda self: LigerLayerNorm.__name__)
118
+ _bind_method_to_module(module.original_module, "_get_name", lambda self: LigerLayerNorm.__name__)
119
119
  else:
120
120
  module.variance_epsilon = getattr(module, "variance_epsilon", None) or getattr(module, "eps", None) or eps
121
121
  module.hidden_size = getattr(module, "hidden_size", None) or getattr(module, "normalized_shape", None)
122
122
  _bind_method_to_module(module, "forward", LigerLayerNorm.forward)
123
123
  _bind_method_to_module(module, "extra_repr", LigerLayerNorm.extra_repr)
124
- module.__class__.__name__ = LigerLayerNorm.__name__
124
+ _bind_method_to_module(module, "_get_name", lambda self: LigerLayerNorm.__name__)
125
125
 
126
126
 
127
127
  def _patch_swiglu_module(module, liger_module):
128
128
  _bind_method_to_module(module, "forward", liger_module.forward)
129
- module.__class__.__name__ = liger_module.__name__
129
+ _bind_method_to_module(module, "_get_name", lambda self: liger_module.__name__)
130
130
 
131
131
 
132
132
  def _patch_geglu_module(module):
133
133
  _bind_method_to_module(module, "forward", LigerGEGLUMLP.forward)
134
- module.__class__.__name__ = LigerGEGLUMLP.__name__
134
+ _bind_method_to_module(module, "_get_name", lambda self: LigerGEGLUMLP.__name__)
135
135
 
136
136
 
137
137
  def apply_liger_kernel_to_granite(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.6.0.dev20250722231330
3
+ Version: 0.6.0.dev20250724002613
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -56,7 +56,7 @@ liger_kernel/transformers/grpo_loss.py,sha256=uAkUNKSnUGEOqa82L9w2e6AI1kcmG8K45-
56
56
  liger_kernel/transformers/jsd.py,sha256=DGqRnxIZxsvxo0_tbbxX3b-sDbDjC_yKufyRIHCcScY,2979
57
57
  liger_kernel/transformers/kl_div.py,sha256=WLffFbh1EExD2Eb1F7lN11fo9JJC-0751WJjZAF1Fj8,409
58
58
  liger_kernel/transformers/layer_norm.py,sha256=c9pk3PEasOKYR0rhe5e5nNrnYKVCEW4VC8S6LpCq9EQ,906
59
- liger_kernel/transformers/monkey_patch.py,sha256=VsN839y5QVEC6BD_-hCiShWLerQM2QDLDoKf2rq02I4,88990
59
+ liger_kernel/transformers/monkey_patch.py,sha256=tXKo4EKVp3szpdqPh051oLZFrlg_hCbWRv0RpSX_kfY,89238
60
60
  liger_kernel/transformers/multi_token_attention.py,sha256=l9VDICK0dfmifUDW668hGscP8AHq2rYcM2oGUa3baRQ,1751
61
61
  liger_kernel/transformers/qwen2vl_mrope.py,sha256=5EwSqrMdsL9MYspeBMXBsNJKvH0MOmRrtJXAJlnnlOI,1047
62
62
  liger_kernel/transformers/rms_norm.py,sha256=vkekcvTeWY8vL4H6hg3t0XeY0Ew_3OFMPHuzqlxPPVw,2719
@@ -92,9 +92,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
92
92
  liger_kernel/transformers/trainer/orpo_trainer.py,sha256=tX0h63aOFe3rNqTmk6JpMf75UPo981yzEa6TghnjS0Q,5370
93
93
  liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
94
94
  liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
95
- liger_kernel_nightly-0.6.0.dev20250722231330.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
96
- liger_kernel_nightly-0.6.0.dev20250722231330.dist-info/METADATA,sha256=ouFHoAdiJbPlGWQr5aV5OLKv5X-fXXE6xGay6Jum7eI,24502
97
- liger_kernel_nightly-0.6.0.dev20250722231330.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
98
- liger_kernel_nightly-0.6.0.dev20250722231330.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
99
- liger_kernel_nightly-0.6.0.dev20250722231330.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
100
- liger_kernel_nightly-0.6.0.dev20250722231330.dist-info/RECORD,,
95
+ liger_kernel_nightly-0.6.0.dev20250724002613.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
96
+ liger_kernel_nightly-0.6.0.dev20250724002613.dist-info/METADATA,sha256=Qd-pYi9G6xzToXYSXoT-Nt_eT9YLkEVDp2xBGzGiIhk,24502
97
+ liger_kernel_nightly-0.6.0.dev20250724002613.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
98
+ liger_kernel_nightly-0.6.0.dev20250724002613.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
99
+ liger_kernel_nightly-0.6.0.dev20250724002613.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
100
+ liger_kernel_nightly-0.6.0.dev20250724002613.dist-info/RECORD,,