liger-kernel-nightly 0.6.0.dev20250708194445__py3-none-any.whl → 0.6.0.dev20250709030408__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- liger_kernel/transformers/monkey_patch.py +4 -2
- {liger_kernel_nightly-0.6.0.dev20250708194445.dist-info → liger_kernel_nightly-0.6.0.dev20250709030408.dist-info}/METADATA +1 -1
- {liger_kernel_nightly-0.6.0.dev20250708194445.dist-info → liger_kernel_nightly-0.6.0.dev20250709030408.dist-info}/RECORD +7 -7
- {liger_kernel_nightly-0.6.0.dev20250708194445.dist-info → liger_kernel_nightly-0.6.0.dev20250709030408.dist-info}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.0.dev20250708194445.dist-info → liger_kernel_nightly-0.6.0.dev20250709030408.dist-info}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.0.dev20250708194445.dist-info → liger_kernel_nightly-0.6.0.dev20250709030408.dist-info}/WHEEL +0 -0
- {liger_kernel_nightly-0.6.0.dev20250708194445.dist-info → liger_kernel_nightly-0.6.0.dev20250709030408.dist-info}/top_level.txt +0 -0
@@ -1096,7 +1096,9 @@ def apply_liger_kernel_to_paligemma(
|
|
1096
1096
|
# PaliGemma submodules are ['vision_tower', 'multi_modal_projector', 'language_model']
|
1097
1097
|
|
1098
1098
|
from transformers.models.gemma.modeling_gemma import GemmaForCausalLM
|
1099
|
+
from transformers.models.gemma.modeling_gemma import GemmaModel
|
1099
1100
|
from transformers.models.gemma2.modeling_gemma2 import Gemma2ForCausalLM
|
1101
|
+
from transformers.models.gemma2.modeling_gemma2 import Gemma2Model
|
1100
1102
|
from transformers.models.paligemma import modeling_paligemma
|
1101
1103
|
from transformers.models.paligemma.modeling_paligemma import PaliGemmaForConditionalGeneration
|
1102
1104
|
from transformers.models.siglip import modeling_siglip
|
@@ -1155,7 +1157,7 @@ def apply_liger_kernel_to_paligemma(
|
|
1155
1157
|
|
1156
1158
|
language_model = model.language_model
|
1157
1159
|
|
1158
|
-
if isinstance(language_model, GemmaForCausalLM):
|
1160
|
+
if isinstance(language_model, (GemmaForCausalLM, GemmaModel)):
|
1159
1161
|
apply_liger_kernel_to_gemma(
|
1160
1162
|
rope=rope,
|
1161
1163
|
cross_entropy=False,
|
@@ -1165,7 +1167,7 @@ def apply_liger_kernel_to_paligemma(
|
|
1165
1167
|
model=language_model,
|
1166
1168
|
)
|
1167
1169
|
|
1168
|
-
elif isinstance(language_model, Gemma2ForCausalLM):
|
1170
|
+
elif isinstance(language_model, (Gemma2ForCausalLM, Gemma2Model)):
|
1169
1171
|
apply_liger_kernel_to_gemma2(
|
1170
1172
|
rope=rope,
|
1171
1173
|
cross_entropy=False,
|
@@ -54,7 +54,7 @@ liger_kernel/transformers/grpo_loss.py,sha256=uAkUNKSnUGEOqa82L9w2e6AI1kcmG8K45-
|
|
54
54
|
liger_kernel/transformers/jsd.py,sha256=DGqRnxIZxsvxo0_tbbxX3b-sDbDjC_yKufyRIHCcScY,2979
|
55
55
|
liger_kernel/transformers/kl_div.py,sha256=WLffFbh1EExD2Eb1F7lN11fo9JJC-0751WJjZAF1Fj8,409
|
56
56
|
liger_kernel/transformers/layer_norm.py,sha256=c9pk3PEasOKYR0rhe5e5nNrnYKVCEW4VC8S6LpCq9EQ,906
|
57
|
-
liger_kernel/transformers/monkey_patch.py,sha256=
|
57
|
+
liger_kernel/transformers/monkey_patch.py,sha256=kHe6Lmwh0X-ha1dTSYPa0R2h7uT-ytkixK8rl0rcOYQ,85722
|
58
58
|
liger_kernel/transformers/multi_token_attention.py,sha256=l9VDICK0dfmifUDW668hGscP8AHq2rYcM2oGUa3baRQ,1751
|
59
59
|
liger_kernel/transformers/qwen2vl_mrope.py,sha256=5EwSqrMdsL9MYspeBMXBsNJKvH0MOmRrtJXAJlnnlOI,1047
|
60
60
|
liger_kernel/transformers/rms_norm.py,sha256=vkekcvTeWY8vL4H6hg3t0XeY0Ew_3OFMPHuzqlxPPVw,2719
|
@@ -89,9 +89,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
|
|
89
89
|
liger_kernel/transformers/trainer/orpo_trainer.py,sha256=tX0h63aOFe3rNqTmk6JpMf75UPo981yzEa6TghnjS0Q,5370
|
90
90
|
liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
|
91
91
|
liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
|
92
|
-
liger_kernel_nightly-0.6.0.
|
93
|
-
liger_kernel_nightly-0.6.0.
|
94
|
-
liger_kernel_nightly-0.6.0.
|
95
|
-
liger_kernel_nightly-0.6.0.
|
96
|
-
liger_kernel_nightly-0.6.0.
|
97
|
-
liger_kernel_nightly-0.6.0.
|
92
|
+
liger_kernel_nightly-0.6.0.dev20250709030408.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
|
93
|
+
liger_kernel_nightly-0.6.0.dev20250709030408.dist-info/METADATA,sha256=VG7Cv_i2Fkvxidtu9VfPghP5qMi4zMMH9nhesam8ahE,24535
|
94
|
+
liger_kernel_nightly-0.6.0.dev20250709030408.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
|
95
|
+
liger_kernel_nightly-0.6.0.dev20250709030408.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
|
96
|
+
liger_kernel_nightly-0.6.0.dev20250709030408.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
|
97
|
+
liger_kernel_nightly-0.6.0.dev20250709030408.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|