liger-kernel-nightly 0.6.3.dev20251105235313__py3-none-any.whl → 0.6.3.dev20251106220336__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- liger_kernel/transformers/model/glm4v_moe.py +7 -3
- {liger_kernel_nightly-0.6.3.dev20251105235313.dist-info → liger_kernel_nightly-0.6.3.dev20251106220336.dist-info}/METADATA +1 -1
- {liger_kernel_nightly-0.6.3.dev20251105235313.dist-info → liger_kernel_nightly-0.6.3.dev20251106220336.dist-info}/RECORD +7 -7
- {liger_kernel_nightly-0.6.3.dev20251105235313.dist-info → liger_kernel_nightly-0.6.3.dev20251106220336.dist-info}/LICENSE +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105235313.dist-info → liger_kernel_nightly-0.6.3.dev20251106220336.dist-info}/NOTICE +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105235313.dist-info → liger_kernel_nightly-0.6.3.dev20251106220336.dist-info}/WHEEL +0 -0
- {liger_kernel_nightly-0.6.3.dev20251105235313.dist-info → liger_kernel_nightly-0.6.3.dev20251106220336.dist-info}/top_level.txt +0 -0
|
@@ -155,14 +155,18 @@ def lce_forward(
|
|
|
155
155
|
output = output + (token_accuracy,) if token_accuracy is not None else output
|
|
156
156
|
return output
|
|
157
157
|
|
|
158
|
-
#
|
|
159
|
-
|
|
158
|
+
# Build output kwargs and include aux_loss only if present (depends on transformers version)
|
|
159
|
+
output_kwargs = dict(
|
|
160
160
|
loss=loss,
|
|
161
161
|
logits=logits,
|
|
162
162
|
past_key_values=outputs.past_key_values,
|
|
163
163
|
hidden_states=outputs.hidden_states,
|
|
164
164
|
attentions=outputs.attentions,
|
|
165
165
|
rope_deltas=outputs.rope_deltas,
|
|
166
|
-
aux_loss=outputs.aux_loss,
|
|
167
166
|
token_accuracy=token_accuracy,
|
|
168
167
|
)
|
|
168
|
+
if hasattr(outputs, "aux_loss"):
|
|
169
|
+
output_kwargs["aux_loss"] = outputs.aux_loss
|
|
170
|
+
|
|
171
|
+
# Return GLM4V MoE output with accuracy
|
|
172
|
+
return LigerGlm4vMoeCausalLMOutputWithPast(**output_kwargs)
|
|
@@ -79,7 +79,7 @@ liger_kernel/transformers/model/gemma2.py,sha256=qa9Ok42vFojVGNmASTH3Ek566Vu507k
|
|
|
79
79
|
liger_kernel/transformers/model/gemma3.py,sha256=mEV3Kuy-dqfTk_b899Vb-InuD4_DvwH0nm5xgbG-0MM,14911
|
|
80
80
|
liger_kernel/transformers/model/glm4.py,sha256=bSp22iPIjsli4-c_usUOsyh1Bs2gIK8X6ynS0azseUs,5900
|
|
81
81
|
liger_kernel/transformers/model/glm4v.py,sha256=dd-BQpccDCp1SbIxcJ5rG8xcwYQK3KOv1Tgm9TGnZc4,6594
|
|
82
|
-
liger_kernel/transformers/model/glm4v_moe.py,sha256=
|
|
82
|
+
liger_kernel/transformers/model/glm4v_moe.py,sha256=zKhMdOOrRhlrvCSFaeVYfddL1ubpY8edEO91TN81n98,7135
|
|
83
83
|
liger_kernel/transformers/model/internvl.py,sha256=OOutracs9qrPHSU7FVYar08yinvGrHQVPvo39JEws6w,6473
|
|
84
84
|
liger_kernel/transformers/model/llama.py,sha256=kqZeONzwTBzudoChlKMzq1w23BtYGbxWZC1l1V__JTw,13410
|
|
85
85
|
liger_kernel/transformers/model/llama4.py,sha256=PfkynGVI0xxMs3EtyYpCgaALI6stu25OIrTIymE-pvg,4853
|
|
@@ -106,9 +106,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
|
|
|
106
106
|
liger_kernel/transformers/trainer/orpo_trainer.py,sha256=tX0h63aOFe3rNqTmk6JpMf75UPo981yzEa6TghnjS0Q,5370
|
|
107
107
|
liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
|
|
108
108
|
liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
|
|
109
|
-
liger_kernel_nightly-0.6.3.
|
|
110
|
-
liger_kernel_nightly-0.6.3.
|
|
111
|
-
liger_kernel_nightly-0.6.3.
|
|
112
|
-
liger_kernel_nightly-0.6.3.
|
|
113
|
-
liger_kernel_nightly-0.6.3.
|
|
114
|
-
liger_kernel_nightly-0.6.3.
|
|
109
|
+
liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
|
|
110
|
+
liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/METADATA,sha256=dy_9atp4YioeU8GBh82zuDxFpz-nYGyfStlvUa4RxwY,24777
|
|
111
|
+
liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
|
|
112
|
+
liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
|
|
113
|
+
liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
|
|
114
|
+
liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|