liger-kernel-nightly 0.6.3.dev20251105235313__py3-none-any.whl → 0.6.3.dev20251106220336__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -155,14 +155,18 @@ def lce_forward(
155
155
  output = output + (token_accuracy,) if token_accuracy is not None else output
156
156
  return output
157
157
 
158
- # Return GLM4V MoE output with accuracy (using dict syntax to add extra field)
159
- return LigerGlm4vMoeCausalLMOutputWithPast(
158
+ # Build output kwargs and include aux_loss only if present (depends on transformers version)
159
+ output_kwargs = dict(
160
160
  loss=loss,
161
161
  logits=logits,
162
162
  past_key_values=outputs.past_key_values,
163
163
  hidden_states=outputs.hidden_states,
164
164
  attentions=outputs.attentions,
165
165
  rope_deltas=outputs.rope_deltas,
166
- aux_loss=outputs.aux_loss,
167
166
  token_accuracy=token_accuracy,
168
167
  )
168
+ if hasattr(outputs, "aux_loss"):
169
+ output_kwargs["aux_loss"] = outputs.aux_loss
170
+
171
+ # Return GLM4V MoE output with accuracy
172
+ return LigerGlm4vMoeCausalLMOutputWithPast(**output_kwargs)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: liger_kernel_nightly
3
- Version: 0.6.3.dev20251105235313
3
+ Version: 0.6.3.dev20251106220336
4
4
  Summary: Efficient Triton kernels for LLM Training
5
5
  License: BSD 2-CLAUSE LICENSE
6
6
  Copyright 2024 LinkedIn Corporation
@@ -79,7 +79,7 @@ liger_kernel/transformers/model/gemma2.py,sha256=qa9Ok42vFojVGNmASTH3Ek566Vu507k
79
79
  liger_kernel/transformers/model/gemma3.py,sha256=mEV3Kuy-dqfTk_b899Vb-InuD4_DvwH0nm5xgbG-0MM,14911
80
80
  liger_kernel/transformers/model/glm4.py,sha256=bSp22iPIjsli4-c_usUOsyh1Bs2gIK8X6ynS0azseUs,5900
81
81
  liger_kernel/transformers/model/glm4v.py,sha256=dd-BQpccDCp1SbIxcJ5rG8xcwYQK3KOv1Tgm9TGnZc4,6594
82
- liger_kernel/transformers/model/glm4v_moe.py,sha256=4UH3HGOWFZejfwLzC-bikwD7y2qQYDstYQWSCsWj2mo,6979
82
+ liger_kernel/transformers/model/glm4v_moe.py,sha256=zKhMdOOrRhlrvCSFaeVYfddL1ubpY8edEO91TN81n98,7135
83
83
  liger_kernel/transformers/model/internvl.py,sha256=OOutracs9qrPHSU7FVYar08yinvGrHQVPvo39JEws6w,6473
84
84
  liger_kernel/transformers/model/llama.py,sha256=kqZeONzwTBzudoChlKMzq1w23BtYGbxWZC1l1V__JTw,13410
85
85
  liger_kernel/transformers/model/llama4.py,sha256=PfkynGVI0xxMs3EtyYpCgaALI6stu25OIrTIymE-pvg,4853
@@ -106,9 +106,9 @@ liger_kernel/transformers/trainer/__init__.py,sha256=p7yQfklV8-467qSz_ZMimkbDF7H
106
106
  liger_kernel/transformers/trainer/orpo_trainer.py,sha256=tX0h63aOFe3rNqTmk6JpMf75UPo981yzEa6TghnjS0Q,5370
107
107
  liger_kernel/triton/__init__.py,sha256=qCiCamzCRv6lpV8IqpAc9YMdNKC7GKurClWceQPnlis,92
108
108
  liger_kernel/triton/monkey_patch.py,sha256=Rd0hUHAzDkFfHvnX7-PBaNK5EKnZhtfM_h-fgQH9HPY,1568
109
- liger_kernel_nightly-0.6.3.dev20251105235313.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
110
- liger_kernel_nightly-0.6.3.dev20251105235313.dist-info/METADATA,sha256=6KnnAgqnY1JVClGWaYcFr7Q37aHNnKEHRS6RoDD5_ys,24777
111
- liger_kernel_nightly-0.6.3.dev20251105235313.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
112
- liger_kernel_nightly-0.6.3.dev20251105235313.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
113
- liger_kernel_nightly-0.6.3.dev20251105235313.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
114
- liger_kernel_nightly-0.6.3.dev20251105235313.dist-info/RECORD,,
109
+ liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/LICENSE,sha256=OhzLDHJ0to4a8sodVLELZiCFylZ1NAAYLs-HrjPy0ag,1312
110
+ liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/METADATA,sha256=dy_9atp4YioeU8GBh82zuDxFpz-nYGyfStlvUa4RxwY,24777
111
+ liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/NOTICE,sha256=njwnoPZLh9AN8SJQzxvCGLHi-8X__AvWRze6joNXIY8,2066
112
+ liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
113
+ liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/top_level.txt,sha256=2eghu4hA3LnkM7ElW92tQ8zegWKgSbeo-k-aGe1YnvY,13
114
+ liger_kernel_nightly-0.6.3.dev20251106220336.dist-info/RECORD,,