PyPI - transformers - Versions diffs - 4.57.2__py3-none-any.whl → 4.57.4__py3-none-any.whl - Mend

transformers 4.57.2py3-none-any.whl → 4.57.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (119) hide show

transformers/models/hunyuan_v1_dense/modeling_hunyuan_v1_dense.py CHANGED Viewed

@@ -365,7 +365,7 @@ class HunYuanDenseV1Model(HunYuanDenseV1PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/hunyuan_v1_moe/modeling_hunyuan_v1_moe.py CHANGED Viewed

@@ -435,7 +435,7 @@ class HunYuanMoEV1Model(HunYuanMoEV1PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/idefics/modeling_idefics.py CHANGED Viewed

@@ -943,7 +943,7 @@ class IdeficsModel(IdeficsPreTrainedModel):
     def freeze_vision_layers(self, module_exceptions=[]):
         freeze_model(self.vision_model, module_exceptions=module_exceptions)
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/instructblip/modeling_instructblip.py CHANGED Viewed

@@ -915,7 +915,7 @@ class InstructBlipQFormerModel(InstructBlipPreTrainedModel):
         extended_attention_mask = (1.0 - extended_attention_mask) * -10000.0
         return extended_attention_mask
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/instructblipvideo/modeling_instructblipvideo.py CHANGED Viewed

@@ -877,7 +877,7 @@ class InstructBlipVideoQFormerModel(InstructBlipVideoPreTrainedModel):
         extended_attention_mask = (1.0 - extended_attention_mask) * -10000.0
         return extended_attention_mask
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/lfm2/modeling_lfm2.py CHANGED Viewed

@@ -609,7 +609,7 @@ class Lfm2Model(Lfm2PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/llama/modeling_llama.py CHANGED Viewed

@@ -348,7 +348,7 @@ class LlamaModel(LlamaPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/llama4/modeling_llama4.py CHANGED Viewed

@@ -491,7 +491,7 @@ class Llama4TextModel(Llama4PreTrainedModel):
         self.post_init()
     @can_return_tuple
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/longcat_flash/modeling_longcat_flash.py CHANGED Viewed

@@ -541,7 +541,7 @@ class LongcatFlashModel(LongcatFlashPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/minimax/modeling_minimax.py CHANGED Viewed

@@ -646,7 +646,7 @@ class MiniMaxModel(MiniMaxPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/minimax/modular_minimax.py CHANGED Viewed

@@ -480,7 +480,7 @@ class MiniMaxPreTrainedModel(MixtralPreTrainedModel):
 class MiniMaxModel(MixtralModel):
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/ministral/modeling_ministral.py CHANGED Viewed

@@ -325,7 +325,7 @@ class MinistralModel(MinistralPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/ministral/modular_ministral.py CHANGED Viewed

@@ -198,7 +198,7 @@ class MinistralModel(Qwen2Model):
         super().__init__(config)
         del self.has_sliding_layers
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/mistral/modeling_mistral.py CHANGED Viewed

@@ -321,7 +321,7 @@ class MistralModel(MistralPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/mistral/modular_mistral.py CHANGED Viewed

@@ -112,7 +112,7 @@ class MistralPreTrainedModel(LlamaPreTrainedModel):
 class MistralModel(LlamaModel):
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/mixtral/modeling_mixtral.py CHANGED Viewed

@@ -415,7 +415,7 @@ class MixtralModel(MixtralPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/mllama/modeling_mllama.py CHANGED Viewed

@@ -993,7 +993,7 @@ class MllamaVisionModel(MllamaPreTrainedModel):
         hidden_state = torch.cat([class_embedding, hidden_state], dim=1)
         return hidden_state
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self, pixel_values: torch.Tensor, aspect_ratio_ids: torch.Tensor, aspect_ratio_mask: torch.Tensor, **kwargs
@@ -1161,7 +1161,7 @@ class MllamaTextModel(MllamaPreTrainedModel):
         self.gradient_checkpointing = False
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @can_return_tuple
     @auto_docstring
     def forward(
@@ -1429,7 +1429,7 @@ class MllamaModel(MllamaPreTrainedModel):
     def get_decoder(self):
         return self.language_model
-    @check_model_inputs()
+    @check_model_inputs
     @can_return_tuple
     @auto_docstring
     def forward(

transformers/models/modernbert_decoder/modeling_modernbert_decoder.py CHANGED Viewed

@@ -430,7 +430,7 @@ class ModernBertDecoderModel(ModernBertDecoderPreTrainedModel):
     def set_input_embeddings(self, value):
         self.embeddings.tok_embeddings = value
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/modernbert_decoder/modular_modernbert_decoder.py CHANGED Viewed

@@ -501,7 +501,7 @@ class ModernBertDecoderModel(ModernBertDecoderPreTrainedModel):
     def set_input_embeddings(self, value):
         self.embeddings.tok_embeddings = value
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/moonshine/modeling_moonshine.py CHANGED Viewed

@@ -520,7 +520,7 @@ class MoonshineEncoder(MoonshinePreTrainedModel):
     def set_input_embeddings(self, value: nn.Module):
         self.conv1 = value
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_values: torch.FloatTensor,
@@ -605,7 +605,7 @@ class MoonshineDecoder(MoonshinePreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/moonshine/modular_moonshine.py CHANGED Viewed

@@ -552,7 +552,7 @@ class MoonshineEncoder(MoonshinePreTrainedModel):
     def set_input_embeddings(self, value: nn.Module):
         self.conv1 = value
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_values: torch.FloatTensor,
@@ -627,7 +627,7 @@ class MoonshineDecoder(LlamaModel):
             [MoonshineDecoderLayer(config, idx) for idx in range(config.decoder_num_hidden_layers)]
         )
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/olmo/modeling_olmo.py CHANGED Viewed

@@ -325,7 +325,7 @@ class OlmoModel(OlmoPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/olmo2/modeling_olmo2.py CHANGED Viewed

@@ -330,7 +330,7 @@ class Olmo2Model(Olmo2PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/olmo3/modeling_olmo3.py CHANGED Viewed

@@ -358,7 +358,7 @@ class Olmo3Model(Olmo3PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/parakeet/modeling_parakeet.py CHANGED Viewed

@@ -507,7 +507,7 @@ class ParakeetEncoder(ParakeetPreTrainedModel):
         self.post_init()
     @auto_docstring
-    @check_model_inputs()
+    @check_model_inputs
     @can_return_tuple
     def forward(
         self,

transformers/models/parakeet/modular_parakeet.py CHANGED Viewed

@@ -391,7 +391,7 @@ class ParakeetEncoder(ParakeetPreTrainedModel):
         self.post_init()
     @auto_docstring
-    @check_model_inputs()
+    @check_model_inputs
     @can_return_tuple
     def forward(
         self,

transformers/models/phi/modeling_phi.py CHANGED Viewed

@@ -330,7 +330,7 @@ class PhiModel(PhiPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/phi3/modeling_phi3.py CHANGED Viewed

@@ -353,7 +353,7 @@ class Phi3Model(Phi3PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/phi4_multimodal/modeling_phi4_multimodal.py CHANGED Viewed

@@ -1562,7 +1562,7 @@ class Phi4MultimodalModel(Phi4MultimodalPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/phi4_multimodal/modular_phi4_multimodal.py CHANGED Viewed

@@ -1472,7 +1472,7 @@ class Phi4MultimodalModel(Phi3Model):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/qwen2/modeling_qwen2.py CHANGED Viewed

@@ -325,7 +325,7 @@ class Qwen2Model(Qwen2PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/qwen2/modular_qwen2.py CHANGED Viewed

@@ -143,7 +143,7 @@ class Qwen2Model(MistralModel):
         super().__init__(config)
         self.has_sliding_layers = "sliding_attention" in self.config.layer_types
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/qwen3/modeling_qwen3.py CHANGED Viewed

@@ -351,7 +351,7 @@ class Qwen3Model(Qwen3PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/qwen3_moe/modeling_qwen3_moe.py CHANGED Viewed

@@ -438,7 +438,7 @@ class Qwen3MoeModel(Qwen3MoePreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/qwen3_next/modeling_qwen3_next.py CHANGED Viewed

@@ -988,7 +988,7 @@ class Qwen3NextModel(Qwen3NextPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/qwen3_next/modular_qwen3_next.py CHANGED Viewed

@@ -727,7 +727,7 @@ class Qwen3NextModel(Qwen3NextPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/qwen3_omni_moe/modeling_qwen3_omni_moe.py CHANGED Viewed

@@ -1628,7 +1628,7 @@ class Qwen3OmniMoeThinkerTextModel(Qwen3OmniMoePreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,
@@ -2480,7 +2480,7 @@ class Qwen3OmniMoeTalkerCodePredictorModel(Qwen3OmniMoePreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,
@@ -2852,7 +2852,7 @@ class Qwen3OmniMoeTalkerModel(Qwen3OmniMoePreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,
@@ -3542,7 +3542,7 @@ class Qwen3OmniMoeCode2WavTransformerModel(Qwen3OmniMoePreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/qwen3_omni_moe/modular_qwen3_omni_moe.py CHANGED Viewed

@@ -1507,7 +1507,7 @@ class Qwen3OmniMoeTalkerCodePredictorModel(Qwen3Model):
     def get_input_embeddings(self):
         return self.codec_embedding
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/qwen3_vl/modeling_qwen3_vl.py CHANGED Viewed

@@ -779,7 +779,7 @@ class Qwen3VLTextModel(Qwen3VLPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,
@@ -1104,7 +1104,7 @@ class Qwen3VLModel(Qwen3VLPreTrainedModel):
         return special_image_mask, special_video_mask
     @auto_docstring
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: torch.LongTensor = None,
@@ -1311,7 +1311,7 @@ class Qwen3VLForConditionalGeneration(Qwen3VLPreTrainedModel, GenerationMixin):
     def visual(self):
         return self.model.visual
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: torch.LongTensor = None,

transformers/models/qwen3_vl/modular_qwen3_vl.py CHANGED Viewed

@@ -749,7 +749,7 @@ class Qwen3VLTextModel(Qwen3VLPreTrainedModel, Qwen3Model):
         hidden_states[visual_pos_masks, :] = local_this
         return hidden_states
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,
@@ -1006,7 +1006,7 @@ class Qwen3VLModel(Qwen2_5_VLModel):
         return self.get_image_features(pixel_values_videos, video_grid_thw)
     @auto_docstring
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: torch.LongTensor = None,
@@ -1149,7 +1149,7 @@ class Qwen3VLForConditionalGeneration(Qwen2_5_VLForConditionalGeneration):
     config: Qwen3VLConfig
     _checkpoint_conversion_mapping = {}
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: torch.LongTensor = None,

transformers/models/qwen3_vl_moe/modeling_qwen3_vl_moe.py CHANGED Viewed

@@ -891,7 +891,7 @@ class Qwen3VLMoeTextModel(Qwen3VLMoePreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,
@@ -1270,7 +1270,7 @@ class Qwen3VLMoeModel(Qwen3VLMoePreTrainedModel):
         return special_image_mask, special_video_mask
     @auto_docstring
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: torch.LongTensor = None,
@@ -1530,7 +1530,7 @@ class Qwen3VLMoeForConditionalGeneration(Qwen3VLMoePreTrainedModel, GenerationMi
     def visual(self):
         return self.model.visual
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: torch.LongTensor = None,

transformers/models/sam/modeling_sam.py CHANGED Viewed

@@ -1197,7 +1197,7 @@ class SamModel(SamPreTrainedModel):
         )
         return prompt_output
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/sam2/modeling_sam2.py CHANGED Viewed

@@ -618,7 +618,7 @@ class Sam2HieraDetModel(Sam2PreTrainedModel):
         pos_embed = pos_embed.permute(0, 2, 3, 1)
         return pos_embed
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         pixel_values: Optional[torch.FloatTensor] = None,
@@ -670,7 +670,7 @@ class Sam2VisionModel(Sam2PreTrainedModel):
     def get_input_embeddings(self):
         return self.backbone.get_input_embeddings()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         pixel_values: Optional[torch.FloatTensor] = None,
@@ -1387,7 +1387,7 @@ class Sam2Model(Sam2PreTrainedModel):
         )
         return prompt_output
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/sam2/modular_sam2.py CHANGED Viewed

@@ -726,7 +726,7 @@ class Sam2HieraDetModel(Sam2PreTrainedModel):
         pos_embed = pos_embed.permute(0, 2, 3, 1)
         return pos_embed
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         pixel_values: Optional[torch.FloatTensor] = None,
@@ -778,7 +778,7 @@ class Sam2VisionModel(Sam2PreTrainedModel):
     def get_input_embeddings(self):
         return self.backbone.get_input_embeddings()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         pixel_values: Optional[torch.FloatTensor] = None,
@@ -1280,7 +1280,7 @@ class Sam2Model(SamModel):
         return feature_maps, feature_maps_position_embeddings, vision_outputs.hidden_states, vision_outputs.attentions
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/sam_hq/modeling_sam_hq.py CHANGED Viewed

@@ -1320,7 +1320,7 @@ class SamHQModel(SamHQPreTrainedModel):
         )
         return prompt_output
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/seed_oss/modeling_seed_oss.py CHANGED Viewed

@@ -349,7 +349,7 @@ class SeedOssModel(SeedOssPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/siglip/modeling_siglip.py CHANGED Viewed

@@ -1023,7 +1023,7 @@ class SiglipForImageClassification(SiglipPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/siglip2/modeling_siglip2.py CHANGED Viewed

@@ -1102,7 +1102,7 @@ class Siglip2ForImageClassification(Siglip2PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/smollm3/modeling_smollm3.py CHANGED Viewed

@@ -355,7 +355,7 @@ class SmolLM3Model(SmolLM3PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/starcoder2/modeling_starcoder2.py CHANGED Viewed

@@ -325,7 +325,7 @@ class Starcoder2Model(Starcoder2PreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers 4.57.2__py3-none-any.whl → 4.57.4__py3-none-any.whl

transformers 4.57.2py3-none-any.whl → 4.57.4py3-none-any.whl