PyPI - transformers - Versions diffs - 4.57.3__py3-none-any.whl → 4.57.4__py3-none-any.whl - Mend

transformers 4.57.3py3-none-any.whl → 4.57.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (119) hide show

transformers/models/starcoder2/modular_starcoder2.py CHANGED Viewed

@@ -150,7 +150,7 @@ class Starcoder2Model(MistralModel):
         self.norm = nn.LayerNorm(config.hidden_size, eps=config.norm_epsilon)
         self.embedding_dropout = config.embedding_dropout
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/t5gemma/modeling_t5gemma.py CHANGED Viewed

@@ -707,7 +707,7 @@ class T5GemmaEncoder(T5GemmaPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,
@@ -791,7 +791,7 @@ class T5GemmaDecoder(T5GemmaEncoder):
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/t5gemma/modular_t5gemma.py CHANGED Viewed

@@ -559,7 +559,7 @@ class T5GemmaEncoder(T5GemmaPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,
@@ -643,7 +643,7 @@ class T5GemmaDecoder(T5GemmaEncoder):
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_ids: Optional[torch.LongTensor] = None,

transformers/models/vaultgemma/modeling_vaultgemma.py CHANGED Viewed

@@ -368,7 +368,7 @@ class VaultGemmaModel(VaultGemmaPreTrainedModel):
         # Initialize weights and apply final processing
         self.post_init()
-    @check_model_inputs()
+    @check_model_inputs
     @auto_docstring
     def forward(
         self,

transformers/models/voxtral/modeling_voxtral.py CHANGED Viewed

@@ -321,7 +321,7 @@ class VoxtralEncoder(VoxtralPreTrainedModel):
     def set_input_embeddings(self, value: nn.Module):
         self.conv1 = value
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_features,

transformers/models/voxtral/modular_voxtral.py CHANGED Viewed

@@ -65,7 +65,7 @@ class VoxtralEncoder(Qwen2AudioEncoder):
         "hidden_states": VoxtralEncoderLayer,
     }
-    @check_model_inputs()
+    @check_model_inputs
     def forward(
         self,
         input_features,

transformers/tokenization_utils_base.py CHANGED Viewed

@@ -2435,7 +2435,12 @@ class PreTrainedTokenizerBase(SpecialTokensMixin, PushToHubMixin):
                     return True
             return False
-        if _is_local or is_base_mistral(pretrained_model_name_or_path):
+        if is_offline_mode():
+            _is_local = True
+        if pretrained_model_name_or_path is not None and (
+            _is_local or (not _is_local and is_base_mistral(pretrained_model_name_or_path))
+        ):
             _config_file = cached_file(
                 pretrained_model_name_or_path,
                 "config.json",

transformers/utils/generic.py CHANGED Viewed

@@ -944,7 +944,7 @@ class OutputRecorder:
     class_name: Optional[str] = None
-def check_model_inputs(tie_last_hidden_states=True):
+def check_model_inputs(func=None, *, tie_last_hidden_states=True):
     """
     Decorator to intercept specific layer outputs without using hooks.
     Compatible with torch.compile (Dynamo tracing).
@@ -1115,6 +1115,8 @@ def check_model_inputs(tie_last_hidden_states=True):
         return wrapper
+    if func is not None:
+        return wrapped_fn(func)
     return wrapped_fn

{transformers-4.57.3.dist-info → transformers-4.57.4.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: transformers
-Version: 4.57.3
+Version: 4.57.4
 Summary: State-of-the-art Machine Learning for JAX, PyTorch and TensorFlow
 Home-page: https://github.com/huggingface/transformers
 Author: The Hugging Face team (past and future) with the help of all our contributors (https://github.com/huggingface/transformers/graphs/contributors)

transformers 4.57.3__py3-none-any.whl → 4.57.4__py3-none-any.whl

transformers 4.57.3py3-none-any.whl → 4.57.4py3-none-any.whl