PyPI - keras-hub-nightly - Versions diffs - 0.15.0.dev20240823171555__py3-none-any.whl → 0.16.0.dev2024092017__py3-none-any.whl - Mend

keras-hub-nightly 0.15.0.dev20240823171555py3-none-any.whl → 0.16.0.dev2024092017py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (198) hide show

keras_hub/__init__.py +0 -6
keras_hub/api/__init__.py +2 -0
keras_hub/api/bounding_box/__init__.py +36 -0
keras_hub/api/layers/__init__.py +14 -0
keras_hub/api/models/__init__.py +97 -48
keras_hub/api/tokenizers/__init__.py +30 -0
keras_hub/api/utils/__init__.py +22 -0
keras_hub/src/api_export.py +15 -9
keras_hub/src/bounding_box/__init__.py +13 -0
keras_hub/src/bounding_box/converters.py +529 -0
keras_hub/src/bounding_box/formats.py +162 -0
keras_hub/src/bounding_box/iou.py +263 -0
keras_hub/src/bounding_box/to_dense.py +95 -0
keras_hub/src/bounding_box/to_ragged.py +99 -0
keras_hub/src/bounding_box/utils.py +194 -0
keras_hub/src/bounding_box/validate_format.py +99 -0
keras_hub/src/layers/preprocessing/audio_converter.py +121 -0
keras_hub/src/layers/preprocessing/image_converter.py +130 -0
keras_hub/src/layers/preprocessing/masked_lm_mask_generator.py +2 -0
keras_hub/src/layers/preprocessing/multi_segment_packer.py +9 -8
keras_hub/src/layers/preprocessing/preprocessing_layer.py +2 -29
keras_hub/src/layers/preprocessing/random_deletion.py +33 -31
keras_hub/src/layers/preprocessing/random_swap.py +33 -31
keras_hub/src/layers/preprocessing/resizing_image_converter.py +101 -0
keras_hub/src/layers/preprocessing/start_end_packer.py +3 -2
keras_hub/src/models/albert/__init__.py +1 -2
keras_hub/src/models/albert/albert_masked_lm_preprocessor.py +6 -86
keras_hub/src/models/albert/{albert_classifier.py → albert_text_classifier.py} +34 -10
keras_hub/src/models/albert/{albert_preprocessor.py → albert_text_classifier_preprocessor.py} +14 -70
keras_hub/src/models/albert/albert_tokenizer.py +17 -36
keras_hub/src/models/backbone.py +12 -34
keras_hub/src/models/bart/__init__.py +1 -2
keras_hub/src/models/bart/bart_seq_2_seq_lm_preprocessor.py +21 -148
keras_hub/src/models/bart/bart_tokenizer.py +12 -39
keras_hub/src/models/bert/__init__.py +1 -5
keras_hub/src/models/bert/bert_masked_lm_preprocessor.py +6 -87
keras_hub/src/models/bert/bert_presets.py +1 -4
keras_hub/src/models/bert/{bert_classifier.py → bert_text_classifier.py} +19 -12
keras_hub/src/models/bert/{bert_preprocessor.py → bert_text_classifier_preprocessor.py} +14 -70
keras_hub/src/models/bert/bert_tokenizer.py +17 -35
keras_hub/src/models/bloom/__init__.py +1 -2
keras_hub/src/models/bloom/bloom_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/bloom/bloom_tokenizer.py +12 -41
keras_hub/src/models/causal_lm.py +10 -29
keras_hub/src/models/causal_lm_preprocessor.py +195 -0
keras_hub/src/models/csp_darknet/csp_darknet_backbone.py +54 -15
keras_hub/src/models/deberta_v3/__init__.py +1 -4
keras_hub/src/models/deberta_v3/deberta_v3_masked_lm_preprocessor.py +14 -77
keras_hub/src/models/deberta_v3/{deberta_v3_classifier.py → deberta_v3_text_classifier.py} +16 -11
keras_hub/src/models/deberta_v3/{deberta_v3_preprocessor.py → deberta_v3_text_classifier_preprocessor.py} +23 -64
keras_hub/src/models/deberta_v3/deberta_v3_tokenizer.py +30 -25
keras_hub/src/models/densenet/densenet_backbone.py +46 -22
keras_hub/src/models/distil_bert/__init__.py +1 -4
keras_hub/src/models/distil_bert/distil_bert_masked_lm_preprocessor.py +14 -76
keras_hub/src/models/distil_bert/{distil_bert_classifier.py → distil_bert_text_classifier.py} +17 -12
keras_hub/src/models/distil_bert/{distil_bert_preprocessor.py → distil_bert_text_classifier_preprocessor.py} +23 -63
keras_hub/src/models/distil_bert/distil_bert_tokenizer.py +19 -35
keras_hub/src/models/efficientnet/__init__.py +13 -0
keras_hub/src/models/efficientnet/efficientnet_backbone.py +569 -0
keras_hub/src/models/efficientnet/fusedmbconv.py +229 -0
keras_hub/src/models/efficientnet/mbconv.py +238 -0
keras_hub/src/models/electra/__init__.py +1 -2
keras_hub/src/models/electra/electra_tokenizer.py +17 -32
keras_hub/src/models/f_net/__init__.py +1 -2
keras_hub/src/models/f_net/f_net_masked_lm_preprocessor.py +12 -78
keras_hub/src/models/f_net/{f_net_classifier.py → f_net_text_classifier.py} +17 -10
keras_hub/src/models/f_net/{f_net_preprocessor.py → f_net_text_classifier_preprocessor.py} +19 -63
keras_hub/src/models/f_net/f_net_tokenizer.py +17 -35
keras_hub/src/models/falcon/__init__.py +1 -2
keras_hub/src/models/falcon/falcon_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/falcon/falcon_tokenizer.py +12 -35
keras_hub/src/models/gemma/__init__.py +1 -2
keras_hub/src/models/gemma/gemma_causal_lm_preprocessor.py +6 -90
keras_hub/src/models/gemma/gemma_decoder_block.py +1 -1
keras_hub/src/models/gemma/gemma_tokenizer.py +12 -23
keras_hub/src/models/gpt2/__init__.py +1 -2
keras_hub/src/models/gpt2/gpt2_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/gpt2/gpt2_preprocessor.py +12 -90
keras_hub/src/models/gpt2/gpt2_tokenizer.py +12 -34
keras_hub/src/models/gpt_neo_x/gpt_neo_x_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/gpt_neo_x/gpt_neo_x_tokenizer.py +12 -34
keras_hub/src/models/image_classifier.py +0 -5
keras_hub/src/models/image_classifier_preprocessor.py +83 -0
keras_hub/src/models/llama/__init__.py +1 -2
keras_hub/src/models/llama/llama_causal_lm_preprocessor.py +6 -85
keras_hub/src/models/llama/llama_tokenizer.py +12 -25
keras_hub/src/models/llama3/__init__.py +1 -2
keras_hub/src/models/llama3/llama3_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/llama3/llama3_tokenizer.py +12 -33
keras_hub/src/models/masked_lm.py +0 -2
keras_hub/src/models/masked_lm_preprocessor.py +156 -0
keras_hub/src/models/mistral/__init__.py +1 -2
keras_hub/src/models/mistral/mistral_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/mistral/mistral_tokenizer.py +12 -23
keras_hub/src/models/mix_transformer/mix_transformer_backbone.py +2 -2
keras_hub/src/models/mobilenet/__init__.py +13 -0
keras_hub/src/models/mobilenet/mobilenet_backbone.py +530 -0
keras_hub/src/models/mobilenet/mobilenet_image_classifier.py +114 -0
keras_hub/src/models/opt/__init__.py +1 -2
keras_hub/src/models/opt/opt_causal_lm_preprocessor.py +6 -93
keras_hub/src/models/opt/opt_tokenizer.py +12 -41
keras_hub/src/models/pali_gemma/__init__.py +1 -4
keras_hub/src/models/pali_gemma/pali_gemma_causal_lm_preprocessor.py +28 -28
keras_hub/src/models/pali_gemma/pali_gemma_image_converter.py +25 -0
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +5 -5
keras_hub/src/models/pali_gemma/pali_gemma_tokenizer.py +11 -3
keras_hub/src/models/phi3/__init__.py +1 -2
keras_hub/src/models/phi3/phi3_causal_lm.py +3 -9
keras_hub/src/models/phi3/phi3_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/phi3/phi3_tokenizer.py +12 -36
keras_hub/src/models/preprocessor.py +72 -83
keras_hub/src/models/resnet/__init__.py +6 -0
keras_hub/src/models/resnet/resnet_backbone.py +390 -42
keras_hub/src/models/resnet/resnet_image_classifier.py +33 -6
keras_hub/src/models/resnet/resnet_image_classifier_preprocessor.py +28 -0
keras_hub/src/models/{llama3/llama3_preprocessor.py → resnet/resnet_image_converter.py} +7 -5
keras_hub/src/models/resnet/resnet_presets.py +95 -0
keras_hub/src/models/retinanet/__init__.py +13 -0
keras_hub/src/models/retinanet/anchor_generator.py +175 -0
keras_hub/src/models/retinanet/box_matcher.py +259 -0
keras_hub/src/models/retinanet/non_max_supression.py +578 -0
keras_hub/src/models/roberta/__init__.py +1 -2
keras_hub/src/models/roberta/roberta_masked_lm_preprocessor.py +22 -74
keras_hub/src/models/roberta/{roberta_classifier.py → roberta_text_classifier.py} +16 -11
keras_hub/src/models/roberta/{roberta_preprocessor.py → roberta_text_classifier_preprocessor.py} +21 -53
keras_hub/src/models/roberta/roberta_tokenizer.py +13 -52
keras_hub/src/models/seq_2_seq_lm_preprocessor.py +269 -0
keras_hub/src/models/stable_diffusion_v3/__init__.py +13 -0
keras_hub/src/models/stable_diffusion_v3/clip_encoder_block.py +103 -0
keras_hub/src/models/stable_diffusion_v3/clip_preprocessor.py +93 -0
keras_hub/src/models/stable_diffusion_v3/clip_text_encoder.py +149 -0
keras_hub/src/models/stable_diffusion_v3/clip_tokenizer.py +167 -0
keras_hub/src/models/stable_diffusion_v3/mmdit.py +427 -0
keras_hub/src/models/stable_diffusion_v3/mmdit_block.py +317 -0
keras_hub/src/models/stable_diffusion_v3/t5_xxl_preprocessor.py +74 -0
keras_hub/src/models/stable_diffusion_v3/t5_xxl_text_encoder.py +155 -0
keras_hub/src/models/stable_diffusion_v3/vae_attention.py +126 -0
keras_hub/src/models/stable_diffusion_v3/vae_image_decoder.py +186 -0
keras_hub/src/models/t5/__init__.py +1 -2
keras_hub/src/models/t5/t5_tokenizer.py +13 -23
keras_hub/src/models/task.py +71 -116
keras_hub/src/models/{classifier.py → text_classifier.py} +19 -13
keras_hub/src/models/text_classifier_preprocessor.py +138 -0
keras_hub/src/models/whisper/__init__.py +1 -2
keras_hub/src/models/whisper/{whisper_audio_feature_extractor.py → whisper_audio_converter.py} +20 -18
keras_hub/src/models/whisper/whisper_backbone.py +0 -3
keras_hub/src/models/whisper/whisper_presets.py +10 -10
keras_hub/src/models/whisper/whisper_tokenizer.py +20 -16
keras_hub/src/models/xlm_roberta/__init__.py +1 -4
keras_hub/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor.py +26 -72
keras_hub/src/models/xlm_roberta/{xlm_roberta_classifier.py → xlm_roberta_text_classifier.py} +16 -11
keras_hub/src/models/xlm_roberta/{xlm_roberta_preprocessor.py → xlm_roberta_text_classifier_preprocessor.py} +26 -53
keras_hub/src/models/xlm_roberta/xlm_roberta_tokenizer.py +25 -10
keras_hub/src/tests/test_case.py +46 -0
keras_hub/src/tokenizers/byte_pair_tokenizer.py +30 -17
keras_hub/src/tokenizers/byte_tokenizer.py +14 -15
keras_hub/src/tokenizers/sentence_piece_tokenizer.py +20 -7
keras_hub/src/tokenizers/tokenizer.py +67 -32
keras_hub/src/tokenizers/unicode_codepoint_tokenizer.py +14 -15
keras_hub/src/tokenizers/word_piece_tokenizer.py +34 -47
keras_hub/src/utils/imagenet/__init__.py +13 -0
keras_hub/src/utils/imagenet/imagenet_utils.py +1067 -0
keras_hub/src/utils/keras_utils.py +0 -50
keras_hub/src/utils/preset_utils.py +230 -68
keras_hub/src/utils/tensor_utils.py +187 -69
keras_hub/src/utils/timm/convert_resnet.py +19 -16
keras_hub/src/utils/timm/preset_loader.py +66 -0
keras_hub/src/utils/transformers/convert_albert.py +193 -0
keras_hub/src/utils/transformers/convert_bart.py +373 -0
keras_hub/src/utils/transformers/convert_bert.py +7 -17
keras_hub/src/utils/transformers/convert_distilbert.py +10 -20
keras_hub/src/utils/transformers/convert_gemma.py +5 -19
keras_hub/src/utils/transformers/convert_gpt2.py +5 -18
keras_hub/src/utils/transformers/convert_llama3.py +7 -18
keras_hub/src/utils/transformers/convert_mistral.py +129 -0
keras_hub/src/utils/transformers/convert_pali_gemma.py +7 -29
keras_hub/src/utils/transformers/preset_loader.py +77 -0
keras_hub/src/utils/transformers/safetensor_utils.py +2 -2
keras_hub/src/version_utils.py +1 -1
keras_hub_nightly-0.16.0.dev2024092017.dist-info/METADATA +202 -0
keras_hub_nightly-0.16.0.dev2024092017.dist-info/RECORD +334 -0
{keras_hub_nightly-0.15.0.dev20240823171555.dist-info → keras_hub_nightly-0.16.0.dev2024092017.dist-info}/WHEEL +1 -1
keras_hub/src/models/bart/bart_preprocessor.py +0 -276
keras_hub/src/models/bloom/bloom_preprocessor.py +0 -185
keras_hub/src/models/electra/electra_preprocessor.py +0 -154
keras_hub/src/models/falcon/falcon_preprocessor.py +0 -187
keras_hub/src/models/gemma/gemma_preprocessor.py +0 -191
keras_hub/src/models/gpt_neo_x/gpt_neo_x_preprocessor.py +0 -145
keras_hub/src/models/llama/llama_preprocessor.py +0 -189
keras_hub/src/models/mistral/mistral_preprocessor.py +0 -190
keras_hub/src/models/opt/opt_preprocessor.py +0 -188
keras_hub/src/models/phi3/phi3_preprocessor.py +0 -190
keras_hub/src/models/whisper/whisper_preprocessor.py +0 -326
keras_hub/src/utils/timm/convert.py +0 -37
keras_hub/src/utils/transformers/convert.py +0 -101
keras_hub_nightly-0.15.0.dev20240823171555.dist-info/METADATA +0 -34
keras_hub_nightly-0.15.0.dev20240823171555.dist-info/RECORD +0 -297
{keras_hub_nightly-0.15.0.dev20240823171555.dist-info → keras_hub_nightly-0.16.0.dev2024092017.dist-info}/top_level.txt +0 -0

keras_hub/src/utils/tensor_utils.py CHANGED Viewed

@@ -12,7 +12,13 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
+import contextlib
+import functools
+import inspect
+import threading
 import keras
+import numpy as np
 from keras import ops
 try:
@@ -23,6 +29,181 @@ except ImportError:
     tf_text = None
+NO_CONVERT_COUNTER = threading.local()
+@contextlib.contextmanager
+def no_convert_scope():
+    try:
+        NO_CONVERT_COUNTER.count = getattr(NO_CONVERT_COUNTER, "count", 0) + 1
+        yield
+    finally:
+        NO_CONVERT_COUNTER.count = getattr(NO_CONVERT_COUNTER, "count", 0) - 1
+def in_no_convert_scope():
+    return getattr(NO_CONVERT_COUNTER, "count", 0) > 0
+def preprocessing_function(fn):
+    """Wraps a preprocessing function to handle tf tensor conversion."""
+    if tf is None:
+        return fn
+    params = inspect.signature(fn).parameters
+    accepts_labels = all(k in params for k in ("x", "y", "sample_weight"))
+    if not accepts_labels:
+        @functools.wraps(fn)
+        def wrapper(self, x, **kwargs):
+            with tf.device("cpu"):
+                x = convert_preprocessing_inputs(x)
+                with no_convert_scope():
+                    x = fn(self, x, **kwargs)
+                return convert_preprocessing_outputs(x)
+    else:
+        @functools.wraps(fn)
+        def wrapper(self, x, y=None, sample_weight=None, **kwargs):
+            with tf.device("cpu"):
+                x, y, sample_weight = convert_preprocessing_inputs(
+                    (x, y, sample_weight)
+                )
+                with no_convert_scope():
+                    x = fn(self, x, y=y, sample_weight=sample_weight, **kwargs)
+                return convert_preprocessing_outputs(x)
+    return wrapper
+def convert_preprocessing_inputs(x):
+    """Convert raw inputs for preprocessing.
+    This function is used to convert raw inputs (strings, lists, `np.ndarray`s,
+    `jax.Array`s, `torch.Tensor`s, etc) to a canonical format for
+    preprocessing layers. All inputs will be converted to backend tensors if
+    possible, except ragged inputs and string inputs which be converted to tf
+    tensors regardless of backend.
+    `tuple` and `list` elements are handled differently by this function. A
+    `tuple` is assumed to enumerate separate inputs, and a `list` is assumed to
+    enumerate elements in a single array-like input. This makes it possible to
+    represent ragged and string inputs in a multi-backend format, as shown in
+    the examples below.
+    Examples:
+    ```python
+    # Two ragged arrays of token ids.
+    x = ([[1, 2, 3], [4, 5]], [[1, 2], [3, 4, 5]])
+    keras_hub.utils.convert_preprocessing_inputs(x)
+    # A batch of three samples each with two string segments.
+    x = (["hi", "hello", "hey"], ["bye", "later", "so long"])
+    keras_hub.utils.convert_preprocessing_inputs(x)
+    # A batch of features in a dictionary.
+    x = {
+        "text": ["hi", "hello", "hey"],
+        "images": np.ones((3, 64, 64, 3)),
+        "labels": [1, 0, 1],
+    }
+    keras_hub.utils.convert_preprocessing_inputs(x)
+    ```
+    """
+    if not tf.executing_eagerly() or in_no_convert_scope():
+        return x
+    if isinstance(x, dict):
+        return {k: convert_preprocessing_inputs(x[k]) for k, v in x.items()}
+    if isinstance(x, tuple):
+        return tuple(convert_preprocessing_inputs(v) for v in x)
+    if isinstance(x, (str, bytes)):
+        return tf.constant(x)
+    if isinstance(x, list):
+        try:
+            numpy_x = np.array(x)
+        except ValueError as e:
+            # If numpy conversion failed, try converting to a ragged array.
+            try:
+                return tf.ragged.constant(x)
+            except ValueError:
+                # If ragged conversion failed return to the numpy error.
+                raise e
+        # If we have a string input, use tf.tensor.
+        if numpy_x.dtype.type is np.str_ or numpy_x.dtype.type is np.bytes_:
+            return tf.convert_to_tensor(x)
+        # Numpy will default to int64, int32 works with more ops.
+        if numpy_x.dtype == np.int64:
+            numpy_x = numpy_x.astype(np.int32)
+        # We have non-ragged, non-string input. Use backbend type.
+        x = ops.convert_to_tensor(numpy_x)
+        # Torch will complain about device placement for GPU tensors.
+        if keras.config.backend() == "torch":
+            x = x.cpu()
+        return x
+    if is_tensor_type(x):
+        # String or ragged types we keep as tf.
+        if isinstance(x, tf.RaggedTensor) or x.dtype == tf.string:
+            return x
+        # If we have a string input, use tf.tensor.
+        if isinstance(x, np.ndarray) and x.dtype.type is np.str_:
+            return tf.convert_to_tensor(x)
+        x = ops.convert_to_tensor(x)
+        # Torch will complain about device placement for GPU tensors.
+        if keras.config.backend() == "torch":
+            x = x.cpu()
+        return x
+    return x
+def convert_preprocessing_outputs(x):
+    """Convert outputs after preprocessing to a backend agnostic format.
+    This function is used to convert `tf.Tensor` and `tf.RaggedTensor` output
+    from preprocessing layers to either:
+    - The correct tensor type for the Keras backend framework.
+    - Python lists, in the case of ragged and string data.
+    This will automatically be called when on the output of preprocessing
+    layers or `keras_hub.models.Task`s with preprocessing included. It could be
+    used directly to convert a `tf.data.Dataset` output to a backend agnostic
+    type.
+    Examples:
+    ```python
+    # Two ragged arrays of token ids.
+    x = tf.ragged.constant([[1, 2, 3], [4, 5]])
+    keras_hub.utils.convert_preprocessing_outputs(x)
+    # A batch of three samples each with two string segments.
+    x = (tf.constant["hi", "yo", "hey"]), tf.constant(["bye", "ciao", ""]))
+    keras_hub.utils.convert_preprocessing_outputs(x)
+    # A batch of features in a dictionary.
+    x = {
+        "text": tf.constant(["hi", "hello", "hey"]),
+        "images": tf.ones((3, 64, 64, 3)),
+        "labels": tf.constant([1, 0, 1]),
+    }
+    keras_hub.utils.convert_preprocessing_outputs(x)
+    ```
+    """
+    if not tf.executing_eagerly() or in_no_convert_scope():
+        return x
+    def convert(x):
+        if x is None:
+            return x
+        if isinstance(x, tf.RaggedTensor) or x.dtype == tf.string:
+            return tensor_to_list(x)
+        dtype = keras.backend.standardize_dtype(x.dtype)
+        return ops.convert_to_tensor(x, dtype=dtype)
+    return keras.tree.map_structure(convert, x)
 def _decode_strings_to_utf8(inputs):
     """Recursively decodes to list of strings with 'utf-8' encoding."""
     if isinstance(inputs, bytes):
@@ -52,75 +233,15 @@ def tensor_to_list(inputs):
     return list_outputs
-def convert_to_backend_tensor_or_python_list(x):
-    """
-    Convert a tensor to the backend friendly representation of the data.
-    This wraps `ops.convert_to_tensor` to account for the fact that torch and
-    jax both lack native types for ragged and string data.
-    If we encounter one of these types in torch or jax, we will instead covert
-    the tensor to simple pythonic types (lists of strings).
-    """
-    if isinstance(x, tf.RaggedTensor) or getattr(x, "dtype", None) == tf.string:
-        return tensor_to_list(x)
-    dtype = getattr(x, "dtype", "float32")
-    dtype = keras.backend.standardize_dtype(dtype)
-    return ops.convert_to_tensor(x, dtype=dtype)
 def convert_to_ragged_batch(inputs):
-    """Convert pythonic or numpy-like input to a 2-D `tf.RaggedTensor`.
-    This is useful for text preprocessing layers which deal with already
-    tokenized or split text.
-    Args:
-        inputs: A pythonic or numpy-like input to covert. This input should
-            represent a possibly batched list of token sequences.
-    Returns:
-        An `(inputs, unbatched, rectangular)` tuple, where `inputs` is a
-        2-D `tf.RaggedTensor`, `unbatched` is `True` if the inputs were
-        origianlly rank 1, and `rectangular` is `True` if the inputs rows are
-        all of equal lengths.
-    """
-    # `tf.keras.layers.Layer` does a weird conversion in __call__, where a list
-    # of lists of ints will become a list of list of scalar tensors. We could
-    # clean this up if we no longer need to care about that case.
-    if isinstance(inputs, (list, tuple)):
-        if isinstance(inputs[0], (list, tuple)):
-            rectangular = len(set([len(row) for row in inputs])) == 1
-            rows = [
-                tf.convert_to_tensor(row, dtype_hint="int32") for row in inputs
-            ]
-            inputs = tf.ragged.stack(rows).with_row_splits_dtype("int64")
-        else:
-            inputs = tf.convert_to_tensor(inputs)
-            rectangular = True
-    elif isinstance(inputs, tf.Tensor):
-        rectangular = True
-    elif isinstance(inputs, tf.RaggedTensor):
-        rectangular = False
-    elif hasattr(inputs, "__array__"):
-        inputs = tf.convert_to_tensor(ops.convert_to_numpy(inputs))
-        rectangular = True
-    else:
-        raise ValueError(
-            f"Unknown tensor type. Tensor input can be passed as "
-            "tensors, numpy arrays, or python lists. Received: "
-            f"`type(inputs)={type(inputs)}`"
-        )
-    if inputs.shape.rank < 1 or inputs.shape.rank > 2:
-        raise ValueError(
-            f"Tokenized tensor input should be rank 1 (unbatched) or "
-            f"rank 2 (batched). Received: `inputs.shape={input.shape}`"
-        )
+    """Ensure a tf.Tensor is a ragged rank 2 tensor."""
+    if not isinstance(inputs, (tf.RaggedTensor, tf.Tensor)):
+        inputs = tf.convert_to_tensor(inputs)
     unbatched = inputs.shape.rank == 1
-    rectangular = rectangular or unbatched
+    rectangular = isinstance(inputs, tf.Tensor)
     if unbatched:
         inputs = tf.expand_dims(inputs, 0)
-    if isinstance(inputs, tf.Tensor):
+    if rectangular:
         inputs = tf.RaggedTensor.from_tensor(inputs)
     return inputs, unbatched, rectangular
@@ -135,10 +256,7 @@ def truncate_at_token(inputs, token, mask):
 def strip_to_ragged(token_ids, mask, ids_to_strip):
     """Remove masked and special tokens from a sequence before detokenizing."""
-    token_ids = ops.convert_to_numpy(token_ids)
-    token_ids = token_ids.astype("int32")
-    mask = ops.convert_to_numpy(mask)
-    mask = mask.astype("bool")
+    mask = tf.cast(mask, "bool")
     for id in ids_to_strip:
         mask = mask & (token_ids != id)
     return tf.ragged.boolean_mask(token_ids, mask)

keras_hub/src/utils/timm/convert_resnet.py CHANGED Viewed

@@ -13,10 +13,9 @@
 # limitations under the License.
 import numpy as np
-from keras_hub.src.utils.preset_utils import HF_CONFIG_FILE
-from keras_hub.src.utils.preset_utils import jax_memory_cleanup
-from keras_hub.src.utils.preset_utils import load_config
-from keras_hub.src.utils.transformers.safetensor_utils import SafetensorLoader
+from keras_hub.src.models.resnet.resnet_backbone import ResNetBackbone
+backbone_cls = ResNetBackbone
 def convert_backbone_config(timm_config):
@@ -56,6 +55,8 @@ def convert_backbone_config(timm_config):
         stackwise_num_strides=[1, 2, 2, 2],
         block_type=block_type,
         use_pre_activation=use_pre_activation,
+        input_conv_filters=[64],
+        input_conv_kernel_sizes=[7],
     )
@@ -100,10 +101,10 @@ def convert_weights(backbone, loader, timm_config):
     for stack_index in range(num_stacks):
         for block_idx in range(backbone.stackwise_num_blocks[stack_index]):
             if version == "v1":
-                keras_name = f"v1_stack{stack_index}_block{block_idx}"
+                keras_name = f"stack{stack_index}_block{block_idx}"
                 hf_name = f"layer{stack_index+1}.{block_idx}"
             else:
-                keras_name = f"v2_stack{stack_index}_block{block_idx}"
+                keras_name = f"stack{stack_index}_block{block_idx}"
                 hf_name = f"stages.{stack_index}.blocks.{block_idx}"
             if version == "v1":
@@ -159,13 +160,15 @@ def convert_weights(backbone, loader, timm_config):
     normalization_layer.build(normalization_layer._build_input_shape)
-def load_resnet_backbone(cls, preset, load_weights, **kwargs):
-    timm_config = load_config(preset, HF_CONFIG_FILE)
-    keras_config = convert_backbone_config(timm_config)
-    backbone = cls(**keras_config, **kwargs)
-    if load_weights:
-        jax_memory_cleanup(backbone)
-        # Use prefix="" to avoid using `get_prefixed_key`.
-        with SafetensorLoader(preset, prefix="") as loader:
-            convert_weights(backbone, loader, timm_config)
-    return backbone
+def convert_head(task, loader, timm_config):
+    v2 = "resnetv2_" in timm_config["architecture"]
+    prefix = "head.fc." if v2 else "fc."
+    loader.port_weight(
+        task.output_dense.kernel,
+        hf_weight_key=prefix + "weight",
+        hook_fn=lambda x, _: np.transpose(np.squeeze(x)),
+    )
+    loader.port_weight(
+        task.output_dense.bias,
+        hf_weight_key=prefix + "bias",
+    )

keras_hub/src/utils/timm/preset_loader.py ADDED Viewed

@@ -0,0 +1,66 @@
+# Copyright 2024 The KerasHub Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Convert timm models to KerasHub."""
+from keras_hub.src.models.image_classifier import ImageClassifier
+from keras_hub.src.utils.preset_utils import PresetLoader
+from keras_hub.src.utils.preset_utils import jax_memory_cleanup
+from keras_hub.src.utils.timm import convert_resnet
+from keras_hub.src.utils.transformers.safetensor_utils import SafetensorLoader
+class TimmPresetLoader(PresetLoader):
+    def __init__(self, preset, config):
+        super().__init__(preset, config)
+        architecture = self.config["architecture"]
+        if "resnet" in architecture:
+            self.converter = convert_resnet
+        else:
+            raise ValueError(
+                "KerasHub has no converter for timm models "
+                f"with architecture `'{architecture}'`."
+            )
+    def check_backbone_class(self):
+        return self.converter.backbone_cls
+    def load_backbone(self, cls, load_weights, **kwargs):
+        keras_config = self.converter.convert_backbone_config(self.config)
+        backbone = cls(**{**keras_config, **kwargs})
+        if load_weights:
+            jax_memory_cleanup(backbone)
+            # Use prefix="" to avoid using `get_prefixed_key`.
+            with SafetensorLoader(self.preset, prefix="") as loader:
+                self.converter.convert_weights(backbone, loader, self.config)
+        return backbone
+    def load_task(self, cls, load_weights, load_task_weights, **kwargs):
+        if not load_task_weights or not issubclass(cls, ImageClassifier):
+            return super().load_task(
+                cls, load_weights, load_task_weights, **kwargs
+            )
+        # Support loading the classification head for classifier models.
+        kwargs["num_classes"] = self.config["num_classes"]
+        task = super().load_task(cls, load_weights, load_task_weights, **kwargs)
+        if load_task_weights:
+            with SafetensorLoader(self.preset, prefix="") as loader:
+                self.converter.convert_head(task, loader, self.config)
+        return task
+    def load_image_converter(self, cls, **kwargs):
+        pretrained_cfg = self.config.get("pretrained_cfg", None)
+        if not pretrained_cfg or "input_size" not in pretrained_cfg:
+            return None
+        input_size = pretrained_cfg["input_size"]
+        return cls(width=input_size[1], height=input_size[2])

keras_hub/src/utils/transformers/convert_albert.py ADDED Viewed

@@ -0,0 +1,193 @@
+# Copyright 2024 The KerasHub Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import numpy as np
+from keras_hub.src.models.albert.albert_backbone import AlbertBackbone
+from keras_hub.src.utils.preset_utils import get_file
+backbone_cls = AlbertBackbone
+def convert_backbone_config(transformers_config):
+    return {
+        "vocabulary_size": transformers_config["vocab_size"],
+        "num_layers": transformers_config["num_hidden_layers"],
+        "num_heads": transformers_config["num_attention_heads"],
+        "embedding_dim": transformers_config["embedding_size"],
+        "hidden_dim": transformers_config["hidden_size"],
+        "intermediate_dim": transformers_config["intermediate_size"],
+        "num_groups": transformers_config["num_hidden_groups"],
+        "num_inner_repetitions": transformers_config["inner_group_num"],
+        "dropout": transformers_config["attention_probs_dropout_prob"],
+        "max_sequence_length": transformers_config["max_position_embeddings"],
+        "num_segments": transformers_config["type_vocab_size"],
+    }
+def convert_weights(backbone, loader, transformers_config):
+    # Embeddings
+    loader.port_weight(
+        keras_variable=backbone.token_embedding.embeddings,
+        hf_weight_key="albert.embeddings.word_embeddings.weight",
+    )
+    loader.port_weight(
+        keras_variable=backbone.position_embedding.position_embeddings,
+        hf_weight_key="albert.embeddings.position_embeddings.weight",
+    )
+    loader.port_weight(
+        keras_variable=backbone.segment_embedding.embeddings,
+        hf_weight_key="albert.embeddings.token_type_embeddings.weight",
+    )
+    # Normalization
+    loader.port_weight(
+        keras_variable=backbone.embeddings_layer_norm.gamma,
+        hf_weight_key="albert.embeddings.LayerNorm.weight",
+    )
+    loader.port_weight(
+        keras_variable=backbone.embeddings_layer_norm.beta,
+        hf_weight_key="albert.embeddings.LayerNorm.bias",
+    )
+    # Encoder Embeddings
+    loader.port_weight(
+        keras_variable=backbone.embeddings_projection.kernel,
+        hf_weight_key="albert.encoder.embedding_hidden_mapping_in.weight",
+        hook_fn=lambda hf_tensor, _: np.transpose(hf_tensor, axes=(1, 0)),
+    )
+    loader.port_weight(
+        keras_variable=backbone.embeddings_projection.bias,
+        hf_weight_key="albert.encoder.embedding_hidden_mapping_in.bias",
+    )
+    # Encoder Group Layers
+    for group_idx in range(backbone.num_groups):
+        for inner_layer_idx in range(backbone.num_inner_repetitions):
+            keras_group = backbone.get_layer(
+                f"group_{group_idx}_inner_layer_{inner_layer_idx}"
+            )
+            hf_group_prefix = (
+                "albert.encoder.albert_layer_groups."
+                f"{group_idx}.albert_layers.{inner_layer_idx}."
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer.query_dense.kernel,
+                hf_weight_key=f"{hf_group_prefix}attention.query.weight",
+                hook_fn=lambda hf_tensor, keras_shape: np.reshape(
+                    np.transpose(hf_tensor), keras_shape
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer.query_dense.bias,
+                hf_weight_key=f"{hf_group_prefix}attention.query.bias",
+                hook_fn=lambda hf_tensor, keras_shape: np.reshape(
+                    hf_tensor, keras_shape
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer.key_dense.kernel,
+                hf_weight_key=f"{hf_group_prefix}attention.key.weight",
+                hook_fn=lambda hf_tensor, keras_shape: np.reshape(
+                    np.transpose(hf_tensor), keras_shape
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer.key_dense.bias,
+                hf_weight_key=f"{hf_group_prefix}attention.key.bias",
+                hook_fn=lambda hf_tensor, keras_shape: np.reshape(
+                    hf_tensor, keras_shape
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer.value_dense.kernel,
+                hf_weight_key=f"{hf_group_prefix}attention.value.weight",
+                hook_fn=lambda hf_tensor, keras_shape: np.reshape(
+                    np.transpose(hf_tensor), keras_shape
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer.value_dense.bias,
+                hf_weight_key=f"{hf_group_prefix}attention.value.bias",
+                hook_fn=lambda hf_tensor, keras_shape: np.reshape(
+                    hf_tensor, keras_shape
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer.output_dense.kernel,
+                hf_weight_key=f"{hf_group_prefix}attention.dense.weight",
+                hook_fn=lambda hf_tensor, keras_shape: np.reshape(
+                    np.transpose(hf_tensor), keras_shape
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer.output_dense.bias,
+                hf_weight_key=f"{hf_group_prefix}attention.dense.bias",
+                hook_fn=lambda hf_tensor, keras_shape: np.reshape(
+                    hf_tensor, keras_shape
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer_norm.gamma,
+                hf_weight_key=f"{hf_group_prefix}attention.LayerNorm.weight",
+            )
+            loader.port_weight(
+                keras_variable=keras_group._self_attention_layer_norm.beta,
+                hf_weight_key=f"{hf_group_prefix}attention.LayerNorm.bias",
+            )
+            loader.port_weight(
+                keras_variable=keras_group._feedforward_intermediate_dense.kernel,
+                hf_weight_key=f"{hf_group_prefix}ffn.weight",
+                hook_fn=lambda hf_tensor, _: np.transpose(
+                    hf_tensor, axes=(1, 0)
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._feedforward_intermediate_dense.bias,
+                hf_weight_key=f"{hf_group_prefix}ffn.bias",
+            )
+            loader.port_weight(
+                keras_variable=keras_group._feedforward_output_dense.kernel,
+                hf_weight_key=f"{hf_group_prefix}ffn_output.weight",
+                hook_fn=lambda hf_tensor, _: np.transpose(
+                    hf_tensor, axes=(1, 0)
+                ),
+            )
+            loader.port_weight(
+                keras_variable=keras_group._feedforward_output_dense.bias,
+                hf_weight_key=f"{hf_group_prefix}ffn_output.bias",
+            )
+            loader.port_weight(
+                keras_variable=keras_group._feedforward_layer_norm.gamma,
+                hf_weight_key=f"{hf_group_prefix}full_layer_layer_norm.weight",
+            )
+            loader.port_weight(
+                keras_variable=keras_group._feedforward_layer_norm.beta,
+                hf_weight_key=f"{hf_group_prefix}full_layer_layer_norm.bias",
+            )
+    # Pooler
+    loader.port_weight(
+        keras_variable=backbone.pooled_dense.kernel,
+        hf_weight_key="albert.pooler.weight",
+        hook_fn=lambda hf_tensor, _: np.transpose(hf_tensor, axes=(1, 0)),
+    )
+    loader.port_weight(
+        keras_variable=backbone.pooled_dense.bias,
+        hf_weight_key="albert.pooler.bias",
+    )
+def convert_tokenizer(cls, preset, **kwargs):
+    return cls(get_file(preset, "spiece.model"), **kwargs)

keras-hub-nightly 0.15.0.dev20240823171555__py3-none-any.whl → 0.16.0.dev2024092017__py3-none-any.whl

keras-hub-nightly 0.15.0.dev20240823171555py3-none-any.whl → 0.16.0.dev2024092017py3-none-any.whl