PyPI - keras-hub-nightly - Versions diffs - 0.15.0.dev20240823171555__py3-none-any.whl → 0.16.0.dev2024092017__py3-none-any.whl - Mend

keras-hub-nightly 0.15.0.dev20240823171555py3-none-any.whl → 0.16.0.dev2024092017py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (198) hide show

keras_hub/__init__.py +0 -6
keras_hub/api/__init__.py +2 -0
keras_hub/api/bounding_box/__init__.py +36 -0
keras_hub/api/layers/__init__.py +14 -0
keras_hub/api/models/__init__.py +97 -48
keras_hub/api/tokenizers/__init__.py +30 -0
keras_hub/api/utils/__init__.py +22 -0
keras_hub/src/api_export.py +15 -9
keras_hub/src/bounding_box/__init__.py +13 -0
keras_hub/src/bounding_box/converters.py +529 -0
keras_hub/src/bounding_box/formats.py +162 -0
keras_hub/src/bounding_box/iou.py +263 -0
keras_hub/src/bounding_box/to_dense.py +95 -0
keras_hub/src/bounding_box/to_ragged.py +99 -0
keras_hub/src/bounding_box/utils.py +194 -0
keras_hub/src/bounding_box/validate_format.py +99 -0
keras_hub/src/layers/preprocessing/audio_converter.py +121 -0
keras_hub/src/layers/preprocessing/image_converter.py +130 -0
keras_hub/src/layers/preprocessing/masked_lm_mask_generator.py +2 -0
keras_hub/src/layers/preprocessing/multi_segment_packer.py +9 -8
keras_hub/src/layers/preprocessing/preprocessing_layer.py +2 -29
keras_hub/src/layers/preprocessing/random_deletion.py +33 -31
keras_hub/src/layers/preprocessing/random_swap.py +33 -31
keras_hub/src/layers/preprocessing/resizing_image_converter.py +101 -0
keras_hub/src/layers/preprocessing/start_end_packer.py +3 -2
keras_hub/src/models/albert/__init__.py +1 -2
keras_hub/src/models/albert/albert_masked_lm_preprocessor.py +6 -86
keras_hub/src/models/albert/{albert_classifier.py → albert_text_classifier.py} +34 -10
keras_hub/src/models/albert/{albert_preprocessor.py → albert_text_classifier_preprocessor.py} +14 -70
keras_hub/src/models/albert/albert_tokenizer.py +17 -36
keras_hub/src/models/backbone.py +12 -34
keras_hub/src/models/bart/__init__.py +1 -2
keras_hub/src/models/bart/bart_seq_2_seq_lm_preprocessor.py +21 -148
keras_hub/src/models/bart/bart_tokenizer.py +12 -39
keras_hub/src/models/bert/__init__.py +1 -5
keras_hub/src/models/bert/bert_masked_lm_preprocessor.py +6 -87
keras_hub/src/models/bert/bert_presets.py +1 -4
keras_hub/src/models/bert/{bert_classifier.py → bert_text_classifier.py} +19 -12
keras_hub/src/models/bert/{bert_preprocessor.py → bert_text_classifier_preprocessor.py} +14 -70
keras_hub/src/models/bert/bert_tokenizer.py +17 -35
keras_hub/src/models/bloom/__init__.py +1 -2
keras_hub/src/models/bloom/bloom_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/bloom/bloom_tokenizer.py +12 -41
keras_hub/src/models/causal_lm.py +10 -29
keras_hub/src/models/causal_lm_preprocessor.py +195 -0
keras_hub/src/models/csp_darknet/csp_darknet_backbone.py +54 -15
keras_hub/src/models/deberta_v3/__init__.py +1 -4
keras_hub/src/models/deberta_v3/deberta_v3_masked_lm_preprocessor.py +14 -77
keras_hub/src/models/deberta_v3/{deberta_v3_classifier.py → deberta_v3_text_classifier.py} +16 -11
keras_hub/src/models/deberta_v3/{deberta_v3_preprocessor.py → deberta_v3_text_classifier_preprocessor.py} +23 -64
keras_hub/src/models/deberta_v3/deberta_v3_tokenizer.py +30 -25
keras_hub/src/models/densenet/densenet_backbone.py +46 -22
keras_hub/src/models/distil_bert/__init__.py +1 -4
keras_hub/src/models/distil_bert/distil_bert_masked_lm_preprocessor.py +14 -76
keras_hub/src/models/distil_bert/{distil_bert_classifier.py → distil_bert_text_classifier.py} +17 -12
keras_hub/src/models/distil_bert/{distil_bert_preprocessor.py → distil_bert_text_classifier_preprocessor.py} +23 -63
keras_hub/src/models/distil_bert/distil_bert_tokenizer.py +19 -35
keras_hub/src/models/efficientnet/__init__.py +13 -0
keras_hub/src/models/efficientnet/efficientnet_backbone.py +569 -0
keras_hub/src/models/efficientnet/fusedmbconv.py +229 -0
keras_hub/src/models/efficientnet/mbconv.py +238 -0
keras_hub/src/models/electra/__init__.py +1 -2
keras_hub/src/models/electra/electra_tokenizer.py +17 -32
keras_hub/src/models/f_net/__init__.py +1 -2
keras_hub/src/models/f_net/f_net_masked_lm_preprocessor.py +12 -78
keras_hub/src/models/f_net/{f_net_classifier.py → f_net_text_classifier.py} +17 -10
keras_hub/src/models/f_net/{f_net_preprocessor.py → f_net_text_classifier_preprocessor.py} +19 -63
keras_hub/src/models/f_net/f_net_tokenizer.py +17 -35
keras_hub/src/models/falcon/__init__.py +1 -2
keras_hub/src/models/falcon/falcon_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/falcon/falcon_tokenizer.py +12 -35
keras_hub/src/models/gemma/__init__.py +1 -2
keras_hub/src/models/gemma/gemma_causal_lm_preprocessor.py +6 -90
keras_hub/src/models/gemma/gemma_decoder_block.py +1 -1
keras_hub/src/models/gemma/gemma_tokenizer.py +12 -23
keras_hub/src/models/gpt2/__init__.py +1 -2
keras_hub/src/models/gpt2/gpt2_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/gpt2/gpt2_preprocessor.py +12 -90
keras_hub/src/models/gpt2/gpt2_tokenizer.py +12 -34
keras_hub/src/models/gpt_neo_x/gpt_neo_x_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/gpt_neo_x/gpt_neo_x_tokenizer.py +12 -34
keras_hub/src/models/image_classifier.py +0 -5
keras_hub/src/models/image_classifier_preprocessor.py +83 -0
keras_hub/src/models/llama/__init__.py +1 -2
keras_hub/src/models/llama/llama_causal_lm_preprocessor.py +6 -85
keras_hub/src/models/llama/llama_tokenizer.py +12 -25
keras_hub/src/models/llama3/__init__.py +1 -2
keras_hub/src/models/llama3/llama3_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/llama3/llama3_tokenizer.py +12 -33
keras_hub/src/models/masked_lm.py +0 -2
keras_hub/src/models/masked_lm_preprocessor.py +156 -0
keras_hub/src/models/mistral/__init__.py +1 -2
keras_hub/src/models/mistral/mistral_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/mistral/mistral_tokenizer.py +12 -23
keras_hub/src/models/mix_transformer/mix_transformer_backbone.py +2 -2
keras_hub/src/models/mobilenet/__init__.py +13 -0
keras_hub/src/models/mobilenet/mobilenet_backbone.py +530 -0
keras_hub/src/models/mobilenet/mobilenet_image_classifier.py +114 -0
keras_hub/src/models/opt/__init__.py +1 -2
keras_hub/src/models/opt/opt_causal_lm_preprocessor.py +6 -93
keras_hub/src/models/opt/opt_tokenizer.py +12 -41
keras_hub/src/models/pali_gemma/__init__.py +1 -4
keras_hub/src/models/pali_gemma/pali_gemma_causal_lm_preprocessor.py +28 -28
keras_hub/src/models/pali_gemma/pali_gemma_image_converter.py +25 -0
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +5 -5
keras_hub/src/models/pali_gemma/pali_gemma_tokenizer.py +11 -3
keras_hub/src/models/phi3/__init__.py +1 -2
keras_hub/src/models/phi3/phi3_causal_lm.py +3 -9
keras_hub/src/models/phi3/phi3_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/phi3/phi3_tokenizer.py +12 -36
keras_hub/src/models/preprocessor.py +72 -83
keras_hub/src/models/resnet/__init__.py +6 -0
keras_hub/src/models/resnet/resnet_backbone.py +390 -42
keras_hub/src/models/resnet/resnet_image_classifier.py +33 -6
keras_hub/src/models/resnet/resnet_image_classifier_preprocessor.py +28 -0
keras_hub/src/models/{llama3/llama3_preprocessor.py → resnet/resnet_image_converter.py} +7 -5
keras_hub/src/models/resnet/resnet_presets.py +95 -0
keras_hub/src/models/retinanet/__init__.py +13 -0
keras_hub/src/models/retinanet/anchor_generator.py +175 -0
keras_hub/src/models/retinanet/box_matcher.py +259 -0
keras_hub/src/models/retinanet/non_max_supression.py +578 -0
keras_hub/src/models/roberta/__init__.py +1 -2
keras_hub/src/models/roberta/roberta_masked_lm_preprocessor.py +22 -74
keras_hub/src/models/roberta/{roberta_classifier.py → roberta_text_classifier.py} +16 -11
keras_hub/src/models/roberta/{roberta_preprocessor.py → roberta_text_classifier_preprocessor.py} +21 -53
keras_hub/src/models/roberta/roberta_tokenizer.py +13 -52
keras_hub/src/models/seq_2_seq_lm_preprocessor.py +269 -0
keras_hub/src/models/stable_diffusion_v3/__init__.py +13 -0
keras_hub/src/models/stable_diffusion_v3/clip_encoder_block.py +103 -0
keras_hub/src/models/stable_diffusion_v3/clip_preprocessor.py +93 -0
keras_hub/src/models/stable_diffusion_v3/clip_text_encoder.py +149 -0
keras_hub/src/models/stable_diffusion_v3/clip_tokenizer.py +167 -0
keras_hub/src/models/stable_diffusion_v3/mmdit.py +427 -0
keras_hub/src/models/stable_diffusion_v3/mmdit_block.py +317 -0
keras_hub/src/models/stable_diffusion_v3/t5_xxl_preprocessor.py +74 -0
keras_hub/src/models/stable_diffusion_v3/t5_xxl_text_encoder.py +155 -0
keras_hub/src/models/stable_diffusion_v3/vae_attention.py +126 -0
keras_hub/src/models/stable_diffusion_v3/vae_image_decoder.py +186 -0
keras_hub/src/models/t5/__init__.py +1 -2
keras_hub/src/models/t5/t5_tokenizer.py +13 -23
keras_hub/src/models/task.py +71 -116
keras_hub/src/models/{classifier.py → text_classifier.py} +19 -13
keras_hub/src/models/text_classifier_preprocessor.py +138 -0
keras_hub/src/models/whisper/__init__.py +1 -2
keras_hub/src/models/whisper/{whisper_audio_feature_extractor.py → whisper_audio_converter.py} +20 -18
keras_hub/src/models/whisper/whisper_backbone.py +0 -3
keras_hub/src/models/whisper/whisper_presets.py +10 -10
keras_hub/src/models/whisper/whisper_tokenizer.py +20 -16
keras_hub/src/models/xlm_roberta/__init__.py +1 -4
keras_hub/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor.py +26 -72
keras_hub/src/models/xlm_roberta/{xlm_roberta_classifier.py → xlm_roberta_text_classifier.py} +16 -11
keras_hub/src/models/xlm_roberta/{xlm_roberta_preprocessor.py → xlm_roberta_text_classifier_preprocessor.py} +26 -53
keras_hub/src/models/xlm_roberta/xlm_roberta_tokenizer.py +25 -10
keras_hub/src/tests/test_case.py +46 -0
keras_hub/src/tokenizers/byte_pair_tokenizer.py +30 -17
keras_hub/src/tokenizers/byte_tokenizer.py +14 -15
keras_hub/src/tokenizers/sentence_piece_tokenizer.py +20 -7
keras_hub/src/tokenizers/tokenizer.py +67 -32
keras_hub/src/tokenizers/unicode_codepoint_tokenizer.py +14 -15
keras_hub/src/tokenizers/word_piece_tokenizer.py +34 -47
keras_hub/src/utils/imagenet/__init__.py +13 -0
keras_hub/src/utils/imagenet/imagenet_utils.py +1067 -0
keras_hub/src/utils/keras_utils.py +0 -50
keras_hub/src/utils/preset_utils.py +230 -68
keras_hub/src/utils/tensor_utils.py +187 -69
keras_hub/src/utils/timm/convert_resnet.py +19 -16
keras_hub/src/utils/timm/preset_loader.py +66 -0
keras_hub/src/utils/transformers/convert_albert.py +193 -0
keras_hub/src/utils/transformers/convert_bart.py +373 -0
keras_hub/src/utils/transformers/convert_bert.py +7 -17
keras_hub/src/utils/transformers/convert_distilbert.py +10 -20
keras_hub/src/utils/transformers/convert_gemma.py +5 -19
keras_hub/src/utils/transformers/convert_gpt2.py +5 -18
keras_hub/src/utils/transformers/convert_llama3.py +7 -18
keras_hub/src/utils/transformers/convert_mistral.py +129 -0
keras_hub/src/utils/transformers/convert_pali_gemma.py +7 -29
keras_hub/src/utils/transformers/preset_loader.py +77 -0
keras_hub/src/utils/transformers/safetensor_utils.py +2 -2
keras_hub/src/version_utils.py +1 -1
keras_hub_nightly-0.16.0.dev2024092017.dist-info/METADATA +202 -0
keras_hub_nightly-0.16.0.dev2024092017.dist-info/RECORD +334 -0
{keras_hub_nightly-0.15.0.dev20240823171555.dist-info → keras_hub_nightly-0.16.0.dev2024092017.dist-info}/WHEEL +1 -1
keras_hub/src/models/bart/bart_preprocessor.py +0 -276
keras_hub/src/models/bloom/bloom_preprocessor.py +0 -185
keras_hub/src/models/electra/electra_preprocessor.py +0 -154
keras_hub/src/models/falcon/falcon_preprocessor.py +0 -187
keras_hub/src/models/gemma/gemma_preprocessor.py +0 -191
keras_hub/src/models/gpt_neo_x/gpt_neo_x_preprocessor.py +0 -145
keras_hub/src/models/llama/llama_preprocessor.py +0 -189
keras_hub/src/models/mistral/mistral_preprocessor.py +0 -190
keras_hub/src/models/opt/opt_preprocessor.py +0 -188
keras_hub/src/models/phi3/phi3_preprocessor.py +0 -190
keras_hub/src/models/whisper/whisper_preprocessor.py +0 -326
keras_hub/src/utils/timm/convert.py +0 -37
keras_hub/src/utils/transformers/convert.py +0 -101
keras_hub_nightly-0.15.0.dev20240823171555.dist-info/METADATA +0 -34
keras_hub_nightly-0.15.0.dev20240823171555.dist-info/RECORD +0 -297
{keras_hub_nightly-0.15.0.dev20240823171555.dist-info → keras_hub_nightly-0.16.0.dev2024092017.dist-info}/top_level.txt +0 -0

keras_hub/src/models/text_classifier_preprocessor.py ADDED Viewed

@@ -0,0 +1,138 @@
+# Copyright 2024 The KerasHub Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import keras
+from keras_hub.src.api_export import keras_hub_export
+from keras_hub.src.layers.preprocessing.multi_segment_packer import (
+    MultiSegmentPacker,
+)
+from keras_hub.src.models.preprocessor import Preprocessor
+from keras_hub.src.utils.tensor_utils import preprocessing_function
+@keras_hub_export("keras_hub.models.TextClassifierPreprocessor")
+class TextClassifierPreprocessor(Preprocessor):
+    """Base class for text classification preprocessing layers.
+    `TextClassifierPreprocessor` tasks wrap a `keras_hub.tokenizer.Tokenizer` to
+    create a preprocessing layer for text classification tasks. It is intended
+    to be paired with a `keras_hub.models.TextClassifier` task.
+    All `TextClassifierPreprocessor` take inputs three ordered inputs, `x`, `y`,
+    and `sample_weight`. `x`, the first input, should always be included. It can
+    be a single string, a batch of strings, or a tuple of batches of string
+    segments that should be combined into a single sequence. See examples below.
+    `y` and `sample_weight` are optional inputs that will be passed through
+    unaltered. Usually, `y` will be the classification label, and
+    `sample_weight` will not be provided.
+    The layer will output either `x`, an `(x, y)` tuple if labels were provided,
+    or an `(x, y, sample_weight)` tuple if labels and sample weight were
+    provided. `x` will be a dictionary with tokenized input, the exact contents
+    of the dictionary will depend on the model being used.
+    All `TextClassifierPreprocessor` tasks include a `from_preset()` constructor
+    which can be used to load a pre-trained config and vocabularies. You can
+    call the `from_preset()` constructor directly on this base class, in which
+    case the correct class for you model will be automatically instantiated.
+    Examples.
+    ```python
+    preprocessor = keras_hub.models.TextClassifierPreprocessor.from_preset(
+        "bert_base_en_uncased",
+        sequence_length=256, # Optional.
+    )
+    # Tokenize and pad/truncate a single sentence.
+    x = "The quick brown fox jumped."
+    x = preprocessor(x)
+    # Tokenize and pad/truncate a labeled sentence.
+    x, y = "The quick brown fox jumped.", 1
+    x, y = preprocessor(x, y)
+    # Tokenize and pad/truncate a batch of labeled sentences.
+    x, y = ["The quick brown fox jumped.", "Call me Ishmael."], [1, 0]
+    x, y = preprocessor(x, y)
+    # Tokenize and combine a batch of labeled sentence pairs.
+    first = ["The quick brown fox jumped.", "Call me Ishmael."]
+    second = ["The fox tripped.", "Oh look, a whale."]
+    labels = [1, 0]
+    x, y = (first, second), labels
+    x, y = preprocessor(x, y)
+    # Use a `tf.data.Dataset`.
+    ds = tf.data.Dataset.from_tensor_slices(((first, second), labels))
+    ds = ds.map(preprocessor, num_parallel_calls=tf.data.AUTOTUNE)
+    ```
+    """
+    def __init__(
+        self,
+        tokenizer,
+        sequence_length=512,
+        truncate="round_robin",
+        **kwargs,
+    ):
+        super().__init__(**kwargs)
+        self.tokenizer = tokenizer
+        self.packer = None
+        self.sequence_length = sequence_length
+        self.truncate = truncate
+    def build(self, input_shape):
+        super().build(input_shape)
+        # Defer masker creation to `build()` so that we can be sure tokenizer
+        # assets have loaded when restoring a saved model.
+        self.packer = MultiSegmentPacker(
+            start_value=self.tokenizer.start_token_id,
+            end_value=self.tokenizer.end_token_id,
+            pad_value=self.tokenizer.pad_token_id,
+            truncate=self.truncate,
+            sequence_length=self.sequence_length,
+        )
+    @preprocessing_function
+    def call(self, x, y=None, sample_weight=None):
+        x = x if isinstance(x, tuple) else (x,)
+        x = tuple(self.tokenizer(segment) for segment in x)
+        token_ids, segment_ids = self.packer(x)
+        x = {
+            "token_ids": token_ids,
+            "padding_mask": token_ids != self.tokenizer.pad_token_id,
+            "segment_ids": segment_ids,
+        }
+        return keras.utils.pack_x_y_sample_weight(x, y, sample_weight)
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "sequence_length": self.sequence_length,
+                "truncate": self.truncate,
+            }
+        )
+        return config
+    @property
+    def sequence_length(self):
+        """The padded length of model input sequences."""
+        return self._sequence_length
+    @sequence_length.setter
+    def sequence_length(self, value):
+        self._sequence_length = value
+        if self.packer is not None:
+            self.packer.sequence_length = value

keras_hub/src/models/whisper/__init__.py CHANGED Viewed

@@ -14,7 +14,6 @@
 from keras_hub.src.models.whisper.whisper_backbone import WhisperBackbone
 from keras_hub.src.models.whisper.whisper_presets import backbone_presets
-from keras_hub.src.models.whisper.whisper_tokenizer import WhisperTokenizer
 from keras_hub.src.utils.preset_utils import register_presets
-register_presets(backbone_presets, (WhisperBackbone, WhisperTokenizer))
+register_presets(backbone_presets, WhisperBackbone)

keras_hub/src/models/whisper/{whisper_audio_feature_extractor.py → whisper_audio_converter.py} RENAMED Viewed

@@ -15,24 +15,19 @@
 import numpy as np
+from keras_hub.src.api_export import keras_hub_export
+from keras_hub.src.layers.preprocessing.audio_converter import AudioConverter
+from keras_hub.src.models.whisper.whisper_backbone import WhisperBackbone
 try:
     import tensorflow as tf
 except ImportError:
-    raise ImportError(
-        "To use `keras_hub`, please install Tensorflow: `pip install tensorflow`. "
-        "The TensorFlow package is required for data preprocessing with any backend."
-    )
-from keras_hub.src.api_export import keras_hub_export
-from keras_hub.src.layers.preprocessing.preprocessing_layer import (
-    PreprocessingLayer,
-)
+    tf = None
-@keras_hub_export("keras_hub.models.WhisperAudioFeatureExtractor")
-class WhisperAudioFeatureExtractor(PreprocessingLayer):
-    """
-    Whisper audio feature extractor layer.
+@keras_hub_export("keras_hub.layers.WhisperAudioConverter")
+class WhisperAudioConverter(AudioConverter):
+    """Whisper audio converter layer.
     This layer takes in a batch of audio tensors, and computes the log-mel
     spectrogram features for each audio tensor.
@@ -55,22 +50,25 @@ class WhisperAudioFeatureExtractor(PreprocessingLayer):
             `max_audio_length * sampling_rate`. Defaults to `30`.
     Examples:
     ```python
     audio_tensor = tf.ones((8000,), dtype="float32")
     # Compute the log-mel spectrogram.
-    whisper_audio_feature_extractor = keras_hub.models.WhisperAudioFeatureExtractor()
-    whisper_audio_feature_extractor(audio_tensor)
+    audio_converter = keras_hub.models.WhisperAudioConverter.from_preset(
+        "whisper_base_en",
+    )
+    audio_converter(audio_tensor)
     # Compute the log-mel spectrogram for a batch of audio tensors.
     audio_tensor_1 = tf.ones((8000,), dtype="float32")
-    audio_tensor_2 = tf.ones((10000,), dtype="float32"
+    audio_tensor_2 = tf.ones((10000,), dtype="float32")
     audio_tensor = tf.ragged.stack([audio_tensor_1, audio_tensor_2], axis=0)
-    whisper_audio_feature_extractor(audio_tensor)
+    audio_converter(audio_tensor)
     ```
     """
+    backbone_cls = WhisperBackbone
     def __init__(
         self,
         num_mels=80,
@@ -97,6 +95,10 @@ class WhisperAudioFeatureExtractor(PreprocessingLayer):
         # `(num_fft_bins // 2 + 1, num_mels).`
         self.mel_filters = self._get_mel_filters()
+    def audio_shape(self):
+        """Returns the preprocessed size of a single audio sample."""
+        return (self.max_audio_length, self.num_mels)
     def _get_mel_filters(self):
         """
         Adapted from Hugging Face

keras_hub/src/models/whisper/whisper_backbone.py CHANGED Viewed

@@ -24,7 +24,6 @@ from keras_hub.src.layers.modeling.token_and_position_embedding import (
 from keras_hub.src.models.backbone import Backbone
 from keras_hub.src.models.whisper.whisper_decoder import WhisperDecoder
 from keras_hub.src.models.whisper.whisper_encoder import WhisperEncoder
-from keras_hub.src.utils.tensor_utils import assert_tf_backend
 def whisper_kernel_initializer(stddev=0.02):
@@ -117,8 +116,6 @@ class WhisperBackbone(Backbone):
         dtype=None,
         **kwargs,
     ):
-        assert_tf_backend(self.__class__.__name__)
         # === Layers ===
         self.encoder_conv_layer_1 = keras.layers.Conv1D(
             filters=hidden_dim,

keras_hub/src/models/whisper/whisper_presets.py CHANGED Viewed

@@ -25,7 +25,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_tiny_en/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_tiny_en/3",
     },
     "whisper_base_en": {
         "metadata": {
@@ -38,7 +38,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_base_en/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_base_en/3",
     },
     "whisper_small_en": {
         "metadata": {
@@ -51,7 +51,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_small_en/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_small_en/3",
     },
     "whisper_medium_en": {
         "metadata": {
@@ -64,7 +64,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_medium_en/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_medium_en/3",
     },
     "whisper_tiny_multi": {
         "metadata": {
@@ -77,7 +77,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_tiny_multi/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_tiny_multi/3",
     },
     "whisper_base_multi": {
         "metadata": {
@@ -90,7 +90,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_base_multi/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_base_multi/3",
     },
     "whisper_small_multi": {
         "metadata": {
@@ -103,7 +103,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_small_multi/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_small_multi/3",
     },
     "whisper_medium_multi": {
         "metadata": {
@@ -116,7 +116,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_medium_multi/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_medium_multi/3",
     },
     "whisper_large_multi": {
         "metadata": {
@@ -129,7 +129,7 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_large_multi/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_large_multi/3",
     },
     "whisper_large_multi_v2": {
         "metadata": {
@@ -143,6 +143,6 @@ backbone_presets = {
             "path": "whisper",
             "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
-        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_large_multi_v2/2",
+        "kaggle_handle": "kaggle://keras/whisper/keras/whisper_large_multi_v2/3",
     },
 }

keras_hub/src/models/whisper/whisper_tokenizer.py CHANGED Viewed

@@ -15,6 +15,7 @@
 import json
 from keras_hub.src.api_export import keras_hub_export
+from keras_hub.src.models.whisper.whisper_backbone import WhisperBackbone
 from keras_hub.src.tokenizers.byte_pair_tokenizer import BytePairTokenizer
@@ -25,7 +26,12 @@ def _load_dict(dict_or_path):
     return dict_or_path
-@keras_hub_export("keras_hub.models.WhisperTokenizer")
+@keras_hub_export(
+    [
+        "keras_hub.tokenizers.WhisperTokenizer",
+        "keras_hub.models.WhisperTokenizer",
+    ]
+)
 class WhisperTokenizer(BytePairTokenizer):
     """Whisper text tokenizer using Byte-Pair Encoding subword segmentation.
@@ -47,6 +53,8 @@ class WhisperTokenizer(BytePairTokenizer):
             tokenizer.
     """
+    backbone_cls = WhisperBackbone
     def __init__(
         self,
         vocabulary=None,
@@ -94,20 +102,22 @@ class WhisperTokenizer(BytePairTokenizer):
         self.translate_token_id = special_tokens[self.translate_token]
         self.transcribe_token_id = special_tokens[self.transcribe_token]
-        self.special_tokens = special_tokens
+        self._special_token_dict = special_tokens
         self.language_tokens = language_tokens
-        # TODO: Add language tokens to `unsplittable_tokens` once we figure
-        # out the performance issue with a large list.
-        unsplittable_tokens = list(special_tokens.keys())
         super().__init__(
             vocabulary=vocabulary,
             merges=merges,
-            unsplittable_tokens=unsplittable_tokens,
             **kwargs,
         )
+    @property
+    def special_tokens(self):
+        return list(self._special_token_dict.keys())
+    @property
+    def special_token_ids(self):
+        return list(self._special_token_dict.values())
     def save_assets(self, dir_path):
         # TODO: whisper is currently mutating it's vocabulary before passing
         # it to the super class, so we need to restore the unmutated vocabulary
@@ -140,7 +150,7 @@ class WhisperTokenizer(BytePairTokenizer):
                 self.translate_token,
                 self.transcribe_token,
             ]:
-                vocabulary[token] = self.special_tokens[token]
+                vocabulary[token] = self._special_token_dict[token]
         else:
             self._initial_vocabulary = None
@@ -148,15 +158,9 @@ class WhisperTokenizer(BytePairTokenizer):
     def get_config(self):
         config = super().get_config()
-        # In the constructor, we pass the list of special tokens to the
-        # `unsplittable_tokens` arg of the superclass' constructor. Hence, we
-        # delete it from the config here.
-        del config["unsplittable_tokens"]
         config.update(
             {
-                "special_tokens": self.special_tokens,
+                "special_tokens": self._special_token_dict,
                 "language_tokens": self.language_tokens,
             }
         )

keras_hub/src/models/xlm_roberta/__init__.py CHANGED Viewed

@@ -18,9 +18,6 @@ from keras_hub.src.models.xlm_roberta.xlm_roberta_backbone import (
 from keras_hub.src.models.xlm_roberta.xlm_roberta_presets import (
     backbone_presets,
 )
-from keras_hub.src.models.xlm_roberta.xlm_roberta_tokenizer import (
-    XLMRobertaTokenizer,
-)
 from keras_hub.src.utils.preset_utils import register_presets
-register_presets(backbone_presets, (XLMRobertaBackbone, XLMRobertaTokenizer))
+register_presets(backbone_presets, XLMRobertaBackbone)

keras_hub/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor.py CHANGED Viewed

@@ -13,19 +13,23 @@
 # limitations under the License.
 import keras
-from absl import logging
 from keras_hub.src.api_export import keras_hub_export
-from keras_hub.src.layers.preprocessing.masked_lm_mask_generator import (
-    MaskedLMMaskGenerator,
+from keras_hub.src.layers.preprocessing.multi_segment_packer import (
+    MultiSegmentPacker,
 )
-from keras_hub.src.models.xlm_roberta.xlm_roberta_preprocessor import (
-    XLMRobertaPreprocessor,
+from keras_hub.src.models.masked_lm_preprocessor import MaskedLMPreprocessor
+from keras_hub.src.models.xlm_roberta.xlm_roberta_backbone import (
+    XLMRobertaBackbone,
 )
+from keras_hub.src.models.xlm_roberta.xlm_roberta_tokenizer import (
+    XLMRobertaTokenizer,
+)
+from keras_hub.src.utils.tensor_utils import preprocessing_function
 @keras_hub_export("keras_hub.models.XLMRobertaMaskedLMPreprocessor")
-class XLMRobertaMaskedLMPreprocessor(XLMRobertaPreprocessor):
+class XLMRobertaMaskedLMPreprocessor(MaskedLMPreprocessor):
     """XLM-RoBERTa preprocessing for the masked language modeling task.
     This preprocessing layer will prepare inputs for a masked language modeling
@@ -120,76 +124,26 @@ class XLMRobertaMaskedLMPreprocessor(XLMRobertaPreprocessor):
     ```
     """
-    def __init__(
-        self,
-        tokenizer,
-        sequence_length=512,
-        truncate="round_robin",
-        mask_selection_rate=0.15,
-        mask_selection_length=96,
-        mask_token_rate=0.8,
-        random_token_rate=0.1,
-        **kwargs,
-    ):
-        super().__init__(
-            tokenizer,
-            sequence_length=sequence_length,
-            truncate=truncate,
-            **kwargs,
-        )
-        self.mask_selection_rate = mask_selection_rate
-        self.mask_selection_length = mask_selection_length
-        self.mask_token_rate = mask_token_rate
-        self.random_token_rate = random_token_rate
-        self.masker = None
+    backbone_cls = XLMRobertaBackbone
+    tokenizer_cls = XLMRobertaTokenizer
     def build(self, input_shape):
         super().build(input_shape)
-        # Defer masker creation to `build()` so that we can be sure tokenizer
-        # assets have loaded when restoring a saved model.
-        self.masker = MaskedLMMaskGenerator(
-            mask_selection_rate=self.mask_selection_rate,
-            mask_selection_length=self.mask_selection_length,
-            mask_token_rate=self.mask_token_rate,
-            random_token_rate=self.random_token_rate,
-            vocabulary_size=self.tokenizer.vocabulary_size(),
-            mask_token_id=self.tokenizer.mask_token_id,
-            unselectable_token_ids=[
-                self.tokenizer.start_token_id,
-                self.tokenizer.end_token_id,
-                self.tokenizer.pad_token_id,
-            ],
-        )
-    def get_config(self):
-        config = super().get_config()
-        config.update(
-            {
-                "mask_selection_rate": self.mask_selection_rate,
-                "mask_selection_length": self.mask_selection_length,
-                "mask_token_rate": self.mask_token_rate,
-                "random_token_rate": self.random_token_rate,
-            }
+        # Roberta is doubles up the sep token, so we override build.
+        self.packer = MultiSegmentPacker(
+            start_value=self.tokenizer.start_token_id,
+            end_value=self.tokenizer.end_token_id,
+            sep_value=[self.tokenizer.end_token_id] * 2,
+            pad_value=self.tokenizer.pad_token_id,
+            truncate=self.truncate,
+            sequence_length=self.sequence_length,
         )
-        return config
+        self.built = True
+    @preprocessing_function
     def call(self, x, y=None, sample_weight=None):
-        if y is not None or sample_weight is not None:
-            logging.warning(
-                f"{self.__class__.__name__} generates `y` and `sample_weight` "
-                "based on your input data, but your data already contains `y` "
-                "or `sample_weight`. Your `y` and `sample_weight` will be "
-                "ignored."
-            )
-        x = super().call(x)
-        token_ids, padding_mask = x["token_ids"], x["padding_mask"]
-        masker_outputs = self.masker(token_ids)
-        x = {
-            "token_ids": masker_outputs["token_ids"],
-            "padding_mask": padding_mask,
-            "mask_positions": masker_outputs["mask_positions"],
-        }
-        y = masker_outputs["mask_ids"]
-        sample_weight = masker_outputs["mask_weights"]
+        output = super().call(x, y=y, sample_weight=sample_weight)
+        x, y, sample_weight = keras.utils.unpack_x_y_sample_weight(output)
+        # Backbone has no segment ID input.
+        del x["segment_ids"]
         return keras.utils.pack_x_y_sample_weight(x, y, sample_weight)

keras_hub/src/models/xlm_roberta/{xlm_roberta_classifier.py → xlm_roberta_text_classifier.py} RENAMED Viewed

@@ -16,20 +16,25 @@
 import keras
 from keras_hub.src.api_export import keras_hub_export
-from keras_hub.src.models.classifier import Classifier
 from keras_hub.src.models.roberta.roberta_backbone import (
     roberta_kernel_initializer,
 )
+from keras_hub.src.models.text_classifier import TextClassifier
 from keras_hub.src.models.xlm_roberta.xlm_roberta_backbone import (
     XLMRobertaBackbone,
 )
-from keras_hub.src.models.xlm_roberta.xlm_roberta_preprocessor import (
-    XLMRobertaPreprocessor,
+from keras_hub.src.models.xlm_roberta.xlm_roberta_text_classifier_preprocessor import (
+    XLMRobertaTextClassifierPreprocessor,
 )
-@keras_hub_export("keras_hub.models.XLMRobertaClassifier")
-class XLMRobertaClassifier(Classifier):
+@keras_hub_export(
+    [
+        "keras_hub.models.XLMRobertaTextClassifier",
+        "keras_hub.models.XLMRobertaClassifier",
+    ]
+)
+class XLMRobertaTextClassifier(TextClassifier):
     """An end-to-end XLM-RoBERTa model for classification tasks.
     This model attaches a classification head to a
@@ -50,7 +55,7 @@ class XLMRobertaClassifier(Classifier):
     Args:
         backbone: A `keras_hub.models.XLMRobertaBackbone` instance.
         num_classes: int. Number of classes to predict.
-        preprocessor: A `keras_hub.models.XLMRobertaPreprocessor` or `None`. If
+        preprocessor: A `keras_hub.models.XLMRobertaTextClassifierPreprocessor` or `None`. If
             `None`, this model will not apply preprocessing, and inputs should
             be preprocessed before calling the model.
         activation: Optional `str` or callable. The activation function to use
@@ -68,7 +73,7 @@ class XLMRobertaClassifier(Classifier):
     labels = [0, 3]
     # Pretrained classifier.
-    classifier = keras_hub.models.XLMRobertaClassifier.from_preset(
+    classifier = keras_hub.models.XLMRobertaTextClassifier.from_preset(
         "xlm_roberta_base_multi",
         num_classes=4,
     )
@@ -96,7 +101,7 @@ class XLMRobertaClassifier(Classifier):
     labels = [0, 3]
     # Pretrained classifier without preprocessing.
-    classifier = keras_hub.models.XLMRobertaClassifier.from_preset(
+    classifier = keras_hub.models.XLMRobertaTextClassifier.from_preset(
         "xlm_roberta_base_multi",
         num_classes=4,
         preprocessor=None,
@@ -128,7 +133,7 @@ class XLMRobertaClassifier(Classifier):
     tokenizer = keras_hub.models.XLMRobertaTokenizer(
         proto=proto
     )
-    preprocessor = keras_hub.models.XLMRobertaPreprocessor(
+    preprocessor = keras_hub.models.XLMRobertaTextClassifierPreprocessor(
         tokenizer,
         sequence_length=128,
     )
@@ -140,7 +145,7 @@ class XLMRobertaClassifier(Classifier):
         intermediate_dim=512,
         max_sequence_length=128,
     )
-    classifier = keras_hub.models.XLMRobertaClassifier(
+    classifier = keras_hub.models.XLMRobertaTextClassifier(
         backbone=backbone,
         preprocessor=preprocessor,
         num_classes=4,
@@ -150,7 +155,7 @@ class XLMRobertaClassifier(Classifier):
     """
     backbone_cls = XLMRobertaBackbone
-    preprocessor_cls = XLMRobertaPreprocessor
+    preprocessor_cls = XLMRobertaTextClassifierPreprocessor
     def __init__(
         self,

keras-hub-nightly 0.15.0.dev20240823171555__py3-none-any.whl → 0.16.0.dev2024092017__py3-none-any.whl

keras-hub-nightly 0.15.0.dev20240823171555py3-none-any.whl → 0.16.0.dev2024092017py3-none-any.whl