PyPI - keras-hub-nightly - Versions diffs - 0.15.0.dev20240823171555__py3-none-any.whl → 0.16.0.dev2024092017__py3-none-any.whl - Mend

keras-hub-nightly 0.15.0.dev20240823171555py3-none-any.whl → 0.16.0.dev2024092017py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (198) hide show

keras_hub/__init__.py +0 -6
keras_hub/api/__init__.py +2 -0
keras_hub/api/bounding_box/__init__.py +36 -0
keras_hub/api/layers/__init__.py +14 -0
keras_hub/api/models/__init__.py +97 -48
keras_hub/api/tokenizers/__init__.py +30 -0
keras_hub/api/utils/__init__.py +22 -0
keras_hub/src/api_export.py +15 -9
keras_hub/src/bounding_box/__init__.py +13 -0
keras_hub/src/bounding_box/converters.py +529 -0
keras_hub/src/bounding_box/formats.py +162 -0
keras_hub/src/bounding_box/iou.py +263 -0
keras_hub/src/bounding_box/to_dense.py +95 -0
keras_hub/src/bounding_box/to_ragged.py +99 -0
keras_hub/src/bounding_box/utils.py +194 -0
keras_hub/src/bounding_box/validate_format.py +99 -0
keras_hub/src/layers/preprocessing/audio_converter.py +121 -0
keras_hub/src/layers/preprocessing/image_converter.py +130 -0
keras_hub/src/layers/preprocessing/masked_lm_mask_generator.py +2 -0
keras_hub/src/layers/preprocessing/multi_segment_packer.py +9 -8
keras_hub/src/layers/preprocessing/preprocessing_layer.py +2 -29
keras_hub/src/layers/preprocessing/random_deletion.py +33 -31
keras_hub/src/layers/preprocessing/random_swap.py +33 -31
keras_hub/src/layers/preprocessing/resizing_image_converter.py +101 -0
keras_hub/src/layers/preprocessing/start_end_packer.py +3 -2
keras_hub/src/models/albert/__init__.py +1 -2
keras_hub/src/models/albert/albert_masked_lm_preprocessor.py +6 -86
keras_hub/src/models/albert/{albert_classifier.py → albert_text_classifier.py} +34 -10
keras_hub/src/models/albert/{albert_preprocessor.py → albert_text_classifier_preprocessor.py} +14 -70
keras_hub/src/models/albert/albert_tokenizer.py +17 -36
keras_hub/src/models/backbone.py +12 -34
keras_hub/src/models/bart/__init__.py +1 -2
keras_hub/src/models/bart/bart_seq_2_seq_lm_preprocessor.py +21 -148
keras_hub/src/models/bart/bart_tokenizer.py +12 -39
keras_hub/src/models/bert/__init__.py +1 -5
keras_hub/src/models/bert/bert_masked_lm_preprocessor.py +6 -87
keras_hub/src/models/bert/bert_presets.py +1 -4
keras_hub/src/models/bert/{bert_classifier.py → bert_text_classifier.py} +19 -12
keras_hub/src/models/bert/{bert_preprocessor.py → bert_text_classifier_preprocessor.py} +14 -70
keras_hub/src/models/bert/bert_tokenizer.py +17 -35
keras_hub/src/models/bloom/__init__.py +1 -2
keras_hub/src/models/bloom/bloom_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/bloom/bloom_tokenizer.py +12 -41
keras_hub/src/models/causal_lm.py +10 -29
keras_hub/src/models/causal_lm_preprocessor.py +195 -0
keras_hub/src/models/csp_darknet/csp_darknet_backbone.py +54 -15
keras_hub/src/models/deberta_v3/__init__.py +1 -4
keras_hub/src/models/deberta_v3/deberta_v3_masked_lm_preprocessor.py +14 -77
keras_hub/src/models/deberta_v3/{deberta_v3_classifier.py → deberta_v3_text_classifier.py} +16 -11
keras_hub/src/models/deberta_v3/{deberta_v3_preprocessor.py → deberta_v3_text_classifier_preprocessor.py} +23 -64
keras_hub/src/models/deberta_v3/deberta_v3_tokenizer.py +30 -25
keras_hub/src/models/densenet/densenet_backbone.py +46 -22
keras_hub/src/models/distil_bert/__init__.py +1 -4
keras_hub/src/models/distil_bert/distil_bert_masked_lm_preprocessor.py +14 -76
keras_hub/src/models/distil_bert/{distil_bert_classifier.py → distil_bert_text_classifier.py} +17 -12
keras_hub/src/models/distil_bert/{distil_bert_preprocessor.py → distil_bert_text_classifier_preprocessor.py} +23 -63
keras_hub/src/models/distil_bert/distil_bert_tokenizer.py +19 -35
keras_hub/src/models/efficientnet/__init__.py +13 -0
keras_hub/src/models/efficientnet/efficientnet_backbone.py +569 -0
keras_hub/src/models/efficientnet/fusedmbconv.py +229 -0
keras_hub/src/models/efficientnet/mbconv.py +238 -0
keras_hub/src/models/electra/__init__.py +1 -2
keras_hub/src/models/electra/electra_tokenizer.py +17 -32
keras_hub/src/models/f_net/__init__.py +1 -2
keras_hub/src/models/f_net/f_net_masked_lm_preprocessor.py +12 -78
keras_hub/src/models/f_net/{f_net_classifier.py → f_net_text_classifier.py} +17 -10
keras_hub/src/models/f_net/{f_net_preprocessor.py → f_net_text_classifier_preprocessor.py} +19 -63
keras_hub/src/models/f_net/f_net_tokenizer.py +17 -35
keras_hub/src/models/falcon/__init__.py +1 -2
keras_hub/src/models/falcon/falcon_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/falcon/falcon_tokenizer.py +12 -35
keras_hub/src/models/gemma/__init__.py +1 -2
keras_hub/src/models/gemma/gemma_causal_lm_preprocessor.py +6 -90
keras_hub/src/models/gemma/gemma_decoder_block.py +1 -1
keras_hub/src/models/gemma/gemma_tokenizer.py +12 -23
keras_hub/src/models/gpt2/__init__.py +1 -2
keras_hub/src/models/gpt2/gpt2_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/gpt2/gpt2_preprocessor.py +12 -90
keras_hub/src/models/gpt2/gpt2_tokenizer.py +12 -34
keras_hub/src/models/gpt_neo_x/gpt_neo_x_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/gpt_neo_x/gpt_neo_x_tokenizer.py +12 -34
keras_hub/src/models/image_classifier.py +0 -5
keras_hub/src/models/image_classifier_preprocessor.py +83 -0
keras_hub/src/models/llama/__init__.py +1 -2
keras_hub/src/models/llama/llama_causal_lm_preprocessor.py +6 -85
keras_hub/src/models/llama/llama_tokenizer.py +12 -25
keras_hub/src/models/llama3/__init__.py +1 -2
keras_hub/src/models/llama3/llama3_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/llama3/llama3_tokenizer.py +12 -33
keras_hub/src/models/masked_lm.py +0 -2
keras_hub/src/models/masked_lm_preprocessor.py +156 -0
keras_hub/src/models/mistral/__init__.py +1 -2
keras_hub/src/models/mistral/mistral_causal_lm_preprocessor.py +6 -91
keras_hub/src/models/mistral/mistral_tokenizer.py +12 -23
keras_hub/src/models/mix_transformer/mix_transformer_backbone.py +2 -2
keras_hub/src/models/mobilenet/__init__.py +13 -0
keras_hub/src/models/mobilenet/mobilenet_backbone.py +530 -0
keras_hub/src/models/mobilenet/mobilenet_image_classifier.py +114 -0
keras_hub/src/models/opt/__init__.py +1 -2
keras_hub/src/models/opt/opt_causal_lm_preprocessor.py +6 -93
keras_hub/src/models/opt/opt_tokenizer.py +12 -41
keras_hub/src/models/pali_gemma/__init__.py +1 -4
keras_hub/src/models/pali_gemma/pali_gemma_causal_lm_preprocessor.py +28 -28
keras_hub/src/models/pali_gemma/pali_gemma_image_converter.py +25 -0
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +5 -5
keras_hub/src/models/pali_gemma/pali_gemma_tokenizer.py +11 -3
keras_hub/src/models/phi3/__init__.py +1 -2
keras_hub/src/models/phi3/phi3_causal_lm.py +3 -9
keras_hub/src/models/phi3/phi3_causal_lm_preprocessor.py +6 -89
keras_hub/src/models/phi3/phi3_tokenizer.py +12 -36
keras_hub/src/models/preprocessor.py +72 -83
keras_hub/src/models/resnet/__init__.py +6 -0
keras_hub/src/models/resnet/resnet_backbone.py +390 -42
keras_hub/src/models/resnet/resnet_image_classifier.py +33 -6
keras_hub/src/models/resnet/resnet_image_classifier_preprocessor.py +28 -0
keras_hub/src/models/{llama3/llama3_preprocessor.py → resnet/resnet_image_converter.py} +7 -5
keras_hub/src/models/resnet/resnet_presets.py +95 -0
keras_hub/src/models/retinanet/__init__.py +13 -0
keras_hub/src/models/retinanet/anchor_generator.py +175 -0
keras_hub/src/models/retinanet/box_matcher.py +259 -0
keras_hub/src/models/retinanet/non_max_supression.py +578 -0
keras_hub/src/models/roberta/__init__.py +1 -2
keras_hub/src/models/roberta/roberta_masked_lm_preprocessor.py +22 -74
keras_hub/src/models/roberta/{roberta_classifier.py → roberta_text_classifier.py} +16 -11
keras_hub/src/models/roberta/{roberta_preprocessor.py → roberta_text_classifier_preprocessor.py} +21 -53
keras_hub/src/models/roberta/roberta_tokenizer.py +13 -52
keras_hub/src/models/seq_2_seq_lm_preprocessor.py +269 -0
keras_hub/src/models/stable_diffusion_v3/__init__.py +13 -0
keras_hub/src/models/stable_diffusion_v3/clip_encoder_block.py +103 -0
keras_hub/src/models/stable_diffusion_v3/clip_preprocessor.py +93 -0
keras_hub/src/models/stable_diffusion_v3/clip_text_encoder.py +149 -0
keras_hub/src/models/stable_diffusion_v3/clip_tokenizer.py +167 -0
keras_hub/src/models/stable_diffusion_v3/mmdit.py +427 -0
keras_hub/src/models/stable_diffusion_v3/mmdit_block.py +317 -0
keras_hub/src/models/stable_diffusion_v3/t5_xxl_preprocessor.py +74 -0
keras_hub/src/models/stable_diffusion_v3/t5_xxl_text_encoder.py +155 -0
keras_hub/src/models/stable_diffusion_v3/vae_attention.py +126 -0
keras_hub/src/models/stable_diffusion_v3/vae_image_decoder.py +186 -0
keras_hub/src/models/t5/__init__.py +1 -2
keras_hub/src/models/t5/t5_tokenizer.py +13 -23
keras_hub/src/models/task.py +71 -116
keras_hub/src/models/{classifier.py → text_classifier.py} +19 -13
keras_hub/src/models/text_classifier_preprocessor.py +138 -0
keras_hub/src/models/whisper/__init__.py +1 -2
keras_hub/src/models/whisper/{whisper_audio_feature_extractor.py → whisper_audio_converter.py} +20 -18
keras_hub/src/models/whisper/whisper_backbone.py +0 -3
keras_hub/src/models/whisper/whisper_presets.py +10 -10
keras_hub/src/models/whisper/whisper_tokenizer.py +20 -16
keras_hub/src/models/xlm_roberta/__init__.py +1 -4
keras_hub/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor.py +26 -72
keras_hub/src/models/xlm_roberta/{xlm_roberta_classifier.py → xlm_roberta_text_classifier.py} +16 -11
keras_hub/src/models/xlm_roberta/{xlm_roberta_preprocessor.py → xlm_roberta_text_classifier_preprocessor.py} +26 -53
keras_hub/src/models/xlm_roberta/xlm_roberta_tokenizer.py +25 -10
keras_hub/src/tests/test_case.py +46 -0
keras_hub/src/tokenizers/byte_pair_tokenizer.py +30 -17
keras_hub/src/tokenizers/byte_tokenizer.py +14 -15
keras_hub/src/tokenizers/sentence_piece_tokenizer.py +20 -7
keras_hub/src/tokenizers/tokenizer.py +67 -32
keras_hub/src/tokenizers/unicode_codepoint_tokenizer.py +14 -15
keras_hub/src/tokenizers/word_piece_tokenizer.py +34 -47
keras_hub/src/utils/imagenet/__init__.py +13 -0
keras_hub/src/utils/imagenet/imagenet_utils.py +1067 -0
keras_hub/src/utils/keras_utils.py +0 -50
keras_hub/src/utils/preset_utils.py +230 -68
keras_hub/src/utils/tensor_utils.py +187 -69
keras_hub/src/utils/timm/convert_resnet.py +19 -16
keras_hub/src/utils/timm/preset_loader.py +66 -0
keras_hub/src/utils/transformers/convert_albert.py +193 -0
keras_hub/src/utils/transformers/convert_bart.py +373 -0
keras_hub/src/utils/transformers/convert_bert.py +7 -17
keras_hub/src/utils/transformers/convert_distilbert.py +10 -20
keras_hub/src/utils/transformers/convert_gemma.py +5 -19
keras_hub/src/utils/transformers/convert_gpt2.py +5 -18
keras_hub/src/utils/transformers/convert_llama3.py +7 -18
keras_hub/src/utils/transformers/convert_mistral.py +129 -0
keras_hub/src/utils/transformers/convert_pali_gemma.py +7 -29
keras_hub/src/utils/transformers/preset_loader.py +77 -0
keras_hub/src/utils/transformers/safetensor_utils.py +2 -2
keras_hub/src/version_utils.py +1 -1
keras_hub_nightly-0.16.0.dev2024092017.dist-info/METADATA +202 -0
keras_hub_nightly-0.16.0.dev2024092017.dist-info/RECORD +334 -0
{keras_hub_nightly-0.15.0.dev20240823171555.dist-info → keras_hub_nightly-0.16.0.dev2024092017.dist-info}/WHEEL +1 -1
keras_hub/src/models/bart/bart_preprocessor.py +0 -276
keras_hub/src/models/bloom/bloom_preprocessor.py +0 -185
keras_hub/src/models/electra/electra_preprocessor.py +0 -154
keras_hub/src/models/falcon/falcon_preprocessor.py +0 -187
keras_hub/src/models/gemma/gemma_preprocessor.py +0 -191
keras_hub/src/models/gpt_neo_x/gpt_neo_x_preprocessor.py +0 -145
keras_hub/src/models/llama/llama_preprocessor.py +0 -189
keras_hub/src/models/mistral/mistral_preprocessor.py +0 -190
keras_hub/src/models/opt/opt_preprocessor.py +0 -188
keras_hub/src/models/phi3/phi3_preprocessor.py +0 -190
keras_hub/src/models/whisper/whisper_preprocessor.py +0 -326
keras_hub/src/utils/timm/convert.py +0 -37
keras_hub/src/utils/transformers/convert.py +0 -101
keras_hub_nightly-0.15.0.dev20240823171555.dist-info/METADATA +0 -34
keras_hub_nightly-0.15.0.dev20240823171555.dist-info/RECORD +0 -297
{keras_hub_nightly-0.15.0.dev20240823171555.dist-info → keras_hub_nightly-0.16.0.dev2024092017.dist-info}/top_level.txt +0 -0

keras_hub/src/models/whisper/whisper_preprocessor.py DELETED Viewed

@@ -1,326 +0,0 @@
-# Copyright 2024 The KerasHub Authors
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     https://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import keras
-from absl import logging
-from keras_hub.src.api_export import keras_hub_export
-from keras_hub.src.layers.preprocessing.start_end_packer import StartEndPacker
-from keras_hub.src.models.preprocessor import Preprocessor
-from keras_hub.src.models.whisper.whisper_audio_feature_extractor import (
-    WhisperAudioFeatureExtractor,
-)
-from keras_hub.src.models.whisper.whisper_tokenizer import WhisperTokenizer
-from keras_hub.src.utils.keras_utils import (
-    convert_inputs_to_list_of_tensor_segments,
-)
-@keras_hub_export("keras_hub.models.WhisperPreprocessor")
-class WhisperPreprocessor(Preprocessor):
-    """A Whisper preprocessing layer which handles audio and text input.
-    This preprocessing layer will do three things:
-     1. Compute the log-mel spectrogram of the audio tensor inputs using
-        `audio_feature_extractor`.
-     2. Tokenize decoder inputs using the `tokenizer`.
-     2. Add the appropriate special tokens - `"<|startoftranscript|>", task
-        token, language token, `"<|endoftext|>"`, etc.
-     3. Construct a dictionary with keys `"encoder_features"`,
-        `"decoder_token_ids"`, `"decoder_padding_mask"` that can be passed
-        directly to a Whisper model.
-    Args:
-        tokenizer: A `keras_hub.models.WhisperTokenizer` instance.
-        audio_feature_extractor: A
-            `keras_hub.models.WhisperAudioFeatureExtractor` instance or `None`.
-            If `None` a feature extractor with default parameters will be
-            created.
-        decoder_sequence_length: The length of the packed decoder inputs.
-        language: string, language token. Should only be passed if your
-            tokenizer is multilingual.
-        task: string, task name. One of `"transcribe"`, `"translate"`. Should
-            only be passed if your tokenizer is multilingual.
-        no_timestamps: bool. If True, `"<|no_timestamps|>"` will be added as a
-            special token to your input.
-    Call arguments:
-        x: A dictionary with `"encoder_audio"` and `"decoder_text"` as its keys.
-            `"encoder_audio"` should correspond to the input audio tensor.
-            `"decoder_text"` should be a tensor of single string sequences.
-            Inputs may be batched or unbatched. Raw python inputs will be
-            converted to tensors.
-        y: Any label data. Will be passed through unaltered.
-        sample_weight: Any label weight data. Will be passed through unaltered.
-    Examples:
-    Directly calling the layer on data.
-    ```python
-    preprocessor = keras_hub.models.WhisperPreprocessor.from_preset(
-        "whisper_tiny_en",
-    )
-    # Preprocess unbatched inputs.
-    input_data = {
-        "encoder_audio": tf.ones((200,)),
-        "decoder_text": "The quick brown fox jumped.",
-    }
-    preprocessor(input_data)
-    # Preprocess batched inputs.
-    input_data = {
-        "encoder_audio": tf.ones((2, 200)),
-        "decoder_text": ["The quick brown fox jumped.", "Call me Ishmael."],
-    }
-    preprocessor(input_data)
-    # Custom audio feature extractor and vocabulary.
-    audio_feature_extractor = keras_hub.models.WhisperAudioFeatureExtractor(
-        num_mels=80,
-        num_fft_bins=400,
-        stride=100,
-        sampling_rate=100,
-        max_audio_length=5,
-    )
-    features = ["a quick fox.", "a fox quick."]
-    vocab = {"<|endoftext|>": 0, "a": 4, "Ġquick": 5, "Ġfox": 6}
-    merges = ["Ġ q", "u i", "c k", "ui ck", "Ġq uick"]
-    merges += ["Ġ f", "o x", "Ġf ox"]
-    special_tokens = {
-        "<|startoftranscript|>": 9,
-        "<|endoftext|>": 10,
-        "<|notimestamps|>": 11,
-        "<|transcribe|>": 12,
-        "<|translate|>": 13,
-    }
-    tokenizer = keras_hub.models.WhisperTokenizer(
-        vocabulary=vocab,
-        merges=merges,
-        special_tokens=special_tokens,
-    )
-    preprocessor = keras_hub.models.WhisperPreprocessor(
-        audio_feature_extractor=audio_feature_extractor,
-        tokenizer=tokenizer,
-    )
-    input_data = {
-        "encoder_audio": tf.ones((200,)),
-        "decoder_text": "The quick brown fox jumped.",
-    }
-    preprocessor(input_data)
-    ```
-    Mapping with `tf.data.Dataset`.
-    ```python
-    preprocessor = keras_hub.models.WhisperPreprocessor.from_preset(
-        "whisper_tiny_en")
-    # Map labeled single sentences.
-    features = {
-        "encoder_audio": tf.ones((2, 200)),
-        "decoder_text": ["The quick brown fox jumped.", "Call me Ishmael."],
-    }
-    labels = tf.constant(["True", "False"])
-    ds = tf.data.Dataset.from_tensor_slices((features, labels))
-    ds = ds.map(preprocessor, num_parallel_calls=tf.data.AUTOTUNE)
-    # Map unlabeled single sentences.
-    features = {
-        "encoder_audio": tf.ones((2, 200)),
-        "decoder_text": ["The quick brown fox jumped.", "Call me Ishmael."],
-    }
-    ds = tf.data.Dataset.from_tensor_slices(features)
-    ds = ds.map(preprocessor, num_parallel_calls=tf.data.AUTOTUNE)
-    ```
-    """
-    tokenizer_cls = WhisperTokenizer
-    def __init__(
-        self,
-        tokenizer,
-        audio_feature_extractor=None,
-        decoder_sequence_length=448,
-        language=None,
-        task=None,
-        no_timestamps=True,
-        **kwargs,
-    ):
-        super().__init__(**kwargs)
-        if audio_feature_extractor is None:
-            audio_feature_extractor = WhisperAudioFeatureExtractor()
-        self.audio_feature_extractor = audio_feature_extractor
-        self.tokenizer = tokenizer
-        self.decoder_packer = None
-        self.decoder_sequence_length = decoder_sequence_length
-        self.language = language
-        self.task = task
-        self.no_timestamps = no_timestamps
-    def build(self, input_shape):
-        # Defer packer creation to `build()` so that we can be sure tokenizer
-        # assets have loaded when restoring a saved model.
-        # Create list of tokens to be prepended to decoder inputs.
-        bos_tokens = [self.tokenizer.bos_token_id]
-        if self.tokenizer.language_tokens is not None:
-            if (
-                self.language is None
-                or self.language not in self.tokenizer.language_tokens
-            ):
-                raise ValueError(
-                    "You must pass a non-None value for `language` when using "
-                    "a multilingual tokenizer. The value must be one of "
-                    f'{",".join(self.tokenizer.language_tokens.keys())}. '
-                    f"Received: language={self.language}."
-                )
-            if self.task is None or self.task not in [
-                "transcribe",
-                "translate",
-            ]:
-                raise ValueError(
-                    "You must pass a non-None value for `task` when using "
-                    "a multilingual tokenizer. The value must be one of "
-                    '`"transcribe"`, `"translate"`. '
-                    f"Received: task={self.task}."
-                )
-            bos_tokens += [self.tokenizer.language_tokens[self.language]]
-            if self.task == "transcribe":
-                bos_tokens += [self.tokenizer.special_tokens["<|transcribe|>"]]
-            elif self.task == "translate":
-                bos_tokens += [self.tokenizer.special_tokens["<|translate|>"]]
-        else:
-            if self.language is not None:
-                logging.info(
-                    "`tokenizer` is monolingual, and `language` has a "
-                    "non-`None` value. Setting `language` to `None`."
-                )
-                self.language = None
-            if self.task is not None:
-                logging.info(
-                    "`tokenizer` is monolingual, and `task` has a "
-                    "non-`None` value. Setting `task` to `None`."
-                )
-                self.task = None
-        if self.no_timestamps:
-            bos_tokens += [self.tokenizer.no_timestamps_token_id]
-        # TODO: Use `MultiSegmentPacker` instead of `StartEndPacker` once we
-        # want to move to multi-segment packing and have improved
-        # `MultiSegmentPacker`'s performance.
-        self.decoder_packer = StartEndPacker(
-            start_value=bos_tokens,
-            end_value=self.tokenizer.eos_token_id,
-            pad_value=self.tokenizer.pad_token_id,
-            sequence_length=self.decoder_sequence_length,
-            return_padding_mask=True,
-        )
-    def call(self, x, y=None, sample_weight=None, decoder_sequence_length=None):
-        if not (
-            isinstance(x, dict)
-            and ["encoder_audio", "decoder_text"] == list(x.keys())
-        ):
-            raise ValueError(
-                '`x` must be a dictionary, containing the keys `"encoder_audio"`'
-                f' and `"decoder_text"`. Received x={x}.'
-            )
-        encoder_audio = x["encoder_audio"]
-        decoder_text = x["decoder_text"]
-        encoder_audio = convert_inputs_to_list_of_tensor_segments(encoder_audio)
-        decoder_text = convert_inputs_to_list_of_tensor_segments(decoder_text)
-        if len(encoder_audio) > 1 or len(decoder_text) > 1:
-            raise ValueError(
-                '`WhisperPreprocessor` requires both `"encoder_audio"` and '
-                f'`"decoder_text"` to contain only one segment, but received '
-                f"{len(encoder_audio)} and {len(decoder_text)}, respectively."
-            )
-        encoder_features = self.audio_feature_extractor(encoder_audio[0])
-        decoder_sequence_length = (
-            decoder_sequence_length or self.decoder_sequence_length
-        )
-        decoder_inputs = self.tokenizer(decoder_text[0])
-        decoder_token_ids, decoder_padding_mask = self.decoder_packer(
-            decoder_inputs,
-            sequence_length=decoder_sequence_length,
-        )
-        x = {
-            "encoder_features": encoder_features,
-            "decoder_token_ids": decoder_token_ids,
-            "decoder_padding_mask": decoder_padding_mask,
-        }
-        return keras.utils.pack_x_y_sample_weight(x, y, sample_weight)
-    def get_config(self):
-        config = super().get_config()
-        config.update(
-            {
-                "audio_feature_extractor": keras.layers.serialize(
-                    self.audio_feature_extractor
-                ),
-                "decoder_sequence_length": self.decoder_sequence_length,
-                "language": self.language,
-                "task": self.task,
-                "no_timestamps": self.no_timestamps,
-            }
-        )
-        return config
-    @classmethod
-    def from_config(cls, config):
-        if "tokenizer" in config and isinstance(config["tokenizer"], dict):
-            config["tokenizer"] = keras.layers.deserialize(config["tokenizer"])
-        if "audio_feature_extractor" in config and isinstance(
-            config["audio_feature_extractor"], dict
-        ):
-            config["audio_feature_extractor"] = keras.layers.deserialize(
-                config["audio_feature_extractor"]
-            )
-        return cls(**config)
-    @property
-    def decoder_sequence_length(self):
-        """The padded length of decoder input sequences."""
-        return self._decoder_sequence_length
-    @decoder_sequence_length.setter
-    def decoder_sequence_length(self, value):
-        self._decoder_sequence_length = value
-        if self.decoder_packer is not None:
-            self.decoder_packer.sequence_length = value
-    @property
-    def sequence_length(self):
-        """Alias for `decoder_sequence_length`."""
-        return self.decoder_sequence_length
-    @sequence_length.setter
-    def sequence_length(self, value):
-        self.decoder_sequence_length = value

keras_hub/src/utils/timm/convert.py DELETED Viewed

@@ -1,37 +0,0 @@
-# Copyright 2024 The KerasHub Authors
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     https://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""Convert timm models to KerasHub."""
-from keras_hub.src.utils.timm.convert_resnet import load_resnet_backbone
-def load_timm_backbone(cls, preset, load_weights, **kwargs):
-    """Load a timm model config and weights as a KerasHub backbone.
-    Args:
-        cls (class): Keras model class.
-        preset (str): Preset configuration name.
-        load_weights (bool): Whether to load the weights.
-    Returns:
-        backbone: Initialized Keras model backbone.
-    """
-    if cls is None:
-        raise ValueError("Backbone class is None")
-    if cls.__name__ == "ResNetBackbone":
-        return load_resnet_backbone(cls, preset, load_weights, **kwargs)
-    raise ValueError(
-        f"{cls} has not been ported from the Hugging Face format yet. "
-        "Please check Hugging Face Hub for the Keras model. "
-    )

keras_hub/src/utils/transformers/convert.py DELETED Viewed

@@ -1,101 +0,0 @@
-# Copyright 2024 The KerasHub Authors
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     https://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""Convert huggingface models to KerasHub."""
-from keras_hub.src.utils.transformers.convert_bert import load_bert_backbone
-from keras_hub.src.utils.transformers.convert_bert import load_bert_tokenizer
-from keras_hub.src.utils.transformers.convert_distilbert import (
-    load_distilbert_backbone,
-)
-from keras_hub.src.utils.transformers.convert_distilbert import (
-    load_distilbert_tokenizer,
-)
-from keras_hub.src.utils.transformers.convert_gemma import load_gemma_backbone
-from keras_hub.src.utils.transformers.convert_gemma import load_gemma_tokenizer
-from keras_hub.src.utils.transformers.convert_gpt2 import load_gpt2_backbone
-from keras_hub.src.utils.transformers.convert_gpt2 import load_gpt2_tokenizer
-from keras_hub.src.utils.transformers.convert_llama3 import load_llama3_backbone
-from keras_hub.src.utils.transformers.convert_llama3 import (
-    load_llama3_tokenizer,
-)
-from keras_hub.src.utils.transformers.convert_pali_gemma import (
-    load_pali_gemma_backbone,
-)
-from keras_hub.src.utils.transformers.convert_pali_gemma import (
-    load_pali_gemma_tokenizer,
-)
-def load_transformers_backbone(cls, preset, load_weights):
-    """
-    Load a Transformer model config and weights as a KerasHub backbone.
-    Args:
-        cls (class): Keras model class.
-        preset (str): Preset configuration name.
-        load_weights (bool): Whether to load the weights.
-    Returns:
-        backbone: Initialized Keras model backbone.
-    """
-    if cls is None:
-        raise ValueError("Backbone class is None")
-    if cls.__name__ == "BertBackbone":
-        return load_bert_backbone(cls, preset, load_weights)
-    if cls.__name__ == "GemmaBackbone":
-        return load_gemma_backbone(cls, preset, load_weights)
-    if cls.__name__ == "Llama3Backbone":
-        return load_llama3_backbone(cls, preset, load_weights)
-    if cls.__name__ == "PaliGemmaBackbone":
-        return load_pali_gemma_backbone(cls, preset, load_weights)
-    if cls.__name__ == "GPT2Backbone":
-        return load_gpt2_backbone(cls, preset, load_weights)
-    if cls.__name__ == "DistilBertBackbone":
-        return load_distilbert_backbone(cls, preset, load_weights)
-    raise ValueError(
-        f"{cls} has not been ported from the Hugging Face format yet. "
-        "Please check Hugging Face Hub for the Keras model. "
-    )
-def load_transformers_tokenizer(cls, preset):
-    """
-    Load a Transformer tokenizer assets as a KerasHub tokenizer.
-    Args:
-        cls (class): Tokenizer class.
-        preset (str): Preset configuration name.
-    Returns:
-        tokenizer: Initialized tokenizer.
-    """
-    if cls is None:
-        raise ValueError("Tokenizer class is None")
-    if cls.__name__ == "BertTokenizer":
-        return load_bert_tokenizer(cls, preset)
-    if cls.__name__ == "GemmaTokenizer":
-        return load_gemma_tokenizer(cls, preset)
-    if cls.__name__ == "Llama3Tokenizer":
-        return load_llama3_tokenizer(cls, preset)
-    if cls.__name__ == "PaliGemmaTokenizer":
-        return load_pali_gemma_tokenizer(cls, preset)
-    if cls.__name__ == "GPT2Tokenizer":
-        return load_gpt2_tokenizer(cls, preset)
-    if cls.__name__ == "DistilBertTokenizer":
-        return load_distilbert_tokenizer(cls, preset)
-    raise ValueError(
-        f"{cls} has not been ported from the Hugging Face format yet. "
-        "Please check Hugging Face Hub for the Keras model. "
-    )

keras_hub_nightly-0.15.0.dev20240823171555.dist-info/METADATA DELETED Viewed

@@ -1,34 +0,0 @@
-Metadata-Version: 2.1
-Name: keras-hub-nightly
-Version: 0.15.0.dev20240823171555
-Summary: 🚧🚧🚧 Work in progress. 🚧🚧🚧 More details soon!
-Home-page: https://github.com/keras-team/keras-hub
-Author: Keras team
-Author-email: keras-hub@google.com
-License: Apache License 2.0
-Classifier: Development Status :: 3 - Alpha
-Classifier: Programming Language :: Python :: 3
-Classifier: Programming Language :: Python :: 3.8
-Classifier: Programming Language :: Python :: 3.9
-Classifier: Programming Language :: Python :: 3.10
-Classifier: Programming Language :: Python :: 3.11
-Classifier: Programming Language :: Python :: 3 :: Only
-Classifier: Operating System :: Unix
-Classifier: Operating System :: Microsoft :: Windows
-Classifier: Operating System :: MacOS
-Classifier: Intended Audience :: Science/Research
-Classifier: Topic :: Scientific/Engineering
-Classifier: Topic :: Software Development
-Requires-Python: >=3.9
-Requires-Dist: absl-py
-Requires-Dist: numpy
-Requires-Dist: packaging
-Requires-Dist: regex
-Requires-Dist: rich
-Requires-Dist: kagglehub
-Requires-Dist: tensorflow-text ; platform_system != "Darwin"
-Provides-Extra: extras
-Requires-Dist: rouge-score ; extra == 'extras'
-Requires-Dist: sentencepiece ; extra == 'extras'
-🚧🚧🚧 Work in progress. 🚧🚧🚧 More details soon!

keras-hub-nightly 0.15.0.dev20240823171555__py3-none-any.whl → 0.16.0.dev2024092017__py3-none-any.whl

keras-hub-nightly 0.15.0.dev20240823171555py3-none-any.whl → 0.16.0.dev2024092017py3-none-any.whl