PyPI - keras-hub-nightly - Versions diffs - 0.16.1.dev202410200345__py3-none-any.whl → 0.19.0.dev202412070351__py3-none-any.whl - Mend

keras-hub-nightly 0.16.1.dev202410200345py3-none-any.whl → 0.19.0.dev202412070351py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (109) hide show

keras_hub/api/layers/__init__.py +12 -0
keras_hub/api/models/__init__.py +32 -0
keras_hub/src/bounding_box/__init__.py +2 -0
keras_hub/src/bounding_box/converters.py +102 -12
keras_hub/src/layers/modeling/rms_normalization.py +34 -0
keras_hub/src/layers/modeling/transformer_encoder.py +27 -7
keras_hub/src/layers/preprocessing/image_converter.py +5 -0
keras_hub/src/models/albert/albert_presets.py +0 -8
keras_hub/src/models/bart/bart_presets.py +0 -6
keras_hub/src/models/bert/bert_presets.py +0 -20
keras_hub/src/models/bloom/bloom_presets.py +0 -16
keras_hub/src/models/clip/__init__.py +5 -0
keras_hub/src/models/clip/clip_backbone.py +286 -0
keras_hub/src/models/clip/clip_encoder_block.py +19 -4
keras_hub/src/models/clip/clip_image_converter.py +8 -0
keras_hub/src/models/clip/clip_presets.py +93 -0
keras_hub/src/models/clip/clip_text_encoder.py +4 -1
keras_hub/src/models/clip/clip_tokenizer.py +18 -3
keras_hub/src/models/clip/clip_vision_embedding.py +101 -0
keras_hub/src/models/clip/clip_vision_encoder.py +159 -0
keras_hub/src/models/deberta_v3/deberta_v3_presets.py +0 -10
keras_hub/src/models/deeplab_v3/deeplab_v3_presets.py +0 -2
keras_hub/src/models/deeplab_v3/deeplab_v3_segmenter.py +5 -3
keras_hub/src/models/densenet/densenet_backbone.py +1 -1
keras_hub/src/models/densenet/densenet_presets.py +0 -6
keras_hub/src/models/distil_bert/distil_bert_presets.py +0 -6
keras_hub/src/models/efficientnet/__init__.py +9 -0
keras_hub/src/models/efficientnet/cba.py +141 -0
keras_hub/src/models/efficientnet/efficientnet_backbone.py +139 -56
keras_hub/src/models/efficientnet/efficientnet_image_classifier.py +14 -0
keras_hub/src/models/efficientnet/efficientnet_image_classifier_preprocessor.py +16 -0
keras_hub/src/models/efficientnet/efficientnet_image_converter.py +10 -0
keras_hub/src/models/efficientnet/efficientnet_presets.py +192 -0
keras_hub/src/models/efficientnet/fusedmbconv.py +81 -36
keras_hub/src/models/efficientnet/mbconv.py +52 -21
keras_hub/src/models/electra/electra_presets.py +0 -12
keras_hub/src/models/f_net/f_net_presets.py +0 -4
keras_hub/src/models/falcon/falcon_presets.py +0 -2
keras_hub/src/models/flux/__init__.py +5 -0
keras_hub/src/models/flux/flux_layers.py +494 -0
keras_hub/src/models/flux/flux_maths.py +218 -0
keras_hub/src/models/flux/flux_model.py +231 -0
keras_hub/src/models/flux/flux_presets.py +14 -0
keras_hub/src/models/flux/flux_text_to_image.py +142 -0
keras_hub/src/models/flux/flux_text_to_image_preprocessor.py +73 -0
keras_hub/src/models/gemma/gemma_presets.py +0 -40
keras_hub/src/models/gpt2/gpt2_presets.py +0 -9
keras_hub/src/models/image_object_detector.py +87 -0
keras_hub/src/models/image_object_detector_preprocessor.py +57 -0
keras_hub/src/models/image_to_image.py +16 -10
keras_hub/src/models/inpaint.py +20 -13
keras_hub/src/models/llama/llama_backbone.py +1 -1
keras_hub/src/models/llama/llama_presets.py +5 -15
keras_hub/src/models/llama3/llama3_presets.py +0 -8
keras_hub/src/models/mistral/mistral_presets.py +0 -6
keras_hub/src/models/mit/mit_backbone.py +41 -27
keras_hub/src/models/mit/mit_layers.py +9 -7
keras_hub/src/models/mit/mit_presets.py +12 -24
keras_hub/src/models/opt/opt_presets.py +0 -8
keras_hub/src/models/pali_gemma/pali_gemma_backbone.py +61 -11
keras_hub/src/models/pali_gemma/pali_gemma_decoder_block.py +21 -23
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +166 -10
keras_hub/src/models/pali_gemma/pali_gemma_vit.py +12 -11
keras_hub/src/models/phi3/phi3_presets.py +0 -4
keras_hub/src/models/resnet/resnet_presets.py +10 -42
keras_hub/src/models/retinanet/__init__.py +5 -0
keras_hub/src/models/retinanet/anchor_generator.py +52 -53
keras_hub/src/models/retinanet/feature_pyramid.py +99 -36
keras_hub/src/models/retinanet/non_max_supression.py +1 -0
keras_hub/src/models/retinanet/prediction_head.py +192 -0
keras_hub/src/models/retinanet/retinanet_backbone.py +146 -0
keras_hub/src/models/retinanet/retinanet_image_converter.py +53 -0
keras_hub/src/models/retinanet/retinanet_label_encoder.py +49 -51
keras_hub/src/models/retinanet/retinanet_object_detector.py +382 -0
keras_hub/src/models/retinanet/retinanet_object_detector_preprocessor.py +14 -0
keras_hub/src/models/retinanet/retinanet_presets.py +15 -0
keras_hub/src/models/roberta/roberta_presets.py +0 -4
keras_hub/src/models/sam/sam_backbone.py +0 -1
keras_hub/src/models/sam/sam_image_segmenter.py +9 -10
keras_hub/src/models/sam/sam_presets.py +0 -6
keras_hub/src/models/segformer/__init__.py +8 -0
keras_hub/src/models/segformer/segformer_backbone.py +163 -0
keras_hub/src/models/segformer/segformer_image_converter.py +8 -0
keras_hub/src/models/segformer/segformer_image_segmenter.py +171 -0
keras_hub/src/models/segformer/segformer_image_segmenter_preprocessor.py +31 -0
keras_hub/src/models/segformer/segformer_presets.py +124 -0
keras_hub/src/models/stable_diffusion_3/mmdit.py +41 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_backbone.py +38 -21
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_image_to_image.py +3 -3
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_inpaint.py +3 -3
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_presets.py +28 -4
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image.py +1 -1
keras_hub/src/models/t5/t5_backbone.py +5 -4
keras_hub/src/models/t5/t5_presets.py +41 -13
keras_hub/src/models/text_to_image.py +13 -5
keras_hub/src/models/vgg/vgg_backbone.py +1 -1
keras_hub/src/models/vgg/vgg_presets.py +0 -8
keras_hub/src/models/whisper/whisper_audio_converter.py +1 -1
keras_hub/src/models/whisper/whisper_presets.py +0 -20
keras_hub/src/models/xlm_roberta/xlm_roberta_presets.py +0 -4
keras_hub/src/tests/test_case.py +25 -0
keras_hub/src/utils/preset_utils.py +17 -4
keras_hub/src/utils/timm/convert_efficientnet.py +449 -0
keras_hub/src/utils/timm/preset_loader.py +3 -0
keras_hub/src/version_utils.py +1 -1
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/METADATA +15 -26
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/RECORD +109 -76
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/WHEEL +1 -1
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/top_level.txt +0 -0

keras_hub/src/models/gemma/gemma_presets.py CHANGED Viewed

@@ -6,9 +6,7 @@ backbone_presets = {
         "metadata": {
             "description": "2 billion parameter, 18-layer, base Gemma model.",
             "params": 2506172416,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma/keras/gemma_2b_en/2",
     },
@@ -18,9 +16,7 @@ backbone_presets = {
                 "2 billion parameter, 18-layer, instruction tuned Gemma model."
             ),
             "params": 2506172416,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma/keras/gemma_instruct_2b_en/2",
     },
@@ -31,9 +27,7 @@ backbone_presets = {
                 "The 1.1 update improves model quality."
             ),
             "params": 2506172416,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma/keras/gemma_1.1_instruct_2b_en/3",
     },
@@ -45,9 +39,7 @@ backbone_presets = {
                 "completion. The 1.1 update improves model quality."
             ),
             "params": 2506172416,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/codegemma/keras/code_gemma_1.1_2b_en/1",
     },
@@ -59,9 +51,7 @@ backbone_presets = {
                 "completion."
             ),
             "params": 2506172416,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/codegemma/keras/code_gemma_2b_en/1",
     },
@@ -69,9 +59,7 @@ backbone_presets = {
         "metadata": {
             "description": "7 billion parameter, 28-layer, base Gemma model.",
             "params": 8537680896,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma/keras/gemma_7b_en/2",
     },
@@ -81,9 +69,7 @@ backbone_presets = {
                 "7 billion parameter, 28-layer, instruction tuned Gemma model."
             ),
             "params": 8537680896,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma/keras/gemma_instruct_7b_en/2",
     },
@@ -94,9 +80,7 @@ backbone_presets = {
                 "The 1.1 update improves model quality."
             ),
             "params": 8537680896,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma/keras/gemma_1.1_instruct_7b_en/3",
     },
@@ -108,9 +92,7 @@ backbone_presets = {
                 "completion."
             ),
             "params": 8537680896,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/codegemma/keras/code_gemma_7b_en/1",
     },
@@ -122,9 +104,7 @@ backbone_presets = {
                 "to code."
             ),
             "params": 8537680896,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/codegemma/keras/code_gemma_instruct_7b_en/1",
     },
@@ -136,9 +116,7 @@ backbone_presets = {
                 "to code. The 1.1 update improves model quality."
             ),
             "params": 8537680896,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/codegemma/keras/code_gemma_1.1_instruct_7b_en/1",
     },
@@ -146,9 +124,7 @@ backbone_presets = {
         "metadata": {
             "description": "2 billion parameter, 26-layer, base Gemma model.",
             "params": 2614341888,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma2/keras/gemma2_2b_en/1",
     },
@@ -156,9 +132,7 @@ backbone_presets = {
         "metadata": {
             "description": "2 billion parameter, 26-layer, instruction tuned Gemma model.",
             "params": 2614341888,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma2/keras/gemma2_instruct_2b_en/1",
     },
@@ -166,9 +140,7 @@ backbone_presets = {
         "metadata": {
             "description": "9 billion parameter, 42-layer, base Gemma model.",
             "params": 9241705984,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma2/keras/gemma2_9b_en/2",
     },
@@ -176,9 +148,7 @@ backbone_presets = {
         "metadata": {
             "description": "9 billion parameter, 42-layer, instruction tuned Gemma model.",
             "params": 9241705984,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma2/keras/gemma2_instruct_9b_en/2",
     },
@@ -186,9 +156,7 @@ backbone_presets = {
         "metadata": {
             "description": "27 billion parameter, 42-layer, base Gemma model.",
             "params": 27227128320,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma2/keras/gemma2_27b_en/1",
     },
@@ -196,9 +164,7 @@ backbone_presets = {
         "metadata": {
             "description": "27 billion parameter, 42-layer, instruction tuned Gemma model.",
             "params": 27227128320,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://keras/gemma2/keras/gemma2_instruct_27b_en/1",
     },
@@ -206,9 +172,7 @@ backbone_presets = {
         "metadata": {
             "description": "2 billion parameter, 26-layer, ShieldGemma model.",
             "params": 2614341888,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://google/shieldgemma/keras/shieldgemma_2b_en/1",
     },
@@ -216,9 +180,7 @@ backbone_presets = {
         "metadata": {
             "description": "9 billion parameter, 42-layer, ShieldGemma model.",
             "params": 9241705984,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://google/shieldgemma/keras/shieldgemma_9b_en/1",
     },
@@ -226,9 +188,7 @@ backbone_presets = {
         "metadata": {
             "description": "27 billion parameter, 42-layer, ShieldGemma model.",
             "params": 27227128320,
-            "official_name": "Gemma",
             "path": "gemma",
-            "model_card": "https://www.kaggle.com/models/google/gemma",
         },
         "kaggle_handle": "kaggle://google/shieldgemma/keras/shieldgemma_27b_en/1",
     },

keras_hub/src/models/gpt2/gpt2_presets.py CHANGED Viewed

@@ -9,9 +9,7 @@ backbone_presets = {
                 "Trained on WebText."
             ),
             "params": 124439808,
-            "official_name": "GPT-2",
             "path": "gpt2",
-            "model_card": "https://github.com/openai/gpt-2/blob/master/model_card.md",
         },
         "kaggle_handle": "kaggle://keras/gpt2/keras/gpt2_base_en/2",
     },
@@ -22,9 +20,7 @@ backbone_presets = {
                 "Trained on WebText."
             ),
             "params": 354823168,
-            "official_name": "GPT-2",
             "path": "gpt2",
-            "model_card": "https://github.com/openai/gpt-2/blob/master/model_card.md",
         },
         "kaggle_handle": "kaggle://keras/gpt2/keras/gpt2_medium_en/2",
     },
@@ -35,9 +31,7 @@ backbone_presets = {
                 "Trained on WebText."
             ),
             "params": 774030080,
-            "official_name": "GPT-2",
             "path": "gpt2",
-            "model_card": "https://github.com/openai/gpt-2/blob/master/model_card.md",
         },
         "kaggle_handle": "kaggle://keras/gpt2/keras/gpt2_large_en/2",
     },
@@ -48,9 +42,7 @@ backbone_presets = {
                 "Trained on WebText."
             ),
             "params": 1557611200,
-            "official_name": "GPT-2",
             "path": "gpt2",
-            "model_card": "https://github.com/openai/gpt-2/blob/master/model_card.md",
         },
         "kaggle_handle": "kaggle://keras/gpt2/keras/gpt2_extra_large_en/2",
     },
@@ -61,7 +53,6 @@ backbone_presets = {
                 "Finetuned on the CNN/DailyMail summarization dataset."
             ),
             "params": 124439808,
-            "official_name": "GPT-2",
             "path": "gpt2",
         },
         "kaggle_handle": "kaggle://keras/gpt2/keras/gpt2_base_en_cnn_dailymail/2",

keras_hub/src/models/image_object_detector.py ADDED Viewed

@@ -0,0 +1,87 @@
+import keras
+from keras_hub.src.api_export import keras_hub_export
+from keras_hub.src.models.task import Task
+@keras_hub_export("keras_hub.models.ImageObjectDetector")
+class ImageObjectDetector(Task):
+    """Base class for all image object detection tasks.
+    The `ImageObjectDetector` tasks wrap a `keras_hub.models.Backbone` and
+    a `keras_hub.models.Preprocessor` to create a model that can be used for
+    object detection. `ImageObjectDetector` tasks take an additional
+    `num_classes` argument, controlling the number of predicted output classes.
+    To fine-tune with `fit()`, pass a dataset containing tuples of `(x, y)`
+    labels where `x` is a string and `y` is dictionary with `boxes` and
+    `classes`.
+    All `ImageObjectDetector` tasks include a `from_preset()` constructor which
+    can be used to load a pre-trained config and weights.
+    """
+    def compile(
+        self,
+        optimizer="auto",
+        box_loss="auto",
+        classification_loss="auto",
+        metrics=None,
+        **kwargs,
+    ):
+        """Configures the `ImageObjectDetector` task for training.
+        The `ImageObjectDetector` task extends the default compilation signature of
+        `keras.Model.compile` with defaults for `optimizer`, `loss`, and
+        `metrics`. To override these defaults, pass any value
+        to these arguments during compilation.
+        Args:
+            optimizer: `"auto"`, an optimizer name, or a `keras.Optimizer`
+                instance. Defaults to `"auto"`, which uses the default optimizer
+                for the given model and task. See `keras.Model.compile` and
+                `keras.optimizers` for more info on possible `optimizer` values.
+            box_loss: `"auto"`, a loss name, or a `keras.losses.Loss` instance.
+                Defaults to `"auto"`, where a
+                `keras.losses.Huber` loss will be
+                applied for the object detector task. See
+                `keras.Model.compile` and `keras.losses` for more info on
+                possible `loss` values.
+            classification_loss: `"auto"`, a loss name, or a `keras.losses.Loss`
+                instance. Defaults to `"auto"`, where a
+                `keras.losses.BinaryFocalCrossentropy` loss will be
+                applied for the object detector task. See
+                `keras.Model.compile` and `keras.losses` for more info on
+                possible `loss` values.
+            metrics: `a list of metrics to be evaluated by
+                the model during training and testing. Defaults to `None`.
+                See `keras.Model.compile` and `keras.metrics` for
+                more info on possible `metrics` values.
+            **kwargs: See `keras.Model.compile` for a full list of arguments
+                supported by the compile method.
+        """
+        if optimizer == "auto":
+            optimizer = keras.optimizers.Adam(5e-5)
+        if box_loss == "auto":
+            box_loss = keras.losses.Huber(reduction="sum")
+        if classification_loss == "auto":
+            activation = getattr(self, "activation", None)
+            activation = keras.activations.get(activation)
+            from_logits = activation != keras.activations.sigmoid
+            classification_loss = keras.losses.BinaryFocalCrossentropy(
+                from_logits=from_logits, reduction="sum"
+            )
+        if metrics is not None:
+            raise ValueError("User metrics not yet supported")
+        losses = {
+            "bbox_regression": box_loss,
+            "cls_logits": classification_loss,
+        }
+        super().compile(
+            optimizer=optimizer,
+            loss=losses,
+            metrics=metrics,
+            **kwargs,
+        )

keras_hub/src/models/image_object_detector_preprocessor.py ADDED Viewed

@@ -0,0 +1,57 @@
+import keras
+from keras_hub.src.api_export import keras_hub_export
+from keras_hub.src.models.preprocessor import Preprocessor
+from keras_hub.src.utils.tensor_utils import preprocessing_function
+@keras_hub_export("keras_hub.models.ImageObjectDetectorPreprocessor")
+class ImageObjectDetectorPreprocessor(Preprocessor):
+    """Base class for object detector preprocessing layers.
+    `ImageObjectDetectorPreprocessor` tasks wraps a
+    `keras_hub.layers.Preprocessor` to create a preprocessing layer for
+    object detection tasks. It is intended to be paired with a
+    `keras_hub.models.ImageObjectDetector` task.
+    All `ImageObjectDetectorPreprocessor` take three inputs, `x`, `y`, and
+    `sample_weight`. `x`, the first input, should always be included. It can
+    be a image or batch of images. See examples below. `y` and `sample_weight`
+    are optional inputs that will be passed through unaltered. Usually, `y` will
+    be the a dict of `{"boxes": Tensor(batch_size, num_boxes, 4),
+    "classes": (batch_size, num_boxes)}.
+    The layer will returns either `x`, an `(x, y)` tuple if labels were provided,
+    or an `(x, y, sample_weight)` tuple if labels and sample weight were
+    provided. `x` will be the input images after all model preprocessing has
+    been applied.
+    All `ImageObjectDetectorPreprocessor` tasks include a `from_preset()`
+    constructor which can be used to load a pre-trained config and vocabularies.
+    You can call the `from_preset()` constructor directly on this base class, in
+    which case the correct class for your model will be automatically
+    instantiated.
+    Args:
+        image_converter: Preprocessing pipeline for images.
+    Examples.
+    ```python
+    preprocessor = keras_hub.models.ImageObjectDetectorPreprocessor.from_preset(
+        "retinanet_resnet50",
+    )
+    """
+    def __init__(
+        self,
+        image_converter=None,
+        **kwargs,
+    ):
+        super().__init__(**kwargs)
+        self.image_converter = image_converter
+    @preprocessing_function
+    def call(self, x, y=None, sample_weight=None):
+        if self.image_converter:
+            x = self.image_converter(x)
+        return keras.utils.pack_x_y_sample_weight(x, y, sample_weight)

keras_hub/src/models/image_to_image.py CHANGED Viewed

@@ -234,7 +234,7 @@ class ImageToImage(Task):
                 input_is_scalar = True
             x = ops.image.resize(
                 x,
-                (self.backbone.height, self.backbone.width),
+                (self.backbone.image_shape[0], self.backbone.image_shape[1]),
                 interpolation="nearest",
                 data_format=data_format,
             )
@@ -284,8 +284,8 @@ class ImageToImage(Task):
         self,
         inputs,
         num_steps,
-        guidance_scale,
         strength,
+        guidance_scale=None,
         seed=None,
     ):
         """Generate image based on the provided `inputs`.
@@ -313,30 +313,36 @@ class ImageToImage(Task):
                 - A `tf.data.Dataset` with `"images"`, `"prompts"` and/or
                     `"negative_prompts"` keys.
             num_steps: int. The number of diffusion steps to take.
-            guidance_scale: float. The classifier free guidance scale defined in
-                [Classifier-Free Diffusion Guidance](
-                https://arxiv.org/abs/2207.12598). A higher scale encourages
-                generating images more closely related to the prompts, typically
-                at the cost of lower image quality.
             strength: float. Indicates the extent to which the reference
                 `images` are transformed. Must be between `0.0` and `1.0`. When
                 `strength=1.0`, `images` is essentially ignore and added noise
                 is maximum and the denoising process runs for the full number of
                 iterations specified in `num_steps`.
+            guidance_scale: Optional float. The classifier free guidance scale
+                defined in [Classifier-Free Diffusion Guidance](
+                https://arxiv.org/abs/2207.12598). A higher scale encourages
+                generating images more closely related to the prompts, typically
+                at the cost of lower image quality. Note that some models don't
+                utilize classifier-free guidance.
             seed: optional int. Used as a random seed.
         """
         num_steps = int(num_steps)
-        guidance_scale = float(guidance_scale)
         strength = float(strength)
+        guidance_scale = (
+            float(guidance_scale) if guidance_scale is not None else None
+        )
         if strength < 0.0 or strength > 1.0:
             raise ValueError(
                 "`strength` must be between `0.0` and `1.0`. "
                 f"Received strength={strength}."
             )
+        if guidance_scale is not None and guidance_scale > 1.0:
+            guidance_scale = ops.convert_to_tensor(float(guidance_scale))
+        else:
+            guidance_scale = None
         starting_step = int(num_steps * (1.0 - strength))
         starting_step = ops.convert_to_tensor(starting_step, "int32")
-        num_steps = ops.convert_to_tensor(num_steps, "int32")
-        guidance_scale = ops.convert_to_tensor(guidance_scale)
+        num_steps = ops.convert_to_tensor(int(num_steps), "int32")
         # Check `inputs` format.
         required_keys = ["images", "prompts"]

keras_hub/src/models/inpaint.py CHANGED Viewed

@@ -202,7 +202,7 @@ class Inpaint(Task):
                 input_is_scalar = True
             x = ops.image.resize(
                 x,
-                (self.backbone.height, self.backbone.width),
+                (self.backbone.image_shape[0], self.backbone.image_shape[1]),
                 interpolation="nearest",
                 data_format=data_format,
             )
@@ -240,7 +240,7 @@ class Inpaint(Task):
                 x = ops.cast(x, "float32")
             x = ops.image.resize(
                 x,
-                (self.backbone.height, self.backbone.width),
+                (self.backbone.image_shape[0], self.backbone.image_shape[1]),
                 interpolation="nearest",
                 data_format=data_format,
             )
@@ -303,7 +303,7 @@ class Inpaint(Task):
                 input_is_scalar = True
             x = ops.image.resize(
                 x,
-                (self.backbone.height, self.backbone.width),
+                (self.backbone.image_shape[0], self.backbone.image_shape[1]),
                 interpolation="nearest",
                 data_format=data_format,
             )
@@ -323,7 +323,7 @@ class Inpaint(Task):
                 x = ops.cast(x, "float32")
             x = ops.image.resize(
                 x,
-                (self.backbone.height, self.backbone.width),
+                (self.backbone.image_shape[0], self.backbone.image_shape[1]),
                 interpolation="nearest",
                 data_format=data_format,
             )
@@ -376,16 +376,16 @@ class Inpaint(Task):
         self,
         inputs,
         num_steps,
-        guidance_scale,
         strength,
+        guidance_scale=None,
         seed=None,
     ):
         """Generate image based on the provided `inputs`.
         Typically, `inputs` is a dict with `"images"` `"masks"` and `"prompts"`
         keys. `"images"` are reference images within a value range of
-        `[-1.0, 1.0]`, which will be resized to `self.backbone.height` and
-        `self.backbone.width`, then encoded into latent space by the VAE
+        `[-1.0, 1.0]`, which will be resized to height and width from
+        `self.backbone.image_shape`, then encoded into latent space by the VAE
         encoder. `"masks"` are mask images with a boolean dtype, where white
         pixels are repainted while black pixels are preserved. `"prompts"` are
         strings that will be tokenized and encoded by the text encoder.
@@ -406,26 +406,33 @@ class Inpaint(Task):
                 - A `tf.data.Dataset` with `"images"`, `"masks"`, `"prompts"`
                     and/or `"negative_prompts"` keys.
             num_steps: int. The number of diffusion steps to take.
-            guidance_scale: float. The classifier free guidance scale defined in
-                [Classifier-Free Diffusion Guidance](
-                https://arxiv.org/abs/2207.12598). A higher scale encourages
-                generating images more closely related to the prompts, typically
-                at the cost of lower image quality.
             strength: float. Indicates the extent to which the reference
                 `images` are transformed. Must be between `0.0` and `1.0`. When
                 `strength=1.0`, `images` is essentially ignore and added noise
                 is maximum and the denoising process runs for the full number of
                 iterations specified in `num_steps`.
+            guidance_scale: Optional float. The classifier free guidance scale
+                defined in [Classifier-Free Diffusion Guidance](
+                https://arxiv.org/abs/2207.12598). A higher scale encourages
+                generating images more closely related to the prompts, typically
+                at the cost of lower image quality. Note that some models don't
+                utilize classifier-free guidance.
             seed: optional int. Used as a random seed.
         """
         num_steps = int(num_steps)
-        guidance_scale = float(guidance_scale)
         strength = float(strength)
+        guidance_scale = (
+            float(guidance_scale) if guidance_scale is not None else None
+        )
         if strength < 0.0 or strength > 1.0:
             raise ValueError(
                 "`strength` must be between `0.0` and `1.0`. "
                 f"Received strength={strength}."
             )
+        if guidance_scale is not None and guidance_scale > 1.0:
+            guidance_scale = ops.convert_to_tensor(guidance_scale)
+        else:
+            guidance_scale = None
         starting_step = int(num_steps * (1.0 - strength))
         starting_step = ops.convert_to_tensor(starting_step, "int32")
         num_steps = ops.convert_to_tensor(num_steps, "int32")

keras_hub/src/models/llama/llama_backbone.py CHANGED Viewed

@@ -59,7 +59,7 @@ class LlamaBackbone(Backbone):
     }
     # Pretrained Llama decoder.
-    model = keras_hub.models.LlamaBackbone.from_preset("llama7b_base_en")
+    model = keras_hub.models.LlamaBackbone.from_preset("llama2_7b_en")
     model(input_data)
     # Randomly initialized Llama decoder with custom config.

keras_hub/src/models/llama/llama_presets.py CHANGED Viewed

@@ -6,9 +6,7 @@ backbone_presets = {
         "metadata": {
             "description": "7 billion parameter, 32-layer, base LLaMA 2 model.",
             "params": 6738415616,
-            "official_name": "LLaMA 2",
-            "path": "llama2",
-            "model_card": "https://github.com/meta-llama/llama",
+            "path": "llama",
         },
         "kaggle_handle": "kaggle://keras/llama2/keras/llama2_7b_en/1",
     },
@@ -19,9 +17,7 @@ backbone_presets = {
                 "activation and weights quantized to int8."
             ),
             "params": 6739839488,
-            "official_name": "LLaMA 2",
-            "path": "llama2",
-            "model_card": "https://github.com/meta-llama/llama",
+            "path": "llama",
         },
         "kaggle_handle": "kaggle://keras/llama2/keras/llama2_7b_en_int8/1",
     },
@@ -32,9 +28,7 @@ backbone_presets = {
                 "model."
             ),
             "params": 6738415616,
-            "official_name": "LLaMA 2",
-            "path": "llama2",
-            "model_card": "https://github.com/meta-llama/llama",
+            "path": "llama",
         },
         "kaggle_handle": "kaggle://keras/llama2/keras/llama2_instruct_7b_en/1",
     },
@@ -45,9 +39,7 @@ backbone_presets = {
                 "model with activation and weights quantized to int8."
             ),
             "params": 6739839488,
-            "official_name": "LLaMA 2",
-            "path": "llama2",
-            "model_card": "https://github.com/meta-llama/llama",
+            "path": "llama",
         },
         "kaggle_handle": "kaggle://keras/llama2/keras/llama2_instruct_7b_en_int8/1",
     },
@@ -58,9 +50,7 @@ backbone_presets = {
                 "model."
             ),
             "params": 6738415616,
-            "official_name": "Vicuna",
-            "path": "vicuna",
-            "model_card": "https://github.com/lm-sys/FastChat",
+            "path": "llama",
         },
         "kaggle_handle": "kaggle://keras/vicuna/keras/vicuna_1.5_7b_en/1",
     },

keras_hub/src/models/llama3/llama3_presets.py CHANGED Viewed

@@ -6,9 +6,7 @@ backbone_presets = {
         "metadata": {
             "description": "8 billion parameter, 32-layer, base LLaMA 3 model.",
             "params": 8030261248,
-            "official_name": "LLaMA 3",
             "path": "llama3",
-            "model_card": "https://github.com/meta-llama/llama3",
         },
         "kaggle_handle": "kaggle://keras/llama3/keras/llama3_8b_en/3",
     },
@@ -19,9 +17,7 @@ backbone_presets = {
                 "activation and weights quantized to int8."
             ),
             "params": 8031894016,
-            "official_name": "LLaMA 3",
             "path": "llama3",
-            "model_card": "https://github.com/meta-llama/llama3",
         },
         "kaggle_handle": "kaggle://keras/llama3/keras/llama3_8b_en_int8/1",
     },
@@ -32,9 +28,7 @@ backbone_presets = {
                 "model."
             ),
             "params": 8030261248,
-            "official_name": "LLaMA 3",
             "path": "llama3",
-            "model_card": "https://github.com/meta-llama/llama3",
         },
         "kaggle_handle": "kaggle://keras/llama3/keras/llama3_instruct_8b_en/3",
     },
@@ -45,9 +39,7 @@ backbone_presets = {
                 "model with activation and weights quantized to int8."
             ),
             "params": 8031894016,
-            "official_name": "LLaMA 3",
             "path": "llama3",
-            "model_card": "https://github.com/meta-llama/llama3",
         },
         "kaggle_handle": (
             "kaggle://keras/llama3/keras/llama3_instruct_8b_en_int8/1"

keras-hub-nightly 0.16.1.dev202410200345__py3-none-any.whl → 0.19.0.dev202412070351__py3-none-any.whl

keras-hub-nightly 0.16.1.dev202410200345py3-none-any.whl → 0.19.0.dev202412070351py3-none-any.whl