PyPI - keras-hub-nightly - Versions diffs - 0.16.1.dev202410200345__py3-none-any.whl → 0.19.0.dev202412070351__py3-none-any.whl - Mend

keras-hub-nightly 0.16.1.dev202410200345py3-none-any.whl → 0.19.0.dev202412070351py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (109) hide show

keras_hub/api/layers/__init__.py +12 -0
keras_hub/api/models/__init__.py +32 -0
keras_hub/src/bounding_box/__init__.py +2 -0
keras_hub/src/bounding_box/converters.py +102 -12
keras_hub/src/layers/modeling/rms_normalization.py +34 -0
keras_hub/src/layers/modeling/transformer_encoder.py +27 -7
keras_hub/src/layers/preprocessing/image_converter.py +5 -0
keras_hub/src/models/albert/albert_presets.py +0 -8
keras_hub/src/models/bart/bart_presets.py +0 -6
keras_hub/src/models/bert/bert_presets.py +0 -20
keras_hub/src/models/bloom/bloom_presets.py +0 -16
keras_hub/src/models/clip/__init__.py +5 -0
keras_hub/src/models/clip/clip_backbone.py +286 -0
keras_hub/src/models/clip/clip_encoder_block.py +19 -4
keras_hub/src/models/clip/clip_image_converter.py +8 -0
keras_hub/src/models/clip/clip_presets.py +93 -0
keras_hub/src/models/clip/clip_text_encoder.py +4 -1
keras_hub/src/models/clip/clip_tokenizer.py +18 -3
keras_hub/src/models/clip/clip_vision_embedding.py +101 -0
keras_hub/src/models/clip/clip_vision_encoder.py +159 -0
keras_hub/src/models/deberta_v3/deberta_v3_presets.py +0 -10
keras_hub/src/models/deeplab_v3/deeplab_v3_presets.py +0 -2
keras_hub/src/models/deeplab_v3/deeplab_v3_segmenter.py +5 -3
keras_hub/src/models/densenet/densenet_backbone.py +1 -1
keras_hub/src/models/densenet/densenet_presets.py +0 -6
keras_hub/src/models/distil_bert/distil_bert_presets.py +0 -6
keras_hub/src/models/efficientnet/__init__.py +9 -0
keras_hub/src/models/efficientnet/cba.py +141 -0
keras_hub/src/models/efficientnet/efficientnet_backbone.py +139 -56
keras_hub/src/models/efficientnet/efficientnet_image_classifier.py +14 -0
keras_hub/src/models/efficientnet/efficientnet_image_classifier_preprocessor.py +16 -0
keras_hub/src/models/efficientnet/efficientnet_image_converter.py +10 -0
keras_hub/src/models/efficientnet/efficientnet_presets.py +192 -0
keras_hub/src/models/efficientnet/fusedmbconv.py +81 -36
keras_hub/src/models/efficientnet/mbconv.py +52 -21
keras_hub/src/models/electra/electra_presets.py +0 -12
keras_hub/src/models/f_net/f_net_presets.py +0 -4
keras_hub/src/models/falcon/falcon_presets.py +0 -2
keras_hub/src/models/flux/__init__.py +5 -0
keras_hub/src/models/flux/flux_layers.py +494 -0
keras_hub/src/models/flux/flux_maths.py +218 -0
keras_hub/src/models/flux/flux_model.py +231 -0
keras_hub/src/models/flux/flux_presets.py +14 -0
keras_hub/src/models/flux/flux_text_to_image.py +142 -0
keras_hub/src/models/flux/flux_text_to_image_preprocessor.py +73 -0
keras_hub/src/models/gemma/gemma_presets.py +0 -40
keras_hub/src/models/gpt2/gpt2_presets.py +0 -9
keras_hub/src/models/image_object_detector.py +87 -0
keras_hub/src/models/image_object_detector_preprocessor.py +57 -0
keras_hub/src/models/image_to_image.py +16 -10
keras_hub/src/models/inpaint.py +20 -13
keras_hub/src/models/llama/llama_backbone.py +1 -1
keras_hub/src/models/llama/llama_presets.py +5 -15
keras_hub/src/models/llama3/llama3_presets.py +0 -8
keras_hub/src/models/mistral/mistral_presets.py +0 -6
keras_hub/src/models/mit/mit_backbone.py +41 -27
keras_hub/src/models/mit/mit_layers.py +9 -7
keras_hub/src/models/mit/mit_presets.py +12 -24
keras_hub/src/models/opt/opt_presets.py +0 -8
keras_hub/src/models/pali_gemma/pali_gemma_backbone.py +61 -11
keras_hub/src/models/pali_gemma/pali_gemma_decoder_block.py +21 -23
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +166 -10
keras_hub/src/models/pali_gemma/pali_gemma_vit.py +12 -11
keras_hub/src/models/phi3/phi3_presets.py +0 -4
keras_hub/src/models/resnet/resnet_presets.py +10 -42
keras_hub/src/models/retinanet/__init__.py +5 -0
keras_hub/src/models/retinanet/anchor_generator.py +52 -53
keras_hub/src/models/retinanet/feature_pyramid.py +99 -36
keras_hub/src/models/retinanet/non_max_supression.py +1 -0
keras_hub/src/models/retinanet/prediction_head.py +192 -0
keras_hub/src/models/retinanet/retinanet_backbone.py +146 -0
keras_hub/src/models/retinanet/retinanet_image_converter.py +53 -0
keras_hub/src/models/retinanet/retinanet_label_encoder.py +49 -51
keras_hub/src/models/retinanet/retinanet_object_detector.py +382 -0
keras_hub/src/models/retinanet/retinanet_object_detector_preprocessor.py +14 -0
keras_hub/src/models/retinanet/retinanet_presets.py +15 -0
keras_hub/src/models/roberta/roberta_presets.py +0 -4
keras_hub/src/models/sam/sam_backbone.py +0 -1
keras_hub/src/models/sam/sam_image_segmenter.py +9 -10
keras_hub/src/models/sam/sam_presets.py +0 -6
keras_hub/src/models/segformer/__init__.py +8 -0
keras_hub/src/models/segformer/segformer_backbone.py +163 -0
keras_hub/src/models/segformer/segformer_image_converter.py +8 -0
keras_hub/src/models/segformer/segformer_image_segmenter.py +171 -0
keras_hub/src/models/segformer/segformer_image_segmenter_preprocessor.py +31 -0
keras_hub/src/models/segformer/segformer_presets.py +124 -0
keras_hub/src/models/stable_diffusion_3/mmdit.py +41 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_backbone.py +38 -21
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_image_to_image.py +3 -3
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_inpaint.py +3 -3
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_presets.py +28 -4
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image.py +1 -1
keras_hub/src/models/t5/t5_backbone.py +5 -4
keras_hub/src/models/t5/t5_presets.py +41 -13
keras_hub/src/models/text_to_image.py +13 -5
keras_hub/src/models/vgg/vgg_backbone.py +1 -1
keras_hub/src/models/vgg/vgg_presets.py +0 -8
keras_hub/src/models/whisper/whisper_audio_converter.py +1 -1
keras_hub/src/models/whisper/whisper_presets.py +0 -20
keras_hub/src/models/xlm_roberta/xlm_roberta_presets.py +0 -4
keras_hub/src/tests/test_case.py +25 -0
keras_hub/src/utils/preset_utils.py +17 -4
keras_hub/src/utils/timm/convert_efficientnet.py +449 -0
keras_hub/src/utils/timm/preset_loader.py +3 -0
keras_hub/src/version_utils.py +1 -1
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/METADATA +15 -26
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/RECORD +109 -76
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/WHEEL +1 -1
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/top_level.txt +0 -0

keras_hub/src/models/retinanet/retinanet_label_encoder.py CHANGED Viewed

@@ -1,9 +1,12 @@
+import math
 import keras
 from keras import ops
-from keras_hub.src.bounding_box.converters import _encode_box_to_deltas
+# TODO: https://github.com/keras-team/keras-hub/issues/1965
+from keras_hub.src.bounding_box.converters import convert_format
+from keras_hub.src.bounding_box.converters import encode_box_to_deltas
 from keras_hub.src.bounding_box.iou import compute_iou
-from keras_hub.src.models.retinanet.anchor_generator import AnchorGenerator
 from keras_hub.src.models.retinanet.box_matcher import BoxMatcher
 from keras_hub.src.utils import tensor_utils
@@ -24,17 +27,10 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
     consistency during training, regardless of the input format.
     Args:
-        bounding_box_format: str. The format of bounding boxes of input dataset.
-            Refer TODO: Add link to Keras Core Docs.
-        min_level: int. Minimum level of the output feature pyramid.
-        max_level: int. Maximum level of the output feature pyramid.
-        num_scales: int. Number of intermediate scales added on each level.
-            For example, num_scales=2 adds one additional intermediate anchor
-            scale [2^0, 2^0.5] on each level.
-        aspect_ratios: List[float]. Aspect ratios of anchors added on
-            each level. Each number indicates the ratio of width to height.
-        anchor_size: float. Scale of size of the base anchor relative to the
-            feature stride 2^level.
+        anchor_generator:  A `keras_hub.layers.AnchorGenerator`.
+        bounding_box_format: str. Ground truth format of bounding boxes.
+        encoding_format: str. The desired target encoding format for the boxes.
+            TODO: https://github.com/keras-team/keras-hub/issues/1907
         positive_threshold:  float. the threshold to set an anchor to positive
             match to gt box. Values above it are positive matches.
             Defaults to `0.5`
@@ -43,7 +39,7 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
             Defaults to `0.4`
         box_variance: List[float]. The scaling factors used to scale the
             bounding box targets.
-            Defaults to `[0.1, 0.1, 0.2, 0.2]`.
+            Defaults to `[1.0, 1.0, 1.0, 1.0]`.
         background_class: int. The class ID used for the background class,
             Defaults to `-1`.
         ignore_class: int. The class ID used for the ignore class,
@@ -63,15 +59,12 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
     def __init__(
         self,
+        anchor_generator,
         bounding_box_format,
-        min_level,
-        max_level,
-        num_scales,
-        aspect_ratios,
-        anchor_size,
+        encoding_format="center_yxhw",
         positive_threshold=0.5,
         negative_threshold=0.4,
-        box_variance=[0.1, 0.1, 0.2, 0.2],
+        box_variance=[1.0, 1.0, 1.0, 1.0],
         background_class=-1.0,
         ignore_class=-2.0,
         box_matcher_match_values=[-1, -2, 1],
@@ -79,27 +72,15 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
         **kwargs,
     ):
         super().__init__(**kwargs)
+        self.anchor_generator = anchor_generator
         self.bounding_box_format = bounding_box_format
-        self.min_level = min_level
-        self.max_level = max_level
-        self.num_scales = num_scales
-        self.aspect_ratios = aspect_ratios
-        self.anchor_size = anchor_size
+        self.encoding_format = encoding_format
         self.positive_threshold = positive_threshold
         self.box_variance = box_variance
         self.negative_threshold = negative_threshold
         self.background_class = background_class
         self.ignore_class = ignore_class
-        self.anchor_generator = AnchorGenerator(
-            bounding_box_format=bounding_box_format,
-            min_level=min_level,
-            max_level=max_level,
-            num_scales=num_scales,
-            aspect_ratios=aspect_ratios,
-            anchor_size=anchor_size,
-        )
         self.box_matcher = BoxMatcher(
             thresholds=[negative_threshold, positive_threshold],
             match_values=box_matcher_match_values,
@@ -116,7 +97,7 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
             images: A Tensor. The  input images argument should be
                 of shape `[B, H, W, C]` or `[B, C, H, W]`.
             gt_boxes: A Tensor with shape of `[B, num_boxes, 4]`.
-            gt_labels: A Tensor with shape of `[B, num_boxes, num_classes]`
+            gt_classes: A Tensor with shape of `[B, num_boxes, num_classes]`
         Returns:
             box_targets: A Tensor of shape `[batch_size, num_anchors, 4]`
@@ -171,10 +152,15 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
             image_shape: Tuple indicating the image shape `[H, W, C]`.
         Returns:
-            Encoded boudning boxes in the format of `center_yxwh` and
+            Encoded bounding boxes in the format of `center_yxwh` and
             corresponding labels for each encoded bounding box.
         """
+        anchor_boxes = convert_format(
+            anchor_boxes,
+            source=self.anchor_generator.bounding_box_format,
+            target=self.bounding_box_format,
+            image_shape=image_shape,
+        )
         iou_matrix = compute_iou(
             anchor_boxes,
             gt_boxes,
@@ -193,11 +179,12 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
             matched_gt_boxes, (-1, ops.shape(matched_gt_boxes)[1], 4)
         )
-        box_target = _encode_box_to_deltas(
+        box_targets = encode_box_to_deltas(
             anchors=anchor_boxes,
             boxes=matched_gt_boxes,
             anchor_format=self.bounding_box_format,
             box_format=self.bounding_box_format,
+            encoding_format=self.encoding_format,
             variance=self.box_variance,
             image_shape=image_shape,
         )
@@ -205,16 +192,16 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
         matched_gt_cls_ids = tensor_utils.target_gather(
             gt_classes, matched_gt_idx
         )
-        cls_target = ops.where(
+        class_targets = ops.where(
             ops.not_equal(positive_mask, 1.0),
             self.background_class,
             matched_gt_cls_ids,
         )
-        cls_target = ops.where(
-            ops.equal(ignore_mask, 1.0), self.ignore_class, cls_target
+        class_targets = ops.where(
+            ops.equal(ignore_mask, 1.0), self.ignore_class, class_targets
         )
         label = ops.concatenate(
-            [box_target, ops.cast(cls_target, box_target.dtype)], axis=-1
+            [box_targets, ops.cast(class_targets, box_targets.dtype)], axis=-1
         )
         # In the case that a box in the corner of an image matches with an all
@@ -234,12 +221,11 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
         config = super().get_config()
         config.update(
             {
+                "anchor_generator": keras.layers.serialize(
+                    self.anchor_generator
+                ),
                 "bounding_box_format": self.bounding_box_format,
-                "min_level": self.min_level,
-                "max_level": self.max_level,
-                "num_scales": self.num_scales,
-                "aspect_ratios": self.aspect_ratios,
-                "anchor_size": self.anchor_size,
+                "encoding_format": self.encoding_format,
                 "positive_threshold": self.positive_threshold,
                 "box_variance": self.box_variance,
                 "negative_threshold": self.negative_threshold,
@@ -249,6 +235,18 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
         )
         return config
+    @classmethod
+    def from_config(cls, config):
+        config.update(
+            {
+                "anchor_generator": keras.layers.deserialize(
+                    config["anchor_generator"]
+                ),
+            }
+        )
+        return super().from_config(config)
     def compute_output_shape(
         self, images_shape, gt_boxes_shape, gt_classes_shape
     ):
@@ -258,10 +256,10 @@ class RetinaNetLabelEncoder(keras.layers.Layer):
         total_num_anchors = 0
         for i in range(min_level, max_level + 1):
-            total_num_anchors += (
-                (image_H // 2 ** (i))
-                * (image_W // 2 ** (i))
-                * self.anchor_generator.anchors_per_location
+            total_num_anchors += int(
+                math.ceil(image_H / 2 ** (i))
+                * math.ceil(image_W / 2 ** (i))
+                * self.anchor_generator.num_base_anchors
             )
         return (batch_size, total_num_anchors, 4), (

keras_hub/src/models/retinanet/retinanet_object_detector.py ADDED Viewed

@@ -0,0 +1,382 @@
+import keras
+from keras import ops
+from keras_hub.src.api_export import keras_hub_export
+# TODO: https://github.com/keras-team/keras-hub/issues/1965
+from keras_hub.src.bounding_box.converters import convert_format
+from keras_hub.src.bounding_box.converters import decode_deltas_to_boxes
+from keras_hub.src.models.image_object_detector import ImageObjectDetector
+from keras_hub.src.models.retinanet.anchor_generator import AnchorGenerator
+from keras_hub.src.models.retinanet.non_max_supression import NonMaxSuppression
+from keras_hub.src.models.retinanet.prediction_head import PredictionHead
+from keras_hub.src.models.retinanet.retinanet_backbone import RetinaNetBackbone
+from keras_hub.src.models.retinanet.retinanet_label_encoder import (
+    RetinaNetLabelEncoder,
+)
+from keras_hub.src.models.retinanet.retinanet_object_detector_preprocessor import (
+    RetinaNetObjectDetectorPreprocessor,
+)
+@keras_hub_export("keras_hub.models.RetinaNetObjectDetector")
+class RetinaNetObjectDetector(ImageObjectDetector):
+    """RetinaNet object detector model.
+    This class implements the RetinaNet object detection architecture.
+    It consists of a feature extractor backbone, a feature pyramid network(FPN),
+    and two prediction heads (for classification and bounding box regression).
+    Args:
+        backbone: `keras.Model`. A `keras.models.RetinaNetBackbone` class,
+            defining the backbone network architecture. Provides feature maps
+            for detection.
+        anchor_generator: A `keras_hub.layers.AnchorGenerator` instance.
+            Generates anchor boxes at different scales and aspect ratios
+            across the image. If None, a default `AnchorGenerator` is
+            created with the following parameters:
+                - `bounding_box_format`:  Same as the model's
+                   `bounding_box_format`.
+                - `min_level`: The backbone's `min_level`.
+                - `max_level`: The backbone's `max_level`.
+                - `num_scales`: 3.
+                - `aspect_ratios`: [0.5, 1.0, 2.0].
+                - `anchor_size`: 4.0.
+            You can create a custom `AnchorGenerator` by instantiating the
+            `keras_hub.layers.AnchorGenerator` class and passing the desired
+            arguments.
+        num_classes: int. The number of object classes to be detected.
+        bounding_box_format: str. Dataset bounding box format (e.g., "xyxy",
+            "yxyx"). The supported formats are
+            refer TODO: https://github.com/keras-team/keras-hub/issues/1907.
+            Defaults to `yxyx`.
+        label_encoder: Optional. A `RetinaNetLabelEncoder` instance.  Encodes
+            ground truth boxes and classes into training targets. It matches
+            ground truth boxes to anchors based on IoU and encodes box
+            coordinates as offsets. If `None`, a default encoder is created.
+            See the
+            `keras_hub.src.models.retinanet.retinanet_label_encoder.RetinaNetLabelEncoder`
+            class for details. If None, a default encoder is created with
+            standard parameters.
+                - `anchor_generator`: Same as the model's.
+                - `bounding_box_format`:  Same as the model's
+                   `bounding_box_format`.
+                - `positive_threshold`: 0.5
+                - `negative_threshold`: 0.4
+                - `encoding_format`: "center_xywh"
+                - `box_variance`: [1.0, 1.0, 1.0, 1.0]
+                - `background_class`: -1
+                - `ignore_class`: -2
+        use_prediction_head_norm: bool. Whether to use Group Normalization after
+            the convolution layers in the prediction heads. Defaults to `False`.
+        classification_head_prior_probability: float.  Prior probability for the
+            classification head (used for focal loss). Defaults to 0.01.
+        pre_logits_num_conv_layers: int. The number of convolutional layers in
+            the head before the logits layer. These convolutional layers are
+            applied before the final linear layer (logits) that produces the
+            output predictions (bounding box regressions, classification scores).
+        preprocessor: Optional. An instance of
+            `RetinaNetObjectDetectorPreprocessor`or a custom preprocessor.
+            Handles image preprocessing before feeding into the backbone.
+        activation: Optional. The activation function to be used in the
+            classification head. If None, sigmoid is used.
+        dtype: Optional. The data type for the prediction heads. Defaults to the
+            backbone's dtype policy.
+        prediction_decoder: Optional. A `keras.layers.Layer` instance
+            responsible for transforming RetinaNet predictions
+            (box regressions and classifications) into final bounding boxes and
+            classes with confidence scores. Defaults to a `NonMaxSuppression`
+            instance.
+    """
+    backbone_cls = RetinaNetBackbone
+    preprocessor_cls = RetinaNetObjectDetectorPreprocessor
+    def __init__(
+        self,
+        backbone,
+        num_classes,
+        bounding_box_format="yxyx",
+        anchor_generator=None,
+        label_encoder=None,
+        use_prediction_head_norm=False,
+        classification_head_prior_probability=0.01,
+        pre_logits_num_conv_layers=4,
+        preprocessor=None,
+        activation=None,
+        dtype=None,
+        prediction_decoder=None,
+        **kwargs,
+    ):
+        # === Layers ===
+        image_input = keras.layers.Input(backbone.image_shape, name="images")
+        head_dtype = dtype or backbone.dtype_policy
+        anchor_generator = anchor_generator or AnchorGenerator(
+            bounding_box_format,
+            min_level=backbone.min_level,
+            max_level=backbone.max_level,
+            num_scales=3,
+            aspect_ratios=[0.5, 1.0, 2.0],
+            anchor_size=4,
+        )
+        # As weights are ported from torch they use encoded format
+        # as "center_xywh"
+        label_encoder = label_encoder or RetinaNetLabelEncoder(
+            anchor_generator,
+            bounding_box_format=bounding_box_format,
+            encoding_format="center_xywh",
+        )
+        box_head = PredictionHead(
+            output_filters=anchor_generator.num_base_anchors * 4,
+            num_conv_layers=pre_logits_num_conv_layers,
+            num_filters=256,
+            use_group_norm=use_prediction_head_norm,
+            use_prior_probability=True,
+            prior_probability=classification_head_prior_probability,
+            dtype=head_dtype,
+            name="box_head",
+        )
+        classification_head = PredictionHead(
+            output_filters=anchor_generator.num_base_anchors * num_classes,
+            num_conv_layers=pre_logits_num_conv_layers,
+            num_filters=256,
+            use_group_norm=use_prediction_head_norm,
+            dtype=head_dtype,
+            name="classification_head",
+        )
+        # === Functional Model ===
+        feature_map = backbone(image_input)
+        class_predictions = []
+        box_predictions = []
+        # Iterate through the feature pyramid levels (e.g., P3, P4, P5, P6, P7).
+        for level in feature_map:
+            box_predictions.append(
+                keras.layers.Reshape((-1, 4), name=f"box_pred_{level}")(
+                    box_head(feature_map[level])
+                )
+            )
+            class_predictions.append(
+                keras.layers.Reshape(
+                    (-1, num_classes), name=f"cls_pred_{level}"
+                )(classification_head(feature_map[level]))
+            )
+        # Concatenate predictions from all FPN levels.
+        class_predictions = keras.layers.Concatenate(axis=1, name="cls_logits")(
+            class_predictions
+        )
+        # box_pred is always in "center_xywh" delta-encoded no matter what
+        # format you pass in.
+        box_predictions = keras.layers.Concatenate(
+            axis=1, name="bbox_regression"
+        )(box_predictions)
+        outputs = {
+            "bbox_regression": box_predictions,
+            "cls_logits": class_predictions,
+        }
+        super().__init__(
+            inputs=image_input,
+            outputs=outputs,
+            **kwargs,
+        )
+        # === Config ===
+        self.bounding_box_format = bounding_box_format
+        self.use_prediction_head_norm = use_prediction_head_norm
+        self.num_classes = num_classes
+        self.backbone = backbone
+        self.preprocessor = preprocessor
+        self.activation = activation
+        self.pre_logits_num_conv_layers = pre_logits_num_conv_layers
+        self.box_head = box_head
+        self.classification_head = classification_head
+        self.anchor_generator = anchor_generator
+        self.label_encoder = label_encoder
+        self._prediction_decoder = prediction_decoder or NonMaxSuppression(
+            from_logits=(activation != keras.activations.sigmoid),
+            bounding_box_format=bounding_box_format,
+        )
+    def compute_loss(self, x, y, y_pred, sample_weight, **kwargs):
+        y_for_label_encoder = convert_format(
+            y,
+            source=self.bounding_box_format,
+            target=self.label_encoder.bounding_box_format,
+            images=x,
+        )
+        boxes, classes = self.label_encoder(
+            images=x,
+            gt_boxes=y_for_label_encoder["boxes"],
+            gt_classes=y_for_label_encoder["classes"],
+        )
+        box_pred = y_pred["bbox_regression"]
+        cls_pred = y_pred["cls_logits"]
+        if boxes.shape[-1] != 4:
+            raise ValueError(
+                "boxes should have shape (None, None, 4). Got "
+                f"boxes.shape={tuple(boxes.shape)}"
+            )
+        if box_pred.shape[-1] != 4:
+            raise ValueError(
+                "box_pred should have shape (None, None, 4). Got "
+                f"box_pred.shape={tuple(box_pred.shape)}. Does your model's "
+                "`num_classes` parameter match your losses `num_classes` "
+                "parameter?"
+            )
+        if cls_pred.shape[-1] != self.num_classes:
+            raise ValueError(
+                "cls_pred should have shape (None, None, 4). Got "
+                f"cls_pred.shape={tuple(cls_pred.shape)}. Does your model's "
+                "`num_classes` parameter match your losses `num_classes` "
+                "parameter?"
+            )
+        cls_labels = ops.one_hot(
+            ops.cast(classes, "int32"), self.num_classes, dtype="float32"
+        )
+        positive_mask = ops.cast(ops.greater(classes, -1.0), dtype="float32")
+        normalizer = ops.sum(positive_mask)
+        cls_weights = ops.cast(ops.not_equal(classes, -2.0), dtype="float32")
+        cls_weights /= normalizer
+        box_weights = positive_mask / normalizer
+        y_true = {
+            "bbox_regression": boxes,
+            "cls_logits": cls_labels,
+        }
+        sample_weights = {
+            "bbox_regression": box_weights,
+            "cls_logits": cls_weights,
+        }
+        zero_weight = {
+            "bbox_regression": ops.zeros_like(box_weights),
+            "cls_logits": ops.zeros_like(cls_weights),
+        }
+        sample_weight = ops.cond(
+            normalizer == 0,
+            lambda: zero_weight,
+            lambda: sample_weights,
+        )
+        return super().compute_loss(
+            x=x, y=y_true, y_pred=y_pred, sample_weight=sample_weight, **kwargs
+        )
+    def predict_step(self, *args):
+        outputs = super().predict_step(*args)
+        if isinstance(outputs, tuple):
+            return self.decode_predictions(outputs[0], args[-1]), outputs[1]
+        return self.decode_predictions(outputs, *args)
+    @property
+    def prediction_decoder(self):
+        return self._prediction_decoder
+    @prediction_decoder.setter
+    def prediction_decoder(self, prediction_decoder):
+        if prediction_decoder.bounding_box_format != self.bounding_box_format:
+            raise ValueError(
+                "Expected `prediction_decoder` and `RetinaNet` to "
+                "use the same `bounding_box_format`, but got "
+                "`prediction_decoder.bounding_box_format="
+                f"{prediction_decoder.bounding_box_format}`, and "
+                "`self.bounding_box_format="
+                f"{self.bounding_box_format}`."
+            )
+        self._prediction_decoder = prediction_decoder
+        self.make_predict_function(force=True)
+        self.make_train_function(force=True)
+        self.make_test_function(force=True)
+    def decode_predictions(self, predictions, data):
+        box_pred = predictions["bbox_regression"]
+        cls_pred = predictions["cls_logits"]
+        # box_pred is on "center_yxhw" format, convert to target format.
+        if isinstance(data, list) or isinstance(data, tuple):
+            images, _ = data
+        else:
+            images = data
+        image_shape = ops.shape(images)[1:]
+        anchor_boxes = self.anchor_generator(images)
+        anchor_boxes = ops.concatenate(list(anchor_boxes.values()), axis=0)
+        box_pred = decode_deltas_to_boxes(
+            anchors=anchor_boxes,
+            boxes_delta=box_pred,
+            encoded_format="center_xywh",
+            anchor_format=self.anchor_generator.bounding_box_format,
+            box_format=self.bounding_box_format,
+            image_shape=image_shape,
+        )
+        # box_pred is now in "self.bounding_box_format" format
+        box_pred = convert_format(
+            box_pred,
+            source=self.bounding_box_format,
+            target=self.prediction_decoder.bounding_box_format,
+            image_shape=image_shape,
+        )
+        y_pred = self.prediction_decoder(
+            box_pred, cls_pred, image_shape=image_shape
+        )
+        y_pred["boxes"] = convert_format(
+            y_pred["boxes"],
+            source=self.prediction_decoder.bounding_box_format,
+            target=self.bounding_box_format,
+            image_shape=image_shape,
+        )
+        return y_pred
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "num_classes": self.num_classes,
+                "use_prediction_head_norm": self.use_prediction_head_norm,
+                "pre_logits_num_conv_layers": self.pre_logits_num_conv_layers,
+                "bounding_box_format": self.bounding_box_format,
+                "anchor_generator": keras.layers.serialize(
+                    self.anchor_generator
+                ),
+                "label_encoder": keras.layers.serialize(self.label_encoder),
+                "prediction_decoder": keras.layers.serialize(
+                    self._prediction_decoder
+                ),
+            }
+        )
+        return config
+    @classmethod
+    def from_config(cls, config):
+        if "label_encoder" in config and isinstance(
+            config["label_encoder"], dict
+        ):
+            config["label_encoder"] = keras.layers.deserialize(
+                config["label_encoder"]
+            )
+        if "anchor_generator" in config and isinstance(
+            config["anchor_generator"], dict
+        ):
+            config["anchor_generator"] = keras.layers.deserialize(
+                config["anchor_generator"]
+            )
+        if "prediction_decoder" in config and isinstance(
+            config["prediction_decoder"], dict
+        ):
+            config["prediction_decoder"] = keras.layers.deserialize(
+                config["prediction_decoder"]
+            )
+        return super().from_config(config)

keras_hub/src/models/retinanet/retinanet_object_detector_preprocessor.py ADDED Viewed

@@ -0,0 +1,14 @@
+from keras_hub.src.api_export import keras_hub_export
+from keras_hub.src.models.image_object_detector_preprocessor import (
+    ImageObjectDetectorPreprocessor,
+)
+from keras_hub.src.models.retinanet.retinanet_backbone import RetinaNetBackbone
+from keras_hub.src.models.retinanet.retinanet_image_converter import (
+    RetinaNetImageConverter,
+)
+@keras_hub_export("keras_hub.models.RetinaNetObjectDetectorPreprocessor")
+class RetinaNetObjectDetectorPreprocessor(ImageObjectDetectorPreprocessor):
+    backbone_cls = RetinaNetBackbone
+    image_converter_cls = RetinaNetImageConverter

keras_hub/src/models/retinanet/retinanet_presets.py ADDED Viewed

@@ -0,0 +1,15 @@
+"""RetinaNet model preset configurations."""
+# Metadata for loading pretrained model weights.
+backbone_presets = {
+    "retinanet_resnet50_fpn_coco": {
+        "metadata": {
+            "description": (
+                "RetinaNet model with ResNet50 backbone fine-tuned on COCO in 800x800 resolution."
+            ),
+            "params": 34121239,
+            "path": "retinanet",
+        },
+        "kaggle_handle": "kaggle://keras/retinanet/keras/retinanet_resnet50_fpn_coco/1",
+    }
+}

keras_hub/src/models/roberta/roberta_presets.py CHANGED Viewed

@@ -8,9 +8,7 @@ backbone_presets = {
                 "Trained on English Wikipedia, BooksCorpus, CommonCraw, and OpenWebText."
             ),
             "params": 124052736,
-            "official_name": "RoBERTa",
             "path": "roberta",
-            "model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/roberta/README.md",
         },
         "kaggle_handle": "kaggle://keras/roberta/keras/roberta_base_en/2",
     },
@@ -21,9 +19,7 @@ backbone_presets = {
                 "Trained on English Wikipedia, BooksCorpus, CommonCraw, and OpenWebText."
             ),
             "params": 354307072,
-            "official_name": "RoBERTa",
             "path": "roberta",
-            "model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/roberta/README.md",
         },
         "kaggle_handle": "kaggle://keras/roberta/keras/roberta_large_en/2",
     },

keras_hub/src/models/sam/sam_backbone.py CHANGED Viewed

@@ -68,7 +68,6 @@ class SAMBackbone(Backbone):
         image_encoder=image_encoder,
         prompt_encoder=prompt_encoder,
         mask_decoder=mask_decoder,
-        image_shape=(image_size, image_size, 3),
     )
     backbone(input_data)
     ```

keras-hub-nightly 0.16.1.dev202410200345__py3-none-any.whl → 0.19.0.dev202412070351__py3-none-any.whl

keras-hub-nightly 0.16.1.dev202410200345py3-none-any.whl → 0.19.0.dev202412070351py3-none-any.whl