PyPI - keras-hub-nightly - Versions diffs - 0.16.1.dev202410200345__py3-none-any.whl → 0.19.0.dev202412070351__py3-none-any.whl - Mend

keras-hub-nightly 0.16.1.dev202410200345py3-none-any.whl → 0.19.0.dev202412070351py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (109) hide show

keras_hub/api/layers/__init__.py +12 -0
keras_hub/api/models/__init__.py +32 -0
keras_hub/src/bounding_box/__init__.py +2 -0
keras_hub/src/bounding_box/converters.py +102 -12
keras_hub/src/layers/modeling/rms_normalization.py +34 -0
keras_hub/src/layers/modeling/transformer_encoder.py +27 -7
keras_hub/src/layers/preprocessing/image_converter.py +5 -0
keras_hub/src/models/albert/albert_presets.py +0 -8
keras_hub/src/models/bart/bart_presets.py +0 -6
keras_hub/src/models/bert/bert_presets.py +0 -20
keras_hub/src/models/bloom/bloom_presets.py +0 -16
keras_hub/src/models/clip/__init__.py +5 -0
keras_hub/src/models/clip/clip_backbone.py +286 -0
keras_hub/src/models/clip/clip_encoder_block.py +19 -4
keras_hub/src/models/clip/clip_image_converter.py +8 -0
keras_hub/src/models/clip/clip_presets.py +93 -0
keras_hub/src/models/clip/clip_text_encoder.py +4 -1
keras_hub/src/models/clip/clip_tokenizer.py +18 -3
keras_hub/src/models/clip/clip_vision_embedding.py +101 -0
keras_hub/src/models/clip/clip_vision_encoder.py +159 -0
keras_hub/src/models/deberta_v3/deberta_v3_presets.py +0 -10
keras_hub/src/models/deeplab_v3/deeplab_v3_presets.py +0 -2
keras_hub/src/models/deeplab_v3/deeplab_v3_segmenter.py +5 -3
keras_hub/src/models/densenet/densenet_backbone.py +1 -1
keras_hub/src/models/densenet/densenet_presets.py +0 -6
keras_hub/src/models/distil_bert/distil_bert_presets.py +0 -6
keras_hub/src/models/efficientnet/__init__.py +9 -0
keras_hub/src/models/efficientnet/cba.py +141 -0
keras_hub/src/models/efficientnet/efficientnet_backbone.py +139 -56
keras_hub/src/models/efficientnet/efficientnet_image_classifier.py +14 -0
keras_hub/src/models/efficientnet/efficientnet_image_classifier_preprocessor.py +16 -0
keras_hub/src/models/efficientnet/efficientnet_image_converter.py +10 -0
keras_hub/src/models/efficientnet/efficientnet_presets.py +192 -0
keras_hub/src/models/efficientnet/fusedmbconv.py +81 -36
keras_hub/src/models/efficientnet/mbconv.py +52 -21
keras_hub/src/models/electra/electra_presets.py +0 -12
keras_hub/src/models/f_net/f_net_presets.py +0 -4
keras_hub/src/models/falcon/falcon_presets.py +0 -2
keras_hub/src/models/flux/__init__.py +5 -0
keras_hub/src/models/flux/flux_layers.py +494 -0
keras_hub/src/models/flux/flux_maths.py +218 -0
keras_hub/src/models/flux/flux_model.py +231 -0
keras_hub/src/models/flux/flux_presets.py +14 -0
keras_hub/src/models/flux/flux_text_to_image.py +142 -0
keras_hub/src/models/flux/flux_text_to_image_preprocessor.py +73 -0
keras_hub/src/models/gemma/gemma_presets.py +0 -40
keras_hub/src/models/gpt2/gpt2_presets.py +0 -9
keras_hub/src/models/image_object_detector.py +87 -0
keras_hub/src/models/image_object_detector_preprocessor.py +57 -0
keras_hub/src/models/image_to_image.py +16 -10
keras_hub/src/models/inpaint.py +20 -13
keras_hub/src/models/llama/llama_backbone.py +1 -1
keras_hub/src/models/llama/llama_presets.py +5 -15
keras_hub/src/models/llama3/llama3_presets.py +0 -8
keras_hub/src/models/mistral/mistral_presets.py +0 -6
keras_hub/src/models/mit/mit_backbone.py +41 -27
keras_hub/src/models/mit/mit_layers.py +9 -7
keras_hub/src/models/mit/mit_presets.py +12 -24
keras_hub/src/models/opt/opt_presets.py +0 -8
keras_hub/src/models/pali_gemma/pali_gemma_backbone.py +61 -11
keras_hub/src/models/pali_gemma/pali_gemma_decoder_block.py +21 -23
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +166 -10
keras_hub/src/models/pali_gemma/pali_gemma_vit.py +12 -11
keras_hub/src/models/phi3/phi3_presets.py +0 -4
keras_hub/src/models/resnet/resnet_presets.py +10 -42
keras_hub/src/models/retinanet/__init__.py +5 -0
keras_hub/src/models/retinanet/anchor_generator.py +52 -53
keras_hub/src/models/retinanet/feature_pyramid.py +99 -36
keras_hub/src/models/retinanet/non_max_supression.py +1 -0
keras_hub/src/models/retinanet/prediction_head.py +192 -0
keras_hub/src/models/retinanet/retinanet_backbone.py +146 -0
keras_hub/src/models/retinanet/retinanet_image_converter.py +53 -0
keras_hub/src/models/retinanet/retinanet_label_encoder.py +49 -51
keras_hub/src/models/retinanet/retinanet_object_detector.py +382 -0
keras_hub/src/models/retinanet/retinanet_object_detector_preprocessor.py +14 -0
keras_hub/src/models/retinanet/retinanet_presets.py +15 -0
keras_hub/src/models/roberta/roberta_presets.py +0 -4
keras_hub/src/models/sam/sam_backbone.py +0 -1
keras_hub/src/models/sam/sam_image_segmenter.py +9 -10
keras_hub/src/models/sam/sam_presets.py +0 -6
keras_hub/src/models/segformer/__init__.py +8 -0
keras_hub/src/models/segformer/segformer_backbone.py +163 -0
keras_hub/src/models/segformer/segformer_image_converter.py +8 -0
keras_hub/src/models/segformer/segformer_image_segmenter.py +171 -0
keras_hub/src/models/segformer/segformer_image_segmenter_preprocessor.py +31 -0
keras_hub/src/models/segformer/segformer_presets.py +124 -0
keras_hub/src/models/stable_diffusion_3/mmdit.py +41 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_backbone.py +38 -21
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_image_to_image.py +3 -3
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_inpaint.py +3 -3
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_presets.py +28 -4
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image.py +1 -1
keras_hub/src/models/t5/t5_backbone.py +5 -4
keras_hub/src/models/t5/t5_presets.py +41 -13
keras_hub/src/models/text_to_image.py +13 -5
keras_hub/src/models/vgg/vgg_backbone.py +1 -1
keras_hub/src/models/vgg/vgg_presets.py +0 -8
keras_hub/src/models/whisper/whisper_audio_converter.py +1 -1
keras_hub/src/models/whisper/whisper_presets.py +0 -20
keras_hub/src/models/xlm_roberta/xlm_roberta_presets.py +0 -4
keras_hub/src/tests/test_case.py +25 -0
keras_hub/src/utils/preset_utils.py +17 -4
keras_hub/src/utils/timm/convert_efficientnet.py +449 -0
keras_hub/src/utils/timm/preset_loader.py +3 -0
keras_hub/src/version_utils.py +1 -1
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/METADATA +15 -26
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/RECORD +109 -76
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/WHEEL +1 -1
{keras_hub_nightly-0.16.1.dev202410200345.dist-info → keras_hub_nightly-0.19.0.dev202412070351.dist-info}/top_level.txt +0 -0

keras_hub/src/models/whisper/whisper_presets.py CHANGED Viewed

@@ -7,9 +7,7 @@ backbone_presets = {
                 "English speech data."
             ),
             "params": 37184256,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_tiny_en/3",
     },
@@ -20,9 +18,7 @@ backbone_presets = {
                 "English speech data."
             ),
             "params": 124439808,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_base_en/3",
     },
@@ -33,9 +29,7 @@ backbone_presets = {
                 "English speech data."
             ),
             "params": 241734144,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_small_en/3",
     },
@@ -46,9 +40,7 @@ backbone_presets = {
                 "English speech data."
             ),
             "params": 763856896,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_medium_en/3",
     },
@@ -59,9 +51,7 @@ backbone_presets = {
                 "multilingual speech data."
             ),
             "params": 37760640,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_tiny_multi/3",
     },
@@ -72,9 +62,7 @@ backbone_presets = {
                 "multilingual speech data."
             ),
             "params": 72593920,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_base_multi/3",
     },
@@ -85,9 +73,7 @@ backbone_presets = {
                 "multilingual speech data."
             ),
             "params": 241734912,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_small_multi/3",
     },
@@ -98,9 +84,7 @@ backbone_presets = {
                 "multilingual speech data."
             ),
             "params": 763857920,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_medium_multi/3",
     },
@@ -111,9 +95,7 @@ backbone_presets = {
                 "multilingual speech data."
             ),
             "params": 1543304960,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_large_multi/3",
     },
@@ -125,9 +107,7 @@ backbone_presets = {
                 "of `whisper_large_multi`."
             ),
             "params": 1543304960,
-            "official_name": "Whisper",
             "path": "whisper",
-            "model_card": "https://github.com/openai/whisper/blob/main/model-card.md",
         },
         "kaggle_handle": "kaggle://keras/whisper/keras/whisper_large_multi_v2/3",
     },

keras_hub/src/models/xlm_roberta/xlm_roberta_presets.py CHANGED Viewed

@@ -8,9 +8,7 @@ backbone_presets = {
                 "Trained on CommonCrawl in 100 languages."
             ),
             "params": 277450752,
-            "official_name": "XLM-RoBERTa",
             "path": "xlm_roberta",
-            "model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/xlmr/README.md",
         },
         "kaggle_handle": "kaggle://keras/xlm_roberta/keras/xlm_roberta_base_multi/2",
     },
@@ -21,9 +19,7 @@ backbone_presets = {
                 "Trained on CommonCrawl in 100 languages."
             ),
             "params": 558837760,
-            "official_name": "XLM-RoBERTa",
             "path": "xlm_roberta",
-            "model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/xlmr/README.md",
         },
         "kaggle_handle": "kaggle://keras/xlm_roberta/keras/xlm_roberta_large_multi/2",
     },

keras_hub/src/tests/test_case.py CHANGED Viewed

@@ -313,6 +313,14 @@ class TestCase(tf.test.TestCase, parameterized.TestCase):
         for policy in ["mixed_float16", "mixed_bfloat16", "bfloat16"]:
             policy = keras.mixed_precision.Policy(policy)
+            # Ensure the correct `dtype` is set for sublayers or submodels in
+            # `init_kwargs`.
+            original_init_kwargs = init_kwargs.copy()
+            for k, v in init_kwargs.items():
+                if isinstance(v, keras.Layer):
+                    config = v.get_config()
+                    config["dtype"] = policy
+                    init_kwargs[k] = v.__class__.from_config(config)
             layer = cls(**{**init_kwargs, "dtype": policy})
             if isinstance(layer, keras.Model):
                 output_data = layer(input_data)
@@ -343,8 +351,15 @@ class TestCase(tf.test.TestCase, parameterized.TestCase):
                     continue
                 self.assertEqual(policy.compute_dtype, sublayer.compute_dtype)
                 self.assertEqual(policy.variable_dtype, sublayer.variable_dtype)
+            # Restore `init_kwargs`.
+            init_kwargs = original_init_kwargs
     def run_quantization_test(self, instance, cls, init_kwargs, input_data):
+        # TODO: revert the following if. This works around a torch
+        # quantization failure in `MultiHeadAttention` with Keras 3.7.
+        if keras.config.backend() == "torch":
+            return
         def _get_supported_layers(mode):
             supported_layers = [keras.layers.Dense, keras.layers.EinsumDense]
             if mode == "int8":
@@ -361,6 +376,14 @@ class TestCase(tf.test.TestCase, parameterized.TestCase):
                     policy_map[layer.path] = keras.dtype_policies.get(
                         f"{mode}_from_float32"
                     )
+            # Ensure the correct `dtype` is set for sublayers or submodels in
+            # `init_kwargs`.
+            original_init_kwargs = init_kwargs.copy()
+            for k, v in init_kwargs.items():
+                if isinstance(v, keras.Layer):
+                    config = v.get_config()
+                    config["dtype"] = policy_map
+                    init_kwargs[k] = v.__class__.from_config(config)
             # Instantiate the layer.
             model = cls(**{**init_kwargs, "dtype": policy_map})
             # Call layer eagerly.
@@ -382,6 +405,8 @@ class TestCase(tf.test.TestCase, parameterized.TestCase):
             # Check weights loading.
             weights = model.get_weights()
             revived_model.set_weights(weights)
+            # Restore `init_kwargs`.
+            init_kwargs = original_init_kwargs
     def run_model_saving_test(
         self,

keras_hub/src/utils/preset_utils.py CHANGED Viewed

@@ -563,10 +563,8 @@ class PresetLoader:
         backbone_kwargs["dtype"] = kwargs.pop("dtype", None)
         # Forward `height` and `width` to backbone when using `TextToImage`.
-        if "height" in kwargs:
-            backbone_kwargs["height"] = kwargs.pop("height", None)
-        if "width" in kwargs:
-            backbone_kwargs["width"] = kwargs.pop("width", None)
+        if "image_shape" in kwargs:
+            backbone_kwargs["image_shape"] = kwargs.pop("image_shape", None)
         return backbone_kwargs, kwargs
@@ -660,6 +658,12 @@ class KerasPresetLoader(PresetLoader):
                 cls, load_weights, load_task_weights, **kwargs
             )
         # We found a `task.json` with a complete config for our class.
+        # Forward backbone args.
+        backbone_kwargs, kwargs = self.get_backbone_kwargs(**kwargs)
+        if "backbone" in task_config["config"]:
+            backbone_config = task_config["config"]["backbone"]["config"]
+            backbone_config = {**backbone_config, **backbone_kwargs}
+            task_config["config"]["backbone"]["config"] = backbone_config
         task = load_serialized_object(task_config, **kwargs)
         if task.preprocessor and hasattr(
             task.preprocessor, "load_preset_assets"
@@ -767,14 +771,23 @@ class KerasPresetSaver:
             config_file.write(json.dumps(config, indent=4))
     def _save_metadata(self, layer):
+        from keras_hub.src.models.task import Task
         from keras_hub.src.version_utils import __version__ as keras_hub_version
+        # Find all tasks that are compatible with the backbone.
+        # E.g. for `BertBackbone` we would have `TextClassifier` and `MaskedLM`.
+        # For `ResNetBackbone` we would have `ImageClassifier`.
+        tasks = list_subclasses(Task)
+        tasks = filter(lambda x: x.backbone_cls == type(layer), tasks)
+        tasks = [task.__base__.__name__ for task in tasks]
         keras_version = keras.version() if hasattr(keras, "version") else None
         metadata = {
             "keras_version": keras_version,
             "keras_hub_version": keras_hub_version,
             "parameter_count": layer.count_params(),
             "date_saved": datetime.datetime.now().strftime("%Y-%m-%d@%H:%M:%S"),
+            "tasks": tasks,
         }
         metadata_path = os.path.join(self.preset_dir, METADATA_FILE)
         with open(metadata_path, "w") as metadata_file:

keras_hub/src/utils/timm/convert_efficientnet.py ADDED Viewed

@@ -0,0 +1,449 @@
+import math
+import numpy as np
+from keras_hub.src.models.efficientnet.efficientnet_backbone import (
+    EfficientNetBackbone,
+)
+backbone_cls = EfficientNetBackbone
+VARIANT_MAP = {
+    "b0": {
+        "stackwise_width_coefficients": [1.0] * 7,
+        "stackwise_depth_coefficients": [1.0] * 7,
+        "stackwise_squeeze_and_excite_ratios": [0.25] * 7,
+    },
+    "b1": {
+        "stackwise_width_coefficients": [1.0] * 7,
+        "stackwise_depth_coefficients": [1.1] * 7,
+        "stackwise_squeeze_and_excite_ratios": [0.25] * 7,
+    },
+    "b2": {
+        "stackwise_width_coefficients": [1.1] * 7,
+        "stackwise_depth_coefficients": [1.2] * 7,
+        "stackwise_squeeze_and_excite_ratios": [0.25] * 7,
+    },
+    "b3": {
+        "stackwise_width_coefficients": [1.2] * 7,
+        "stackwise_depth_coefficients": [1.4] * 7,
+        "stackwise_squeeze_and_excite_ratios": [0.25] * 7,
+    },
+    "b4": {
+        "stackwise_width_coefficients": [1.4] * 7,
+        "stackwise_depth_coefficients": [1.8] * 7,
+        "stackwise_squeeze_and_excite_ratios": [0.25] * 7,
+    },
+    "b5": {
+        "stackwise_width_coefficients": [1.6] * 7,
+        "stackwise_depth_coefficients": [2.2] * 7,
+        "stackwise_squeeze_and_excite_ratios": [0.25] * 7,
+    },
+    "lite0": {
+        "stackwise_width_coefficients": [1.0] * 7,
+        "stackwise_depth_coefficients": [1.0] * 7,
+        "stackwise_squeeze_and_excite_ratios": [0] * 7,
+        "activation": "relu6",
+    },
+    "el": {
+        "stackwise_width_coefficients": [1.2] * 6,
+        "stackwise_depth_coefficients": [1.4] * 6,
+        "stackwise_kernel_sizes": [3, 3, 3, 5, 5, 5],
+        "stackwise_num_repeats": [1, 2, 4, 5, 4, 2],
+        "stackwise_input_filters": [32, 24, 32, 48, 96, 144],
+        "stackwise_output_filters": [24, 32, 48, 96, 144, 192],
+        "stackwise_expansion_ratios": [4, 8, 8, 8, 8, 8],
+        "stackwise_strides": [1, 2, 2, 2, 1, 2],
+        "stackwise_squeeze_and_excite_ratios": [0] * 6,
+        "stackwise_block_types": ["fused"] * 3 + ["unfused"] * 3,
+        "stackwise_force_input_filters": [24, 0, 0, 0, 0, 0],
+        "stackwise_nores_option": [True] + [False] * 5,
+        "activation": "relu",
+    },
+    "em": {
+        "stackwise_width_coefficients": [1.0] * 6,
+        "stackwise_depth_coefficients": [1.1] * 6,
+        "stackwise_kernel_sizes": [3, 3, 3, 5, 5, 5],
+        "stackwise_num_repeats": [1, 2, 4, 5, 4, 2],
+        "stackwise_input_filters": [32, 24, 32, 48, 96, 144],
+        "stackwise_output_filters": [24, 32, 48, 96, 144, 192],
+        "stackwise_expansion_ratios": [4, 8, 8, 8, 8, 8],
+        "stackwise_strides": [1, 2, 2, 2, 1, 2],
+        "stackwise_squeeze_and_excite_ratios": [0] * 6,
+        "stackwise_block_types": ["fused"] * 3 + ["unfused"] * 3,
+        "stackwise_force_input_filters": [24, 0, 0, 0, 0, 0],
+        "stackwise_nores_option": [True] + [False] * 5,
+        "activation": "relu",
+    },
+    "es": {
+        "stackwise_width_coefficients": [1.0] * 6,
+        "stackwise_depth_coefficients": [1.0] * 6,
+        "stackwise_kernel_sizes": [3, 3, 3, 5, 5, 5],
+        "stackwise_num_repeats": [1, 2, 4, 5, 4, 2],
+        "stackwise_input_filters": [32, 24, 32, 48, 96, 144],
+        "stackwise_output_filters": [24, 32, 48, 96, 144, 192],
+        "stackwise_expansion_ratios": [4, 8, 8, 8, 8, 8],
+        "stackwise_strides": [1, 2, 2, 2, 1, 2],
+        "stackwise_squeeze_and_excite_ratios": [0] * 6,
+        "stackwise_block_types": ["fused"] * 3 + ["unfused"] * 3,
+        "stackwise_force_input_filters": [24, 0, 0, 0, 0, 0],
+        "stackwise_nores_option": [True] + [False] * 5,
+        "activation": "relu",
+    },
+    "rw_m": {
+        "stackwise_width_coefficients": [1.2] * 6,
+        "stackwise_depth_coefficients": [1.2] * 4 + [1.6] * 2,
+        "stackwise_kernel_sizes": [3, 3, 3, 3, 3, 3],
+        "stackwise_num_repeats": [2, 4, 4, 6, 9, 15],
+        "stackwise_input_filters": [24, 24, 48, 64, 128, 160],
+        "stackwise_output_filters": [24, 48, 64, 128, 160, 272],
+        "stackwise_expansion_ratios": [1, 4, 4, 4, 6, 6],
+        "stackwise_strides": [1, 2, 2, 2, 1, 2],
+        "stackwise_squeeze_and_excite_ratios": [0, 0, 0, 0.25, 0.25, 0.25],
+        "stackwise_block_types": ["fused"] * 3 + ["unfused"] * 3,
+        "stackwise_force_input_filters": [0, 0, 0, 0, 0, 0],
+        "stackwise_nores_option": [False] * 6,
+        "activation": "silu",
+        "num_features": 1792,
+    },
+    "rw_s": {
+        "stackwise_width_coefficients": [1.0] * 6,
+        "stackwise_depth_coefficients": [1.0] * 6,
+        "stackwise_kernel_sizes": [3, 3, 3, 3, 3, 3],
+        "stackwise_num_repeats": [2, 4, 4, 6, 9, 15],
+        "stackwise_input_filters": [24, 24, 48, 64, 128, 160],
+        "stackwise_output_filters": [24, 48, 64, 128, 160, 272],
+        "stackwise_expansion_ratios": [1, 4, 4, 4, 6, 6],
+        "stackwise_strides": [1, 2, 2, 2, 1, 2],
+        "stackwise_squeeze_and_excite_ratios": [0, 0, 0, 0.25, 0.25, 0.25],
+        "stackwise_block_types": ["fused"] * 3 + ["unfused"] * 3,
+        "stackwise_force_input_filters": [0, 0, 0, 0, 0, 0],
+        "stackwise_nores_option": [False] * 6,
+        "activation": "silu",
+        "num_features": 1792,
+    },
+    "rw_t": {
+        "stackwise_width_coefficients": [0.8] * 6,
+        "stackwise_depth_coefficients": [0.9] * 6,
+        "stackwise_kernel_sizes": [3, 3, 3, 3, 3, 3],
+        "stackwise_num_repeats": [2, 4, 4, 6, 9, 15],
+        "stackwise_input_filters": [24, 24, 48, 64, 128, 160],
+        "stackwise_output_filters": [24, 48, 64, 128, 160, 256],
+        "stackwise_expansion_ratios": [1, 4, 4, 4, 6, 6],
+        "stackwise_strides": [1, 2, 2, 2, 1, 2],
+        "stackwise_squeeze_and_excite_ratios": [0, 0, 0, 0.25, 0.25, 0.25],
+        "stackwise_block_types": ["cba"] + ["fused"] * 2 + ["unfused"] * 3,
+        "stackwise_force_input_filters": [0, 0, 0, 0, 0, 0],
+        "stackwise_nores_option": [False] * 6,
+        "activation": "silu",
+    },
+}
+def convert_backbone_config(timm_config):
+    timm_architecture = timm_config["architecture"]
+    base_kwargs = {
+        "stackwise_kernel_sizes": [3, 3, 5, 3, 5, 5, 3],
+        "stackwise_num_repeats": [1, 2, 2, 3, 3, 4, 1],
+        "stackwise_input_filters": [32, 16, 24, 40, 80, 112, 192],
+        "stackwise_output_filters": [16, 24, 40, 80, 112, 192, 320],
+        "stackwise_expansion_ratios": [1, 6, 6, 6, 6, 6, 6],
+        "stackwise_strides": [1, 2, 2, 2, 1, 2, 1],
+        "stackwise_block_types": ["v1"] * 7,
+        "min_depth": None,
+        "include_stem_padding": True,
+        "use_depth_divisor_as_min_depth": True,
+        "cap_round_filter_decrease": True,
+        "stem_conv_padding": "valid",
+        "batch_norm_momentum": 0.9,
+        "batch_norm_epsilon": 1e-5,
+        "dropout": 0,
+        "projection_activation": None,
+    }
+    variant = "_".join(timm_architecture.split("_")[1:])
+    if variant not in VARIANT_MAP:
+        raise ValueError(
+            f"Currently, the architecture {timm_architecture} is not supported."
+        )
+    base_kwargs.update(VARIANT_MAP[variant])
+    return base_kwargs
+def convert_weights(backbone, loader, timm_config):
+    timm_architecture = timm_config["architecture"]
+    variant = "_".join(timm_architecture.split("_")[1:])
+    def port_conv2d(keras_layer, hf_weight_prefix, port_bias=True):
+        loader.port_weight(
+            keras_layer.kernel,
+            hf_weight_key=f"{hf_weight_prefix}.weight",
+            hook_fn=lambda x, _: np.transpose(x, (2, 3, 1, 0)),
+        )
+        if port_bias:
+            loader.port_weight(
+                keras_layer.bias,
+                hf_weight_key=f"{hf_weight_prefix}.bias",
+            )
+    def port_depthwise_conv2d(
+        keras_layer,
+        hf_weight_prefix,
+        port_bias=True,
+        depth_multiplier=1,
+    ):
+        def convert_pt_conv2d_kernel(pt_kernel):
+            out_channels, in_channels_per_group, height, width = pt_kernel.shape
+            # PT Convs are depthwise convs if and only if in_channels_per_group == 1
+            assert in_channels_per_group == 1
+            pt_kernel = np.transpose(pt_kernel, (2, 3, 0, 1))
+            in_channels = out_channels // depth_multiplier
+            return np.reshape(
+                pt_kernel, (height, width, in_channels, depth_multiplier)
+            )
+        loader.port_weight(
+            keras_layer.kernel,
+            hf_weight_key=f"{hf_weight_prefix}.weight",
+            hook_fn=lambda x, _: convert_pt_conv2d_kernel(x),
+        )
+        if port_bias:
+            loader.port_weight(
+                keras_layer.bias,
+                hf_weight_key=f"{hf_weight_prefix}.bias",
+            )
+    def port_batch_normalization(keras_layer, hf_weight_prefix):
+        loader.port_weight(
+            keras_layer.gamma,
+            hf_weight_key=f"{hf_weight_prefix}.weight",
+        )
+        loader.port_weight(
+            keras_layer.beta,
+            hf_weight_key=f"{hf_weight_prefix}.bias",
+        )
+        loader.port_weight(
+            keras_layer.moving_mean,
+            hf_weight_key=f"{hf_weight_prefix}.running_mean",
+        )
+        loader.port_weight(
+            keras_layer.moving_variance,
+            hf_weight_key=f"{hf_weight_prefix}.running_var",
+        )
+        # do we need num batches tracked?
+    # Stem
+    port_conv2d(backbone.get_layer("stem_conv"), "conv_stem", port_bias=False)
+    port_batch_normalization(backbone.get_layer("stem_bn"), "bn1")
+    # Stages
+    num_stacks = len(backbone.stackwise_kernel_sizes)
+    for stack_index in range(num_stacks):
+        block_type = backbone.stackwise_block_types[stack_index]
+        expansion_ratio = backbone.stackwise_expansion_ratios[stack_index]
+        repeats = backbone.stackwise_num_repeats[stack_index]
+        stack_depth_coefficient = backbone.stackwise_depth_coefficients[
+            stack_index
+        ]
+        repeats = int(math.ceil(stack_depth_coefficient * repeats))
+        se_ratio = VARIANT_MAP[variant]["stackwise_squeeze_and_excite_ratios"][
+            stack_index
+        ]
+        for block_idx in range(repeats):
+            conv_pw_count = 0
+            bn_count = 1
+            # 97 is the start of the lowercase alphabet.
+            letter_identifier = chr(block_idx + 97)
+            keras_block_prefix = f"block{stack_index+1}{letter_identifier}_"
+            hf_block_prefix = f"blocks.{stack_index}.{block_idx}."
+            if block_type == "v1":
+                conv_pw_name_map = ["conv_pw", "conv_pwl"]
+                # Initial Expansion Conv
+                if expansion_ratio != 1:
+                    port_conv2d(
+                        backbone.get_layer(keras_block_prefix + "expand_conv"),
+                        hf_block_prefix + conv_pw_name_map[conv_pw_count],
+                        port_bias=False,
+                    )
+                    conv_pw_count += 1
+                    port_batch_normalization(
+                        backbone.get_layer(keras_block_prefix + "expand_bn"),
+                        hf_block_prefix + f"bn{bn_count}",
+                    )
+                    bn_count += 1
+                # Depthwise Conv
+                port_depthwise_conv2d(
+                    backbone.get_layer(keras_block_prefix + "dwconv"),
+                    hf_block_prefix + "conv_dw",
+                    port_bias=False,
+                )
+                port_batch_normalization(
+                    backbone.get_layer(keras_block_prefix + "dwconv_bn"),
+                    hf_block_prefix + f"bn{bn_count}",
+                )
+                bn_count += 1
+                if 0 < se_ratio <= 1:
+                    # Squeeze and Excite
+                    port_conv2d(
+                        backbone.get_layer(keras_block_prefix + "se_reduce"),
+                        hf_block_prefix + "se.conv_reduce",
+                    )
+                    port_conv2d(
+                        backbone.get_layer(keras_block_prefix + "se_expand"),
+                        hf_block_prefix + "se.conv_expand",
+                    )
+                # Output/Projection
+                port_conv2d(
+                    backbone.get_layer(keras_block_prefix + "project"),
+                    hf_block_prefix + conv_pw_name_map[conv_pw_count],
+                    port_bias=False,
+                )
+                conv_pw_count += 1
+                port_batch_normalization(
+                    backbone.get_layer(keras_block_prefix + "project_bn"),
+                    hf_block_prefix + f"bn{bn_count}",
+                )
+                bn_count += 1
+            elif block_type == "fused":
+                fused_block_layer = backbone.get_layer(keras_block_prefix)
+                # Initial Expansion Conv
+                port_conv2d(
+                    fused_block_layer.conv1,
+                    hf_block_prefix + "conv_exp",
+                    port_bias=False,
+                )
+                conv_pw_count += 1
+                port_batch_normalization(
+                    fused_block_layer.bn1,
+                    hf_block_prefix + f"bn{bn_count}",
+                )
+                bn_count += 1
+                if 0 < se_ratio <= 1:
+                    # Squeeze and Excite
+                    port_conv2d(
+                        fused_block_layer.se_conv1,
+                        hf_block_prefix + "se.conv_reduce",
+                    )
+                    port_conv2d(
+                        fused_block_layer.se_conv2,
+                        hf_block_prefix + "se.conv_expand",
+                    )
+                # Output/Projection
+                port_conv2d(
+                    fused_block_layer.output_conv,
+                    hf_block_prefix + "conv_pwl",
+                    port_bias=False,
+                )
+                conv_pw_count += 1
+                port_batch_normalization(
+                    fused_block_layer.bn2,
+                    hf_block_prefix + f"bn{bn_count}",
+                )
+                bn_count += 1
+            elif block_type == "unfused":
+                unfused_block_layer = backbone.get_layer(keras_block_prefix)
+                # Initial Expansion Conv
+                if expansion_ratio != 1:
+                    port_conv2d(
+                        unfused_block_layer.conv1,
+                        hf_block_prefix + "conv_pw",
+                        port_bias=False,
+                    )
+                    conv_pw_count += 1
+                    port_batch_normalization(
+                        unfused_block_layer.bn1,
+                        hf_block_prefix + f"bn{bn_count}",
+                    )
+                    bn_count += 1
+                # Depthwise Conv
+                port_depthwise_conv2d(
+                    unfused_block_layer.depthwise,
+                    hf_block_prefix + "conv_dw",
+                    port_bias=False,
+                )
+                port_batch_normalization(
+                    unfused_block_layer.bn2,
+                    hf_block_prefix + f"bn{bn_count}",
+                )
+                bn_count += 1
+                if 0 < se_ratio <= 1:
+                    # Squeeze and Excite
+                    port_conv2d(
+                        unfused_block_layer.se_conv1,
+                        hf_block_prefix + "se.conv_reduce",
+                    )
+                    port_conv2d(
+                        unfused_block_layer.se_conv2,
+                        hf_block_prefix + "se.conv_expand",
+                    )
+                # Output/Projection
+                port_conv2d(
+                    unfused_block_layer.output_conv,
+                    hf_block_prefix + "conv_pwl",
+                    port_bias=False,
+                )
+                conv_pw_count += 1
+                port_batch_normalization(
+                    unfused_block_layer.bn3,
+                    hf_block_prefix + f"bn{bn_count}",
+                )
+                bn_count += 1
+            elif block_type == "cba":
+                cba_block_layer = backbone.get_layer(keras_block_prefix)
+                # Initial Expansion Conv
+                port_conv2d(
+                    cba_block_layer.conv1,
+                    hf_block_prefix + "conv",
+                    port_bias=False,
+                )
+                conv_pw_count += 1
+                port_batch_normalization(
+                    cba_block_layer.bn1,
+                    hf_block_prefix + f"bn{bn_count}",
+                )
+                bn_count += 1
+    # Head/Top
+    port_conv2d(backbone.get_layer("top_conv"), "conv_head", port_bias=False)
+    port_batch_normalization(backbone.get_layer("top_bn"), "bn2")
+def convert_head(task, loader, timm_config):
+    classifier_prefix = timm_config["pretrained_cfg"]["classifier"]
+    prefix = f"{classifier_prefix}."
+    loader.port_weight(
+        task.output_dense.kernel,
+        hf_weight_key=prefix + "weight",
+        hook_fn=lambda x, _: np.transpose(np.squeeze(x)),
+    )
+    loader.port_weight(
+        task.output_dense.bias,
+        hf_weight_key=prefix + "bias",
+    )

keras-hub-nightly 0.16.1.dev202410200345__py3-none-any.whl → 0.19.0.dev202412070351__py3-none-any.whl

keras-hub-nightly 0.16.1.dev202410200345py3-none-any.whl → 0.19.0.dev202412070351py3-none-any.whl