PyPI - keras-hub-nightly - Versions diffs - 0.16.1.dev202410020340__py3-none-any.whl → 0.19.0.dev202501260345__py3-none-any.whl - Mend

keras-hub-nightly 0.16.1.dev202410020340py3-none-any.whl → 0.19.0.dev202501260345py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (252) hide show

keras_hub/api/layers/__init__.py +21 -3
keras_hub/api/models/__init__.py +71 -12
keras_hub/api/tokenizers/__init__.py +1 -1
keras_hub/src/bounding_box/__init__.py +2 -0
keras_hub/src/bounding_box/converters.py +102 -12
keras_hub/src/layers/modeling/f_net_encoder.py +1 -1
keras_hub/src/layers/modeling/masked_lm_head.py +2 -1
keras_hub/src/layers/modeling/reversible_embedding.py +3 -16
keras_hub/src/layers/modeling/rms_normalization.py +36 -0
keras_hub/src/layers/modeling/rotary_embedding.py +3 -2
keras_hub/src/layers/modeling/token_and_position_embedding.py +1 -1
keras_hub/src/layers/modeling/transformer_decoder.py +8 -6
keras_hub/src/layers/modeling/transformer_encoder.py +29 -7
keras_hub/src/layers/preprocessing/audio_converter.py +3 -7
keras_hub/src/layers/preprocessing/image_converter.py +170 -34
keras_hub/src/metrics/bleu.py +4 -3
keras_hub/src/models/albert/albert_presets.py +4 -12
keras_hub/src/models/albert/albert_text_classifier.py +7 -7
keras_hub/src/models/backbone.py +3 -14
keras_hub/src/models/bart/bart_backbone.py +4 -4
keras_hub/src/models/bart/bart_presets.py +3 -9
keras_hub/src/models/bart/bart_seq_2_seq_lm.py +9 -8
keras_hub/src/models/basnet/__init__.py +5 -0
keras_hub/src/models/basnet/basnet.py +122 -0
keras_hub/src/models/basnet/basnet_backbone.py +366 -0
keras_hub/src/models/basnet/basnet_image_converter.py +8 -0
keras_hub/src/models/basnet/basnet_preprocessor.py +14 -0
keras_hub/src/models/basnet/basnet_presets.py +17 -0
keras_hub/src/models/bert/bert_presets.py +14 -32
keras_hub/src/models/bert/bert_text_classifier.py +3 -3
keras_hub/src/models/bloom/bloom_presets.py +8 -24
keras_hub/src/models/causal_lm.py +56 -12
keras_hub/src/models/clip/__init__.py +5 -0
keras_hub/src/models/clip/clip_backbone.py +286 -0
keras_hub/src/models/clip/clip_encoder_block.py +19 -4
keras_hub/src/models/clip/clip_image_converter.py +8 -0
keras_hub/src/models/clip/clip_presets.py +93 -0
keras_hub/src/models/clip/clip_text_encoder.py +4 -1
keras_hub/src/models/clip/clip_tokenizer.py +18 -3
keras_hub/src/models/clip/clip_vision_embedding.py +101 -0
keras_hub/src/models/clip/clip_vision_encoder.py +159 -0
keras_hub/src/models/csp_darknet/csp_darknet_backbone.py +2 -1
keras_hub/src/models/csp_darknet/csp_darknet_image_classifier.py +0 -109
keras_hub/src/models/deberta_v3/deberta_v3_backbone.py +1 -1
keras_hub/src/models/deberta_v3/deberta_v3_presets.py +5 -15
keras_hub/src/models/deberta_v3/deberta_v3_text_classifier.py +4 -4
keras_hub/src/models/deberta_v3/disentangled_attention_encoder.py +4 -4
keras_hub/src/models/deberta_v3/disentangled_self_attention.py +3 -2
keras_hub/src/models/deberta_v3/relative_embedding.py +1 -1
keras_hub/src/models/deeplab_v3/__init__.py +7 -0
keras_hub/src/models/deeplab_v3/deeplab_v3_backbone.py +200 -0
keras_hub/src/models/deeplab_v3/deeplab_v3_image_converter.py +10 -0
keras_hub/src/models/deeplab_v3/deeplab_v3_image_segmeter_preprocessor.py +16 -0
keras_hub/src/models/deeplab_v3/deeplab_v3_layers.py +215 -0
keras_hub/src/models/deeplab_v3/deeplab_v3_presets.py +17 -0
keras_hub/src/models/deeplab_v3/deeplab_v3_segmenter.py +111 -0
keras_hub/src/models/densenet/densenet_backbone.py +6 -4
keras_hub/src/models/densenet/densenet_image_classifier.py +1 -129
keras_hub/src/models/densenet/densenet_image_converter.py +2 -4
keras_hub/src/models/densenet/densenet_presets.py +9 -15
keras_hub/src/models/distil_bert/distil_bert_masked_lm.py +1 -1
keras_hub/src/models/distil_bert/distil_bert_masked_lm_preprocessor.py +2 -2
keras_hub/src/models/distil_bert/distil_bert_presets.py +5 -10
keras_hub/src/models/distil_bert/distil_bert_text_classifier.py +5 -5
keras_hub/src/models/distil_bert/distil_bert_tokenizer.py +3 -3
keras_hub/src/models/efficientnet/__init__.py +9 -0
keras_hub/src/models/efficientnet/cba.py +141 -0
keras_hub/src/models/efficientnet/efficientnet_backbone.py +160 -61
keras_hub/src/models/efficientnet/efficientnet_image_classifier.py +14 -0
keras_hub/src/models/efficientnet/efficientnet_image_classifier_preprocessor.py +16 -0
keras_hub/src/models/efficientnet/efficientnet_image_converter.py +10 -0
keras_hub/src/models/efficientnet/efficientnet_presets.py +193 -0
keras_hub/src/models/efficientnet/fusedmbconv.py +84 -41
keras_hub/src/models/efficientnet/mbconv.py +53 -22
keras_hub/src/models/electra/electra_backbone.py +2 -2
keras_hub/src/models/electra/electra_presets.py +6 -18
keras_hub/src/models/f_net/f_net_presets.py +2 -6
keras_hub/src/models/f_net/f_net_text_classifier.py +3 -3
keras_hub/src/models/f_net/f_net_text_classifier_preprocessor.py +3 -3
keras_hub/src/models/falcon/falcon_backbone.py +5 -3
keras_hub/src/models/falcon/falcon_causal_lm.py +18 -8
keras_hub/src/models/falcon/falcon_presets.py +1 -3
keras_hub/src/models/falcon/falcon_tokenizer.py +7 -2
keras_hub/src/models/feature_pyramid_backbone.py +1 -1
keras_hub/src/models/flux/__init__.py +5 -0
keras_hub/src/models/flux/flux_layers.py +496 -0
keras_hub/src/models/flux/flux_maths.py +225 -0
keras_hub/src/models/flux/flux_model.py +236 -0
keras_hub/src/models/flux/flux_presets.py +3 -0
keras_hub/src/models/flux/flux_text_to_image.py +146 -0
keras_hub/src/models/flux/flux_text_to_image_preprocessor.py +73 -0
keras_hub/src/models/gemma/gemma_backbone.py +35 -20
keras_hub/src/models/gemma/gemma_causal_lm.py +2 -2
keras_hub/src/models/gemma/gemma_decoder_block.py +3 -1
keras_hub/src/models/gemma/gemma_presets.py +29 -63
keras_hub/src/models/gpt2/gpt2_causal_lm.py +2 -2
keras_hub/src/models/gpt2/gpt2_presets.py +5 -14
keras_hub/src/models/gpt_neo_x/gpt_neo_x_attention.py +2 -1
keras_hub/src/models/gpt_neo_x/gpt_neo_x_causal_lm.py +3 -3
keras_hub/src/models/gpt_neo_x/gpt_neo_x_decoder.py +2 -1
keras_hub/src/models/image_classifier.py +147 -2
keras_hub/src/models/image_classifier_preprocessor.py +6 -3
keras_hub/src/models/image_object_detector.py +87 -0
keras_hub/src/models/image_object_detector_preprocessor.py +57 -0
keras_hub/src/models/image_segmenter.py +0 -5
keras_hub/src/models/image_segmenter_preprocessor.py +29 -4
keras_hub/src/models/image_to_image.py +417 -0
keras_hub/src/models/inpaint.py +520 -0
keras_hub/src/models/llama/llama_backbone.py +138 -12
keras_hub/src/models/llama/llama_causal_lm.py +3 -1
keras_hub/src/models/llama/llama_presets.py +10 -20
keras_hub/src/models/llama3/llama3_backbone.py +12 -11
keras_hub/src/models/llama3/llama3_causal_lm.py +1 -1
keras_hub/src/models/llama3/llama3_presets.py +4 -12
keras_hub/src/models/llama3/llama3_tokenizer.py +25 -2
keras_hub/src/models/mistral/mistral_backbone.py +16 -15
keras_hub/src/models/mistral/mistral_causal_lm.py +6 -4
keras_hub/src/models/mistral/mistral_presets.py +3 -9
keras_hub/src/models/mistral/mistral_transformer_decoder.py +2 -1
keras_hub/src/models/mit/__init__.py +6 -0
keras_hub/src/models/{mix_transformer/mix_transformer_backbone.py → mit/mit_backbone.py} +47 -36
keras_hub/src/models/mit/mit_image_classifier.py +12 -0
keras_hub/src/models/mit/mit_image_classifier_preprocessor.py +12 -0
keras_hub/src/models/mit/mit_image_converter.py +8 -0
keras_hub/src/models/{mix_transformer/mix_transformer_layers.py → mit/mit_layers.py} +20 -13
keras_hub/src/models/mit/mit_presets.py +139 -0
keras_hub/src/models/mobilenet/mobilenet_backbone.py +8 -8
keras_hub/src/models/mobilenet/mobilenet_image_classifier.py +0 -92
keras_hub/src/models/opt/opt_causal_lm.py +2 -2
keras_hub/src/models/opt/opt_presets.py +4 -12
keras_hub/src/models/pali_gemma/pali_gemma_backbone.py +63 -17
keras_hub/src/models/pali_gemma/pali_gemma_causal_lm.py +3 -1
keras_hub/src/models/pali_gemma/pali_gemma_decoder_block.py +21 -23
keras_hub/src/models/pali_gemma/pali_gemma_image_converter.py +2 -4
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +173 -17
keras_hub/src/models/pali_gemma/pali_gemma_vit.py +14 -26
keras_hub/src/models/phi3/phi3_causal_lm.py +3 -1
keras_hub/src/models/phi3/phi3_decoder.py +0 -1
keras_hub/src/models/phi3/phi3_presets.py +2 -6
keras_hub/src/models/phi3/phi3_rotary_embedding.py +1 -1
keras_hub/src/models/preprocessor.py +25 -11
keras_hub/src/models/resnet/resnet_backbone.py +3 -14
keras_hub/src/models/resnet/resnet_image_classifier.py +0 -137
keras_hub/src/models/resnet/resnet_image_converter.py +2 -4
keras_hub/src/models/resnet/resnet_presets.py +127 -18
keras_hub/src/models/retinanet/__init__.py +5 -0
keras_hub/src/models/retinanet/anchor_generator.py +52 -53
keras_hub/src/models/retinanet/feature_pyramid.py +103 -39
keras_hub/src/models/retinanet/non_max_supression.py +1 -0
keras_hub/src/models/retinanet/prediction_head.py +192 -0
keras_hub/src/models/retinanet/retinanet_backbone.py +146 -0
keras_hub/src/models/retinanet/retinanet_image_converter.py +53 -0
keras_hub/src/models/retinanet/retinanet_label_encoder.py +49 -51
keras_hub/src/models/retinanet/retinanet_object_detector.py +381 -0
keras_hub/src/models/retinanet/retinanet_object_detector_preprocessor.py +14 -0
keras_hub/src/models/retinanet/retinanet_presets.py +16 -0
keras_hub/src/models/roberta/roberta_backbone.py +2 -2
keras_hub/src/models/roberta/roberta_presets.py +6 -8
keras_hub/src/models/roberta/roberta_text_classifier.py +3 -3
keras_hub/src/models/sam/__init__.py +5 -0
keras_hub/src/models/sam/sam_backbone.py +2 -3
keras_hub/src/models/sam/sam_image_converter.py +2 -4
keras_hub/src/models/sam/sam_image_segmenter.py +16 -16
keras_hub/src/models/sam/sam_image_segmenter_preprocessor.py +11 -1
keras_hub/src/models/sam/sam_layers.py +5 -3
keras_hub/src/models/sam/sam_presets.py +3 -9
keras_hub/src/models/sam/sam_prompt_encoder.py +4 -2
keras_hub/src/models/sam/sam_transformer.py +5 -4
keras_hub/src/models/segformer/__init__.py +8 -0
keras_hub/src/models/segformer/segformer_backbone.py +167 -0
keras_hub/src/models/segformer/segformer_image_converter.py +8 -0
keras_hub/src/models/segformer/segformer_image_segmenter.py +184 -0
keras_hub/src/models/segformer/segformer_image_segmenter_preprocessor.py +31 -0
keras_hub/src/models/segformer/segformer_presets.py +136 -0
keras_hub/src/models/seq_2_seq_lm_preprocessor.py +1 -1
keras_hub/src/models/stable_diffusion_3/flow_match_euler_discrete_scheduler.py +8 -1
keras_hub/src/models/stable_diffusion_3/mmdit.py +577 -190
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_backbone.py +189 -163
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_image_to_image.py +178 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_inpaint.py +193 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_presets.py +43 -7
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image.py +25 -14
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image_preprocessor.py +1 -1
keras_hub/src/models/t5/t5_backbone.py +5 -4
keras_hub/src/models/t5/t5_presets.py +47 -19
keras_hub/src/models/task.py +47 -39
keras_hub/src/models/text_classifier.py +2 -2
keras_hub/src/models/text_to_image.py +106 -41
keras_hub/src/models/vae/__init__.py +1 -0
keras_hub/src/models/vae/vae_backbone.py +184 -0
keras_hub/src/models/vae/vae_layers.py +739 -0
keras_hub/src/models/vgg/__init__.py +5 -0
keras_hub/src/models/vgg/vgg_backbone.py +4 -24
keras_hub/src/models/vgg/vgg_image_classifier.py +139 -33
keras_hub/src/models/vgg/vgg_image_classifier_preprocessor.py +12 -0
keras_hub/src/models/vgg/vgg_image_converter.py +8 -0
keras_hub/src/models/vgg/vgg_presets.py +48 -0
keras_hub/src/models/vit/__init__.py +5 -0
keras_hub/src/models/vit/vit_backbone.py +152 -0
keras_hub/src/models/vit/vit_image_classifier.py +187 -0
keras_hub/src/models/vit/vit_image_classifier_preprocessor.py +12 -0
keras_hub/src/models/vit/vit_image_converter.py +73 -0
keras_hub/src/models/vit/vit_layers.py +391 -0
keras_hub/src/models/vit/vit_presets.py +126 -0
keras_hub/src/models/vit_det/vit_det_backbone.py +6 -4
keras_hub/src/models/vit_det/vit_layers.py +3 -3
keras_hub/src/models/whisper/whisper_audio_converter.py +2 -4
keras_hub/src/models/whisper/whisper_backbone.py +6 -5
keras_hub/src/models/whisper/whisper_decoder.py +3 -5
keras_hub/src/models/whisper/whisper_presets.py +10 -30
keras_hub/src/models/xlm_roberta/xlm_roberta_masked_lm.py +1 -1
keras_hub/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor.py +2 -2
keras_hub/src/models/xlm_roberta/xlm_roberta_presets.py +2 -6
keras_hub/src/models/xlm_roberta/xlm_roberta_text_classifier.py +4 -4
keras_hub/src/models/xlm_roberta/xlm_roberta_tokenizer.py +2 -1
keras_hub/src/models/xlnet/relative_attention.py +20 -19
keras_hub/src/models/xlnet/xlnet_backbone.py +2 -2
keras_hub/src/models/xlnet/xlnet_content_and_query_embedding.py +3 -5
keras_hub/src/models/xlnet/xlnet_encoder.py +7 -9
keras_hub/src/samplers/contrastive_sampler.py +2 -3
keras_hub/src/samplers/sampler.py +2 -1
keras_hub/src/tests/test_case.py +41 -6
keras_hub/src/tokenizers/byte_pair_tokenizer.py +7 -3
keras_hub/src/tokenizers/byte_tokenizer.py +3 -10
keras_hub/src/tokenizers/sentence_piece_tokenizer.py +2 -9
keras_hub/src/tokenizers/sentence_piece_tokenizer_trainer.py +9 -11
keras_hub/src/tokenizers/tokenizer.py +10 -13
keras_hub/src/tokenizers/unicode_codepoint_tokenizer.py +9 -7
keras_hub/src/tokenizers/word_piece_tokenizer_trainer.py +10 -3
keras_hub/src/utils/keras_utils.py +2 -13
keras_hub/src/utils/pipeline_model.py +3 -3
keras_hub/src/utils/preset_utils.py +196 -144
keras_hub/src/utils/tensor_utils.py +4 -4
keras_hub/src/utils/timm/convert_densenet.py +6 -4
keras_hub/src/utils/timm/convert_efficientnet.py +447 -0
keras_hub/src/utils/timm/convert_resnet.py +1 -1
keras_hub/src/utils/timm/convert_vgg.py +85 -0
keras_hub/src/utils/timm/preset_loader.py +14 -9
keras_hub/src/utils/transformers/convert_llama3.py +21 -5
keras_hub/src/utils/transformers/convert_vit.py +150 -0
keras_hub/src/utils/transformers/preset_loader.py +23 -0
keras_hub/src/utils/transformers/safetensor_utils.py +4 -3
keras_hub/src/version_utils.py +1 -1
{keras_hub_nightly-0.16.1.dev202410020340.dist-info → keras_hub_nightly-0.19.0.dev202501260345.dist-info}/METADATA +86 -68
keras_hub_nightly-0.19.0.dev202501260345.dist-info/RECORD +423 -0
{keras_hub_nightly-0.16.1.dev202410020340.dist-info → keras_hub_nightly-0.19.0.dev202501260345.dist-info}/WHEEL +1 -1
keras_hub/src/layers/preprocessing/resizing_image_converter.py +0 -138
keras_hub/src/models/mix_transformer/__init__.py +0 -0
keras_hub/src/models/mix_transformer/mix_transformer_classifier.py +0 -119
keras_hub/src/models/stable_diffusion_3/vae_image_decoder.py +0 -320
keras_hub_nightly-0.16.1.dev202410020340.dist-info/RECORD +0 -357
{keras_hub_nightly-0.16.1.dev202410020340.dist-info → keras_hub_nightly-0.19.0.dev202501260345.dist-info}/top_level.txt +0 -0

keras_hub/src/models/vae/vae_layers.py ADDED Viewed

@@ -0,0 +1,739 @@
+import math
+import keras
+from keras import ops
+from keras_hub.src.utils.keras_utils import standardize_data_format
+class Conv2DMultiHeadAttention(keras.layers.Layer):
+    """A MultiHeadAttention layer utilizing `Conv2D` and `GroupNormalization`.
+    Args:
+        filters: int. The number of the filters for the convolutional layers.
+        groups: int. The number of the groups for the group normalization
+            layers. Defaults to `32`.
+        data_format: `None` or str. If specified, either `"channels_last"` or
+            `"channels_first"`. The ordering of the dimensions in the
+            inputs. `"channels_last"` corresponds to inputs with shape
+            `(batch_size, height, width, channels)`
+            while `"channels_first"` corresponds to inputs with shape
+            `(batch_size, channels, height, width)`. It defaults to the
+            `image_data_format` value found in your Keras config file at
+            `~/.keras/keras.json`. If you never set it, then it will be
+            `"channels_last"`.
+        **kwargs: other keyword arguments passed to `keras.layers.Layer`,
+            including `name`, `dtype` etc.
+    """
+    def __init__(self, filters, groups=32, data_format=None, **kwargs):
+        super().__init__(**kwargs)
+        data_format = standardize_data_format(data_format)
+        channel_axis = -1 if data_format == "channels_last" else 1
+        self.filters = int(filters)
+        self.groups = int(groups)
+        self._inverse_sqrt_filters = 1.0 / math.sqrt(float(filters))
+        self.data_format = data_format
+        self.group_norm = keras.layers.GroupNormalization(
+            groups=groups,
+            axis=channel_axis,
+            epsilon=1e-6,
+            dtype=self.dtype_policy,
+            name="group_norm",
+        )
+        self.query_conv2d = keras.layers.Conv2D(
+            filters,
+            1,
+            1,
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="query_conv2d",
+        )
+        self.key_conv2d = keras.layers.Conv2D(
+            filters,
+            1,
+            1,
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="key_conv2d",
+        )
+        self.value_conv2d = keras.layers.Conv2D(
+            filters,
+            1,
+            1,
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="value_conv2d",
+        )
+        self.softmax = keras.layers.Softmax(dtype="float32")
+        self.output_conv2d = keras.layers.Conv2D(
+            filters,
+            1,
+            1,
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="output_conv2d",
+        )
+    def build(self, input_shape):
+        self.group_norm.build(input_shape)
+        self.query_conv2d.build(input_shape)
+        self.key_conv2d.build(input_shape)
+        self.value_conv2d.build(input_shape)
+        self.output_conv2d.build(input_shape)
+    def call(self, inputs, training=None):
+        x = self.group_norm(inputs, training=training)
+        query = self.query_conv2d(x, training=training)
+        key = self.key_conv2d(x, training=training)
+        value = self.value_conv2d(x, training=training)
+        if self.data_format == "channels_first":
+            query = ops.transpose(query, (0, 2, 3, 1))
+            key = ops.transpose(key, (0, 2, 3, 1))
+            value = ops.transpose(value, (0, 2, 3, 1))
+        shape = ops.shape(inputs)
+        b = shape[0]
+        query = ops.reshape(query, (b, -1, self.filters))
+        key = ops.reshape(key, (b, -1, self.filters))
+        value = ops.reshape(value, (b, -1, self.filters))
+        # Compute attention.
+        query = ops.multiply(
+            query, ops.cast(self._inverse_sqrt_filters, query.dtype)
+        )
+        # [B, H0 * W0, C], [B, H1 * W1, C] -> [B, H0 * W0, H1 * W1]
+        attention_scores = ops.einsum("abc,adc->abd", query, key)
+        attention_scores = ops.cast(
+            self.softmax(attention_scores), self.compute_dtype
+        )
+        # [B, H2 * W2, C], [B, H0 * W0, H1 * W1] -> [B, H1 * W1 ,C]
+        attention_output = ops.einsum("abc,adb->adc", value, attention_scores)
+        x = ops.reshape(attention_output, shape)
+        x = self.output_conv2d(x, training=training)
+        if self.data_format == "channels_first":
+            x = ops.transpose(x, (0, 3, 1, 2))
+        x = ops.add(x, inputs)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "filters": self.filters,
+                "groups": self.groups,
+            }
+        )
+        return config
+    def compute_output_shape(self, input_shape):
+        return input_shape
+class ResNetBlock(keras.layers.Layer):
+    """A ResNet block utilizing `GroupNormalization` and SiLU activation.
+    Args:
+        filters: The number of filters in the block.
+        has_residual_projection: Whether to add a projection layer for the
+            residual connection. Defaults to `False`.
+        data_format: `None` or str. If specified, either `"channels_last"` or
+            `"channels_first"`. The ordering of the dimensions in the
+            inputs. `"channels_last"` corresponds to inputs with shape
+            `(batch_size, height, width, channels)`
+            while `"channels_first"` corresponds to inputs with shape
+            `(batch_size, channels, height, width)`. It defaults to the
+            `image_data_format` value found in your Keras config file at
+            `~/.keras/keras.json`. If you never set it, then it will be
+            `"channels_last"`.
+        **kwargs: other keyword arguments passed to `keras.layers.Layer`,
+            including `name`, `dtype` etc.
+    """
+    def __init__(
+        self,
+        filters,
+        has_residual_projection=False,
+        data_format=None,
+        **kwargs,
+    ):
+        super().__init__(**kwargs)
+        data_format = standardize_data_format(data_format)
+        channel_axis = -1 if data_format == "channels_last" else 1
+        self.filters = int(filters)
+        self.has_residual_projection = bool(has_residual_projection)
+        # === Layers ===
+        self.norm1 = keras.layers.GroupNormalization(
+            groups=32,
+            axis=channel_axis,
+            epsilon=1e-6,
+            dtype=self.dtype_policy,
+            name="norm1",
+        )
+        self.act1 = keras.layers.Activation("silu", dtype=self.dtype_policy)
+        self.conv1 = keras.layers.Conv2D(
+            filters,
+            3,
+            1,
+            padding="same",
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="conv1",
+        )
+        self.norm2 = keras.layers.GroupNormalization(
+            groups=32,
+            axis=channel_axis,
+            epsilon=1e-6,
+            dtype=self.dtype_policy,
+            name="norm2",
+        )
+        self.act2 = keras.layers.Activation("silu", dtype=self.dtype_policy)
+        self.conv2 = keras.layers.Conv2D(
+            filters,
+            3,
+            1,
+            padding="same",
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="conv2",
+        )
+        if self.has_residual_projection:
+            self.residual_projection = keras.layers.Conv2D(
+                filters,
+                1,
+                1,
+                data_format=data_format,
+                dtype=self.dtype_policy,
+                name="residual_projection",
+            )
+        self.add = keras.layers.Add(dtype=self.dtype_policy)
+    def build(self, input_shape):
+        residual_shape = list(input_shape)
+        self.norm1.build(input_shape)
+        self.act1.build(input_shape)
+        self.conv1.build(input_shape)
+        input_shape = self.conv1.compute_output_shape(input_shape)
+        self.norm2.build(input_shape)
+        self.act2.build(input_shape)
+        self.conv2.build(input_shape)
+        input_shape = self.conv2.compute_output_shape(input_shape)
+        if self.has_residual_projection:
+            self.residual_projection.build(residual_shape)
+        self.add.build([input_shape, input_shape])
+    def call(self, inputs, training=None):
+        x = inputs
+        residual = x
+        x = self.norm1(x, training=training)
+        x = self.act1(x, training=training)
+        x = self.conv1(x, training=training)
+        x = self.norm2(x, training=training)
+        x = self.act2(x, training=training)
+        x = self.conv2(x, training=training)
+        if self.has_residual_projection:
+            residual = self.residual_projection(residual, training=training)
+        x = self.add([residual, x])
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "filters": self.filters,
+                "has_residual_projection": self.has_residual_projection,
+            }
+        )
+        return config
+    def compute_output_shape(self, input_shape):
+        outputs_shape = list(input_shape)
+        if self.has_residual_projection:
+            outputs_shape = self.residual_projection.compute_output_shape(
+                outputs_shape
+            )
+        return outputs_shape
+class VAEEncoder(keras.layers.Layer):
+    """The encoder layer of VAE.
+    Args:
+        stackwise_num_filters: list of ints. The number of filters for each
+            stack.
+        stackwise_num_blocks: list of ints. The number of blocks for each stack.
+        output_channels: int. The number of channels in the output. Defaults to
+            `32`.
+        data_format: `None` or str. If specified, either `"channels_last"` or
+            `"channels_first"`. The ordering of the dimensions in the
+            inputs. `"channels_last"` corresponds to inputs with shape
+            `(batch_size, height, width, channels)`
+            while `"channels_first"` corresponds to inputs with shape
+            `(batch_size, channels, height, width)`. It defaults to the
+            `image_data_format` value found in your Keras config file at
+            `~/.keras/keras.json`. If you never set it, then it will be
+            `"channels_last"`.
+        **kwargs: other keyword arguments passed to `keras.layers.Layer`,
+            including `name`, `dtype` etc.
+    """
+    def __init__(
+        self,
+        stackwise_num_filters,
+        stackwise_num_blocks,
+        output_channels=32,
+        data_format=None,
+        **kwargs,
+    ):
+        super().__init__(**kwargs)
+        data_format = standardize_data_format(data_format)
+        channel_axis = -1 if data_format == "channels_last" else 1
+        self.stackwise_num_filters = stackwise_num_filters
+        self.stackwise_num_blocks = stackwise_num_blocks
+        self.output_channels = int(output_channels)
+        self.data_format = data_format
+        # === Layers ===
+        self.input_projection = keras.layers.Conv2D(
+            stackwise_num_filters[0],
+            3,
+            1,
+            padding="same",
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="input_projection",
+        )
+        # Blocks.
+        input_filters = stackwise_num_filters[0]
+        self.blocks = []
+        self.downsamples = []
+        for i, filters in enumerate(stackwise_num_filters):
+            for j in range(stackwise_num_blocks[i]):
+                self.blocks.append(
+                    ResNetBlock(
+                        filters,
+                        has_residual_projection=input_filters != filters,
+                        data_format=data_format,
+                        dtype=self.dtype_policy,
+                        name=f"block_{i}_{j}",
+                    )
+                )
+                input_filters = filters
+            # No downsample in the last block.
+            if i != len(stackwise_num_filters) - 1:
+                self.downsamples.append(
+                    keras.layers.ZeroPadding2D(
+                        padding=((0, 1), (0, 1)),
+                        data_format=data_format,
+                        dtype=self.dtype_policy,
+                        name=f"downsample_{i}_pad",
+                    )
+                )
+                self.downsamples.append(
+                    keras.layers.Conv2D(
+                        filters,
+                        3,
+                        2,
+                        data_format=data_format,
+                        dtype=self.dtype_policy,
+                        name=f"downsample_{i}_conv",
+                    )
+                )
+        # Mid block.
+        self.mid_block_0 = ResNetBlock(
+            stackwise_num_filters[-1],
+            has_residual_projection=False,
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="mid_block_0",
+        )
+        self.mid_attention = Conv2DMultiHeadAttention(
+            stackwise_num_filters[-1],
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="mid_attention",
+        )
+        self.mid_block_1 = ResNetBlock(
+            stackwise_num_filters[-1],
+            has_residual_projection=False,
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="mid_block_1",
+        )
+        # Output layers.
+        self.output_norm = keras.layers.GroupNormalization(
+            groups=32,
+            axis=channel_axis,
+            epsilon=1e-6,
+            dtype=self.dtype_policy,
+            name="output_norm",
+        )
+        self.output_act = keras.layers.Activation(
+            "swish", dtype=self.dtype_policy
+        )
+        self.output_projection = keras.layers.Conv2D(
+            output_channels,
+            3,
+            1,
+            padding="same",
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="output_projection",
+        )
+    def build(self, input_shape):
+        self.input_projection.build(input_shape)
+        input_shape = self.input_projection.compute_output_shape(input_shape)
+        blocks_idx = 0
+        downsamples_idx = 0
+        for i, _ in enumerate(self.stackwise_num_filters):
+            for _ in range(self.stackwise_num_blocks[i]):
+                self.blocks[blocks_idx].build(input_shape)
+                input_shape = self.blocks[blocks_idx].compute_output_shape(
+                    input_shape
+                )
+                blocks_idx += 1
+            if i != len(self.stackwise_num_filters) - 1:
+                self.downsamples[downsamples_idx].build(input_shape)
+                input_shape = self.downsamples[
+                    downsamples_idx
+                ].compute_output_shape(input_shape)
+                downsamples_idx += 1
+                self.downsamples[downsamples_idx].build(input_shape)
+                input_shape = self.downsamples[
+                    downsamples_idx
+                ].compute_output_shape(input_shape)
+                downsamples_idx += 1
+        self.mid_block_0.build(input_shape)
+        input_shape = self.mid_block_0.compute_output_shape(input_shape)
+        self.mid_attention.build(input_shape)
+        input_shape = self.mid_attention.compute_output_shape(input_shape)
+        self.mid_block_1.build(input_shape)
+        input_shape = self.mid_block_1.compute_output_shape(input_shape)
+        self.output_norm.build(input_shape)
+        self.output_act.build(input_shape)
+        self.output_projection.build(input_shape)
+    def call(self, inputs, training=None):
+        x = inputs
+        x = self.input_projection(x, training=training)
+        blocks_idx = 0
+        upsamples_idx = 0
+        for i, _ in enumerate(self.stackwise_num_filters):
+            for _ in range(self.stackwise_num_blocks[i]):
+                x = self.blocks[blocks_idx](x, training=training)
+                blocks_idx += 1
+            if i != len(self.stackwise_num_filters) - 1:
+                x = self.downsamples[upsamples_idx](x, training=training)
+                x = self.downsamples[upsamples_idx + 1](x, training=training)
+                upsamples_idx += 2
+        x = self.mid_block_0(x, training=training)
+        x = self.mid_attention(x, training=training)
+        x = self.mid_block_1(x, training=training)
+        x = self.output_norm(x, training=training)
+        x = self.output_act(x, training=training)
+        x = self.output_projection(x, training=training)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "stackwise_num_filters": self.stackwise_num_filters,
+                "stackwise_num_blocks": self.stackwise_num_blocks,
+                "output_channels": self.output_channels,
+            }
+        )
+        return config
+    def compute_output_shape(self, input_shape):
+        if self.data_format == "channels_last":
+            h_axis, w_axis, c_axis = 1, 2, 3
+        else:
+            c_axis, h_axis, w_axis = 1, 2, 3
+        scale_factor = 2 ** (len(self.stackwise_num_filters) - 1)
+        outputs_shape = list(input_shape)
+        if (
+            outputs_shape[h_axis] is not None
+            and outputs_shape[w_axis] is not None
+        ):
+            outputs_shape[h_axis] = outputs_shape[h_axis] // scale_factor
+            outputs_shape[w_axis] = outputs_shape[w_axis] // scale_factor
+        outputs_shape[c_axis] = self.output_channels
+        return outputs_shape
+class VAEDecoder(keras.layers.Layer):
+    """The decoder layer of VAE.
+    Args:
+        stackwise_num_filters: list of ints. The number of filters for each
+            stack.
+        stackwise_num_blocks: list of ints. The number of blocks for each stack.
+        output_channels: int. The number of channels in the output. Defaults to
+            `3`.
+        data_format: `None` or str. If specified, either `"channels_last"` or
+            `"channels_first"`. The ordering of the dimensions in the
+            inputs. `"channels_last"` corresponds to inputs with shape
+            `(batch_size, height, width, channels)`
+            while `"channels_first"` corresponds to inputs with shape
+            `(batch_size, channels, height, width)`. It defaults to the
+            `image_data_format` value found in your Keras config file at
+            `~/.keras/keras.json`. If you never set it, then it will be
+            `"channels_last"`.
+        **kwargs: other keyword arguments passed to `keras.layers.Layer`,
+            including `name`, `dtype` etc.
+    """
+    def __init__(
+        self,
+        stackwise_num_filters,
+        stackwise_num_blocks,
+        output_channels=3,
+        data_format=None,
+        **kwargs,
+    ):
+        super().__init__(**kwargs)
+        data_format = standardize_data_format(data_format)
+        channel_axis = -1 if data_format == "channels_last" else 1
+        self.stackwise_num_filters = stackwise_num_filters
+        self.stackwise_num_blocks = stackwise_num_blocks
+        self.output_channels = int(output_channels)
+        self.data_format = data_format
+        # === Layers ===
+        self.input_projection = keras.layers.Conv2D(
+            stackwise_num_filters[0],
+            3,
+            1,
+            padding="same",
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="input_projection",
+        )
+        # Mid block.
+        self.mid_block_0 = ResNetBlock(
+            stackwise_num_filters[0],
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="mid_block_0",
+        )
+        self.mid_attention = Conv2DMultiHeadAttention(
+            stackwise_num_filters[0],
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="mid_attention",
+        )
+        self.mid_block_1 = ResNetBlock(
+            stackwise_num_filters[0],
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="mid_block_1",
+        )
+        # Blocks.
+        input_filters = stackwise_num_filters[0]
+        self.blocks = []
+        self.upsamples = []
+        for i, filters in enumerate(stackwise_num_filters):
+            for j in range(stackwise_num_blocks[i]):
+                self.blocks.append(
+                    ResNetBlock(
+                        filters,
+                        has_residual_projection=input_filters != filters,
+                        data_format=data_format,
+                        dtype=self.dtype_policy,
+                        name=f"block_{i}_{j}",
+                    )
+                )
+                input_filters = filters
+            # No upsample in the last block.
+            if i != len(stackwise_num_filters) - 1:
+                self.upsamples.append(
+                    keras.layers.UpSampling2D(
+                        2,
+                        data_format=data_format,
+                        dtype=self.dtype_policy,
+                        name=f"upsample_{i}",
+                    )
+                )
+                self.upsamples.append(
+                    keras.layers.Conv2D(
+                        filters,
+                        3,
+                        1,
+                        padding="same",
+                        data_format=data_format,
+                        dtype=self.dtype_policy,
+                        name=f"upsample_{i}_conv",
+                    )
+                )
+        # Output layers.
+        self.output_norm = keras.layers.GroupNormalization(
+            groups=32,
+            axis=channel_axis,
+            epsilon=1e-6,
+            dtype=self.dtype_policy,
+            name="output_norm",
+        )
+        self.output_act = keras.layers.Activation(
+            "swish", dtype=self.dtype_policy
+        )
+        self.output_projection = keras.layers.Conv2D(
+            output_channels,
+            3,
+            1,
+            padding="same",
+            data_format=data_format,
+            dtype=self.dtype_policy,
+            name="output_projection",
+        )
+    def build(self, input_shape):
+        self.input_projection.build(input_shape)
+        input_shape = self.input_projection.compute_output_shape(input_shape)
+        self.mid_block_0.build(input_shape)
+        input_shape = self.mid_block_0.compute_output_shape(input_shape)
+        self.mid_attention.build(input_shape)
+        input_shape = self.mid_attention.compute_output_shape(input_shape)
+        self.mid_block_1.build(input_shape)
+        input_shape = self.mid_block_1.compute_output_shape(input_shape)
+        blocks_idx = 0
+        upsamples_idx = 0
+        for i, _ in enumerate(self.stackwise_num_filters):
+            for _ in range(self.stackwise_num_blocks[i]):
+                self.blocks[blocks_idx].build(input_shape)
+                input_shape = self.blocks[blocks_idx].compute_output_shape(
+                    input_shape
+                )
+                blocks_idx += 1
+            if i != len(self.stackwise_num_filters) - 1:
+                self.upsamples[upsamples_idx].build(input_shape)
+                input_shape = self.upsamples[
+                    upsamples_idx
+                ].compute_output_shape(input_shape)
+                self.upsamples[upsamples_idx + 1].build(input_shape)
+                input_shape = self.upsamples[
+                    upsamples_idx + 1
+                ].compute_output_shape(input_shape)
+                upsamples_idx += 2
+        self.output_norm.build(input_shape)
+        self.output_act.build(input_shape)
+        self.output_projection.build(input_shape)
+    def call(self, inputs, training=None):
+        x = inputs
+        x = self.input_projection(x, training=training)
+        x = self.mid_block_0(x, training=training)
+        x = self.mid_attention(x, training=training)
+        x = self.mid_block_1(x, training=training)
+        blocks_idx = 0
+        upsamples_idx = 0
+        for i, _ in enumerate(self.stackwise_num_filters):
+            for _ in range(self.stackwise_num_blocks[i]):
+                x = self.blocks[blocks_idx](x, training=training)
+                blocks_idx += 1
+            if i != len(self.stackwise_num_filters) - 1:
+                x = self.upsamples[upsamples_idx](x, training=training)
+                x = self.upsamples[upsamples_idx + 1](x, training=training)
+                upsamples_idx += 2
+        x = self.output_norm(x, training=training)
+        x = self.output_act(x, training=training)
+        x = self.output_projection(x, training=training)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "stackwise_num_filters": self.stackwise_num_filters,
+                "stackwise_num_blocks": self.stackwise_num_blocks,
+                "output_channels": self.output_channels,
+            }
+        )
+        return config
+    def compute_output_shape(self, input_shape):
+        if self.data_format == "channels_last":
+            h_axis, w_axis, c_axis = 1, 2, 3
+        else:
+            c_axis, h_axis, w_axis = 1, 2, 3
+        scale_factor = 2 ** (len(self.stackwise_num_filters) - 1)
+        outputs_shape = list(input_shape)
+        if (
+            outputs_shape[h_axis] is not None
+            and outputs_shape[w_axis] is not None
+        ):
+            outputs_shape[h_axis] = outputs_shape[h_axis] * scale_factor
+            outputs_shape[w_axis] = outputs_shape[w_axis] * scale_factor
+        outputs_shape[c_axis] = self.output_channels
+        return outputs_shape
+class DiagonalGaussianDistributionSampler(keras.layers.Layer):
+    """A sampler for a diagonal Gaussian distribution.
+    This layer samples latent variables from a diagonal Gaussian distribution.
+    Args:
+        method: str. The method used to sample from the distribution. Available
+            methods are `"sample"` and `"mode"`. `"sample"` draws from the
+            distribution using both the mean and log variance. `"mode"` draws
+            from the distribution using the mean only.
+        axis: int. The axis along which to split the mean and log variance.
+            Defaults to `-1`.
+        seed: optional int. Used as a random seed.
+        **kwargs: other keyword arguments passed to `keras.layers.Layer`,
+            including `name`, `dtype` etc.
+    """
+    def __init__(self, method, axis=-1, seed=None, **kwargs):
+        super().__init__(**kwargs)
+        # TODO: Support `kl` and `nll` modes.
+        valid_methods = ("sample", "mode")
+        if method not in valid_methods:
+            raise ValueError(
+                f"Invalid method {method}. Valid methods are "
+                f"{list(valid_methods)}."
+            )
+        self.method = method
+        self.axis = axis
+        self.seed = seed
+        self.seed_generator = keras.random.SeedGenerator(seed)
+    def call(self, inputs):
+        x = inputs
+        if self.method == "sample":
+            x_mean, x_logvar = ops.split(x, 2, axis=self.axis)
+            x_logvar = ops.clip(x_logvar, -30.0, 20.0)
+            x_std = ops.exp(ops.multiply(0.5, x_logvar))
+            sample = keras.random.normal(
+                ops.shape(x_mean), dtype=x_mean.dtype, seed=self.seed_generator
+            )
+            x = ops.add(x_mean, ops.multiply(x_std, sample))
+        else:
+            x, _ = ops.split(x, 2, axis=self.axis)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "axis": self.axis,
+                "seed": self.seed,
+            }
+        )
+        return config
+    def compute_output_shape(self, input_shape):
+        output_shape = list(input_shape)
+        output_shape[self.axis] = output_shape[self.axis] // 2
+        return output_shape

keras-hub-nightly 0.16.1.dev202410020340__py3-none-any.whl → 0.19.0.dev202501260345__py3-none-any.whl

keras-hub-nightly 0.16.1.dev202410020340py3-none-any.whl → 0.19.0.dev202501260345py3-none-any.whl