PyPI - keras-hub - Versions diffs - 0.21.1__py3-none-any.whl → 0.22.0.dev0__py3-none-any.whl - Mend

keras-hub 0.21.1py3-none-any.whl → 0.22.0.dev0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (94) hide show

keras_hub/layers/__init__.py +9 -0
keras_hub/models/__init__.py +47 -0
keras_hub/src/layers/modeling/transformer_encoder.py +6 -3
keras_hub/src/layers/preprocessing/multi_segment_packer.py +17 -3
keras_hub/src/layers/preprocessing/start_end_packer.py +24 -6
keras_hub/src/models/backbone.py +13 -10
keras_hub/src/models/clip/clip_backbone.py +3 -102
keras_hub/src/models/clip/clip_layers.py +295 -0
keras_hub/src/models/clip/clip_preprocessor.py +57 -48
keras_hub/src/models/clip/clip_text_encoder.py +2 -2
keras_hub/src/models/clip/clip_vision_encoder.py +3 -3
keras_hub/src/models/deit/__init__.py +5 -0
keras_hub/src/models/deit/deit_backbone.py +154 -0
keras_hub/src/models/deit/deit_image_classifier.py +171 -0
keras_hub/src/models/deit/deit_image_classifier_preprocessor.py +12 -0
keras_hub/src/models/deit/deit_image_converter.py +8 -0
keras_hub/src/models/deit/deit_layers.py +519 -0
keras_hub/src/models/deit/deit_presets.py +49 -0
keras_hub/src/models/dinov2/__init__.py +5 -0
keras_hub/src/models/dinov2/dinov2_backbone.py +228 -0
keras_hub/src/models/dinov2/dinov2_image_converter.py +8 -0
keras_hub/src/models/dinov2/dinov2_layers.py +886 -0
keras_hub/src/models/dinov2/dinov2_presets.py +89 -0
keras_hub/src/models/esm/__init__.py +5 -0
keras_hub/src/models/esm/esm_attention.py +95 -0
keras_hub/src/models/esm/esm_backbone.py +229 -0
keras_hub/src/models/esm/esm_classifier.py +184 -0
keras_hub/src/models/esm/esm_classifier_preprocessor.py +135 -0
keras_hub/src/models/esm/esm_encoder.py +134 -0
keras_hub/src/models/esm/esm_masked_plm.py +117 -0
keras_hub/src/models/esm/esm_masked_plm_preprocessor.py +143 -0
keras_hub/src/models/esm/esm_presets.py +53 -0
keras_hub/src/models/esm/esm_tokenizer.py +82 -0
keras_hub/src/models/flux/flux_text_to_image_preprocessor.py +6 -2
keras_hub/src/models/gemma/gemma_attention.py +1 -1
keras_hub/src/models/gemma3/gemma3_backbone.py +2 -2
keras_hub/src/models/gemma3/gemma3_interleave_embeddings.py +1 -1
keras_hub/src/models/hgnetv2/__init__.py +5 -0
keras_hub/src/models/hgnetv2/hgnetv2_backbone.py +193 -0
keras_hub/src/models/hgnetv2/hgnetv2_encoder.py +148 -0
keras_hub/src/models/hgnetv2/hgnetv2_image_classifier.py +216 -0
keras_hub/src/models/hgnetv2/hgnetv2_image_classifier_preprocessor.py +14 -0
keras_hub/src/models/hgnetv2/hgnetv2_image_converter.py +8 -0
keras_hub/src/models/hgnetv2/hgnetv2_layers.py +918 -0
keras_hub/src/models/hgnetv2/hgnetv2_presets.py +58 -0
keras_hub/src/models/llama3/llama3_presets.py +3 -3
keras_hub/src/models/mistral/mistral_presets.py +17 -1
keras_hub/src/models/mixtral/mixtral_presets.py +2 -2
keras_hub/src/models/mobilenet/mobilenet_presets.py +4 -4
keras_hub/src/models/pali_gemma/pali_gemma_backbone.py +2 -2
keras_hub/src/models/pali_gemma/pali_gemma_causal_lm.py +2 -2
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +17 -17
keras_hub/src/models/qwen3/__init__.py +5 -0
keras_hub/src/models/qwen3/qwen3_attention.py +369 -0
keras_hub/src/models/qwen3/qwen3_backbone.py +191 -0
keras_hub/src/models/qwen3/qwen3_causal_lm.py +390 -0
keras_hub/src/models/qwen3/qwen3_causal_lm_preprocessor.py +10 -0
keras_hub/src/models/qwen3/qwen3_decoder.py +309 -0
keras_hub/src/models/qwen3/qwen3_layernorm.py +38 -0
keras_hub/src/models/qwen3/qwen3_presets.py +73 -0
keras_hub/src/models/qwen3/qwen3_tokenizer.py +48 -0
keras_hub/src/models/qwen_moe/qwen_moe_attention.py +1 -0
keras_hub/src/models/qwen_moe/qwen_moe_presets.py +2 -2
keras_hub/src/models/roformer_v2/roformer_v2_attention.py +0 -2
keras_hub/src/models/stable_diffusion_3/flow_match_euler_discrete_scheduler.py +16 -7
keras_hub/src/models/stable_diffusion_3/mmdit.py +61 -4
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_backbone.py +31 -32
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_image_to_image.py +1 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_inpaint.py +1 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image.py +1 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image_preprocessor.py +6 -2
keras_hub/src/models/vit/vit_backbone.py +31 -11
keras_hub/src/models/vit/vit_image_converter.py +0 -70
keras_hub/src/models/vit/vit_layers.py +33 -18
keras_hub/src/models/vit/vit_presets.py +11 -11
keras_hub/src/utils/keras_utils.py +17 -0
keras_hub/src/utils/preset_utils.py +19 -4
keras_hub/src/utils/tensor_utils.py +14 -0
keras_hub/src/utils/transformers/convert_deit.py +155 -0
keras_hub/src/utils/transformers/convert_dinov2.py +180 -0
keras_hub/src/utils/transformers/convert_esm.py +159 -0
keras_hub/src/utils/transformers/convert_llama3.py +6 -0
keras_hub/src/utils/transformers/convert_qwen3.py +145 -0
keras_hub/src/utils/transformers/export/gemma.py +89 -0
keras_hub/src/utils/transformers/export/hf_exporter.py +98 -0
keras_hub/src/utils/transformers/preset_loader.py +14 -2
keras_hub/src/version.py +1 -1
keras_hub/tokenizers/__init__.py +1 -0
{keras_hub-0.21.1.dist-info → keras_hub-0.22.0.dev0.dist-info}/METADATA +4 -4
{keras_hub-0.21.1.dist-info → keras_hub-0.22.0.dev0.dist-info}/RECORD +92 -48
keras_hub/src/models/clip/clip_encoder_block.py +0 -111
keras_hub/src/models/clip/clip_vision_embedding.py +0 -101
{keras_hub-0.21.1.dist-info → keras_hub-0.22.0.dev0.dist-info}/WHEEL +0 -0
{keras_hub-0.21.1.dist-info → keras_hub-0.22.0.dev0.dist-info}/top_level.txt +0 -0

keras_hub/src/models/clip/clip_encoder_block.py DELETED Viewed

@@ -1,111 +0,0 @@
-from keras import dtype_policies
-from keras import layers
-from keras import ops
-def quick_gelu(x):
-    return x * ops.sigmoid(1.702 * x)
-# TODO: Deprecate this in favor of `keras.layers.MultiHeadAttention` once the
-# dtype compatibility issue is resolved.
-class CLIPMultiHeadAttention(layers.MultiHeadAttention):
-    def _masked_softmax(self, attention_scores, attention_mask=None):
-        attention_scores = super()._masked_softmax(
-            attention_scores, attention_mask
-        )
-        return ops.cast(attention_scores, self._value_dense.compute_dtype)
-class CLIPEncoderBlock(layers.Layer):
-    def __init__(
-        self,
-        hidden_dim,
-        num_heads,
-        intermediate_dim,
-        intermediate_activation="quick_gelu",
-        use_causal_mask=True,
-        **kwargs,
-    ):
-        super().__init__(**kwargs)
-        if hidden_dim % num_heads != 0:
-            raise ValueError(
-                "`hidden_dim` must be divisible by `num_heads`. "
-                f"Received: hidden_dim={hidden_dim}, num_heads={num_heads}"
-            )
-        self.hidden_dim = hidden_dim
-        self.num_heads = num_heads
-        self.intermediate_dim = intermediate_dim
-        self.intermediate_activation = intermediate_activation
-        self.use_causal_mask = use_causal_mask
-        if intermediate_activation == "quick_gelu":
-            intermediate_activation = quick_gelu
-        self.layer_norm_1 = layers.LayerNormalization(
-            epsilon=1e-5, dtype=self.dtype_policy, name="layer_norm_1"
-        )
-        self.attention = CLIPMultiHeadAttention(
-            num_heads,
-            hidden_dim // num_heads,
-            dtype=self.dtype_policy,
-            name="attention",
-        )
-        self.layer_norm_2 = layers.LayerNormalization(
-            epsilon=1e-5, dtype=self.dtype_policy, name="layer_norm_2"
-        )
-        self.dense_1 = layers.Dense(
-            self.intermediate_dim, dtype=self.dtype_policy, name="dense_1"
-        )
-        self.activation = layers.Activation(
-            intermediate_activation, dtype=self.dtype_policy, name="activation"
-        )
-        self.dense_2 = layers.Dense(
-            self.hidden_dim, dtype=self.dtype_policy, name="dense_2"
-        )
-    def build(self, input_shape):
-        self.layer_norm_1.build(input_shape)
-        self.attention.build(input_shape, input_shape, input_shape)
-        # Before Keras 3.2, there was no setter for `dtype_policy`. Directly
-        # assign a `DTypePolicy` instead.
-        self.attention._softmax.dtype_policy = dtype_policies.DTypePolicy(
-            "float32"
-        )
-        self.layer_norm_2.build(input_shape)
-        self.dense_1.build(input_shape)
-        input_shape = self.dense_1.compute_output_shape(input_shape)
-        self.dense_2.build(input_shape)
-    def compute_output_shape(self, inputs_shape):
-        outputs_shape = list(inputs_shape)
-        outputs_shape[-1] = self.hidden_dim
-        return outputs_shape
-    def call(self, x, training=None):
-        residual = x
-        x = self.layer_norm_1(x)
-        x = self.attention(
-            x, x, x, training=training, use_causal_mask=self.use_causal_mask
-        )
-        x = ops.add(residual, x)
-        residual = x
-        x = self.dense_1(self.layer_norm_2(residual))
-        x = self.activation(x)
-        x = self.dense_2(x)
-        x = ops.add(residual, x)
-        return x
-    def get_config(self):
-        config = super().get_config()
-        config.update(
-            {
-                "hidden_dim": self.hidden_dim,
-                "num_heads": self.num_heads,
-                "intermediate_dim": self.intermediate_dim,
-                "intermediate_activation": self.intermediate_activation,
-                "use_causal_mask": self.use_causal_mask,
-            }
-        )
-        return config

keras_hub/src/models/clip/clip_vision_embedding.py DELETED Viewed

@@ -1,101 +0,0 @@
-from keras import layers
-from keras import ops
-from keras_hub.src.utils.keras_utils import standardize_data_format
-class CLIPVisionEmbedding(layers.Layer):
-    def __init__(
-        self,
-        hidden_dim,
-        patch_size,
-        image_size,
-        data_format=None,
-        dtype=None,
-        **kwargs,
-    ):
-        super().__init__(dtype=dtype, **kwargs)
-        self.hidden_dim = int(hidden_dim)
-        self.patch_size = int(patch_size)
-        self.image_size = int(image_size)
-        data_format = standardize_data_format(data_format)
-        self.data_format = data_format
-        num_patches = (image_size // patch_size) ** 2
-        self.num_positions = num_patches + 1
-        self.patch_embedding = layers.Conv2D(
-            hidden_dim,
-            kernel_size=patch_size,
-            strides=patch_size,
-            data_format=data_format,
-            use_bias=False,
-            dtype=dtype,
-            name="patch_embedding",
-        )
-        self.position_embedding = layers.Embedding(
-            num_patches + 1, hidden_dim, dtype=dtype, name="position_embedding"
-        )
-    def build(self, input_shape):
-        self.class_embedding = self.add_weight(
-            shape=(self.hidden_dim,),
-            initializer="random_normal",
-            dtype=self.variable_dtype,
-            name="class_embedding",
-        )
-        self.position_ids = self.add_weight(
-            shape=(1, self.num_positions),
-            initializer="zeros",
-            # Let the backend determine the int dtype. For example, tf
-            # requires int64 for correct device placement, whereas jax and torch
-            # don't.
-            dtype=int,
-            trainable=False,
-            name="position_ids",
-        )
-        self.patch_embedding.build(input_shape)
-        self.position_embedding.build(self.position_ids.shape)
-    def call(self, inputs, training=None):
-        x = inputs
-        batch_size = ops.shape(x)[0]
-        patch_embeddings = self.patch_embedding(x, training=training)
-        if self.data_format == "channels_last":
-            patch_embeddings = ops.reshape(
-                patch_embeddings, (batch_size, -1, self.hidden_dim)
-            )
-        else:
-            patch_embeddings = ops.reshape(
-                patch_embeddings, (batch_size, self.hidden_dim, -1)
-            )
-            patch_embeddings = ops.transpose(patch_embeddings, (0, 2, 1))
-        class_embeddings = ops.expand_dims(self.class_embedding, axis=(0, 1))
-        class_embeddings = ops.tile(class_embeddings, (batch_size, 1, 1))
-        position_embeddings = self.position_embedding(self.position_ids)
-        embeddings = ops.concatenate(
-            [class_embeddings, patch_embeddings], axis=1
-        )
-        return ops.add(embeddings, position_embeddings)
-    def get_config(self):
-        config = super().get_config()
-        config.update(
-            {
-                "hidden_dim": self.hidden_dim,
-                "patch_size": self.patch_size,
-                "image_size": self.image_size,
-            }
-        )
-        return config
-    def compute_output_shape(self, input_shape):
-        output_shape = [input_shape[0], None, self.hidden_dim]
-        if self.data_format == "channels_last":
-            if input_shape[1] is not None and input_shape[2] is not None:
-                patch_num = input_shape[1] // self.patch_size
-                output_shape[1] = patch_num**2 + 1
-        else:
-            if input_shape[2] is not None and input_shape[3] is not None:
-                patch_num = input_shape[2] // self.patch_size
-                output_shape[1] = patch_num**2 + 1
-        return output_shape

{keras_hub-0.21.1.dist-info → keras_hub-0.22.0.dev0.dist-info}/WHEEL RENAMED Viewed

File without changes

{keras_hub-0.21.1.dist-info → keras_hub-0.22.0.dev0.dist-info}/top_level.txt RENAMED Viewed

File without changes

keras-hub 0.21.1__py3-none-any.whl → 0.22.0.dev0__py3-none-any.whl

keras-hub 0.21.1py3-none-any.whl → 0.22.0.dev0py3-none-any.whl