PyPI - keras-hub-nightly - Versions diffs - 0.16.1.dev202409250340__py3-none-any.whl → 0.16.1.dev202409270338__py3-none-any.whl - Mend

keras-hub-nightly 0.16.1.dev202409250340py3-none-any.whl → 0.16.1.dev202409270338py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (357) hide show

keras_hub/__init__.py +0 -13
keras_hub/api/__init__.py +0 -13
keras_hub/api/bounding_box/__init__.py +0 -13
keras_hub/api/layers/__init__.py +3 -13
keras_hub/api/metrics/__init__.py +0 -13
keras_hub/api/models/__init__.py +16 -13
keras_hub/api/samplers/__init__.py +0 -13
keras_hub/api/tokenizers/__init__.py +1 -13
keras_hub/api/utils/__init__.py +0 -13
keras_hub/src/__init__.py +0 -13
keras_hub/src/api_export.py +0 -14
keras_hub/src/bounding_box/__init__.py +0 -13
keras_hub/src/bounding_box/converters.py +0 -13
keras_hub/src/bounding_box/formats.py +0 -13
keras_hub/src/bounding_box/iou.py +1 -13
keras_hub/src/bounding_box/to_dense.py +0 -14
keras_hub/src/bounding_box/to_ragged.py +0 -13
keras_hub/src/bounding_box/utils.py +0 -13
keras_hub/src/bounding_box/validate_format.py +0 -14
keras_hub/src/layers/__init__.py +0 -13
keras_hub/src/layers/modeling/__init__.py +0 -13
keras_hub/src/layers/modeling/alibi_bias.py +0 -13
keras_hub/src/layers/modeling/cached_multi_head_attention.py +0 -14
keras_hub/src/layers/modeling/f_net_encoder.py +0 -14
keras_hub/src/layers/modeling/masked_lm_head.py +0 -14
keras_hub/src/layers/modeling/position_embedding.py +0 -14
keras_hub/src/layers/modeling/reversible_embedding.py +0 -14
keras_hub/src/layers/modeling/rotary_embedding.py +0 -14
keras_hub/src/layers/modeling/sine_position_encoding.py +0 -14
keras_hub/src/layers/modeling/token_and_position_embedding.py +0 -14
keras_hub/src/layers/modeling/transformer_decoder.py +0 -14
keras_hub/src/layers/modeling/transformer_encoder.py +0 -14
keras_hub/src/layers/modeling/transformer_layer_utils.py +0 -14
keras_hub/src/layers/preprocessing/__init__.py +0 -13
keras_hub/src/layers/preprocessing/audio_converter.py +0 -13
keras_hub/src/layers/preprocessing/image_converter.py +0 -13
keras_hub/src/layers/preprocessing/masked_lm_mask_generator.py +0 -15
keras_hub/src/layers/preprocessing/multi_segment_packer.py +0 -14
keras_hub/src/layers/preprocessing/preprocessing_layer.py +0 -14
keras_hub/src/layers/preprocessing/random_deletion.py +0 -14
keras_hub/src/layers/preprocessing/random_swap.py +0 -14
keras_hub/src/layers/preprocessing/resizing_image_converter.py +0 -13
keras_hub/src/layers/preprocessing/start_end_packer.py +0 -15
keras_hub/src/metrics/__init__.py +0 -13
keras_hub/src/metrics/bleu.py +0 -14
keras_hub/src/metrics/edit_distance.py +0 -14
keras_hub/src/metrics/perplexity.py +0 -14
keras_hub/src/metrics/rouge_base.py +0 -14
keras_hub/src/metrics/rouge_l.py +0 -14
keras_hub/src/metrics/rouge_n.py +0 -14
keras_hub/src/models/__init__.py +0 -13
keras_hub/src/models/albert/__init__.py +0 -14
keras_hub/src/models/albert/albert_backbone.py +0 -14
keras_hub/src/models/albert/albert_masked_lm.py +0 -14
keras_hub/src/models/albert/albert_masked_lm_preprocessor.py +0 -14
keras_hub/src/models/albert/albert_presets.py +0 -14
keras_hub/src/models/albert/albert_text_classifier.py +0 -14
keras_hub/src/models/albert/albert_text_classifier_preprocessor.py +0 -14
keras_hub/src/models/albert/albert_tokenizer.py +0 -14
keras_hub/src/models/backbone.py +0 -14
keras_hub/src/models/bart/__init__.py +0 -14
keras_hub/src/models/bart/bart_backbone.py +0 -14
keras_hub/src/models/bart/bart_presets.py +0 -13
keras_hub/src/models/bart/bart_seq_2_seq_lm.py +0 -15
keras_hub/src/models/bart/bart_seq_2_seq_lm_preprocessor.py +0 -15
keras_hub/src/models/bart/bart_tokenizer.py +0 -15
keras_hub/src/models/bert/__init__.py +0 -14
keras_hub/src/models/bert/bert_backbone.py +0 -14
keras_hub/src/models/bert/bert_masked_lm.py +0 -14
keras_hub/src/models/bert/bert_masked_lm_preprocessor.py +0 -14
keras_hub/src/models/bert/bert_presets.py +0 -13
keras_hub/src/models/bert/bert_text_classifier.py +0 -14
keras_hub/src/models/bert/bert_text_classifier_preprocessor.py +0 -14
keras_hub/src/models/bert/bert_tokenizer.py +0 -14
keras_hub/src/models/bloom/__init__.py +0 -14
keras_hub/src/models/bloom/bloom_attention.py +0 -13
keras_hub/src/models/bloom/bloom_backbone.py +0 -14
keras_hub/src/models/bloom/bloom_causal_lm.py +0 -15
keras_hub/src/models/bloom/bloom_causal_lm_preprocessor.py +0 -15
keras_hub/src/models/bloom/bloom_decoder.py +0 -13
keras_hub/src/models/bloom/bloom_presets.py +0 -13
keras_hub/src/models/bloom/bloom_tokenizer.py +0 -15
keras_hub/src/models/causal_lm.py +0 -14
keras_hub/src/models/causal_lm_preprocessor.py +0 -13
keras_hub/src/models/clip/__init__.py +0 -0
keras_hub/src/models/{stable_diffusion_v3 → clip}/clip_encoder_block.py +8 -15
keras_hub/src/models/clip/clip_preprocessor.py +134 -0
keras_hub/src/models/clip/clip_text_encoder.py +139 -0
keras_hub/src/models/{stable_diffusion_v3 → clip}/clip_tokenizer.py +65 -41
keras_hub/src/models/csp_darknet/__init__.py +0 -13
keras_hub/src/models/csp_darknet/csp_darknet_backbone.py +0 -13
keras_hub/src/models/csp_darknet/csp_darknet_image_classifier.py +0 -13
keras_hub/src/models/deberta_v3/__init__.py +0 -14
keras_hub/src/models/deberta_v3/deberta_v3_backbone.py +0 -15
keras_hub/src/models/deberta_v3/deberta_v3_masked_lm.py +0 -15
keras_hub/src/models/deberta_v3/deberta_v3_masked_lm_preprocessor.py +0 -14
keras_hub/src/models/deberta_v3/deberta_v3_presets.py +0 -13
keras_hub/src/models/deberta_v3/deberta_v3_text_classifier.py +0 -15
keras_hub/src/models/deberta_v3/deberta_v3_text_classifier_preprocessor.py +0 -14
keras_hub/src/models/deberta_v3/deberta_v3_tokenizer.py +0 -15
keras_hub/src/models/deberta_v3/disentangled_attention_encoder.py +0 -14
keras_hub/src/models/deberta_v3/disentangled_self_attention.py +0 -14
keras_hub/src/models/deberta_v3/relative_embedding.py +0 -14
keras_hub/src/models/densenet/__init__.py +5 -13
keras_hub/src/models/densenet/densenet_backbone.py +11 -21
keras_hub/src/models/densenet/densenet_image_classifier.py +27 -17
keras_hub/src/models/densenet/densenet_image_classifier_preprocessor.py +27 -0
keras_hub/src/models/{stable_diffusion_v3/__init__.py → densenet/densenet_image_converter.py} +10 -0
keras_hub/src/models/densenet/densenet_presets.py +56 -0
keras_hub/src/models/distil_bert/__init__.py +0 -14
keras_hub/src/models/distil_bert/distil_bert_backbone.py +0 -15
keras_hub/src/models/distil_bert/distil_bert_masked_lm.py +0 -15
keras_hub/src/models/distil_bert/distil_bert_masked_lm_preprocessor.py +0 -14
keras_hub/src/models/distil_bert/distil_bert_presets.py +0 -13
keras_hub/src/models/distil_bert/distil_bert_text_classifier.py +0 -15
keras_hub/src/models/distil_bert/distil_bert_text_classifier_preprocessor.py +0 -15
keras_hub/src/models/distil_bert/distil_bert_tokenizer.py +0 -15
keras_hub/src/models/efficientnet/__init__.py +0 -13
keras_hub/src/models/efficientnet/efficientnet_backbone.py +0 -13
keras_hub/src/models/efficientnet/fusedmbconv.py +0 -14
keras_hub/src/models/efficientnet/mbconv.py +0 -14
keras_hub/src/models/electra/__init__.py +0 -14
keras_hub/src/models/electra/electra_backbone.py +0 -14
keras_hub/src/models/electra/electra_presets.py +0 -13
keras_hub/src/models/electra/electra_tokenizer.py +0 -14
keras_hub/src/models/f_net/__init__.py +0 -14
keras_hub/src/models/f_net/f_net_backbone.py +0 -15
keras_hub/src/models/f_net/f_net_masked_lm.py +0 -15
keras_hub/src/models/f_net/f_net_masked_lm_preprocessor.py +0 -14
keras_hub/src/models/f_net/f_net_presets.py +0 -13
keras_hub/src/models/f_net/f_net_text_classifier.py +0 -15
keras_hub/src/models/f_net/f_net_text_classifier_preprocessor.py +0 -15
keras_hub/src/models/f_net/f_net_tokenizer.py +0 -15
keras_hub/src/models/falcon/__init__.py +0 -14
keras_hub/src/models/falcon/falcon_attention.py +0 -13
keras_hub/src/models/falcon/falcon_backbone.py +0 -13
keras_hub/src/models/falcon/falcon_causal_lm.py +0 -14
keras_hub/src/models/falcon/falcon_causal_lm_preprocessor.py +0 -14
keras_hub/src/models/falcon/falcon_presets.py +0 -13
keras_hub/src/models/falcon/falcon_tokenizer.py +0 -15
keras_hub/src/models/falcon/falcon_transformer_decoder.py +0 -13
keras_hub/src/models/feature_pyramid_backbone.py +0 -13
keras_hub/src/models/gemma/__init__.py +0 -14
keras_hub/src/models/gemma/gemma_attention.py +0 -13
keras_hub/src/models/gemma/gemma_backbone.py +0 -15
keras_hub/src/models/gemma/gemma_causal_lm.py +0 -15
keras_hub/src/models/gemma/gemma_causal_lm_preprocessor.py +0 -14
keras_hub/src/models/gemma/gemma_decoder_block.py +0 -13
keras_hub/src/models/gemma/gemma_presets.py +0 -13
keras_hub/src/models/gemma/gemma_tokenizer.py +0 -14
keras_hub/src/models/gemma/rms_normalization.py +0 -14
keras_hub/src/models/gpt2/__init__.py +0 -14
keras_hub/src/models/gpt2/gpt2_backbone.py +0 -15
keras_hub/src/models/gpt2/gpt2_causal_lm.py +0 -15
keras_hub/src/models/gpt2/gpt2_causal_lm_preprocessor.py +0 -14
keras_hub/src/models/gpt2/gpt2_preprocessor.py +0 -15
keras_hub/src/models/gpt2/gpt2_presets.py +0 -13
keras_hub/src/models/gpt2/gpt2_tokenizer.py +0 -15
keras_hub/src/models/gpt_neo_x/__init__.py +0 -13
keras_hub/src/models/gpt_neo_x/gpt_neo_x_attention.py +0 -14
keras_hub/src/models/gpt_neo_x/gpt_neo_x_backbone.py +0 -14
keras_hub/src/models/gpt_neo_x/gpt_neo_x_causal_lm.py +0 -14
keras_hub/src/models/gpt_neo_x/gpt_neo_x_causal_lm_preprocessor.py +0 -14
keras_hub/src/models/gpt_neo_x/gpt_neo_x_decoder.py +0 -14
keras_hub/src/models/gpt_neo_x/gpt_neo_x_tokenizer.py +0 -14
keras_hub/src/models/image_classifier.py +0 -13
keras_hub/src/models/image_classifier_preprocessor.py +0 -13
keras_hub/src/models/image_segmenter.py +0 -13
keras_hub/src/models/llama/__init__.py +0 -14
keras_hub/src/models/llama/llama_attention.py +0 -13
keras_hub/src/models/llama/llama_backbone.py +0 -13
keras_hub/src/models/llama/llama_causal_lm.py +0 -13
keras_hub/src/models/llama/llama_causal_lm_preprocessor.py +0 -15
keras_hub/src/models/llama/llama_decoder.py +0 -13
keras_hub/src/models/llama/llama_layernorm.py +0 -13
keras_hub/src/models/llama/llama_presets.py +0 -13
keras_hub/src/models/llama/llama_tokenizer.py +0 -14
keras_hub/src/models/llama3/__init__.py +0 -14
keras_hub/src/models/llama3/llama3_backbone.py +0 -14
keras_hub/src/models/llama3/llama3_causal_lm.py +0 -13
keras_hub/src/models/llama3/llama3_causal_lm_preprocessor.py +0 -14
keras_hub/src/models/llama3/llama3_presets.py +0 -13
keras_hub/src/models/llama3/llama3_tokenizer.py +0 -14
keras_hub/src/models/masked_lm.py +0 -13
keras_hub/src/models/masked_lm_preprocessor.py +0 -13
keras_hub/src/models/mistral/__init__.py +0 -14
keras_hub/src/models/mistral/mistral_attention.py +0 -13
keras_hub/src/models/mistral/mistral_backbone.py +0 -14
keras_hub/src/models/mistral/mistral_causal_lm.py +0 -14
keras_hub/src/models/mistral/mistral_causal_lm_preprocessor.py +0 -14
keras_hub/src/models/mistral/mistral_layer_norm.py +0 -13
keras_hub/src/models/mistral/mistral_presets.py +0 -13
keras_hub/src/models/mistral/mistral_tokenizer.py +0 -14
keras_hub/src/models/mistral/mistral_transformer_decoder.py +0 -13
keras_hub/src/models/mix_transformer/__init__.py +0 -13
keras_hub/src/models/mix_transformer/mix_transformer_backbone.py +0 -13
keras_hub/src/models/mix_transformer/mix_transformer_classifier.py +0 -13
keras_hub/src/models/mix_transformer/mix_transformer_layers.py +0 -13
keras_hub/src/models/mobilenet/__init__.py +0 -13
keras_hub/src/models/mobilenet/mobilenet_backbone.py +0 -13
keras_hub/src/models/mobilenet/mobilenet_image_classifier.py +0 -13
keras_hub/src/models/opt/__init__.py +0 -14
keras_hub/src/models/opt/opt_backbone.py +0 -15
keras_hub/src/models/opt/opt_causal_lm.py +0 -15
keras_hub/src/models/opt/opt_causal_lm_preprocessor.py +0 -13
keras_hub/src/models/opt/opt_presets.py +0 -13
keras_hub/src/models/opt/opt_tokenizer.py +0 -15
keras_hub/src/models/pali_gemma/__init__.py +0 -13
keras_hub/src/models/pali_gemma/pali_gemma_backbone.py +0 -13
keras_hub/src/models/pali_gemma/pali_gemma_causal_lm.py +0 -13
keras_hub/src/models/pali_gemma/pali_gemma_causal_lm_preprocessor.py +0 -13
keras_hub/src/models/pali_gemma/pali_gemma_decoder_block.py +0 -14
keras_hub/src/models/pali_gemma/pali_gemma_image_converter.py +0 -13
keras_hub/src/models/pali_gemma/pali_gemma_presets.py +0 -13
keras_hub/src/models/pali_gemma/pali_gemma_tokenizer.py +0 -13
keras_hub/src/models/pali_gemma/pali_gemma_vit.py +0 -13
keras_hub/src/models/phi3/__init__.py +0 -14
keras_hub/src/models/phi3/phi3_attention.py +0 -13
keras_hub/src/models/phi3/phi3_backbone.py +0 -13
keras_hub/src/models/phi3/phi3_causal_lm.py +0 -13
keras_hub/src/models/phi3/phi3_causal_lm_preprocessor.py +0 -14
keras_hub/src/models/phi3/phi3_decoder.py +0 -13
keras_hub/src/models/phi3/phi3_layernorm.py +0 -13
keras_hub/src/models/phi3/phi3_presets.py +0 -13
keras_hub/src/models/phi3/phi3_rotary_embedding.py +0 -13
keras_hub/src/models/phi3/phi3_tokenizer.py +0 -13
keras_hub/src/models/preprocessor.py +51 -32
keras_hub/src/models/resnet/__init__.py +0 -14
keras_hub/src/models/resnet/resnet_backbone.py +0 -13
keras_hub/src/models/resnet/resnet_image_classifier.py +0 -13
keras_hub/src/models/resnet/resnet_image_classifier_preprocessor.py +0 -14
keras_hub/src/models/resnet/resnet_image_converter.py +0 -13
keras_hub/src/models/resnet/resnet_presets.py +0 -13
keras_hub/src/models/retinanet/__init__.py +0 -13
keras_hub/src/models/retinanet/anchor_generator.py +0 -14
keras_hub/src/models/retinanet/box_matcher.py +0 -14
keras_hub/src/models/retinanet/non_max_supression.py +0 -14
keras_hub/src/models/roberta/__init__.py +0 -14
keras_hub/src/models/roberta/roberta_backbone.py +0 -15
keras_hub/src/models/roberta/roberta_masked_lm.py +0 -15
keras_hub/src/models/roberta/roberta_masked_lm_preprocessor.py +0 -14
keras_hub/src/models/roberta/roberta_presets.py +0 -13
keras_hub/src/models/roberta/roberta_text_classifier.py +0 -15
keras_hub/src/models/roberta/roberta_text_classifier_preprocessor.py +0 -14
keras_hub/src/models/roberta/roberta_tokenizer.py +0 -15
keras_hub/src/models/sam/__init__.py +0 -13
keras_hub/src/models/sam/sam_backbone.py +0 -14
keras_hub/src/models/sam/sam_image_segmenter.py +0 -14
keras_hub/src/models/sam/sam_layers.py +0 -14
keras_hub/src/models/sam/sam_mask_decoder.py +0 -14
keras_hub/src/models/sam/sam_prompt_encoder.py +0 -14
keras_hub/src/models/sam/sam_transformer.py +0 -14
keras_hub/src/models/seq_2_seq_lm.py +0 -13
keras_hub/src/models/seq_2_seq_lm_preprocessor.py +0 -13
keras_hub/src/models/stable_diffusion_3/__init__.py +9 -0
keras_hub/src/models/stable_diffusion_3/flow_match_euler_discrete_scheduler.py +80 -0
keras_hub/src/models/{stable_diffusion_v3 → stable_diffusion_3}/mmdit.py +351 -39
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_backbone.py +631 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_presets.py +31 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image.py +138 -0
keras_hub/src/models/stable_diffusion_3/stable_diffusion_3_text_to_image_preprocessor.py +83 -0
keras_hub/src/models/{stable_diffusion_v3/t5_xxl_text_encoder.py → stable_diffusion_3/t5_encoder.py} +7 -20
keras_hub/src/models/stable_diffusion_3/vae_image_decoder.py +320 -0
keras_hub/src/models/t5/__init__.py +0 -14
keras_hub/src/models/t5/t5_backbone.py +0 -14
keras_hub/src/models/t5/t5_layer_norm.py +0 -14
keras_hub/src/models/t5/t5_multi_head_attention.py +0 -14
keras_hub/src/models/{stable_diffusion_v3/t5_xxl_preprocessor.py → t5/t5_preprocessor.py} +12 -16
keras_hub/src/models/t5/t5_presets.py +0 -13
keras_hub/src/models/t5/t5_tokenizer.py +0 -14
keras_hub/src/models/t5/t5_transformer_layer.py +0 -14
keras_hub/src/models/task.py +0 -14
keras_hub/src/models/text_classifier.py +0 -13
keras_hub/src/models/text_classifier_preprocessor.py +0 -13
keras_hub/src/models/text_to_image.py +282 -0
keras_hub/src/models/vgg/__init__.py +0 -13
keras_hub/src/models/vgg/vgg_backbone.py +0 -13
keras_hub/src/models/vgg/vgg_image_classifier.py +0 -13
keras_hub/src/models/vit_det/__init__.py +0 -13
keras_hub/src/models/vit_det/vit_det_backbone.py +0 -14
keras_hub/src/models/vit_det/vit_layers.py +0 -15
keras_hub/src/models/whisper/__init__.py +0 -14
keras_hub/src/models/whisper/whisper_audio_converter.py +0 -15
keras_hub/src/models/whisper/whisper_backbone.py +0 -15
keras_hub/src/models/whisper/whisper_cached_multi_head_attention.py +0 -13
keras_hub/src/models/whisper/whisper_decoder.py +0 -14
keras_hub/src/models/whisper/whisper_encoder.py +0 -14
keras_hub/src/models/whisper/whisper_presets.py +0 -14
keras_hub/src/models/whisper/whisper_tokenizer.py +0 -14
keras_hub/src/models/xlm_roberta/__init__.py +0 -14
keras_hub/src/models/xlm_roberta/xlm_roberta_backbone.py +0 -15
keras_hub/src/models/xlm_roberta/xlm_roberta_masked_lm.py +0 -15
keras_hub/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor.py +0 -14
keras_hub/src/models/xlm_roberta/xlm_roberta_presets.py +0 -13
keras_hub/src/models/xlm_roberta/xlm_roberta_text_classifier.py +0 -15
keras_hub/src/models/xlm_roberta/xlm_roberta_text_classifier_preprocessor.py +0 -15
keras_hub/src/models/xlm_roberta/xlm_roberta_tokenizer.py +0 -15
keras_hub/src/models/xlnet/__init__.py +0 -13
keras_hub/src/models/xlnet/relative_attention.py +0 -14
keras_hub/src/models/xlnet/xlnet_backbone.py +0 -14
keras_hub/src/models/xlnet/xlnet_content_and_query_embedding.py +0 -14
keras_hub/src/models/xlnet/xlnet_encoder.py +0 -14
keras_hub/src/samplers/__init__.py +0 -13
keras_hub/src/samplers/beam_sampler.py +0 -14
keras_hub/src/samplers/contrastive_sampler.py +0 -14
keras_hub/src/samplers/greedy_sampler.py +0 -14
keras_hub/src/samplers/random_sampler.py +0 -14
keras_hub/src/samplers/sampler.py +0 -14
keras_hub/src/samplers/serialization.py +0 -14
keras_hub/src/samplers/top_k_sampler.py +0 -14
keras_hub/src/samplers/top_p_sampler.py +0 -14
keras_hub/src/tests/__init__.py +0 -13
keras_hub/src/tests/test_case.py +0 -14
keras_hub/src/tokenizers/__init__.py +0 -13
keras_hub/src/tokenizers/byte_pair_tokenizer.py +0 -14
keras_hub/src/tokenizers/byte_tokenizer.py +0 -14
keras_hub/src/tokenizers/sentence_piece_tokenizer.py +0 -14
keras_hub/src/tokenizers/sentence_piece_tokenizer_trainer.py +0 -14
keras_hub/src/tokenizers/tokenizer.py +23 -27
keras_hub/src/tokenizers/unicode_codepoint_tokenizer.py +0 -15
keras_hub/src/tokenizers/word_piece_tokenizer.py +0 -14
keras_hub/src/tokenizers/word_piece_tokenizer_trainer.py +0 -15
keras_hub/src/utils/__init__.py +0 -13
keras_hub/src/utils/imagenet/__init__.py +0 -13
keras_hub/src/utils/imagenet/imagenet_utils.py +0 -13
keras_hub/src/utils/keras_utils.py +0 -14
keras_hub/src/utils/pipeline_model.py +0 -14
keras_hub/src/utils/preset_utils.py +32 -76
keras_hub/src/utils/python_utils.py +0 -13
keras_hub/src/utils/tensor_utils.py +0 -14
keras_hub/src/utils/timm/__init__.py +0 -13
keras_hub/src/utils/timm/convert_densenet.py +107 -0
keras_hub/src/utils/timm/convert_resnet.py +0 -13
keras_hub/src/utils/timm/preset_loader.py +3 -13
keras_hub/src/utils/transformers/__init__.py +0 -13
keras_hub/src/utils/transformers/convert_albert.py +0 -13
keras_hub/src/utils/transformers/convert_bart.py +0 -13
keras_hub/src/utils/transformers/convert_bert.py +0 -13
keras_hub/src/utils/transformers/convert_distilbert.py +0 -13
keras_hub/src/utils/transformers/convert_gemma.py +0 -13
keras_hub/src/utils/transformers/convert_gpt2.py +0 -13
keras_hub/src/utils/transformers/convert_llama3.py +0 -13
keras_hub/src/utils/transformers/convert_mistral.py +0 -13
keras_hub/src/utils/transformers/convert_pali_gemma.py +0 -13
keras_hub/src/utils/transformers/preset_loader.py +1 -15
keras_hub/src/utils/transformers/safetensor_utils.py +9 -15
keras_hub/src/version_utils.py +1 -15
{keras_hub_nightly-0.16.1.dev202409250340.dist-info → keras_hub_nightly-0.16.1.dev202409270338.dist-info}/METADATA +30 -27
keras_hub_nightly-0.16.1.dev202409270338.dist-info/RECORD +351 -0
keras_hub/src/models/stable_diffusion_v3/clip_preprocessor.py +0 -93
keras_hub/src/models/stable_diffusion_v3/clip_text_encoder.py +0 -149
keras_hub/src/models/stable_diffusion_v3/mmdit_block.py +0 -317
keras_hub/src/models/stable_diffusion_v3/vae_attention.py +0 -126
keras_hub/src/models/stable_diffusion_v3/vae_image_decoder.py +0 -186
keras_hub_nightly-0.16.1.dev202409250340.dist-info/RECORD +0 -342
{keras_hub_nightly-0.16.1.dev202409250340.dist-info → keras_hub_nightly-0.16.1.dev202409270338.dist-info}/WHEEL +0 -0
{keras_hub_nightly-0.16.1.dev202409250340.dist-info → keras_hub_nightly-0.16.1.dev202409270338.dist-info}/top_level.txt +0 -0

keras_hub/src/models/stable_diffusion_v3/mmdit_block.py DELETED Viewed

@@ -1,317 +0,0 @@
-# Copyright 2024 The KerasHub Authors
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     https://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import math
-from keras import layers
-from keras import models
-from keras import ops
-from keras_hub.src.utils.keras_utils import gelu_approximate
-class DismantledBlock(layers.Layer):
-    def __init__(
-        self,
-        num_heads,
-        hidden_dim,
-        mlp_ratio=4.0,
-        use_projection=True,
-        **kwargs,
-    ):
-        super().__init__(**kwargs)
-        self.num_heads = num_heads
-        self.hidden_dim = hidden_dim
-        self.mlp_ratio = mlp_ratio
-        self.use_projection = use_projection
-        head_dim = hidden_dim // num_heads
-        self.head_dim = head_dim
-        mlp_hidden_dim = int(hidden_dim * mlp_ratio)
-        self.mlp_hidden_dim = mlp_hidden_dim
-        num_modulations = 6 if use_projection else 2
-        self.num_modulations = num_modulations
-        self.adaptive_norm_modulation = models.Sequential(
-            [
-                layers.Activation("silu", dtype=self.dtype_policy),
-                layers.Dense(
-                    num_modulations * hidden_dim, dtype=self.dtype_policy
-                ),
-            ],
-            name="adaptive_norm_modulation",
-        )
-        self.norm1 = layers.LayerNormalization(
-            epsilon=1e-6,
-            center=False,
-            scale=False,
-            dtype=self.dtype_policy,
-            name="norm1",
-        )
-        self.attention_qkv = layers.Dense(
-            hidden_dim * 3, dtype=self.dtype_policy, name="attention_qkv"
-        )
-        if use_projection:
-            self.attention_proj = layers.Dense(
-                hidden_dim, dtype=self.dtype_policy, name="attention_proj"
-            )
-            self.norm2 = layers.LayerNormalization(
-                epsilon=1e-6,
-                center=False,
-                scale=False,
-                dtype=self.dtype_policy,
-                name="norm2",
-            )
-            self.mlp = models.Sequential(
-                [
-                    layers.Dense(
-                        mlp_hidden_dim,
-                        activation=gelu_approximate,
-                        dtype=self.dtype_policy,
-                    ),
-                    layers.Dense(
-                        hidden_dim,
-                        dtype=self.dtype_policy,
-                    ),
-                ],
-                name="mlp",
-            )
-    def build(self, inputs_shape, timestep_embedding):
-        self.adaptive_norm_modulation.build(timestep_embedding)
-        self.attention_qkv.build(inputs_shape)
-        self.norm1.build(inputs_shape)
-        if self.use_projection:
-            self.attention_proj.build(inputs_shape)
-            self.norm2.build(inputs_shape)
-            self.mlp.build(inputs_shape)
-    def _modulate(self, inputs, shift, scale):
-        shift = ops.expand_dims(shift, axis=1)
-        scale = ops.expand_dims(scale, axis=1)
-        return ops.add(ops.multiply(inputs, ops.add(scale, 1.0)), shift)
-    def _compute_pre_attention(self, inputs, timestep_embedding, training=None):
-        batch_size = ops.shape(inputs)[0]
-        if self.use_projection:
-            modulation = self.adaptive_norm_modulation(
-                timestep_embedding, training=training
-            )
-            modulation = ops.reshape(
-                modulation, (batch_size, 6, self.hidden_dim)
-            )
-            (
-                shift_msa,
-                scale_msa,
-                gate_msa,
-                shift_mlp,
-                scale_mlp,
-                gate_mlp,
-            ) = ops.unstack(modulation, 6, axis=1)
-            qkv = self.attention_qkv(
-                self._modulate(self.norm1(inputs), shift_msa, scale_msa),
-                training=training,
-            )
-            qkv = ops.reshape(
-                qkv, (batch_size, -1, 3, self.num_heads, self.head_dim)
-            )
-            q, k, v = ops.unstack(qkv, 3, axis=2)
-            return (q, k, v), (inputs, gate_msa, shift_mlp, scale_mlp, gate_mlp)
-        else:
-            modulation = self.adaptive_norm_modulation(
-                timestep_embedding, training=training
-            )
-            modulation = ops.reshape(
-                modulation, (batch_size, 2, self.hidden_dim)
-            )
-            shift_msa, scale_msa = ops.unstack(modulation, 2, axis=1)
-            qkv = self.attention_qkv(
-                self._modulate(self.norm1(inputs), shift_msa, scale_msa),
-                training=training,
-            )
-            qkv = ops.reshape(
-                qkv, (batch_size, -1, 3, self.num_heads, self.head_dim)
-            )
-            q, k, v = ops.unstack(qkv, 3, axis=2)
-            return (q, k, v)
-    def _compute_post_attention(
-        self, inputs, inputs_intermediates, training=None
-    ):
-        x, gate_msa, shift_mlp, scale_mlp, gate_mlp = inputs_intermediates
-        attn = self.attention_proj(inputs, training=training)
-        x = ops.add(x, ops.multiply(ops.expand_dims(gate_msa, axis=1), attn))
-        x = ops.add(
-            x,
-            ops.multiply(
-                ops.expand_dims(gate_mlp, axis=1),
-                self.mlp(
-                    self._modulate(self.norm2(x), shift_mlp, scale_mlp),
-                    training=training,
-                ),
-            ),
-        )
-        return x
-    def call(
-        self,
-        inputs,
-        timestep_embedding=None,
-        inputs_intermediates=None,
-        pre_attention=True,
-        training=None,
-    ):
-        if pre_attention:
-            return self._compute_pre_attention(
-                inputs, timestep_embedding, training=training
-            )
-        else:
-            return self._compute_post_attention(
-                inputs, inputs_intermediates, training=training
-            )
-    def get_config(self):
-        config = super().get_config()
-        config.update(
-            {
-                "num_heads": self.num_heads,
-                "hidden_dim": self.hidden_dim,
-                "mlp_ratio": self.mlp_ratio,
-                "use_projection": self.use_projection,
-            }
-        )
-        return config
-class MMDiTBlock(layers.Layer):
-    def __init__(
-        self,
-        num_heads,
-        hidden_dim,
-        mlp_ratio=4.0,
-        use_context_projection=True,
-        **kwargs,
-    ):
-        super().__init__(**kwargs)
-        self.num_heads = num_heads
-        self.hidden_dim = hidden_dim
-        self.mlp_ratio = mlp_ratio
-        self.use_context_projection = use_context_projection
-        head_dim = hidden_dim // num_heads
-        self.head_dim = head_dim
-        self._inverse_sqrt_key_dim = 1.0 / math.sqrt(head_dim)
-        self._dot_product_equation = "aecd,abcd->acbe"
-        self._combine_equation = "acbe,aecd->abcd"
-        self.x_block = DismantledBlock(
-            num_heads=num_heads,
-            hidden_dim=hidden_dim,
-            mlp_ratio=mlp_ratio,
-            use_projection=True,
-            dtype=self.dtype_policy,
-            name="x_block",
-        )
-        self.context_block = DismantledBlock(
-            num_heads=num_heads,
-            hidden_dim=hidden_dim,
-            mlp_ratio=mlp_ratio,
-            use_projection=use_context_projection,
-            dtype=self.dtype_policy,
-            name="context_block",
-        )
-    def build(self, inputs_shape, context_shape, timestep_embedding_shape):
-        self.x_block.build(inputs_shape, timestep_embedding_shape)
-        self.context_block.build(context_shape, timestep_embedding_shape)
-    def _compute_attention(self, query, key, value):
-        query = ops.multiply(
-            query, ops.cast(self._inverse_sqrt_key_dim, query.dtype)
-        )
-        attention_scores = ops.einsum(self._dot_product_equation, key, query)
-        attention_scores = ops.nn.softmax(attention_scores, axis=-1)
-        attention_output = ops.einsum(
-            self._combine_equation, attention_scores, value
-        )
-        batch_size = ops.shape(attention_output)[0]
-        attention_output = ops.reshape(
-            attention_output, (batch_size, -1, self.num_heads * self.head_dim)
-        )
-        return attention_output
-    def call(self, inputs, context, timestep_embedding, training=None):
-        # Compute pre-attention.
-        x = inputs
-        if self.use_context_projection:
-            context_qkv, context_intermediates = self.context_block(
-                context,
-                timestep_embedding=timestep_embedding,
-                training=training,
-            )
-        else:
-            context_qkv = self.context_block(
-                context,
-                timestep_embedding=timestep_embedding,
-                training=training,
-            )
-        context_len = ops.shape(context_qkv[0])[1]
-        x_qkv, x_intermediates = self.x_block(
-            x, timestep_embedding=timestep_embedding, training=training
-        )
-        q = ops.concatenate([context_qkv[0], x_qkv[0]], axis=1)
-        k = ops.concatenate([context_qkv[1], x_qkv[1]], axis=1)
-        v = ops.concatenate([context_qkv[2], x_qkv[2]], axis=1)
-        # Compute attention.
-        attention = self._compute_attention(q, k, v)
-        context_attention = attention[:, :context_len]
-        x_attention = attention[:, context_len:]
-        # Compute post-attention.
-        x = self.x_block(
-            x_attention,
-            inputs_intermediates=x_intermediates,
-            pre_attention=False,
-            training=training,
-        )
-        if self.use_context_projection:
-            context = self.context_block(
-                context_attention,
-                inputs_intermediates=context_intermediates,
-                pre_attention=False,
-                training=training,
-            )
-            return x, context
-        else:
-            return x
-    def get_config(self):
-        config = super().get_config()
-        config.update(
-            {
-                "num_heads": self.num_heads,
-                "hidden_dim": self.hidden_dim,
-                "mlp_ratio": self.mlp_ratio,
-                "use_context_projection": self.use_context_projection,
-            }
-        )
-        return config
-    def compute_output_shape(
-        self, inputs_shape, context_shape, timestep_embedding_shape
-    ):
-        if self.use_context_projection:
-            return inputs_shape, context_shape
-        else:
-            return inputs_shape

keras_hub/src/models/stable_diffusion_v3/vae_attention.py DELETED Viewed

@@ -1,126 +0,0 @@
-# Copyright 2024 The KerasHub Authors
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     https://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import math
-from keras import layers
-from keras import ops
-from keras_hub.src.utils.keras_utils import standardize_data_format
-class VAEAttention(layers.Layer):
-    def __init__(self, filters, groups=32, data_format=None, **kwargs):
-        super().__init__(**kwargs)
-        self.filters = filters
-        self.data_format = standardize_data_format(data_format)
-        gn_axis = -1 if self.data_format == "channels_last" else 1
-        self.group_norm = layers.GroupNormalization(
-            groups=groups,
-            axis=gn_axis,
-            epsilon=1e-6,
-            dtype=self.dtype_policy,
-            name="group_norm",
-        )
-        self.query_conv2d = layers.Conv2D(
-            filters,
-            1,
-            1,
-            data_format=self.data_format,
-            dtype=self.dtype_policy,
-            name="query_conv2d",
-        )
-        self.key_conv2d = layers.Conv2D(
-            filters,
-            1,
-            1,
-            data_format=self.data_format,
-            dtype=self.dtype_policy,
-            name="key_conv2d",
-        )
-        self.value_conv2d = layers.Conv2D(
-            filters,
-            1,
-            1,
-            data_format=self.data_format,
-            dtype=self.dtype_policy,
-            name="value_conv2d",
-        )
-        self.softmax = layers.Softmax(dtype="float32")
-        self.output_conv2d = layers.Conv2D(
-            filters,
-            1,
-            1,
-            data_format=self.data_format,
-            dtype=self.dtype_policy,
-            name="output_conv2d",
-        )
-        self.groups = groups
-        self._inverse_sqrt_filters = 1.0 / math.sqrt(float(filters))
-    def build(self, input_shape):
-        self.group_norm.build(input_shape)
-        self.query_conv2d.build(input_shape)
-        self.key_conv2d.build(input_shape)
-        self.value_conv2d.build(input_shape)
-        self.output_conv2d.build(input_shape)
-    def call(self, inputs, training=None):
-        x = self.group_norm(inputs)
-        query = self.query_conv2d(x)
-        key = self.key_conv2d(x)
-        value = self.value_conv2d(x)
-        if self.data_format == "channels_first":
-            query = ops.transpose(query, (0, 2, 3, 1))
-            key = ops.transpose(key, (0, 2, 3, 1))
-            value = ops.transpose(value, (0, 2, 3, 1))
-        shape = ops.shape(inputs)
-        b = shape[0]
-        query = ops.reshape(query, (b, -1, self.filters))
-        key = ops.reshape(key, (b, -1, self.filters))
-        value = ops.reshape(value, (b, -1, self.filters))
-        # Compute attention.
-        query = ops.multiply(
-            query, ops.cast(self._inverse_sqrt_filters, query.dtype)
-        )
-        # [B, H0 * W0, C], [B, H1 * W1, C] -> [B, H0 * W0, H1 * W1]
-        attention_scores = ops.einsum("abc,adc->abd", query, key)
-        attention_scores = ops.cast(
-            self.softmax(attention_scores), self.compute_dtype
-        )
-        # [B, H2 * W2, C], [B, H0 * W0, H1 * W1] -> [B, H1 * W1 ,C]
-        attention_output = ops.einsum("abc,adb->adc", value, attention_scores)
-        x = ops.reshape(attention_output, shape)
-        x = self.output_conv2d(x)
-        if self.data_format == "channels_first":
-            x = ops.transpose(x, (0, 3, 1, 2))
-        x = ops.add(x, inputs)
-        return x
-    def get_config(self):
-        config = super().get_config()
-        config.update(
-            {
-                "filters": self.filters,
-                "groups": self.groups,
-            }
-        )
-        return config
-    def compute_output_shape(self, input_shape):
-        return input_shape

keras_hub/src/models/stable_diffusion_v3/vae_image_decoder.py DELETED Viewed

@@ -1,186 +0,0 @@
-# Copyright 2024 The KerasHub Authors
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     https://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import keras
-from keras import layers
-from keras_hub.src.models.stable_diffusion_v3.vae_attention import VAEAttention
-from keras_hub.src.utils.keras_utils import standardize_data_format
-class VAEImageDecoder(keras.Model):
-    def __init__(
-        self,
-        stackwise_num_filters,
-        stackwise_num_blocks,
-        output_channels=3,
-        latent_shape=(None, None, 16),
-        data_format=None,
-        dtype=None,
-        **kwargs,
-    ):
-        data_format = standardize_data_format(data_format)
-        gn_axis = -1 if data_format == "channels_last" else 1
-        # === Functional Model ===
-        latent_inputs = layers.Input(shape=latent_shape)
-        x = layers.Conv2D(
-            stackwise_num_filters[0],
-            3,
-            1,
-            padding="same",
-            data_format=data_format,
-            dtype=dtype,
-            name="input_projection",
-        )(latent_inputs)
-        x = apply_resnet_block(
-            x,
-            stackwise_num_filters[0],
-            data_format=data_format,
-            dtype=dtype,
-            name="input_block0",
-        )
-        x = VAEAttention(
-            stackwise_num_filters[0],
-            data_format=data_format,
-            dtype=dtype,
-            name="input_attention",
-        )(x)
-        x = apply_resnet_block(
-            x,
-            stackwise_num_filters[0],
-            data_format=data_format,
-            dtype=dtype,
-            name="input_block1",
-        )
-        # Stacks.
-        for i, filters in enumerate(stackwise_num_filters):
-            for j in range(stackwise_num_blocks[i]):
-                x = apply_resnet_block(
-                    x,
-                    filters,
-                    data_format=data_format,
-                    dtype=dtype,
-                    name=f"block{i}_{j}",
-                )
-            if i != len(stackwise_num_filters) - 1:
-                # No upsamling in the last blcok.
-                x = layers.UpSampling2D(
-                    2,
-                    data_format=data_format,
-                    dtype=dtype,
-                    name=f"upsample_{i}",
-                )(x)
-                x = layers.Conv2D(
-                    filters,
-                    3,
-                    1,
-                    padding="same",
-                    data_format=data_format,
-                    dtype=dtype,
-                    name=f"upsample_{i}_conv",
-                )(x)
-        # Ouput block.
-        x = layers.GroupNormalization(
-            groups=32,
-            axis=gn_axis,
-            epsilon=1e-6,
-            dtype=dtype,
-            name="output_norm",
-        )(x)
-        x = layers.Activation("swish", dtype=dtype, name="output_activation")(x)
-        image_outputs = layers.Conv2D(
-            output_channels,
-            3,
-            1,
-            padding="same",
-            data_format=data_format,
-            dtype=dtype,
-            name="output_projection",
-        )(x)
-        super().__init__(inputs=latent_inputs, outputs=image_outputs, **kwargs)
-        # === Config ===
-        self.stackwise_num_filters = stackwise_num_filters
-        self.stackwise_num_blocks = stackwise_num_blocks
-        self.output_channels = output_channels
-        self.latent_shape = latent_shape
-        if dtype is not None:
-            try:
-                self.dtype_policy = keras.dtype_policies.get(dtype)
-            # Before Keras 3.2, there is no `keras.dtype_policies.get`.
-            except AttributeError:
-                if isinstance(dtype, keras.DTypePolicy):
-                    dtype = dtype.name
-                self.dtype_policy = keras.DTypePolicy(dtype)
-    def get_config(self):
-        config = super().get_config()
-        config.update(
-            {
-                "stackwise_num_filters": self.stackwise_num_filters,
-                "stackwise_num_blocks": self.stackwise_num_blocks,
-                "output_channels": self.output_channels,
-                "image_shape": self.latent_shape,
-            }
-        )
-        return config
-def apply_resnet_block(x, filters, data_format=None, dtype=None, name=None):
-    data_format = standardize_data_format(data_format)
-    gn_axis = -1 if data_format == "channels_last" else 1
-    input_filters = x.shape[gn_axis]
-    residual = x
-    x = layers.GroupNormalization(
-        groups=32, axis=gn_axis, epsilon=1e-6, dtype=dtype, name=f"{name}_norm1"
-    )(x)
-    x = layers.Activation("swish", dtype=dtype)(x)
-    x = layers.Conv2D(
-        filters,
-        3,
-        1,
-        padding="same",
-        data_format=data_format,
-        dtype=dtype,
-        name=f"{name}_conv1",
-    )(x)
-    x = layers.GroupNormalization(
-        groups=32, axis=gn_axis, epsilon=1e-6, dtype=dtype, name=f"{name}_norm2"
-    )(x)
-    x = layers.Activation("swish")(x)
-    x = layers.Conv2D(
-        filters,
-        3,
-        1,
-        padding="same",
-        data_format=data_format,
-        dtype=dtype,
-        name=f"{name}_conv2",
-    )(x)
-    if input_filters != filters:
-        residual = layers.Conv2D(
-            filters,
-            1,
-            1,
-            data_format=data_format,
-            dtype=dtype,
-            name=f"{name}_residual_projection",
-        )(residual)
-    x = layers.Add(dtype=dtype)([residual, x])
-    return x

keras-hub-nightly 0.16.1.dev202409250340__py3-none-any.whl → 0.16.1.dev202409270338__py3-none-any.whl

keras-hub-nightly 0.16.1.dev202409250340py3-none-any.whl → 0.16.1.dev202409270338py3-none-any.whl