tf-models-nightly 2.17.0.dev20240528__py2.py3-none-any.whl → 2.20.0.dev20251205__py2.py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- official/__init__.py +1 -1
- official/common/__init__.py +1 -1
- official/common/dataset_fn.py +1 -1
- official/common/distribute_utils.py +27 -3
- official/common/distribute_utils_test.py +13 -12
- official/common/flags.py +28 -1
- official/common/registry_imports.py +1 -1
- official/common/streamz_counters.py +1 -1
- official/core/__init__.py +1 -1
- official/core/actions.py +1 -1
- official/core/actions_test.py +1 -1
- official/core/base_task.py +1 -1
- official/core/base_trainer.py +1 -1
- official/core/base_trainer_test.py +1 -1
- official/core/config_definitions.py +1 -1
- official/core/exp_factory.py +1 -1
- official/core/export_base.py +1 -1
- official/core/export_base_test.py +1 -1
- official/core/file_writers.py +1 -1
- official/core/file_writers_test.py +1 -1
- official/core/input_reader.py +1 -1
- official/core/registry.py +1 -1
- official/core/registry_test.py +1 -1
- official/core/savedmodel_checkpoint_manager.py +1 -1
- official/core/savedmodel_checkpoint_manager_test.py +1 -1
- official/core/task_factory.py +1 -1
- official/core/test_utils.py +1 -1
- official/core/tf_example_builder.py +1 -1
- official/core/tf_example_builder_test.py +1 -1
- official/core/tf_example_feature_key.py +1 -1
- official/core/tf_example_feature_key_test.py +1 -1
- official/core/train_lib.py +1 -3
- official/core/train_lib_test.py +1 -1
- official/core/train_utils.py +1 -1
- official/core/train_utils_test.py +1 -1
- official/legacy/__init__.py +1 -1
- official/legacy/albert/__init__.py +1 -1
- official/legacy/albert/configs.py +1 -1
- official/legacy/bert/__init__.py +1 -1
- official/legacy/bert/bert_models.py +1 -1
- official/legacy/bert/bert_models_test.py +1 -1
- official/legacy/bert/common_flags.py +1 -1
- official/legacy/bert/configs.py +1 -1
- official/legacy/bert/export_tfhub.py +1 -2
- official/legacy/bert/export_tfhub_test.py +1 -1
- official/legacy/bert/input_pipeline.py +1 -1
- official/legacy/bert/model_saving_utils.py +1 -1
- official/legacy/bert/model_training_utils.py +1 -1
- official/legacy/bert/model_training_utils_test.py +1 -1
- official/legacy/bert/run_classifier.py +1 -2
- official/legacy/bert/run_pretraining.py +1 -2
- official/legacy/bert/run_squad.py +1 -2
- official/legacy/bert/run_squad_helper.py +1 -1
- official/legacy/bert/serving.py +1 -1
- official/legacy/detection/__init__.py +1 -1
- official/legacy/detection/configs/__init__.py +1 -1
- official/legacy/detection/configs/base_config.py +1 -1
- official/legacy/detection/configs/factory.py +1 -1
- official/legacy/detection/configs/maskrcnn_config.py +1 -1
- official/legacy/detection/configs/olnmask_config.py +1 -1
- official/legacy/detection/configs/retinanet_config.py +1 -1
- official/legacy/detection/configs/shapemask_config.py +1 -1
- official/legacy/detection/dataloader/__init__.py +1 -1
- official/legacy/detection/dataloader/anchor.py +1 -1
- official/legacy/detection/dataloader/factory.py +1 -1
- official/legacy/detection/dataloader/input_reader.py +1 -1
- official/legacy/detection/dataloader/maskrcnn_parser.py +1 -1
- official/legacy/detection/dataloader/mode_keys.py +1 -1
- official/legacy/detection/dataloader/olnmask_parser.py +1 -1
- official/legacy/detection/dataloader/retinanet_parser.py +1 -1
- official/legacy/detection/dataloader/shapemask_parser.py +1 -1
- official/legacy/detection/dataloader/tf_example_decoder.py +1 -1
- official/legacy/detection/evaluation/__init__.py +1 -1
- official/legacy/detection/evaluation/coco_evaluator.py +1 -1
- official/legacy/detection/evaluation/coco_utils.py +1 -1
- official/legacy/detection/evaluation/factory.py +1 -1
- official/legacy/detection/executor/__init__.py +1 -1
- official/legacy/detection/executor/detection_executor.py +1 -1
- official/legacy/detection/executor/distributed_executor.py +1 -1
- official/legacy/detection/main.py +1 -1
- official/legacy/detection/modeling/__init__.py +1 -1
- official/legacy/detection/modeling/architecture/__init__.py +1 -1
- official/legacy/detection/modeling/architecture/factory.py +1 -1
- official/legacy/detection/modeling/architecture/fpn.py +1 -1
- official/legacy/detection/modeling/architecture/heads.py +1 -1
- official/legacy/detection/modeling/architecture/identity.py +1 -1
- official/legacy/detection/modeling/architecture/nn_blocks.py +1 -1
- official/legacy/detection/modeling/architecture/nn_ops.py +1 -1
- official/legacy/detection/modeling/architecture/resnet.py +1 -1
- official/legacy/detection/modeling/architecture/spinenet.py +1 -1
- official/legacy/detection/modeling/base_model.py +1 -1
- official/legacy/detection/modeling/checkpoint_utils.py +1 -1
- official/legacy/detection/modeling/factory.py +1 -1
- official/legacy/detection/modeling/learning_rates.py +1 -1
- official/legacy/detection/modeling/losses.py +1 -1
- official/legacy/detection/modeling/maskrcnn_model.py +1 -1
- official/legacy/detection/modeling/olnmask_model.py +1 -1
- official/legacy/detection/modeling/optimizers.py +1 -1
- official/legacy/detection/modeling/retinanet_model.py +1 -1
- official/legacy/detection/modeling/shapemask_model.py +1 -1
- official/legacy/detection/ops/__init__.py +1 -1
- official/legacy/detection/ops/nms.py +1 -1
- official/legacy/detection/ops/postprocess_ops.py +1 -1
- official/legacy/detection/ops/roi_ops.py +1 -1
- official/legacy/detection/ops/spatial_transform_ops.py +1 -1
- official/legacy/detection/ops/target_ops.py +1 -1
- official/legacy/detection/utils/__init__.py +1 -1
- official/legacy/detection/utils/box_utils.py +1 -1
- official/legacy/detection/utils/class_utils.py +1 -1
- official/legacy/detection/utils/dataloader_utils.py +1 -1
- official/legacy/detection/utils/input_utils.py +1 -1
- official/legacy/detection/utils/mask_utils.py +1 -1
- official/legacy/image_classification/__init__.py +1 -1
- official/legacy/image_classification/augment.py +1 -1
- official/legacy/image_classification/augment_test.py +1 -1
- official/legacy/image_classification/callbacks.py +1 -1
- official/legacy/image_classification/classifier_trainer.py +1 -1
- official/legacy/image_classification/classifier_trainer_test.py +1 -1
- official/legacy/image_classification/classifier_trainer_util_test.py +1 -1
- official/legacy/image_classification/configs/__init__.py +1 -1
- official/legacy/image_classification/configs/base_configs.py +1 -1
- official/legacy/image_classification/configs/configs.py +1 -1
- official/legacy/image_classification/dataset_factory.py +1 -1
- official/legacy/image_classification/efficientnet/__init__.py +1 -1
- official/legacy/image_classification/efficientnet/common_modules.py +1 -1
- official/legacy/image_classification/efficientnet/efficientnet_config.py +1 -1
- official/legacy/image_classification/efficientnet/efficientnet_model.py +1 -1
- official/legacy/image_classification/efficientnet/tfhub_export.py +1 -1
- official/legacy/image_classification/learning_rate.py +1 -1
- official/legacy/image_classification/learning_rate_test.py +1 -1
- official/legacy/image_classification/mnist_main.py +1 -2
- official/legacy/image_classification/mnist_test.py +1 -1
- official/legacy/image_classification/optimizer_factory.py +1 -1
- official/legacy/image_classification/optimizer_factory_test.py +1 -1
- official/legacy/image_classification/preprocessing.py +1 -1
- official/legacy/image_classification/resnet/__init__.py +1 -1
- official/legacy/image_classification/resnet/common.py +1 -1
- official/legacy/image_classification/resnet/imagenet_preprocessing.py +1 -1
- official/legacy/image_classification/resnet/resnet_config.py +1 -1
- official/legacy/image_classification/resnet/resnet_ctl_imagenet_main.py +1 -2
- official/legacy/image_classification/resnet/resnet_model.py +1 -1
- official/legacy/image_classification/resnet/resnet_runnable.py +1 -1
- official/legacy/image_classification/resnet/tfhub_export.py +1 -2
- official/legacy/image_classification/test_utils.py +1 -1
- official/legacy/image_classification/vgg/__init__.py +1 -1
- official/legacy/image_classification/vgg/vgg_config.py +1 -1
- official/legacy/image_classification/vgg/vgg_model.py +1 -1
- official/legacy/transformer/__init__.py +1 -1
- official/legacy/transformer/attention_layer.py +1 -1
- official/legacy/transformer/beam_search_v1.py +1 -1
- official/legacy/transformer/compute_bleu.py +1 -1
- official/legacy/transformer/compute_bleu_test.py +1 -1
- official/legacy/transformer/data_download.py +1 -1
- official/legacy/transformer/data_pipeline.py +1 -1
- official/legacy/transformer/embedding_layer.py +1 -1
- official/legacy/transformer/ffn_layer.py +1 -1
- official/legacy/transformer/metrics.py +1 -1
- official/legacy/transformer/misc.py +1 -1
- official/legacy/transformer/model_params.py +1 -1
- official/legacy/transformer/model_utils.py +1 -1
- official/legacy/transformer/model_utils_test.py +1 -1
- official/legacy/transformer/optimizer.py +1 -1
- official/legacy/transformer/transformer.py +1 -1
- official/legacy/transformer/transformer_forward_test.py +1 -1
- official/legacy/transformer/transformer_layers_test.py +1 -1
- official/legacy/transformer/transformer_main.py +1 -5
- official/legacy/transformer/transformer_main_test.py +1 -1
- official/legacy/transformer/transformer_test.py +1 -1
- official/legacy/transformer/translate.py +1 -2
- official/legacy/transformer/utils/__init__.py +1 -1
- official/legacy/transformer/utils/metrics.py +1 -1
- official/legacy/transformer/utils/tokenizer.py +1 -1
- official/legacy/transformer/utils/tokenizer_test.py +1 -1
- official/legacy/xlnet/__init__.py +1 -1
- official/legacy/xlnet/classifier_utils.py +1 -1
- official/legacy/xlnet/common_flags.py +1 -1
- official/legacy/xlnet/data_utils.py +1 -1
- official/legacy/xlnet/optimization.py +1 -1
- official/legacy/xlnet/preprocess_classification_data.py +1 -2
- official/legacy/xlnet/preprocess_pretrain_data.py +1 -2
- official/legacy/xlnet/preprocess_squad_data.py +1 -2
- official/legacy/xlnet/preprocess_utils.py +1 -1
- official/legacy/xlnet/run_classifier.py +1 -2
- official/legacy/xlnet/run_pretrain.py +1 -2
- official/legacy/xlnet/run_squad.py +1 -2
- official/legacy/xlnet/squad_utils.py +1 -1
- official/legacy/xlnet/training_utils.py +1 -1
- official/legacy/xlnet/xlnet_config.py +1 -1
- official/legacy/xlnet/xlnet_modeling.py +1 -1
- official/modeling/__init__.py +1 -1
- official/modeling/activations/__init__.py +1 -1
- official/modeling/activations/gelu.py +1 -1
- official/modeling/activations/gelu_test.py +1 -1
- official/modeling/activations/mish.py +1 -1
- official/modeling/activations/mish_test.py +1 -1
- official/modeling/activations/relu.py +1 -1
- official/modeling/activations/relu_test.py +1 -1
- official/modeling/activations/sigmoid.py +1 -1
- official/modeling/activations/sigmoid_test.py +1 -1
- official/modeling/activations/swish.py +1 -1
- official/modeling/activations/swish_test.py +1 -1
- official/modeling/grad_utils.py +1 -1
- official/modeling/grad_utils_test.py +1 -1
- official/modeling/hyperparams/__init__.py +1 -1
- official/modeling/hyperparams/base_config.py +27 -19
- official/modeling/hyperparams/base_config_test.py +32 -1
- official/modeling/hyperparams/oneof.py +1 -1
- official/modeling/hyperparams/oneof_test.py +1 -1
- official/modeling/hyperparams/params_dict.py +1 -1
- official/modeling/hyperparams/params_dict_test.py +1 -1
- official/modeling/multitask/__init__.py +1 -1
- official/modeling/multitask/base_model.py +1 -1
- official/modeling/multitask/base_trainer.py +1 -1
- official/modeling/multitask/base_trainer_test.py +1 -1
- official/modeling/multitask/configs.py +3 -3
- official/modeling/multitask/evaluator.py +1 -1
- official/modeling/multitask/evaluator_test.py +1 -1
- official/modeling/multitask/interleaving_trainer.py +1 -1
- official/modeling/multitask/interleaving_trainer_test.py +1 -1
- official/modeling/multitask/multitask.py +1 -1
- official/modeling/multitask/task_sampler.py +1 -1
- official/modeling/multitask/task_sampler_test.py +1 -1
- official/modeling/multitask/test_utils.py +1 -1
- official/modeling/multitask/train_lib.py +81 -14
- official/modeling/multitask/train_lib_test.py +1 -1
- official/modeling/optimization/__init__.py +1 -1
- official/modeling/optimization/adafactor_optimizer.py +1 -1
- official/modeling/optimization/configs/__init__.py +1 -1
- official/modeling/optimization/configs/learning_rate_config.py +1 -1
- official/modeling/optimization/configs/optimization_config.py +1 -1
- official/modeling/optimization/configs/optimization_config_test.py +1 -1
- official/modeling/optimization/configs/optimizer_config.py +1 -1
- official/modeling/optimization/ema_optimizer.py +1 -1
- official/modeling/optimization/lamb.py +1 -1
- official/modeling/optimization/lamb_test.py +1 -1
- official/modeling/optimization/lars.py +1 -1
- official/modeling/optimization/legacy_adamw.py +1 -1
- official/modeling/optimization/lr_schedule.py +1 -1
- official/modeling/optimization/lr_schedule_test.py +1 -1
- official/modeling/optimization/optimizer_factory.py +1 -1
- official/modeling/optimization/optimizer_factory_test.py +1 -1
- official/modeling/optimization/slide_optimizer.py +1 -1
- official/modeling/performance.py +1 -1
- official/modeling/privacy/__init__.py +1 -1
- official/modeling/privacy/configs.py +1 -1
- official/modeling/privacy/configs_test.py +1 -1
- official/modeling/privacy/ops.py +1 -1
- official/modeling/privacy/ops_test.py +1 -1
- official/modeling/tf_utils.py +1 -1
- official/modeling/tf_utils_test.py +1 -1
- official/nlp/__init__.py +1 -1
- official/nlp/configs/__init__.py +1 -1
- official/nlp/configs/bert.py +1 -1
- official/nlp/configs/electra.py +1 -1
- official/nlp/configs/encoders.py +1 -1
- official/nlp/configs/encoders_test.py +1 -1
- official/nlp/configs/experiment_configs.py +1 -1
- official/nlp/configs/finetuning_experiments.py +1 -1
- official/nlp/configs/pretraining_experiments.py +1 -1
- official/nlp/configs/wmt_transformer_experiments.py +1 -1
- official/nlp/continuous_finetune_lib.py +1 -1
- official/nlp/continuous_finetune_lib_test.py +1 -1
- official/nlp/data/__init__.py +1 -1
- official/nlp/data/classifier_data_lib.py +1 -1
- official/nlp/data/classifier_data_lib_test.py +1 -1
- official/nlp/data/create_finetuning_data.py +1 -2
- official/nlp/data/create_pretraining_data.py +1 -3
- official/nlp/data/create_pretraining_data_test.py +1 -1
- official/nlp/data/create_xlnet_pretraining_data.py +1 -3
- official/nlp/data/create_xlnet_pretraining_data_test.py +1 -1
- official/nlp/data/data_loader.py +1 -1
- official/nlp/data/data_loader_factory.py +1 -1
- official/nlp/data/data_loader_factory_test.py +1 -1
- official/nlp/data/dual_encoder_dataloader.py +1 -1
- official/nlp/data/dual_encoder_dataloader_test.py +1 -1
- official/nlp/data/pretrain_dataloader.py +1 -1
- official/nlp/data/pretrain_dataloader_test.py +1 -1
- official/nlp/data/pretrain_dynamic_dataloader.py +1 -1
- official/nlp/data/pretrain_dynamic_dataloader_test.py +1 -1
- official/nlp/data/pretrain_text_dataloader.py +1 -1
- official/nlp/data/question_answering_dataloader.py +1 -1
- official/nlp/data/question_answering_dataloader_test.py +1 -1
- official/nlp/data/sentence_prediction_dataloader.py +1 -1
- official/nlp/data/sentence_prediction_dataloader_test.py +1 -1
- official/nlp/data/sentence_retrieval_lib.py +1 -1
- official/nlp/data/squad_lib.py +1 -1
- official/nlp/data/squad_lib_sp.py +1 -1
- official/nlp/data/tagging_data_lib.py +1 -1
- official/nlp/data/tagging_data_lib_test.py +1 -1
- official/nlp/data/tagging_dataloader.py +1 -1
- official/nlp/data/tagging_dataloader_test.py +1 -1
- official/nlp/data/train_sentencepiece.py +1 -1
- official/nlp/data/wmt_dataloader.py +1 -1
- official/nlp/data/wmt_dataloader_test.py +1 -1
- official/nlp/metrics/__init__.py +1 -1
- official/nlp/metrics/bleu.py +1 -1
- official/nlp/metrics/bleu_test.py +1 -1
- official/nlp/modeling/__init__.py +1 -1
- official/nlp/modeling/layers/__init__.py +3 -1
- official/nlp/modeling/layers/attention.py +1 -1
- official/nlp/modeling/layers/attention_test.py +1 -1
- official/nlp/modeling/layers/bigbird_attention.py +1 -1
- official/nlp/modeling/layers/bigbird_attention_test.py +1 -1
- official/nlp/modeling/layers/block_diag_feedforward.py +1 -1
- official/nlp/modeling/layers/block_diag_feedforward_test.py +1 -1
- official/nlp/modeling/layers/block_sparse_attention.py +359 -0
- official/nlp/modeling/layers/block_sparse_attention_test.py +433 -0
- official/nlp/modeling/layers/cls_head.py +1 -1
- official/nlp/modeling/layers/cls_head_test.py +1 -1
- official/nlp/modeling/layers/factorized_embedding.py +1 -1
- official/nlp/modeling/layers/factorized_embedding_test.py +1 -1
- official/nlp/modeling/layers/gated_feedforward.py +2 -2
- official/nlp/modeling/layers/gated_feedforward_test.py +1 -1
- official/nlp/modeling/layers/gaussian_process.py +1 -1
- official/nlp/modeling/layers/gaussian_process_test.py +1 -1
- official/nlp/modeling/layers/kernel_attention.py +1 -1
- official/nlp/modeling/layers/kernel_attention_test.py +1 -1
- official/nlp/modeling/layers/masked_lm.py +1 -1
- official/nlp/modeling/layers/masked_lm_test.py +1 -1
- official/nlp/modeling/layers/masked_softmax.py +1 -1
- official/nlp/modeling/layers/masked_softmax_test.py +1 -1
- official/nlp/modeling/layers/mat_mul_with_margin.py +1 -2
- official/nlp/modeling/layers/mat_mul_with_margin_test.py +1 -1
- official/nlp/modeling/layers/mixing.py +1 -1
- official/nlp/modeling/layers/mixing_test.py +1 -1
- official/nlp/modeling/layers/mobile_bert_layers.py +1 -1
- official/nlp/modeling/layers/mobile_bert_layers_test.py +1 -1
- official/nlp/modeling/layers/moe.py +1 -1
- official/nlp/modeling/layers/moe_test.py +1 -1
- official/nlp/modeling/layers/multi_channel_attention.py +1 -1
- official/nlp/modeling/layers/multi_channel_attention_test.py +1 -1
- official/nlp/modeling/layers/multi_query_attention.py +426 -0
- official/nlp/modeling/layers/multi_query_attention_test.py +415 -0
- official/nlp/modeling/layers/on_device_embedding.py +1 -1
- official/nlp/modeling/layers/on_device_embedding_test.py +1 -1
- official/nlp/modeling/layers/pack_optimization.py +9 -1
- official/nlp/modeling/layers/pack_optimization_test.py +1 -1
- official/nlp/modeling/layers/per_dim_scale_attention.py +1 -1
- official/nlp/modeling/layers/per_dim_scale_attention_test.py +1 -1
- official/nlp/modeling/layers/position_embedding.py +1 -1
- official/nlp/modeling/layers/position_embedding_test.py +1 -1
- official/nlp/modeling/layers/relative_attention.py +1 -1
- official/nlp/modeling/layers/relative_attention_test.py +1 -1
- official/nlp/modeling/layers/reuse_attention.py +1 -1
- official/nlp/modeling/layers/reuse_attention_test.py +1 -1
- official/nlp/modeling/layers/reuse_transformer.py +1 -1
- official/nlp/modeling/layers/reuse_transformer_test.py +1 -1
- official/nlp/modeling/layers/rezero_transformer.py +89 -21
- official/nlp/modeling/layers/rezero_transformer_test.py +64 -1
- official/nlp/modeling/layers/routing.py +1 -1
- official/nlp/modeling/layers/routing_test.py +1 -1
- official/nlp/modeling/layers/self_attention_mask.py +1 -1
- official/nlp/modeling/layers/spectral_normalization.py +1 -1
- official/nlp/modeling/layers/spectral_normalization_test.py +1 -1
- official/nlp/modeling/layers/talking_heads_attention.py +1 -1
- official/nlp/modeling/layers/talking_heads_attention_test.py +1 -1
- official/nlp/modeling/layers/text_layers.py +1 -1
- official/nlp/modeling/layers/text_layers_test.py +1 -1
- official/nlp/modeling/layers/tn_expand_condense.py +1 -1
- official/nlp/modeling/layers/tn_expand_condense_test.py +1 -1
- official/nlp/modeling/layers/tn_transformer_expand_condense.py +1 -3
- official/nlp/modeling/layers/tn_transformer_test.py +1 -1
- official/nlp/modeling/layers/transformer.py +1 -1
- official/nlp/modeling/layers/transformer_encoder_block.py +313 -52
- official/nlp/modeling/layers/transformer_encoder_block_test.py +291 -9
- official/nlp/modeling/layers/transformer_scaffold.py +1 -1
- official/nlp/modeling/layers/transformer_scaffold_test.py +1 -1
- official/nlp/modeling/layers/transformer_test.py +1 -1
- official/nlp/modeling/layers/transformer_xl.py +1 -1
- official/nlp/modeling/layers/transformer_xl_test.py +1 -1
- official/nlp/modeling/layers/util.py +1 -1
- official/nlp/modeling/losses/__init__.py +1 -1
- official/nlp/modeling/losses/weighted_sparse_categorical_crossentropy.py +1 -1
- official/nlp/modeling/losses/weighted_sparse_categorical_crossentropy_test.py +1 -1
- official/nlp/modeling/models/__init__.py +1 -1
- official/nlp/modeling/models/bert_classifier.py +1 -1
- official/nlp/modeling/models/bert_classifier_test.py +1 -1
- official/nlp/modeling/models/bert_pretrainer.py +1 -1
- official/nlp/modeling/models/bert_pretrainer_test.py +1 -1
- official/nlp/modeling/models/bert_span_labeler.py +1 -1
- official/nlp/modeling/models/bert_span_labeler_test.py +1 -1
- official/nlp/modeling/models/bert_token_classifier.py +1 -1
- official/nlp/modeling/models/bert_token_classifier_test.py +1 -1
- official/nlp/modeling/models/dual_encoder.py +1 -1
- official/nlp/modeling/models/dual_encoder_test.py +1 -1
- official/nlp/modeling/models/electra_pretrainer.py +1 -1
- official/nlp/modeling/models/electra_pretrainer_test.py +1 -1
- official/nlp/modeling/models/seq2seq_transformer.py +1 -1
- official/nlp/modeling/models/seq2seq_transformer_test.py +1 -1
- official/nlp/modeling/models/t5.py +1 -1
- official/nlp/modeling/models/t5_test.py +1 -1
- official/nlp/modeling/models/xlnet.py +1 -1
- official/nlp/modeling/models/xlnet_test.py +1 -1
- official/nlp/modeling/networks/__init__.py +1 -1
- official/nlp/modeling/networks/albert_encoder.py +1 -1
- official/nlp/modeling/networks/albert_encoder_test.py +1 -1
- official/nlp/modeling/networks/bert_dense_encoder_test.py +1 -2
- official/nlp/modeling/networks/bert_encoder.py +1 -1
- official/nlp/modeling/networks/bert_encoder_test.py +1 -2
- official/nlp/modeling/networks/classification.py +1 -1
- official/nlp/modeling/networks/classification_test.py +1 -1
- official/nlp/modeling/networks/encoder_scaffold.py +1 -1
- official/nlp/modeling/networks/encoder_scaffold_test.py +1 -1
- official/nlp/modeling/networks/fnet.py +1 -1
- official/nlp/modeling/networks/fnet_test.py +1 -1
- official/nlp/modeling/networks/funnel_transformer.py +1 -1
- official/nlp/modeling/networks/funnel_transformer_test.py +1 -1
- official/nlp/modeling/networks/mobile_bert_encoder.py +6 -4
- official/nlp/modeling/networks/mobile_bert_encoder_test.py +1 -1
- official/nlp/modeling/networks/packed_sequence_embedding.py +1 -1
- official/nlp/modeling/networks/packed_sequence_embedding_test.py +1 -3
- official/nlp/modeling/networks/span_labeling.py +1 -1
- official/nlp/modeling/networks/span_labeling_test.py +1 -1
- official/nlp/modeling/networks/sparse_mixer.py +1 -1
- official/nlp/modeling/networks/sparse_mixer_test.py +1 -1
- official/nlp/modeling/networks/xlnet_base.py +1 -1
- official/nlp/modeling/networks/xlnet_base_test.py +1 -1
- official/nlp/modeling/ops/__init__.py +1 -1
- official/nlp/modeling/ops/beam_search.py +1 -1
- official/nlp/modeling/ops/beam_search_test.py +1 -1
- official/nlp/modeling/ops/decoding_module.py +1 -1
- official/nlp/modeling/ops/decoding_module_test.py +1 -1
- official/nlp/modeling/ops/sampling_module.py +3 -3
- official/nlp/modeling/ops/segment_extractor.py +1 -1
- official/nlp/modeling/ops/segment_extractor_test.py +1 -1
- official/nlp/optimization.py +1 -1
- official/nlp/serving/__init__.py +1 -1
- official/nlp/serving/export_savedmodel.py +1 -1
- official/nlp/serving/export_savedmodel_test.py +1 -1
- official/nlp/serving/export_savedmodel_util.py +1 -1
- official/nlp/serving/serving_modules.py +1 -1
- official/nlp/serving/serving_modules_test.py +1 -1
- official/nlp/tasks/__init__.py +1 -1
- official/nlp/tasks/dual_encoder.py +1 -2
- official/nlp/tasks/dual_encoder_test.py +1 -1
- official/nlp/tasks/electra_task.py +1 -1
- official/nlp/tasks/electra_task_test.py +1 -1
- official/nlp/tasks/masked_lm.py +1 -1
- official/nlp/tasks/masked_lm_determinism_test.py +1 -1
- official/nlp/tasks/masked_lm_test.py +1 -1
- official/nlp/tasks/question_answering.py +1 -1
- official/nlp/tasks/question_answering_test.py +1 -1
- official/nlp/tasks/sentence_prediction.py +1 -1
- official/nlp/tasks/sentence_prediction_test.py +1 -1
- official/nlp/tasks/tagging.py +1 -1
- official/nlp/tasks/tagging_test.py +1 -1
- official/nlp/tasks/translation.py +1 -1
- official/nlp/tasks/translation_test.py +1 -1
- official/nlp/tasks/utils.py +1 -1
- official/nlp/tools/__init__.py +1 -1
- official/nlp/tools/export_tfhub.py +1 -1
- official/nlp/tools/export_tfhub_lib.py +1 -2
- official/nlp/tools/export_tfhub_lib_test.py +1 -1
- official/nlp/tools/squad_evaluate_v1_1.py +1 -1
- official/nlp/tools/squad_evaluate_v2_0.py +1 -1
- official/nlp/tools/tf1_bert_checkpoint_converter_lib.py +1 -1
- official/nlp/tools/tf2_albert_encoder_checkpoint_converter.py +1 -1
- official/nlp/tools/tf2_bert_encoder_checkpoint_converter.py +1 -1
- official/nlp/tools/tokenization.py +1 -1
- official/nlp/tools/tokenization_test.py +1 -1
- official/nlp/train.py +1 -1
- official/projects/__init__.py +1 -1
- official/projects/bigbird/__init__.py +1 -1
- official/projects/bigbird/encoder.py +1 -1
- official/projects/bigbird/encoder_test.py +1 -1
- official/projects/bigbird/experiment_configs.py +1 -1
- official/projects/bigbird/recompute_grad.py +1 -1
- official/projects/bigbird/recomputing_dropout.py +1 -1
- official/projects/bigbird/stateless_dropout.py +1 -1
- official/projects/centernet/__init__.py +1 -1
- official/projects/centernet/common/__init__.py +1 -1
- official/projects/centernet/common/registry_imports.py +1 -1
- official/projects/centernet/configs/__init__.py +1 -1
- official/projects/centernet/configs/backbones.py +1 -1
- official/projects/centernet/configs/centernet.py +1 -1
- official/projects/centernet/configs/centernet_test.py +1 -1
- official/projects/centernet/dataloaders/__init__.py +1 -1
- official/projects/centernet/dataloaders/centernet_input.py +1 -1
- official/projects/centernet/losses/__init__.py +1 -1
- official/projects/centernet/losses/centernet_losses.py +1 -1
- official/projects/centernet/losses/centernet_losses_test.py +1 -1
- official/projects/centernet/modeling/__init__.py +1 -1
- official/projects/centernet/modeling/backbones/__init__.py +1 -1
- official/projects/centernet/modeling/backbones/hourglass.py +1 -1
- official/projects/centernet/modeling/backbones/hourglass_test.py +1 -1
- official/projects/centernet/modeling/centernet_model.py +2 -2
- official/projects/centernet/modeling/centernet_model_test.py +1 -1
- official/projects/centernet/modeling/heads/__init__.py +1 -1
- official/projects/centernet/modeling/heads/centernet_head.py +2 -2
- official/projects/centernet/modeling/heads/centernet_head_test.py +1 -1
- official/projects/centernet/modeling/layers/__init__.py +1 -1
- official/projects/centernet/modeling/layers/cn_nn_blocks.py +1 -1
- official/projects/centernet/modeling/layers/cn_nn_blocks_test.py +1 -1
- official/projects/centernet/modeling/layers/detection_generator.py +1 -1
- official/projects/centernet/modeling/layers/detection_generator_test.py +1 -1
- official/projects/centernet/ops/__init__.py +1 -1
- official/projects/centernet/ops/box_list.py +1 -1
- official/projects/centernet/ops/box_list_ops.py +1 -1
- official/projects/centernet/ops/loss_ops.py +1 -1
- official/projects/centernet/ops/nms_ops.py +1 -1
- official/projects/centernet/ops/preprocess_ops.py +1 -1
- official/projects/centernet/ops/target_assigner.py +1 -1
- official/projects/centernet/ops/target_assigner_test.py +1 -1
- official/projects/centernet/tasks/__init__.py +1 -1
- official/projects/centernet/tasks/centernet.py +1 -1
- official/projects/centernet/train.py +1 -1
- official/projects/centernet/utils/__init__.py +1 -1
- official/projects/centernet/utils/checkpoints/__init__.py +1 -1
- official/projects/centernet/utils/checkpoints/config_classes.py +1 -1
- official/projects/centernet/utils/checkpoints/config_data.py +1 -1
- official/projects/centernet/utils/checkpoints/load_weights.py +1 -1
- official/projects/centernet/utils/checkpoints/read_checkpoints.py +1 -1
- official/projects/centernet/utils/tf2_centernet_checkpoint_converter.py +1 -1
- official/projects/deepmac_maskrcnn/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/common/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/common/registry_imports.py +1 -1
- official/projects/deepmac_maskrcnn/configs/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/configs/deep_mask_head_rcnn.py +1 -1
- official/projects/deepmac_maskrcnn/configs/deep_mask_head_rcnn_config_test.py +1 -1
- official/projects/deepmac_maskrcnn/modeling/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/modeling/heads/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/modeling/heads/hourglass_network.py +1 -1
- official/projects/deepmac_maskrcnn/modeling/heads/instance_heads.py +1 -3
- official/projects/deepmac_maskrcnn/modeling/heads/instance_heads_test.py +1 -2
- official/projects/deepmac_maskrcnn/modeling/maskrcnn_model.py +1 -3
- official/projects/deepmac_maskrcnn/modeling/maskrcnn_model_test.py +1 -3
- official/projects/deepmac_maskrcnn/serving/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/serving/detection.py +1 -1
- official/projects/deepmac_maskrcnn/serving/detection_test.py +1 -1
- official/projects/deepmac_maskrcnn/serving/export_saved_model.py +1 -1
- official/projects/deepmac_maskrcnn/tasks/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/tasks/deep_mask_head_rcnn.py +1 -1
- official/projects/deepmac_maskrcnn/train.py +1 -1
- official/projects/detr/__init__.py +14 -0
- official/projects/detr/configs/__init__.py +14 -0
- official/projects/detr/configs/detr.py +277 -0
- official/projects/detr/configs/detr_test.py +51 -0
- official/projects/detr/dataloaders/__init__.py +14 -0
- official/projects/detr/dataloaders/coco.py +157 -0
- official/projects/detr/dataloaders/coco_test.py +111 -0
- official/projects/detr/dataloaders/detr_input.py +175 -0
- official/projects/detr/experiments/__init__.py +14 -0
- official/projects/detr/modeling/__init__.py +14 -0
- official/projects/detr/modeling/detr.py +345 -0
- official/projects/detr/modeling/detr_test.py +70 -0
- official/projects/detr/modeling/transformer.py +849 -0
- official/projects/detr/modeling/transformer_test.py +263 -0
- official/projects/detr/ops/__init__.py +14 -0
- official/projects/detr/ops/matchers.py +489 -0
- official/projects/detr/ops/matchers_test.py +95 -0
- official/projects/detr/optimization.py +151 -0
- official/projects/detr/serving/__init__.py +14 -0
- official/projects/detr/serving/export_module.py +103 -0
- official/projects/detr/serving/export_module_test.py +98 -0
- official/projects/detr/serving/export_saved_model.py +109 -0
- official/projects/detr/tasks/__init__.py +14 -0
- official/projects/detr/tasks/detection.py +433 -0
- official/projects/detr/tasks/detection_test.py +203 -0
- official/projects/detr/train.py +70 -0
- official/projects/maskconver/__init__.py +14 -0
- official/projects/maskconver/configs/__init__.py +14 -0
- official/projects/maskconver/configs/backbones.py +43 -0
- official/projects/maskconver/configs/decoders.py +36 -0
- official/projects/maskconver/configs/maskconver.py +523 -0
- official/projects/maskconver/configs/multiscale_maskconver.py +215 -0
- official/projects/maskconver/tasks/__init__.py +14 -0
- official/projects/maskconver/tasks/maskconver.py +641 -0
- official/projects/maskconver/tasks/multiscale_maskconver.py +278 -0
- official/projects/maskconver/train.py +30 -0
- official/projects/maxvit/__init__.py +1 -1
- official/projects/maxvit/configs/__init__.py +1 -1
- official/projects/maxvit/configs/backbones.py +1 -1
- official/projects/maxvit/configs/image_classification.py +1 -1
- official/projects/maxvit/configs/image_classification_test.py +1 -1
- official/projects/maxvit/configs/rcnn.py +1 -1
- official/projects/maxvit/configs/rcnn_test.py +1 -1
- official/projects/maxvit/configs/retinanet.py +1 -1
- official/projects/maxvit/configs/retinanet_test.py +1 -1
- official/projects/maxvit/configs/semantic_segmentation.py +1 -1
- official/projects/maxvit/configs/semantic_segmentation_test.py +1 -1
- official/projects/maxvit/modeling/__init__.py +1 -1
- official/projects/maxvit/modeling/common_ops.py +14 -1
- official/projects/maxvit/modeling/layers.py +1 -1
- official/projects/maxvit/modeling/maxvit.py +2 -2
- official/projects/maxvit/modeling/maxvit_test.py +1 -1
- official/projects/maxvit/registry_imports.py +1 -1
- official/projects/maxvit/train.py +1 -1
- official/projects/maxvit/train_test.py +1 -1
- official/projects/mobilebert/__init__.py +1 -1
- official/projects/mobilebert/distillation.py +1 -1
- official/projects/mobilebert/distillation_test.py +1 -1
- official/projects/mobilebert/export_tfhub.py +1 -1
- official/projects/mobilebert/model_utils.py +1 -1
- official/projects/mobilebert/run_distillation.py +1 -1
- official/projects/mobilebert/tf2_model_checkpoint_converter.py +1 -1
- official/projects/mobilebert/utils.py +1 -1
- official/projects/movinet/__init__.py +1 -1
- official/projects/movinet/configs/__init__.py +1 -1
- official/projects/movinet/configs/movinet.py +1 -1
- official/projects/movinet/configs/movinet_test.py +1 -1
- official/projects/movinet/modeling/__init__.py +1 -1
- official/projects/movinet/modeling/movinet.py +1 -1
- official/projects/movinet/modeling/movinet_layers.py +1 -1
- official/projects/movinet/modeling/movinet_layers_test.py +1 -1
- official/projects/movinet/modeling/movinet_model.py +1 -1
- official/projects/movinet/modeling/movinet_model_test.py +1 -1
- official/projects/movinet/modeling/movinet_test.py +1 -1
- official/projects/movinet/tools/__init__.py +1 -1
- official/projects/movinet/tools/convert_3d_2plus1d.py +1 -1
- official/projects/movinet/tools/convert_3d_2plus1d_test.py +1 -1
- official/projects/movinet/tools/export_saved_model.py +1 -1
- official/projects/movinet/tools/export_saved_model_test.py +6 -3
- official/projects/movinet/tools/quantize_movinet.py +1 -1
- official/projects/movinet/train.py +1 -1
- official/projects/movinet/train_test.py +1 -1
- official/projects/nhnet/__init__.py +1 -1
- official/projects/nhnet/configs.py +1 -1
- official/projects/nhnet/configs_test.py +1 -1
- official/projects/nhnet/decoder.py +1 -1
- official/projects/nhnet/decoder_test.py +1 -1
- official/projects/nhnet/evaluation.py +1 -3
- official/projects/nhnet/input_pipeline.py +1 -1
- official/projects/nhnet/models.py +1 -1
- official/projects/nhnet/models_test.py +1 -1
- official/projects/nhnet/optimizer.py +1 -1
- official/projects/nhnet/raw_data_process.py +1 -1
- official/projects/nhnet/raw_data_processor.py +1 -1
- official/projects/nhnet/trainer.py +1 -6
- official/projects/nhnet/trainer_test.py +1 -1
- official/projects/nhnet/utils.py +1 -1
- official/projects/panoptic/__init__.py +1 -1
- official/projects/panoptic/configs/__init__.py +1 -1
- official/projects/panoptic/configs/panoptic_deeplab.py +5 -6
- official/projects/panoptic/configs/panoptic_maskrcnn.py +1 -1
- official/projects/panoptic/tasks/__init__.py +1 -1
- official/projects/panoptic/tasks/panoptic_deeplab.py +1 -1
- official/projects/panoptic/tasks/panoptic_maskrcnn.py +3 -1
- official/projects/panoptic/train.py +1 -1
- official/projects/qat/__init__.py +1 -1
- official/projects/qat/nlp/__init__.py +1 -1
- official/projects/qat/nlp/configs/__init__.py +1 -1
- official/projects/qat/nlp/configs/finetuning_experiments.py +1 -1
- official/projects/qat/nlp/modeling/__init__.py +1 -1
- official/projects/qat/nlp/modeling/layers/__init__.py +1 -1
- official/projects/qat/nlp/modeling/layers/mobile_bert_layers.py +1 -1
- official/projects/qat/nlp/modeling/layers/multi_head_attention.py +1 -1
- official/projects/qat/nlp/modeling/layers/transformer_encoder_block.py +1 -1
- official/projects/qat/nlp/modeling/layers/transformer_encoder_block_test.py +1 -1
- official/projects/qat/nlp/modeling/models/__init__.py +1 -1
- official/projects/qat/nlp/modeling/models/bert_span_labeler.py +1 -1
- official/projects/qat/nlp/modeling/networks/__init__.py +1 -1
- official/projects/qat/nlp/modeling/networks/span_labeling.py +1 -1
- official/projects/qat/nlp/pretrained_checkpoint_converter.py +1 -3
- official/projects/qat/nlp/quantization/__init__.py +1 -1
- official/projects/qat/nlp/quantization/configs.py +1 -1
- official/projects/qat/nlp/quantization/configs_test.py +1 -2
- official/projects/qat/nlp/quantization/helper.py +1 -1
- official/projects/qat/nlp/quantization/schemes.py +1 -3
- official/projects/qat/nlp/quantization/wrappers.py +1 -1
- official/projects/qat/nlp/registry_imports.py +1 -1
- official/projects/qat/nlp/tasks/__init__.py +1 -1
- official/projects/qat/nlp/tasks/question_answering.py +1 -1
- official/projects/qat/nlp/tasks/question_answering_test.py +1 -1
- official/projects/qat/nlp/train.py +1 -1
- official/projects/qat/vision/__init__.py +1 -1
- official/projects/qat/vision/configs/__init__.py +1 -1
- official/projects/qat/vision/configs/common.py +1 -1
- official/projects/qat/vision/configs/image_classification.py +1 -1
- official/projects/qat/vision/configs/image_classification_test.py +1 -1
- official/projects/qat/vision/configs/retinanet.py +1 -1
- official/projects/qat/vision/configs/retinanet_test.py +1 -1
- official/projects/qat/vision/configs/semantic_segmentation.py +1 -1
- official/projects/qat/vision/configs/semantic_segmentation_test.py +1 -1
- official/projects/qat/vision/modeling/__init__.py +1 -1
- official/projects/qat/vision/modeling/factory.py +1 -3
- official/projects/qat/vision/modeling/factory_test.py +1 -3
- official/projects/qat/vision/modeling/heads/__init__.py +1 -1
- official/projects/qat/vision/modeling/heads/dense_prediction_heads.py +1 -3
- official/projects/qat/vision/modeling/heads/dense_prediction_heads_test.py +1 -2
- official/projects/qat/vision/modeling/layers/__init__.py +1 -1
- official/projects/qat/vision/modeling/layers/nn_blocks.py +1 -3
- official/projects/qat/vision/modeling/layers/nn_blocks_test.py +1 -2
- official/projects/qat/vision/modeling/layers/nn_layers.py +2 -2
- official/projects/qat/vision/modeling/layers/nn_layers_test.py +1 -2
- official/projects/qat/vision/modeling/segmentation_model.py +1 -2
- official/projects/qat/vision/n_bit/__init__.py +1 -1
- official/projects/qat/vision/n_bit/configs.py +1 -1
- official/projects/qat/vision/n_bit/configs_test.py +1 -3
- official/projects/qat/vision/n_bit/nn_blocks.py +1 -3
- official/projects/qat/vision/n_bit/nn_blocks_test.py +1 -2
- official/projects/qat/vision/n_bit/nn_layers.py +1 -1
- official/projects/qat/vision/n_bit/schemes.py +1 -3
- official/projects/qat/vision/quantization/__init__.py +1 -1
- official/projects/qat/vision/quantization/configs.py +1 -1
- official/projects/qat/vision/quantization/configs_test.py +1 -3
- official/projects/qat/vision/quantization/helper.py +1 -1
- official/projects/qat/vision/quantization/helper_test.py +1 -1
- official/projects/qat/vision/quantization/layer_transforms.py +1 -1
- official/projects/qat/vision/quantization/schemes.py +1 -3
- official/projects/qat/vision/registry_imports.py +1 -1
- official/projects/qat/vision/serving/__init__.py +1 -1
- official/projects/qat/vision/serving/export_module.py +1 -1
- official/projects/qat/vision/serving/export_saved_model.py +1 -1
- official/projects/qat/vision/serving/export_tflite.py +1 -1
- official/projects/qat/vision/tasks/__init__.py +1 -1
- official/projects/qat/vision/tasks/image_classification.py +1 -1
- official/projects/qat/vision/tasks/image_classification_test.py +1 -1
- official/projects/qat/vision/tasks/retinanet.py +1 -1
- official/projects/qat/vision/tasks/retinanet_test.py +1 -1
- official/projects/qat/vision/tasks/semantic_segmentation.py +1 -1
- official/projects/qat/vision/train.py +1 -1
- official/projects/roformer/__init__.py +1 -1
- official/projects/roformer/roformer.py +1 -1
- official/projects/roformer/roformer_attention.py +1 -1
- official/projects/roformer/roformer_attention_test.py +1 -1
- official/projects/roformer/roformer_encoder.py +1 -1
- official/projects/roformer/roformer_encoder_block.py +1 -1
- official/projects/roformer/roformer_encoder_block_test.py +1 -1
- official/projects/roformer/roformer_encoder_test.py +1 -1
- official/projects/roformer/roformer_experiments.py +1 -1
- official/projects/roformer/train.py +1 -1
- official/projects/teams/__init__.py +1 -1
- official/projects/teams/teams.py +1 -1
- official/projects/teams/teams_experiments.py +1 -1
- official/projects/teams/teams_pretrainer.py +1 -1
- official/projects/teams/teams_pretrainer_test.py +1 -1
- official/projects/teams/teams_task.py +1 -1
- official/projects/teams/teams_task_test.py +1 -1
- official/projects/teams/train.py +1 -1
- official/projects/triviaqa/__init__.py +1 -1
- official/projects/triviaqa/dataset.py +1 -1
- official/projects/triviaqa/download_and_prepare.py +1 -1
- official/projects/triviaqa/evaluate.py +1 -1
- official/projects/triviaqa/evaluation.py +1 -1
- official/projects/triviaqa/inputs.py +1 -1
- official/projects/triviaqa/modeling.py +1 -1
- official/projects/triviaqa/predict.py +1 -1
- official/projects/triviaqa/prediction.py +1 -1
- official/projects/triviaqa/preprocess.py +1 -1
- official/projects/triviaqa/sentencepiece_pb2.py +1 -1
- official/projects/triviaqa/train.py +1 -1
- official/projects/video_ssl/__init__.py +1 -1
- official/projects/video_ssl/configs/__init__.py +1 -1
- official/projects/video_ssl/configs/video_ssl.py +1 -1
- official/projects/video_ssl/configs/video_ssl_test.py +1 -1
- official/projects/video_ssl/dataloaders/__init__.py +1 -1
- official/projects/video_ssl/dataloaders/video_ssl_input.py +1 -1
- official/projects/video_ssl/dataloaders/video_ssl_input_test.py +1 -2
- official/projects/video_ssl/losses/__init__.py +1 -1
- official/projects/video_ssl/losses/losses.py +1 -2
- official/projects/video_ssl/modeling/__init__.py +1 -1
- official/projects/video_ssl/modeling/video_ssl_model.py +1 -3
- official/projects/video_ssl/ops/__init__.py +1 -1
- official/projects/video_ssl/ops/video_ssl_preprocess_ops.py +1 -1
- official/projects/video_ssl/ops/video_ssl_preprocess_ops_test.py +1 -1
- official/projects/video_ssl/tasks/__init__.py +1 -1
- official/projects/video_ssl/tasks/linear_eval.py +1 -1
- official/projects/video_ssl/tasks/pretrain.py +1 -1
- official/projects/video_ssl/tasks/pretrain_test.py +1 -1
- official/projects/video_ssl/train.py +1 -1
- official/projects/volumetric_models/__init__.py +1 -1
- official/projects/volumetric_models/configs/__init__.py +1 -1
- official/projects/volumetric_models/configs/backbones.py +1 -1
- official/projects/volumetric_models/configs/decoders.py +1 -1
- official/projects/volumetric_models/configs/semantic_segmentation_3d.py +1 -1
- official/projects/volumetric_models/configs/semantic_segmentation_3d_test.py +1 -1
- official/projects/volumetric_models/dataloaders/__init__.py +1 -1
- official/projects/volumetric_models/dataloaders/segmentation_input_3d.py +1 -1
- official/projects/volumetric_models/dataloaders/segmentation_input_3d_test.py +1 -1
- official/projects/volumetric_models/evaluation/__init__.py +1 -1
- official/projects/volumetric_models/evaluation/segmentation_metrics.py +1 -1
- official/projects/volumetric_models/evaluation/segmentation_metrics_test.py +1 -1
- official/projects/volumetric_models/losses/__init__.py +1 -1
- official/projects/volumetric_models/losses/segmentation_losses.py +1 -1
- official/projects/volumetric_models/losses/segmentation_losses_test.py +1 -1
- official/projects/volumetric_models/modeling/__init__.py +1 -1
- official/projects/volumetric_models/modeling/backbones/__init__.py +1 -1
- official/projects/volumetric_models/modeling/backbones/unet_3d.py +1 -2
- official/projects/volumetric_models/modeling/backbones/unet_3d_test.py +1 -2
- official/projects/volumetric_models/modeling/decoders/__init__.py +1 -1
- official/projects/volumetric_models/modeling/decoders/factory.py +1 -3
- official/projects/volumetric_models/modeling/decoders/factory_test.py +1 -1
- official/projects/volumetric_models/modeling/decoders/unet_3d_decoder.py +1 -1
- official/projects/volumetric_models/modeling/decoders/unet_3d_decoder_test.py +1 -2
- official/projects/volumetric_models/modeling/factory.py +1 -3
- official/projects/volumetric_models/modeling/factory_test.py +1 -1
- official/projects/volumetric_models/modeling/heads/__init__.py +1 -1
- official/projects/volumetric_models/modeling/heads/segmentation_heads_3d.py +1 -1
- official/projects/volumetric_models/modeling/heads/segmentation_heads_3d_test.py +1 -1
- official/projects/volumetric_models/modeling/nn_blocks_3d.py +2 -3
- official/projects/volumetric_models/modeling/nn_blocks_3d_test.py +1 -2
- official/projects/volumetric_models/modeling/segmentation_model_test.py +1 -1
- official/projects/volumetric_models/registry_imports.py +1 -1
- official/projects/volumetric_models/serving/__init__.py +1 -1
- official/projects/volumetric_models/serving/export_saved_model.py +1 -1
- official/projects/volumetric_models/serving/semantic_segmentation_3d.py +1 -1
- official/projects/volumetric_models/serving/semantic_segmentation_3d_test.py +3 -3
- official/projects/volumetric_models/tasks/__init__.py +1 -1
- official/projects/volumetric_models/tasks/semantic_segmentation_3d.py +1 -1
- official/projects/volumetric_models/tasks/semantic_segmentation_3d_test.py +1 -1
- official/projects/volumetric_models/train.py +1 -1
- official/projects/volumetric_models/train_test.py +1 -1
- official/projects/waste_identification_ml/__init__.py +1 -1
- official/projects/waste_identification_ml/data_generation/__init__.py +1 -1
- official/projects/waste_identification_ml/data_generation/utils.py +1 -1
- official/projects/waste_identification_ml/data_generation/utils_test.py +1 -1
- official/projects/yolo/__init__.py +1 -1
- official/projects/yolo/common/__init__.py +1 -1
- official/projects/yolo/common/registry_imports.py +1 -1
- official/projects/yolo/configs/__init__.py +1 -1
- official/projects/yolo/configs/backbones.py +1 -1
- official/projects/yolo/configs/darknet_classification.py +1 -1
- official/projects/yolo/configs/decoders.py +1 -1
- official/projects/yolo/configs/yolo.py +1 -1
- official/projects/yolo/configs/yolov7.py +17 -1
- official/projects/yolo/dataloaders/__init__.py +1 -1
- official/projects/yolo/dataloaders/classification_input.py +1 -1
- official/projects/yolo/dataloaders/tf_example_decoder.py +1 -1
- official/projects/yolo/dataloaders/yolo_input.py +1 -1
- official/projects/yolo/losses/__init__.py +1 -1
- official/projects/yolo/losses/yolo_loss.py +1 -1
- official/projects/yolo/losses/yolo_loss_test.py +1 -1
- official/projects/yolo/losses/yolov7_loss.py +1 -1
- official/projects/yolo/losses/yolov7_loss_test.py +1 -1
- official/projects/yolo/modeling/__init__.py +1 -1
- official/projects/yolo/modeling/backbones/__init__.py +1 -1
- official/projects/yolo/modeling/backbones/darknet.py +1 -1
- official/projects/yolo/modeling/backbones/darknet_test.py +1 -1
- official/projects/yolo/modeling/backbones/yolov7.py +69 -1
- official/projects/yolo/modeling/backbones/yolov7_test.py +1 -1
- official/projects/yolo/modeling/decoders/__init__.py +1 -1
- official/projects/yolo/modeling/decoders/yolo_decoder.py +1 -1
- official/projects/yolo/modeling/decoders/yolo_decoder_test.py +1 -2
- official/projects/yolo/modeling/decoders/yolov7.py +90 -1
- official/projects/yolo/modeling/decoders/yolov7_test.py +1 -1
- official/projects/yolo/modeling/factory.py +1 -1
- official/projects/yolo/modeling/factory_test.py +1 -1
- official/projects/yolo/modeling/heads/__init__.py +1 -1
- official/projects/yolo/modeling/heads/yolo_head.py +1 -1
- official/projects/yolo/modeling/heads/yolo_head_test.py +1 -2
- official/projects/yolo/modeling/heads/yolov7_head.py +1 -1
- official/projects/yolo/modeling/heads/yolov7_head_test.py +1 -1
- official/projects/yolo/modeling/layers/__init__.py +1 -1
- official/projects/yolo/modeling/layers/detection_generator.py +1 -1
- official/projects/yolo/modeling/layers/detection_generator_test.py +1 -1
- official/projects/yolo/modeling/layers/nn_blocks.py +1 -1
- official/projects/yolo/modeling/layers/nn_blocks_test.py +1 -1
- official/projects/yolo/modeling/yolo_model.py +2 -2
- official/projects/yolo/modeling/yolov7_model.py +2 -2
- official/projects/yolo/ops/__init__.py +1 -1
- official/projects/yolo/ops/anchor.py +1 -1
- official/projects/yolo/ops/box_ops.py +1 -1
- official/projects/yolo/ops/box_ops_test.py +1 -1
- official/projects/yolo/ops/initializer_ops.py +1 -1
- official/projects/yolo/ops/kmeans_anchors.py +1 -1
- official/projects/yolo/ops/kmeans_anchors_test.py +1 -1
- official/projects/yolo/ops/loss_utils.py +1 -1
- official/projects/yolo/ops/math_ops.py +1 -1
- official/projects/yolo/ops/mosaic.py +1 -1
- official/projects/yolo/ops/preprocessing_ops.py +1 -1
- official/projects/yolo/ops/preprocessing_ops_test.py +1 -1
- official/projects/yolo/optimization/__init__.py +1 -1
- official/projects/yolo/optimization/configs/__init__.py +1 -1
- official/projects/yolo/optimization/configs/optimization_config.py +1 -1
- official/projects/yolo/optimization/configs/optimizer_config.py +1 -1
- official/projects/yolo/optimization/optimizer_factory.py +1 -1
- official/projects/yolo/optimization/sgd_torch.py +1 -1
- official/projects/yolo/serving/__init__.py +1 -1
- official/projects/yolo/serving/export_module_factory.py +1 -1
- official/projects/yolo/serving/export_saved_model.py +1 -1
- official/projects/yolo/serving/export_tflite.py +1 -1
- official/projects/yolo/serving/model_fn.py +1 -1
- official/projects/yolo/tasks/__init__.py +1 -1
- official/projects/yolo/tasks/image_classification.py +1 -1
- official/projects/yolo/tasks/task_utils.py +1 -1
- official/projects/yolo/tasks/yolo.py +1 -1
- official/projects/yolo/tasks/yolov7.py +1 -1
- official/projects/yolo/train.py +1 -1
- official/projects/yt8m/__init__.py +1 -1
- official/projects/yt8m/configs/__init__.py +1 -1
- official/projects/yt8m/configs/yt8m.py +1 -1
- official/projects/yt8m/configs/yt8m_test.py +1 -1
- official/projects/yt8m/modeling/__init__.py +1 -1
- official/projects/yt8m/modeling/backbones/__init__.py +1 -1
- official/projects/yt8m/modeling/backbones/dbof.py +1 -1
- official/projects/yt8m/modeling/backbones/dbof_test.py +1 -1
- official/projects/yt8m/modeling/heads/__init__.py +1 -1
- official/projects/yt8m/modeling/heads/logistic.py +1 -1
- official/projects/yt8m/modeling/heads/moe.py +1 -1
- official/projects/yt8m/modeling/nn_layers.py +1 -1
- official/projects/yt8m/modeling/nn_layers_test.py +1 -1
- official/projects/yt8m/modeling/yt8m_model.py +1 -1
- official/projects/yt8m/modeling/yt8m_model_test.py +1 -1
- official/projects/yt8m/modeling/yt8m_model_utils.py +1 -1
- official/projects/yt8m/modeling/yt8m_model_utils_test.py +1 -1
- official/projects/yt8m/tasks/__init__.py +1 -1
- official/projects/yt8m/tasks/yt8m_task.py +1 -1
- official/projects/yt8m/train.py +1 -1
- official/projects/yt8m/train_test.py +1 -1
- official/recommendation/__init__.py +1 -1
- official/recommendation/constants.py +1 -1
- official/recommendation/create_ncf_data.py +1 -2
- official/recommendation/data_pipeline.py +1 -1
- official/recommendation/data_preprocessing.py +1 -1
- official/recommendation/data_test.py +4 -4
- official/recommendation/movielens.py +1 -2
- official/recommendation/ncf_common.py +1 -1
- official/recommendation/ncf_input_pipeline.py +1 -1
- official/recommendation/ncf_keras_main.py +1 -1
- official/recommendation/ncf_test.py +1 -1
- official/recommendation/neumf_model.py +1 -1
- official/recommendation/popen_helper.py +1 -1
- official/recommendation/ranking/__init__.py +1 -1
- official/recommendation/ranking/common.py +1 -1
- official/recommendation/ranking/configs/__init__.py +1 -1
- official/recommendation/ranking/configs/config.py +14 -1
- official/recommendation/ranking/configs/config_test.py +1 -1
- official/recommendation/ranking/data/__init__.py +1 -1
- official/recommendation/ranking/data/data_pipeline.py +9 -2
- official/recommendation/ranking/data/data_pipeline_multi_hot.py +8 -2
- official/recommendation/ranking/data/data_pipeline_multi_hot_test.py +12 -6
- official/recommendation/ranking/data/data_pipeline_test.py +18 -8
- official/recommendation/ranking/task.py +102 -19
- official/recommendation/ranking/task_test.py +1 -1
- official/recommendation/ranking/train.py +1 -1
- official/recommendation/ranking/train_test.py +76 -31
- official/recommendation/stat_utils.py +1 -1
- official/recommendation/uplift/__init__.py +1 -1
- official/recommendation/uplift/keras_test_case.py +1 -1
- official/recommendation/uplift/keys.py +1 -1
- official/recommendation/uplift/layers/__init__.py +1 -1
- official/recommendation/uplift/layers/encoders/__init__.py +1 -1
- official/recommendation/uplift/layers/encoders/concat_features.py +1 -1
- official/recommendation/uplift/layers/encoders/concat_features_test.py +1 -1
- official/recommendation/uplift/layers/heads/__init__.py +1 -1
- official/recommendation/uplift/layers/heads/two_tower_logits_head.py +1 -1
- official/recommendation/uplift/layers/heads/two_tower_logits_head_test.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/__init__.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/base_uplift_networks.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/two_tower_output_head.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/two_tower_output_head_test.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/two_tower_uplift_network.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/two_tower_uplift_network_test.py +1 -1
- official/recommendation/uplift/losses/__init__.py +1 -1
- official/recommendation/uplift/losses/true_logits_loss.py +1 -1
- official/recommendation/uplift/losses/true_logits_loss_test.py +1 -1
- official/recommendation/uplift/metrics/__init__.py +1 -1
- official/recommendation/uplift/metrics/label_mean.py +1 -1
- official/recommendation/uplift/metrics/label_mean_test.py +1 -1
- official/recommendation/uplift/metrics/label_variance.py +1 -1
- official/recommendation/uplift/metrics/label_variance_test.py +1 -1
- official/recommendation/uplift/metrics/loss_metric.py +1 -1
- official/recommendation/uplift/metrics/loss_metric_test.py +1 -1
- official/recommendation/uplift/metrics/metric_configs.py +1 -1
- official/recommendation/uplift/metrics/poisson_metrics.py +1 -1
- official/recommendation/uplift/metrics/poisson_metrics_test.py +1 -1
- official/recommendation/uplift/metrics/sliced_metric.py +1 -1
- official/recommendation/uplift/metrics/sliced_metric_test.py +1 -1
- official/recommendation/uplift/metrics/treatment_fraction.py +1 -1
- official/recommendation/uplift/metrics/treatment_fraction_test.py +1 -1
- official/recommendation/uplift/metrics/treatment_sliced_metric.py +1 -1
- official/recommendation/uplift/metrics/treatment_sliced_metric_test.py +1 -1
- official/recommendation/uplift/metrics/uplift_mean.py +1 -1
- official/recommendation/uplift/metrics/uplift_mean_test.py +1 -1
- official/recommendation/uplift/metrics/variance.py +1 -1
- official/recommendation/uplift/metrics/variance_test.py +12 -10
- official/recommendation/uplift/models/__init__.py +1 -1
- official/recommendation/uplift/models/two_tower_uplift_model.py +1 -1
- official/recommendation/uplift/models/two_tower_uplift_model_test.py +1 -1
- official/recommendation/uplift/types.py +1 -1
- official/recommendation/uplift/utils.py +3 -3
- official/recommendation/uplift/utils_test.py +1 -1
- official/utils/__init__.py +1 -1
- official/utils/docs/__init__.py +1 -1
- official/utils/docs/build_orbit_api_docs.py +1 -1
- official/utils/docs/build_tfm_api_docs.py +1 -1
- official/utils/flags/__init__.py +1 -1
- official/utils/flags/_base.py +1 -1
- official/utils/flags/_benchmark.py +1 -1
- official/utils/flags/_conventions.py +1 -1
- official/utils/flags/_device.py +1 -1
- official/utils/flags/_distribution.py +1 -1
- official/utils/flags/_misc.py +1 -1
- official/utils/flags/_performance.py +1 -1
- official/utils/flags/core.py +1 -1
- official/utils/flags/flags_test.py +1 -1
- official/utils/hyperparams_flags.py +1 -1
- official/utils/misc/__init__.py +1 -1
- official/utils/misc/keras_utils.py +1 -1
- official/utils/misc/model_helpers.py +1 -1
- official/utils/misc/model_helpers_test.py +3 -3
- official/utils/testing/__init__.py +1 -1
- official/utils/testing/integration.py +1 -1
- official/utils/testing/mock_task.py +1 -1
- official/vision/__init__.py +1 -1
- official/vision/configs/__init__.py +1 -1
- official/vision/configs/backbones.py +3 -1
- official/vision/configs/backbones_3d.py +1 -2
- official/vision/configs/common.py +1 -3
- official/vision/configs/decoders.py +1 -3
- official/vision/configs/image_classification.py +1 -1
- official/vision/configs/image_classification_test.py +1 -1
- official/vision/configs/maskrcnn.py +1 -1
- official/vision/configs/maskrcnn_test.py +1 -1
- official/vision/configs/retinanet.py +2 -1
- official/vision/configs/retinanet_test.py +1 -1
- official/vision/configs/semantic_segmentation.py +7 -8
- official/vision/configs/semantic_segmentation_test.py +1 -1
- official/vision/configs/video_classification.py +1 -1
- official/vision/configs/video_classification_test.py +1 -1
- official/vision/data/__init__.py +1 -1
- official/vision/data/create_coco_tf_record.py +1 -1
- official/vision/data/fake_feature_generator.py +5 -2
- official/vision/data/image_utils.py +1 -1
- official/vision/data/image_utils_test.py +1 -1
- official/vision/data/process_coco_few_shot_json_files.py +1 -1
- official/vision/data/tf_example_builder.py +1 -1
- official/vision/data/tf_example_builder_test.py +1 -1
- official/vision/data/tf_example_feature_key.py +1 -1
- official/vision/data/tfrecord_lib.py +1 -1
- official/vision/data/tfrecord_lib_test.py +1 -1
- official/vision/dataloaders/__init__.py +1 -1
- official/vision/dataloaders/classification_input.py +1 -2
- official/vision/dataloaders/decoder.py +1 -1
- official/vision/dataloaders/input_reader.py +1 -1
- official/vision/dataloaders/input_reader_factory.py +1 -1
- official/vision/dataloaders/maskrcnn_input.py +1 -2
- official/vision/dataloaders/parser.py +1 -1
- official/vision/dataloaders/retinanet_input.py +1 -3
- official/vision/dataloaders/segmentation_input.py +9 -4
- official/vision/dataloaders/tf_example_decoder.py +1 -1
- official/vision/dataloaders/tf_example_decoder_test.py +1 -2
- official/vision/dataloaders/tf_example_label_map_decoder.py +1 -2
- official/vision/dataloaders/tf_example_label_map_decoder_test.py +1 -2
- official/vision/dataloaders/tfds_classification_decoders.py +1 -1
- official/vision/dataloaders/tfds_detection_decoders.py +1 -1
- official/vision/dataloaders/tfds_factory.py +1 -1
- official/vision/dataloaders/tfds_factory_test.py +1 -1
- official/vision/dataloaders/tfds_segmentation_decoders.py +1 -1
- official/vision/dataloaders/tfexample_utils.py +1 -1
- official/vision/dataloaders/utils.py +1 -2
- official/vision/dataloaders/utils_test.py +1 -3
- official/vision/dataloaders/video_input.py +1 -1
- official/vision/dataloaders/video_input_test.py +1 -2
- official/vision/evaluation/__init__.py +1 -1
- official/vision/evaluation/coco_evaluator.py +1 -2
- official/vision/evaluation/coco_utils.py +1 -3
- official/vision/evaluation/coco_utils_test.py +1 -1
- official/vision/evaluation/instance_metrics.py +1 -1
- official/vision/evaluation/instance_metrics_test.py +1 -1
- official/vision/evaluation/iou.py +1 -1
- official/vision/evaluation/iou_test.py +1 -1
- official/vision/evaluation/panoptic_quality.py +1 -1
- official/vision/evaluation/panoptic_quality_evaluator.py +1 -1
- official/vision/evaluation/panoptic_quality_evaluator_test.py +1 -1
- official/vision/evaluation/panoptic_quality_test.py +1 -1
- official/vision/evaluation/segmentation_metrics.py +1 -1
- official/vision/evaluation/segmentation_metrics_test.py +1 -1
- official/vision/evaluation/wod_detection_evaluator.py +1 -1
- official/vision/losses/__init__.py +1 -1
- official/vision/losses/focal_loss.py +1 -1
- official/vision/losses/loss_utils.py +1 -1
- official/vision/losses/maskrcnn_losses.py +1 -2
- official/vision/losses/maskrcnn_losses_test.py +1 -1
- official/vision/losses/retinanet_losses.py +1 -2
- official/vision/losses/segmentation_losses.py +1 -1
- official/vision/losses/segmentation_losses_test.py +1 -1
- official/vision/modeling/__init__.py +1 -1
- official/vision/modeling/backbones/__init__.py +1 -1
- official/vision/modeling/backbones/efficientnet.py +1 -3
- official/vision/modeling/backbones/efficientnet_test.py +1 -2
- official/vision/modeling/backbones/factory.py +1 -3
- official/vision/modeling/backbones/factory_test.py +1 -2
- official/vision/modeling/backbones/mobiledet.py +1 -1
- official/vision/modeling/backbones/mobiledet_test.py +1 -1
- official/vision/modeling/backbones/mobilenet.py +73 -3
- official/vision/modeling/backbones/mobilenet_test.py +12 -3
- official/vision/modeling/backbones/resnet.py +1 -2
- official/vision/modeling/backbones/resnet_3d.py +1 -2
- official/vision/modeling/backbones/resnet_3d_test.py +1 -2
- official/vision/modeling/backbones/resnet_deeplab.py +5 -4
- official/vision/modeling/backbones/resnet_deeplab_test.py +21 -10
- official/vision/modeling/backbones/resnet_test.py +1 -2
- official/vision/modeling/backbones/resnet_unet.py +1 -2
- official/vision/modeling/backbones/resnet_unet_test.py +1 -3
- official/vision/modeling/backbones/revnet.py +1 -2
- official/vision/modeling/backbones/revnet_test.py +1 -2
- official/vision/modeling/backbones/spinenet.py +1 -3
- official/vision/modeling/backbones/spinenet_mobile.py +1 -3
- official/vision/modeling/backbones/spinenet_mobile_test.py +1 -2
- official/vision/modeling/backbones/spinenet_test.py +1 -2
- official/vision/modeling/backbones/vit.py +53 -27
- official/vision/modeling/backbones/vit_specs.py +1 -1
- official/vision/modeling/backbones/vit_test.py +12 -1
- official/vision/modeling/classification_model.py +1 -2
- official/vision/modeling/classification_model_test.py +1 -2
- official/vision/modeling/decoders/__init__.py +1 -1
- official/vision/modeling/decoders/aspp.py +1 -3
- official/vision/modeling/decoders/aspp_test.py +1 -2
- official/vision/modeling/decoders/factory.py +1 -3
- official/vision/modeling/decoders/factory_test.py +1 -1
- official/vision/modeling/decoders/fpn.py +1 -2
- official/vision/modeling/decoders/fpn_test.py +1 -2
- official/vision/modeling/decoders/nasfpn.py +1 -3
- official/vision/modeling/decoders/nasfpn_test.py +1 -2
- official/vision/modeling/factory.py +1 -1
- official/vision/modeling/factory_3d.py +1 -2
- official/vision/modeling/factory_test.py +1 -2
- official/vision/modeling/heads/__init__.py +1 -1
- official/vision/modeling/heads/dense_prediction_heads.py +1 -3
- official/vision/modeling/heads/dense_prediction_heads_test.py +1 -3
- official/vision/modeling/heads/instance_heads.py +3 -4
- official/vision/modeling/heads/instance_heads_test.py +1 -2
- official/vision/modeling/heads/segmentation_heads.py +2 -2
- official/vision/modeling/heads/segmentation_heads_test.py +1 -2
- official/vision/modeling/layers/__init__.py +1 -1
- official/vision/modeling/layers/box_sampler.py +1 -2
- official/vision/modeling/layers/deeplab.py +1 -1
- official/vision/modeling/layers/deeplab_test.py +1 -1
- official/vision/modeling/layers/detection_generator.py +1 -3
- official/vision/modeling/layers/detection_generator_test.py +1 -3
- official/vision/modeling/layers/edgetpu.py +1 -1
- official/vision/modeling/layers/edgetpu_test.py +1 -1
- official/vision/modeling/layers/mask_sampler.py +1 -2
- official/vision/modeling/layers/nn_blocks.py +1 -2
- official/vision/modeling/layers/nn_blocks_3d.py +1 -2
- official/vision/modeling/layers/nn_blocks_3d_test.py +1 -2
- official/vision/modeling/layers/nn_blocks_test.py +1 -3
- official/vision/modeling/layers/nn_layers.py +1 -1
- official/vision/modeling/layers/nn_layers_test.py +1 -2
- official/vision/modeling/layers/roi_aligner.py +7 -5
- official/vision/modeling/layers/roi_aligner_test.py +1 -2
- official/vision/modeling/layers/roi_generator.py +1 -2
- official/vision/modeling/layers/roi_sampler.py +1 -2
- official/vision/modeling/maskrcnn_model.py +1 -1
- official/vision/modeling/maskrcnn_model_test.py +1 -2
- official/vision/modeling/models/__init__.py +1 -1
- official/vision/modeling/retinanet_model.py +9 -8
- official/vision/modeling/retinanet_model_test.py +1 -2
- official/vision/modeling/segmentation_model.py +4 -4
- official/vision/modeling/segmentation_model_test.py +1 -1
- official/vision/modeling/video_classification_model.py +1 -1
- official/vision/modeling/video_classification_model_test.py +1 -2
- official/vision/ops/__init__.py +1 -1
- official/vision/ops/anchor.py +1 -3
- official/vision/ops/anchor_generator.py +1 -1
- official/vision/ops/anchor_generator_test.py +1 -1
- official/vision/ops/anchor_test.py +1 -2
- official/vision/ops/augment.py +4 -16
- official/vision/ops/augment_test.py +1 -1
- official/vision/ops/box_matcher.py +1 -1
- official/vision/ops/box_matcher_test.py +1 -1
- official/vision/ops/box_ops.py +1 -2
- official/vision/ops/iou_similarity.py +1 -1
- official/vision/ops/iou_similarity_test.py +1 -1
- official/vision/ops/mask_ops.py +1 -3
- official/vision/ops/mask_ops_test.py +1 -2
- official/vision/ops/nms.py +1 -2
- official/vision/ops/preprocess_ops.py +40 -11
- official/vision/ops/preprocess_ops_3d.py +6 -3
- official/vision/ops/preprocess_ops_3d_test.py +1 -1
- official/vision/ops/preprocess_ops_test.py +13 -7
- official/vision/ops/sampling_ops.py +1 -2
- official/vision/ops/spatial_transform_ops.py +1 -1
- official/vision/ops/target_gather.py +1 -1
- official/vision/ops/target_gather_test.py +1 -1
- official/vision/registry_imports.py +1 -1
- official/vision/serving/__init__.py +1 -1
- official/vision/serving/detection.py +84 -33
- official/vision/serving/detection_test.py +39 -1
- official/vision/serving/export_base.py +1 -1
- official/vision/serving/export_base_v2.py +1 -1
- official/vision/serving/export_base_v2_test.py +1 -1
- official/vision/serving/export_module_factory.py +1 -1
- official/vision/serving/export_module_factory_test.py +1 -1
- official/vision/serving/export_saved_model.py +1 -1
- official/vision/serving/export_saved_model_lib.py +47 -30
- official/vision/serving/export_saved_model_lib_test.py +1 -1
- official/vision/serving/export_saved_model_lib_v2.py +1 -1
- official/vision/serving/export_tfhub.py +1 -2
- official/vision/serving/export_tfhub_lib.py +1 -3
- official/vision/serving/export_tflite.py +1 -1
- official/vision/serving/export_tflite_lib.py +1 -1
- official/vision/serving/export_utils.py +1 -1
- official/vision/serving/image_classification.py +1 -1
- official/vision/serving/image_classification_test.py +1 -1
- official/vision/serving/semantic_segmentation.py +6 -3
- official/vision/serving/semantic_segmentation_test.py +71 -7
- official/vision/serving/video_classification.py +1 -1
- official/vision/serving/video_classification_test.py +1 -1
- official/vision/tasks/__init__.py +1 -1
- official/vision/tasks/image_classification.py +1 -1
- official/vision/tasks/maskrcnn.py +1 -1
- official/vision/tasks/retinanet.py +1 -1
- official/vision/tasks/semantic_segmentation.py +1 -1
- official/vision/tasks/video_classification.py +1 -1
- official/vision/train.py +1 -1
- official/vision/train_spatial_partitioning.py +1 -1
- official/vision/utils/__init__.py +1 -1
- official/vision/utils/object_detection/__init__.py +1 -1
- official/vision/utils/object_detection/argmax_matcher.py +1 -1
- official/vision/utils/object_detection/balanced_positive_negative_sampler.py +1 -1
- official/vision/utils/object_detection/box_coder.py +1 -1
- official/vision/utils/object_detection/box_list.py +1 -1
- official/vision/utils/object_detection/box_list_ops.py +1 -1
- official/vision/utils/object_detection/faster_rcnn_box_coder.py +1 -1
- official/vision/utils/object_detection/matcher.py +1 -1
- official/vision/utils/object_detection/minibatch_sampler.py +1 -1
- official/vision/utils/object_detection/ops.py +1 -1
- official/vision/utils/object_detection/preprocessor.py +1 -1
- official/vision/utils/object_detection/region_similarity_calculator.py +1 -1
- official/vision/utils/object_detection/shape_utils.py +1 -1
- official/vision/utils/object_detection/target_assigner.py +1 -1
- official/vision/utils/object_detection/visualization_utils.py +6 -1
- official/vision/utils/ops_test.py +1 -1
- official/vision/utils/summary_manager.py +1 -1
- orbit/__init__.py +1 -1
- orbit/actions/__init__.py +1 -1
- orbit/actions/conditional_action.py +3 -2
- orbit/actions/conditional_action_test.py +1 -1
- orbit/actions/export_saved_model.py +1 -1
- orbit/actions/export_saved_model_test.py +1 -1
- orbit/actions/new_best_metric.py +2 -2
- orbit/actions/new_best_metric_test.py +2 -2
- orbit/actions/save_checkpoint_if_preempted.py +1 -1
- orbit/controller.py +1 -1
- orbit/controller_test.py +1 -1
- orbit/examples/__init__.py +1 -1
- orbit/examples/single_task/__init__.py +1 -1
- orbit/examples/single_task/single_task_evaluator.py +1 -1
- orbit/examples/single_task/single_task_evaluator_test.py +1 -1
- orbit/examples/single_task/single_task_trainer.py +1 -1
- orbit/examples/single_task/single_task_trainer_test.py +1 -1
- orbit/runner.py +1 -1
- orbit/standard_runner.py +1 -1
- orbit/standard_runner_test.py +1 -1
- orbit/utils/__init__.py +1 -1
- orbit/utils/common.py +1 -1
- orbit/utils/common_test.py +1 -1
- orbit/utils/epoch_helper.py +1 -1
- orbit/utils/loop_fns.py +7 -2
- orbit/utils/summary_manager.py +1 -1
- orbit/utils/summary_manager_interface.py +1 -1
- orbit/utils/tpu_summaries.py +1 -1
- orbit/utils/tpu_summaries_test.py +1 -1
- tensorflow_models/__init__.py +1 -1
- tensorflow_models/nlp/__init__.py +1 -1
- tensorflow_models/tensorflow_models_test.py +1 -1
- tensorflow_models/uplift/__init__.py +1 -1
- tensorflow_models/vision/__init__.py +1 -1
- {tf_models_nightly-2.17.0.dev20240528.dist-info → tf_models_nightly-2.20.0.dev20251205.dist-info}/METADATA +1 -1
- tf_models_nightly-2.20.0.dev20251205.dist-info/RECORD +1256 -0
- tf_models_nightly-2.17.0.dev20240528.dist-info/RECORD +0 -1216
- {tf_models_nightly-2.17.0.dev20240528.dist-info → tf_models_nightly-2.20.0.dev20251205.dist-info}/AUTHORS +0 -0
- {tf_models_nightly-2.17.0.dev20240528.dist-info → tf_models_nightly-2.20.0.dev20251205.dist-info}/LICENSE +0 -0
- {tf_models_nightly-2.17.0.dev20240528.dist-info → tf_models_nightly-2.20.0.dev20251205.dist-info}/WHEEL +0 -0
- {tf_models_nightly-2.17.0.dev20240528.dist-info → tf_models_nightly-2.20.0.dev20251205.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,433 @@
|
|
|
1
|
+
# Copyright 2025 The TensorFlow Authors. All Rights Reserved.
|
|
2
|
+
#
|
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
|
+
# you may not use this file except in compliance with the License.
|
|
5
|
+
# You may obtain a copy of the License at
|
|
6
|
+
#
|
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
8
|
+
#
|
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
12
|
+
# See the License for the specific language governing permissions and
|
|
13
|
+
# limitations under the License.
|
|
14
|
+
|
|
15
|
+
"""Tests for block sparse attention layer."""
|
|
16
|
+
|
|
17
|
+
import math
|
|
18
|
+
|
|
19
|
+
from absl.testing import parameterized
|
|
20
|
+
import numpy as np
|
|
21
|
+
import tensorflow as tf, tf_keras
|
|
22
|
+
|
|
23
|
+
from official.nlp.modeling.layers import block_sparse_attention
|
|
24
|
+
|
|
25
|
+
|
|
26
|
+
class BlockSparseAttentionTest(tf.test.TestCase, parameterized.TestCase):
|
|
27
|
+
|
|
28
|
+
@parameterized.named_parameters(
|
|
29
|
+
("key_value_same_proj", None, None, [40, 80]),
|
|
30
|
+
("key_value_same_proj_mqa", None, None, [40, 80], False, 1),
|
|
31
|
+
("key_value_same_proj_multi_query_blocks", None, None, [40, 80], True),
|
|
32
|
+
(
|
|
33
|
+
"key_value_same_proj_multi_query_blocks_mqa",
|
|
34
|
+
None,
|
|
35
|
+
None,
|
|
36
|
+
[40, 80],
|
|
37
|
+
True,
|
|
38
|
+
1,
|
|
39
|
+
),
|
|
40
|
+
("key_value_different_proj", 32, 60, [40, 60]),
|
|
41
|
+
("key_value_different_proj_mqa", 32, 60, [40, 60], False, 1),
|
|
42
|
+
("key_value_different_proj_multi_query_blocks", 32, 60, [40, 60], True),
|
|
43
|
+
(
|
|
44
|
+
"key_value_different_proj_multi_query_blocks_mqa",
|
|
45
|
+
32,
|
|
46
|
+
60,
|
|
47
|
+
[40, 60],
|
|
48
|
+
True,
|
|
49
|
+
1,
|
|
50
|
+
),
|
|
51
|
+
)
|
|
52
|
+
def test_non_masked_attention(
|
|
53
|
+
self,
|
|
54
|
+
value_dim,
|
|
55
|
+
output_shape,
|
|
56
|
+
output_dims,
|
|
57
|
+
multi_query_blocks=False,
|
|
58
|
+
num_kv_heads=None,
|
|
59
|
+
):
|
|
60
|
+
"""Test that the attention layer can be created without a mask tensor."""
|
|
61
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
62
|
+
num_heads=12,
|
|
63
|
+
key_dim=64,
|
|
64
|
+
value_dim=value_dim,
|
|
65
|
+
output_shape=output_shape,
|
|
66
|
+
src_block_size=10,
|
|
67
|
+
tgt_block_size=20 if multi_query_blocks else 5,
|
|
68
|
+
num_kv_heads=num_kv_heads,
|
|
69
|
+
)
|
|
70
|
+
# Create a 3-dimensional input (the first dimension is implicit).
|
|
71
|
+
query = tf_keras.Input(shape=(40, 80))
|
|
72
|
+
value = tf_keras.Input(shape=(20, 80))
|
|
73
|
+
output = test_layer(query=query, value=value)
|
|
74
|
+
self.assertEqual(output.shape.as_list(), [None] + output_dims)
|
|
75
|
+
|
|
76
|
+
def test_non_masked_self_attention(self):
|
|
77
|
+
"""Test with one input (self-attenntion) and no mask tensor."""
|
|
78
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
79
|
+
num_heads=12, key_dim=64, src_block_size=10, tgt_block_size=10
|
|
80
|
+
)
|
|
81
|
+
# Create a 3-dimensional input (the first dimension is implicit).
|
|
82
|
+
query = tf_keras.Input(shape=(40, 80))
|
|
83
|
+
output = test_layer(query, query)
|
|
84
|
+
self.assertEqual(output.shape.as_list(), [None, 40, 80])
|
|
85
|
+
|
|
86
|
+
@parameterized.named_parameters(
|
|
87
|
+
("with_bias", True),
|
|
88
|
+
("with_bias_mqa", True, False, False, 1),
|
|
89
|
+
("with_bias_multi_query_blocks", True, False, True),
|
|
90
|
+
("with_bias_multi_query_blocks_mqa", True, False, True, 1),
|
|
91
|
+
("no_bias", False),
|
|
92
|
+
("no_bias_mqa", False, False, False, 1),
|
|
93
|
+
("no_bias_multi_query_blocks", False, False, True),
|
|
94
|
+
("no_bias_multi_query_blocks_mqa", False, False, True, 1),
|
|
95
|
+
("with_sigmoid_attn", True, True),
|
|
96
|
+
("with_sigmoid_attn_mqa", True, True, False, 1),
|
|
97
|
+
("with_sigmoid_attn_multi_query_blocks", True, True, True),
|
|
98
|
+
("with_sigmoid_attn_multi_query_blocks_mqa", True, True, True, 1),
|
|
99
|
+
)
|
|
100
|
+
def test_masked_attention(
|
|
101
|
+
self,
|
|
102
|
+
use_bias,
|
|
103
|
+
use_sigmoid_attn=False,
|
|
104
|
+
multi_query_blocks=False,
|
|
105
|
+
num_kv_heads=None,
|
|
106
|
+
):
|
|
107
|
+
"""Test with a mask tensor."""
|
|
108
|
+
if use_sigmoid_attn:
|
|
109
|
+
sigmoid_attn_bias = -math.log(2)
|
|
110
|
+
else:
|
|
111
|
+
sigmoid_attn_bias = None
|
|
112
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
113
|
+
num_heads=4,
|
|
114
|
+
key_dim=2,
|
|
115
|
+
use_bias=use_bias,
|
|
116
|
+
src_block_size=2,
|
|
117
|
+
tgt_block_size=2 if multi_query_blocks else 1,
|
|
118
|
+
use_sigmoid_attn=use_sigmoid_attn,
|
|
119
|
+
sigmoid_attn_bias=sigmoid_attn_bias,
|
|
120
|
+
num_kv_heads=num_kv_heads,
|
|
121
|
+
)
|
|
122
|
+
# Create a 3-dimensional input (the first dimension is implicit).
|
|
123
|
+
batch_size = 3
|
|
124
|
+
query = tf_keras.Input(shape=(4, 8))
|
|
125
|
+
value = tf_keras.Input(shape=(2, 8))
|
|
126
|
+
mask_tensor = tf_keras.Input(shape=(4, 2))
|
|
127
|
+
output = test_layer(query=query, value=value, attention_mask=mask_tensor)
|
|
128
|
+
|
|
129
|
+
# Create a model containing the test layer.
|
|
130
|
+
model = tf_keras.Model([query, value, mask_tensor], output)
|
|
131
|
+
|
|
132
|
+
# Generate data for the input (non-mask) tensors.
|
|
133
|
+
from_data = 10 * np.random.random_sample((batch_size, 4, 8))
|
|
134
|
+
to_data = 10 * np.random.random_sample((batch_size, 2, 8))
|
|
135
|
+
|
|
136
|
+
# Invoke the data with a random set of mask data. This should mask at
|
|
137
|
+
# least one element.
|
|
138
|
+
mask_data = np.random.randint(2, size=(batch_size, 4, 2))
|
|
139
|
+
masked_output_data = model.predict([from_data, to_data, mask_data])
|
|
140
|
+
|
|
141
|
+
# Invoke the same data, but with a null mask (where no elements are
|
|
142
|
+
# masked).
|
|
143
|
+
null_mask_data = np.ones((batch_size, 4, 2))
|
|
144
|
+
unmasked_output_data = model.predict([from_data, to_data, null_mask_data])
|
|
145
|
+
|
|
146
|
+
# Because one data is masked and one is not, the outputs should not be
|
|
147
|
+
# the same.
|
|
148
|
+
self.assertNotAllClose(masked_output_data, unmasked_output_data)
|
|
149
|
+
|
|
150
|
+
# Tests the layer with three inputs: Q, K, V.
|
|
151
|
+
key = tf_keras.Input(shape=(2, 8))
|
|
152
|
+
output = test_layer(
|
|
153
|
+
query, value=value, key=key, attention_mask=mask_tensor
|
|
154
|
+
)
|
|
155
|
+
model = tf_keras.Model([query, value, key, mask_tensor], output)
|
|
156
|
+
|
|
157
|
+
masked_output_data = model.predict(
|
|
158
|
+
[from_data, to_data, to_data, mask_data]
|
|
159
|
+
)
|
|
160
|
+
unmasked_output_data = model.predict(
|
|
161
|
+
[from_data, to_data, to_data, null_mask_data]
|
|
162
|
+
)
|
|
163
|
+
# Because one data is masked and one is not, the outputs should not be
|
|
164
|
+
# the same.
|
|
165
|
+
self.assertNotAllClose(masked_output_data, unmasked_output_data)
|
|
166
|
+
|
|
167
|
+
if use_bias:
|
|
168
|
+
self.assertLen(test_layer._query_dense.trainable_variables, 2)
|
|
169
|
+
self.assertLen(test_layer._output_dense.trainable_variables, 2)
|
|
170
|
+
else:
|
|
171
|
+
self.assertLen(test_layer._query_dense.trainable_variables, 1)
|
|
172
|
+
self.assertLen(test_layer._output_dense.trainable_variables, 1)
|
|
173
|
+
|
|
174
|
+
@parameterized.named_parameters(
|
|
175
|
+
("default_with_softmax", False),
|
|
176
|
+
("default_with_sigmoid", True),
|
|
177
|
+
)
|
|
178
|
+
def test_default_masked_attention(
|
|
179
|
+
self,
|
|
180
|
+
use_sigmoid_attn=False,
|
|
181
|
+
):
|
|
182
|
+
"""Test with a mask tensor."""
|
|
183
|
+
seq_len = 8
|
|
184
|
+
if use_sigmoid_attn:
|
|
185
|
+
sigmoid_attn_bias = -math.log(seq_len)
|
|
186
|
+
else:
|
|
187
|
+
sigmoid_attn_bias = None
|
|
188
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
189
|
+
num_heads=4,
|
|
190
|
+
key_dim=2,
|
|
191
|
+
use_bias=True,
|
|
192
|
+
src_block_size=seq_len,
|
|
193
|
+
tgt_block_size=seq_len,
|
|
194
|
+
use_sigmoid_attn=use_sigmoid_attn,
|
|
195
|
+
sigmoid_attn_bias=sigmoid_attn_bias,
|
|
196
|
+
)
|
|
197
|
+
# Create a 3-dimensional input (the first dimension is implicit).
|
|
198
|
+
batch_size = 3
|
|
199
|
+
query = tf_keras.Input(shape=(seq_len, 8))
|
|
200
|
+
value = tf_keras.Input(shape=(seq_len, 8))
|
|
201
|
+
mask_tensor = tf_keras.Input(shape=(seq_len, seq_len))
|
|
202
|
+
output = test_layer(query=query, value=value, attention_mask=mask_tensor)
|
|
203
|
+
|
|
204
|
+
# Create a model containing the test layer.
|
|
205
|
+
model = tf_keras.Model([query, value, mask_tensor], output)
|
|
206
|
+
|
|
207
|
+
# Generate data for the input (non-mask) tensors.
|
|
208
|
+
from_data = 10 * np.random.random_sample((batch_size, seq_len, 8))
|
|
209
|
+
to_data = 10 * np.random.random_sample((batch_size, seq_len, 8))
|
|
210
|
+
|
|
211
|
+
# Invoke the data with a random set of mask data. This should mask at
|
|
212
|
+
# least one element.
|
|
213
|
+
mask_data = np.random.randint(2, size=(batch_size, seq_len, seq_len))
|
|
214
|
+
masked_output_data = model.predict([from_data, to_data, mask_data])
|
|
215
|
+
|
|
216
|
+
# Invoke the same data, but with a null mask (where no elements are
|
|
217
|
+
# masked).
|
|
218
|
+
null_mask_data = np.ones((batch_size, seq_len, seq_len))
|
|
219
|
+
unmasked_output_data = model.predict([from_data, to_data, null_mask_data])
|
|
220
|
+
|
|
221
|
+
# Because one data is masked and one is not, the outputs should not be
|
|
222
|
+
# the same.
|
|
223
|
+
self.assertNotAllClose(masked_output_data, unmasked_output_data)
|
|
224
|
+
|
|
225
|
+
# Tests the layer with three inputs: Q, K, V.
|
|
226
|
+
key = tf_keras.Input(shape=(seq_len, 8))
|
|
227
|
+
output = test_layer(
|
|
228
|
+
query, value=value, key=key, attention_mask=mask_tensor
|
|
229
|
+
)
|
|
230
|
+
model = tf_keras.Model([query, value, key, mask_tensor], output)
|
|
231
|
+
|
|
232
|
+
masked_output_data = model.predict(
|
|
233
|
+
[from_data, to_data, to_data, mask_data]
|
|
234
|
+
)
|
|
235
|
+
unmasked_output_data = model.predict(
|
|
236
|
+
[from_data, to_data, to_data, null_mask_data]
|
|
237
|
+
)
|
|
238
|
+
# Because one data is masked and one is not, the outputs should not be
|
|
239
|
+
# the same.
|
|
240
|
+
self.assertNotAllClose(masked_output_data, unmasked_output_data)
|
|
241
|
+
|
|
242
|
+
self.assertLen(test_layer._query_dense.trainable_variables, 2)
|
|
243
|
+
self.assertLen(test_layer._output_dense.trainable_variables, 2)
|
|
244
|
+
|
|
245
|
+
def test_masked_attention_with_scores(self):
|
|
246
|
+
"""Test with a mask tensor."""
|
|
247
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
248
|
+
num_heads=4, key_dim=2, src_block_size=2, tgt_block_size=1,
|
|
249
|
+
)
|
|
250
|
+
# Create a 3-dimensional input (the first dimension is implicit).
|
|
251
|
+
batch_size = 3
|
|
252
|
+
query = tf_keras.Input(shape=(4, 8))
|
|
253
|
+
value = tf_keras.Input(shape=(2, 8))
|
|
254
|
+
mask_tensor = tf_keras.Input(shape=(4, 2))
|
|
255
|
+
output = test_layer(query=query, value=value, attention_mask=mask_tensor)
|
|
256
|
+
|
|
257
|
+
# Create a model containing the test layer.
|
|
258
|
+
model = tf_keras.Model([query, value, mask_tensor], output)
|
|
259
|
+
|
|
260
|
+
# Generate data for the input (non-mask) tensors.
|
|
261
|
+
from_data = 10 * np.random.random_sample((batch_size, 4, 8))
|
|
262
|
+
to_data = 10 * np.random.random_sample((batch_size, 2, 8))
|
|
263
|
+
|
|
264
|
+
# Invoke the data with a random set of mask data. This should mask at
|
|
265
|
+
# least one element.
|
|
266
|
+
mask_data = np.random.randint(2, size=(batch_size, 4, 2))
|
|
267
|
+
masked_output_data = model.predict([from_data, to_data, mask_data])
|
|
268
|
+
|
|
269
|
+
# Invoke the same data, but with a null mask (where no elements are
|
|
270
|
+
# masked).
|
|
271
|
+
null_mask_data = np.ones((batch_size, 4, 2))
|
|
272
|
+
unmasked_output_data = model.predict([from_data, to_data, null_mask_data])
|
|
273
|
+
|
|
274
|
+
# Because one data is masked and one is not, the outputs should not be
|
|
275
|
+
# the same.
|
|
276
|
+
self.assertNotAllClose(masked_output_data, unmasked_output_data)
|
|
277
|
+
|
|
278
|
+
# Create a model containing attention scores.
|
|
279
|
+
output, scores = test_layer(
|
|
280
|
+
query=query,
|
|
281
|
+
value=value,
|
|
282
|
+
attention_mask=mask_tensor,
|
|
283
|
+
return_attention_scores=True,
|
|
284
|
+
)
|
|
285
|
+
model = tf_keras.Model([query, value, mask_tensor], [output, scores])
|
|
286
|
+
masked_output_data_score, masked_score = model.predict(
|
|
287
|
+
[from_data, to_data, mask_data]
|
|
288
|
+
)
|
|
289
|
+
unmasked_output_data_score, unmasked_score = model.predict(
|
|
290
|
+
[from_data, to_data, null_mask_data]
|
|
291
|
+
)
|
|
292
|
+
self.assertNotAllClose(masked_output_data_score, unmasked_output_data_score)
|
|
293
|
+
self.assertAllClose(masked_output_data, masked_output_data_score)
|
|
294
|
+
self.assertAllClose(unmasked_output_data, unmasked_output_data_score)
|
|
295
|
+
self.assertNotAllClose(masked_score, unmasked_score)
|
|
296
|
+
|
|
297
|
+
def test_initializer(self):
|
|
298
|
+
"""Test with a specified initializer."""
|
|
299
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
300
|
+
num_heads=12,
|
|
301
|
+
key_dim=64,
|
|
302
|
+
src_block_size=10,
|
|
303
|
+
kernel_initializer=tf_keras.initializers.TruncatedNormal(stddev=0.02),
|
|
304
|
+
)
|
|
305
|
+
# Create a 3-dimensional input (the first dimension is implicit).
|
|
306
|
+
query = tf_keras.Input(shape=(40, 80))
|
|
307
|
+
output = test_layer(query, query)
|
|
308
|
+
self.assertEqual(output.shape.as_list(), [None, 40, 80])
|
|
309
|
+
|
|
310
|
+
# Make sure the sub layers have different kernel init value, and not
|
|
311
|
+
# reusing the initializers.
|
|
312
|
+
self.assertNotAllClose(
|
|
313
|
+
tf_keras.backend.eval(test_layer._query_dense.kernel),
|
|
314
|
+
tf_keras.backend.eval(test_layer._key_dense.kernel),
|
|
315
|
+
)
|
|
316
|
+
self.assertNotAllClose(
|
|
317
|
+
tf_keras.backend.eval(test_layer._query_dense.kernel),
|
|
318
|
+
tf_keras.backend.eval(test_layer._value_dense.kernel),
|
|
319
|
+
)
|
|
320
|
+
self.assertNotAllClose(
|
|
321
|
+
tf_keras.backend.eval(test_layer._query_dense.kernel),
|
|
322
|
+
tf_keras.backend.eval(test_layer._output_dense.kernel),
|
|
323
|
+
)
|
|
324
|
+
|
|
325
|
+
@parameterized.named_parameters(
|
|
326
|
+
("bfloat16", tf.bfloat16),
|
|
327
|
+
("float16", tf.float16),
|
|
328
|
+
("float32", tf.float32),
|
|
329
|
+
("float64", tf.float64),
|
|
330
|
+
)
|
|
331
|
+
def test_sublayer_dtypes(self, dtype):
|
|
332
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
333
|
+
num_heads=12, key_dim=64, src_block_size=10, dtype=dtype
|
|
334
|
+
)
|
|
335
|
+
|
|
336
|
+
query = tf_keras.Input(shape=(40, 80), dtype=dtype)
|
|
337
|
+
# Build the layer
|
|
338
|
+
test_layer(query=query, value=query)
|
|
339
|
+
|
|
340
|
+
self.assertEqual(test_layer._query_dense.dtype, dtype)
|
|
341
|
+
self.assertEqual(test_layer._key_dense.dtype, dtype)
|
|
342
|
+
self.assertEqual(test_layer._value_dense.dtype, dtype)
|
|
343
|
+
self.assertEqual(test_layer._output_dense.dtype, dtype)
|
|
344
|
+
|
|
345
|
+
def test_dropout(self):
|
|
346
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
347
|
+
num_heads=2, key_dim=2, dropout=0.5, src_block_size=2, tgt_block_size=1,
|
|
348
|
+
)
|
|
349
|
+
|
|
350
|
+
# Generate data for the input (non-mask) tensors.
|
|
351
|
+
from_data = tf_keras.backend.ones(shape=(32, 4, 8))
|
|
352
|
+
to_data = tf_keras.backend.ones(shape=(32, 2, 8))
|
|
353
|
+
train_out = test_layer(from_data, to_data, None, None, None, True)
|
|
354
|
+
test_out = test_layer(from_data, to_data, None, None, None, False)
|
|
355
|
+
|
|
356
|
+
# Output should be close when not in training mode,
|
|
357
|
+
# and should not be close when enabling dropout in training mode.
|
|
358
|
+
self.assertNotAllClose(
|
|
359
|
+
tf_keras.backend.eval(train_out), tf_keras.backend.eval(test_out)
|
|
360
|
+
)
|
|
361
|
+
|
|
362
|
+
def test_query_mask_progagation(self):
|
|
363
|
+
"""Test automatic propagation of the query's mask."""
|
|
364
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
365
|
+
num_heads=2,
|
|
366
|
+
key_dim=2,
|
|
367
|
+
src_block_size=2,
|
|
368
|
+
tgt_block_size=1,
|
|
369
|
+
)
|
|
370
|
+
self.assertTrue(test_layer.supports_masking)
|
|
371
|
+
query = tf.constant(
|
|
372
|
+
[[1, 2, 3, 0, 0, 0], [3, 3, 1, 1, 2, 0], [1, 1, 0, 0, 0, 0]]
|
|
373
|
+
)
|
|
374
|
+
masked_query = tf_keras.layers.Embedding(4, 8, mask_zero=True)(query)
|
|
375
|
+
value = tf.random.normal((3, 3, 8))
|
|
376
|
+
output = test_layer(query=masked_query, value=value)
|
|
377
|
+
self.assertTrue(hasattr(output, "_keras_mask"))
|
|
378
|
+
self.assertAllEqual(masked_query._keras_mask, output._keras_mask)
|
|
379
|
+
|
|
380
|
+
def test_value_mask(self):
|
|
381
|
+
"""Test that the value mask is taken into account."""
|
|
382
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
383
|
+
num_heads=2,
|
|
384
|
+
key_dim=2,
|
|
385
|
+
src_block_size=2,
|
|
386
|
+
tgt_block_size=1,
|
|
387
|
+
)
|
|
388
|
+
query = tf.constant(
|
|
389
|
+
[[1, 2, 3, 0, 0, 0], [3, 3, 1, 1, 2, 0], [1, 1, 0, 0, 0, 0]]
|
|
390
|
+
)
|
|
391
|
+
masked_query = tf_keras.layers.Embedding(4, 8, mask_zero=True)(query)
|
|
392
|
+
value = tf.constant([[5, 4, 0], [3, 0, 0], [2, 1, 1]])
|
|
393
|
+
masked_value = tf_keras.layers.Embedding(6, 8, mask_zero=True)(value)
|
|
394
|
+
output = test_layer(
|
|
395
|
+
query=masked_query,
|
|
396
|
+
value=masked_value,
|
|
397
|
+
)
|
|
398
|
+
mask = tf.constant(
|
|
399
|
+
[[[True, True, False]] * 3 + [[False, False, False]] * 2]
|
|
400
|
+
+ [[[True, False, False]] * 5]
|
|
401
|
+
+ [[[True, True, True]] + [[False, False, False]] * 4]
|
|
402
|
+
)
|
|
403
|
+
del masked_query._keras_mask
|
|
404
|
+
del masked_value._keras_mask
|
|
405
|
+
output_with_manual_mask = test_layer(
|
|
406
|
+
query=masked_query, value=masked_value, attention_mask=mask
|
|
407
|
+
)
|
|
408
|
+
self.assertAllClose(output, output_with_manual_mask)
|
|
409
|
+
|
|
410
|
+
def test_masks_are_cast_to_bool(self):
|
|
411
|
+
"""Test that the implicit and explicit masks are cast to bool."""
|
|
412
|
+
test_layer = block_sparse_attention.MultiHeadAttention(
|
|
413
|
+
num_heads=2, key_dim=2, src_block_size=2, tgt_block_size=1,
|
|
414
|
+
)
|
|
415
|
+
query = np.array(
|
|
416
|
+
[[1, 2, 3, 0, 0, 0], [3, 3, 1, 1, 2, 0], [1, 1, 0, 0, 0, 0]]
|
|
417
|
+
)
|
|
418
|
+
masked_query = tf_keras.layers.Embedding(4, 8, mask_zero=True)(query)
|
|
419
|
+
masked_query._keras_mask = tf.cast(masked_query._keras_mask, tf.float32)
|
|
420
|
+
value = np.array([[5, 4, 0], [3, 0, 0], [2, 1, 1]])
|
|
421
|
+
masked_value = tf_keras.layers.Embedding(6, 8, mask_zero=True)(value)
|
|
422
|
+
masked_value._keras_mask = tf.cast(masked_value._keras_mask, tf.float32)
|
|
423
|
+
float_mask = tf.constant([[[1.0]]])
|
|
424
|
+
# if all works well, the following should not raise any exception:
|
|
425
|
+
_ = test_layer(
|
|
426
|
+
query=masked_query,
|
|
427
|
+
value=masked_value,
|
|
428
|
+
attention_mask=float_mask,
|
|
429
|
+
)
|
|
430
|
+
|
|
431
|
+
|
|
432
|
+
if __name__ == "__main__":
|
|
433
|
+
tf.test.main()
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# Copyright
|
|
1
|
+
# Copyright 2025 The TensorFlow Authors. All Rights Reserved.
|
|
2
2
|
#
|
|
3
3
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
4
|
# you may not use this file except in compliance with the License.
|
|
@@ -37,7 +37,7 @@ class GatedFeedforward(tf_keras.layers.Layer):
|
|
|
37
37
|
dropout: Dropout probability for the output dropout.
|
|
38
38
|
use_gate: Whether to use gated linear units. If True, assuming `GELU` as the
|
|
39
39
|
activation and omitting bias, will apply
|
|
40
|
-
`GEGLU(x, W, V, W_2) = (
|
|
40
|
+
`GEGLU(x, W, V, W_2) = (GELU(xW) * xV)W2`; if False, will follow
|
|
41
41
|
"Attention Is All You Need" (https://arxiv.org/abs/1706.03762) paper and
|
|
42
42
|
apply `FFN(x, W, W_2) = GELU(xW_1)W_2.`
|
|
43
43
|
num_blocks: The number of feedforward blocks to stack. Each block contains a
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# Copyright
|
|
1
|
+
# Copyright 2025 The TensorFlow Authors. All Rights Reserved.
|
|
2
2
|
#
|
|
3
3
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
4
|
# you may not use this file except in compliance with the License.
|
|
@@ -16,7 +16,6 @@
|
|
|
16
16
|
# pylint: disable=g-classes-have-attributes
|
|
17
17
|
|
|
18
18
|
from typing import Tuple
|
|
19
|
-
# Import libraries
|
|
20
19
|
import tensorflow as tf, tf_keras
|
|
21
20
|
|
|
22
21
|
from official.modeling import tf_utils
|