tf-models-nightly 2.17.0.dev20240617__py2.py3-none-any.whl → 2.20.0.dev20251220__py2.py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- official/__init__.py +1 -1
- official/common/__init__.py +1 -1
- official/common/dataset_fn.py +1 -1
- official/common/distribute_utils.py +27 -3
- official/common/distribute_utils_test.py +13 -12
- official/common/flags.py +24 -6
- official/common/registry_imports.py +1 -1
- official/common/streamz_counters.py +1 -1
- official/core/__init__.py +1 -1
- official/core/actions.py +1 -1
- official/core/actions_test.py +1 -1
- official/core/base_task.py +1 -1
- official/core/base_trainer.py +1 -1
- official/core/base_trainer_test.py +1 -1
- official/core/config_definitions.py +1 -1
- official/core/exp_factory.py +1 -1
- official/core/export_base.py +1 -1
- official/core/export_base_test.py +1 -1
- official/core/file_writers.py +1 -1
- official/core/file_writers_test.py +1 -1
- official/core/input_reader.py +1 -1
- official/core/registry.py +1 -1
- official/core/registry_test.py +1 -1
- official/core/savedmodel_checkpoint_manager.py +1 -1
- official/core/savedmodel_checkpoint_manager_test.py +1 -1
- official/core/task_factory.py +1 -1
- official/core/test_utils.py +1 -1
- official/core/tf_example_builder.py +1 -1
- official/core/tf_example_builder_test.py +1 -1
- official/core/tf_example_feature_key.py +1 -1
- official/core/tf_example_feature_key_test.py +1 -1
- official/core/train_lib.py +1 -3
- official/core/train_lib_test.py +1 -1
- official/core/train_utils.py +1 -1
- official/core/train_utils_test.py +1 -1
- official/legacy/__init__.py +1 -1
- official/legacy/albert/__init__.py +1 -1
- official/legacy/albert/configs.py +1 -1
- official/legacy/bert/__init__.py +1 -1
- official/legacy/bert/bert_models.py +1 -1
- official/legacy/bert/bert_models_test.py +1 -1
- official/legacy/bert/common_flags.py +1 -1
- official/legacy/bert/configs.py +1 -1
- official/legacy/bert/export_tfhub.py +1 -2
- official/legacy/bert/export_tfhub_test.py +1 -1
- official/legacy/bert/input_pipeline.py +1 -1
- official/legacy/bert/model_saving_utils.py +1 -1
- official/legacy/bert/model_training_utils.py +1 -1
- official/legacy/bert/model_training_utils_test.py +1 -1
- official/legacy/bert/run_classifier.py +1 -2
- official/legacy/bert/run_pretraining.py +1 -2
- official/legacy/bert/run_squad.py +1 -2
- official/legacy/bert/run_squad_helper.py +1 -1
- official/legacy/bert/serving.py +1 -1
- official/legacy/detection/__init__.py +1 -1
- official/legacy/detection/configs/__init__.py +1 -1
- official/legacy/detection/configs/base_config.py +1 -1
- official/legacy/detection/configs/factory.py +1 -1
- official/legacy/detection/configs/maskrcnn_config.py +1 -1
- official/legacy/detection/configs/olnmask_config.py +1 -1
- official/legacy/detection/configs/retinanet_config.py +1 -1
- official/legacy/detection/configs/shapemask_config.py +1 -1
- official/legacy/detection/dataloader/__init__.py +1 -1
- official/legacy/detection/dataloader/anchor.py +1 -1
- official/legacy/detection/dataloader/factory.py +1 -1
- official/legacy/detection/dataloader/input_reader.py +1 -1
- official/legacy/detection/dataloader/maskrcnn_parser.py +1 -1
- official/legacy/detection/dataloader/mode_keys.py +1 -1
- official/legacy/detection/dataloader/olnmask_parser.py +1 -1
- official/legacy/detection/dataloader/retinanet_parser.py +1 -1
- official/legacy/detection/dataloader/shapemask_parser.py +1 -1
- official/legacy/detection/dataloader/tf_example_decoder.py +1 -1
- official/legacy/detection/evaluation/__init__.py +1 -1
- official/legacy/detection/evaluation/coco_evaluator.py +1 -1
- official/legacy/detection/evaluation/coco_utils.py +1 -1
- official/legacy/detection/evaluation/factory.py +1 -1
- official/legacy/detection/executor/__init__.py +1 -1
- official/legacy/detection/executor/detection_executor.py +1 -1
- official/legacy/detection/executor/distributed_executor.py +1 -1
- official/legacy/detection/main.py +1 -1
- official/legacy/detection/modeling/__init__.py +1 -1
- official/legacy/detection/modeling/architecture/__init__.py +1 -1
- official/legacy/detection/modeling/architecture/factory.py +1 -1
- official/legacy/detection/modeling/architecture/fpn.py +1 -1
- official/legacy/detection/modeling/architecture/heads.py +1 -1
- official/legacy/detection/modeling/architecture/identity.py +1 -1
- official/legacy/detection/modeling/architecture/nn_blocks.py +1 -1
- official/legacy/detection/modeling/architecture/nn_ops.py +1 -1
- official/legacy/detection/modeling/architecture/resnet.py +1 -1
- official/legacy/detection/modeling/architecture/spinenet.py +1 -1
- official/legacy/detection/modeling/base_model.py +1 -1
- official/legacy/detection/modeling/checkpoint_utils.py +1 -1
- official/legacy/detection/modeling/factory.py +1 -1
- official/legacy/detection/modeling/learning_rates.py +1 -1
- official/legacy/detection/modeling/losses.py +1 -1
- official/legacy/detection/modeling/maskrcnn_model.py +1 -1
- official/legacy/detection/modeling/olnmask_model.py +1 -1
- official/legacy/detection/modeling/optimizers.py +1 -1
- official/legacy/detection/modeling/retinanet_model.py +1 -1
- official/legacy/detection/modeling/shapemask_model.py +1 -1
- official/legacy/detection/ops/__init__.py +1 -1
- official/legacy/detection/ops/nms.py +1 -1
- official/legacy/detection/ops/postprocess_ops.py +1 -1
- official/legacy/detection/ops/roi_ops.py +1 -1
- official/legacy/detection/ops/spatial_transform_ops.py +1 -1
- official/legacy/detection/ops/target_ops.py +1 -1
- official/legacy/detection/utils/__init__.py +1 -1
- official/legacy/detection/utils/box_utils.py +1 -1
- official/legacy/detection/utils/class_utils.py +1 -1
- official/legacy/detection/utils/dataloader_utils.py +1 -1
- official/legacy/detection/utils/input_utils.py +1 -1
- official/legacy/detection/utils/mask_utils.py +1 -1
- official/legacy/image_classification/__init__.py +1 -1
- official/legacy/image_classification/augment.py +1 -1
- official/legacy/image_classification/augment_test.py +1 -1
- official/legacy/image_classification/callbacks.py +1 -1
- official/legacy/image_classification/classifier_trainer.py +1 -1
- official/legacy/image_classification/classifier_trainer_test.py +1 -1
- official/legacy/image_classification/classifier_trainer_util_test.py +1 -1
- official/legacy/image_classification/configs/__init__.py +1 -1
- official/legacy/image_classification/configs/base_configs.py +1 -1
- official/legacy/image_classification/configs/configs.py +1 -1
- official/legacy/image_classification/dataset_factory.py +1 -1
- official/legacy/image_classification/efficientnet/__init__.py +1 -1
- official/legacy/image_classification/efficientnet/common_modules.py +1 -1
- official/legacy/image_classification/efficientnet/efficientnet_config.py +1 -1
- official/legacy/image_classification/efficientnet/efficientnet_model.py +1 -1
- official/legacy/image_classification/efficientnet/tfhub_export.py +1 -1
- official/legacy/image_classification/learning_rate.py +1 -1
- official/legacy/image_classification/learning_rate_test.py +1 -1
- official/legacy/image_classification/mnist_main.py +1 -2
- official/legacy/image_classification/mnist_test.py +1 -1
- official/legacy/image_classification/optimizer_factory.py +1 -1
- official/legacy/image_classification/optimizer_factory_test.py +1 -1
- official/legacy/image_classification/preprocessing.py +1 -1
- official/legacy/image_classification/resnet/__init__.py +1 -1
- official/legacy/image_classification/resnet/common.py +1 -1
- official/legacy/image_classification/resnet/imagenet_preprocessing.py +1 -1
- official/legacy/image_classification/resnet/resnet_config.py +1 -1
- official/legacy/image_classification/resnet/resnet_ctl_imagenet_main.py +1 -2
- official/legacy/image_classification/resnet/resnet_model.py +1 -1
- official/legacy/image_classification/resnet/resnet_runnable.py +1 -1
- official/legacy/image_classification/resnet/tfhub_export.py +1 -2
- official/legacy/image_classification/test_utils.py +1 -1
- official/legacy/image_classification/vgg/__init__.py +1 -1
- official/legacy/image_classification/vgg/vgg_config.py +1 -1
- official/legacy/image_classification/vgg/vgg_model.py +1 -1
- official/legacy/transformer/__init__.py +1 -1
- official/legacy/transformer/attention_layer.py +1 -1
- official/legacy/transformer/beam_search_v1.py +1 -1
- official/legacy/transformer/compute_bleu.py +1 -1
- official/legacy/transformer/compute_bleu_test.py +1 -1
- official/legacy/transformer/data_download.py +1 -1
- official/legacy/transformer/data_pipeline.py +1 -1
- official/legacy/transformer/embedding_layer.py +1 -1
- official/legacy/transformer/ffn_layer.py +1 -1
- official/legacy/transformer/metrics.py +1 -1
- official/legacy/transformer/misc.py +1 -1
- official/legacy/transformer/model_params.py +1 -1
- official/legacy/transformer/model_utils.py +1 -1
- official/legacy/transformer/model_utils_test.py +1 -1
- official/legacy/transformer/optimizer.py +1 -1
- official/legacy/transformer/transformer.py +1 -1
- official/legacy/transformer/transformer_forward_test.py +1 -1
- official/legacy/transformer/transformer_layers_test.py +1 -1
- official/legacy/transformer/transformer_main.py +1 -5
- official/legacy/transformer/transformer_main_test.py +1 -1
- official/legacy/transformer/transformer_test.py +1 -1
- official/legacy/transformer/translate.py +1 -2
- official/legacy/transformer/utils/__init__.py +1 -1
- official/legacy/transformer/utils/metrics.py +1 -1
- official/legacy/transformer/utils/tokenizer.py +1 -1
- official/legacy/transformer/utils/tokenizer_test.py +1 -1
- official/legacy/xlnet/__init__.py +1 -1
- official/legacy/xlnet/classifier_utils.py +1 -1
- official/legacy/xlnet/common_flags.py +1 -1
- official/legacy/xlnet/data_utils.py +1 -1
- official/legacy/xlnet/optimization.py +1 -1
- official/legacy/xlnet/preprocess_classification_data.py +1 -2
- official/legacy/xlnet/preprocess_pretrain_data.py +1 -2
- official/legacy/xlnet/preprocess_squad_data.py +1 -2
- official/legacy/xlnet/preprocess_utils.py +1 -1
- official/legacy/xlnet/run_classifier.py +1 -2
- official/legacy/xlnet/run_pretrain.py +1 -2
- official/legacy/xlnet/run_squad.py +1 -2
- official/legacy/xlnet/squad_utils.py +1 -1
- official/legacy/xlnet/training_utils.py +1 -1
- official/legacy/xlnet/xlnet_config.py +1 -1
- official/legacy/xlnet/xlnet_modeling.py +1 -1
- official/modeling/__init__.py +1 -1
- official/modeling/activations/__init__.py +1 -1
- official/modeling/activations/gelu.py +1 -1
- official/modeling/activations/gelu_test.py +1 -1
- official/modeling/activations/mish.py +1 -1
- official/modeling/activations/mish_test.py +1 -1
- official/modeling/activations/relu.py +1 -1
- official/modeling/activations/relu_test.py +1 -1
- official/modeling/activations/sigmoid.py +1 -1
- official/modeling/activations/sigmoid_test.py +1 -1
- official/modeling/activations/swish.py +1 -1
- official/modeling/activations/swish_test.py +1 -1
- official/modeling/grad_utils.py +1 -1
- official/modeling/grad_utils_test.py +1 -1
- official/modeling/hyperparams/__init__.py +1 -1
- official/modeling/hyperparams/base_config.py +27 -19
- official/modeling/hyperparams/base_config_test.py +32 -1
- official/modeling/hyperparams/oneof.py +1 -1
- official/modeling/hyperparams/oneof_test.py +1 -1
- official/modeling/hyperparams/params_dict.py +1 -1
- official/modeling/hyperparams/params_dict_test.py +1 -1
- official/modeling/multitask/__init__.py +1 -1
- official/modeling/multitask/base_model.py +1 -1
- official/modeling/multitask/base_trainer.py +1 -1
- official/modeling/multitask/base_trainer_test.py +1 -1
- official/modeling/multitask/configs.py +3 -3
- official/modeling/multitask/evaluator.py +1 -1
- official/modeling/multitask/evaluator_test.py +1 -1
- official/modeling/multitask/interleaving_trainer.py +1 -1
- official/modeling/multitask/interleaving_trainer_test.py +1 -1
- official/modeling/multitask/multitask.py +1 -1
- official/modeling/multitask/task_sampler.py +1 -1
- official/modeling/multitask/task_sampler_test.py +1 -1
- official/modeling/multitask/test_utils.py +1 -1
- official/modeling/multitask/train_lib.py +81 -14
- official/modeling/multitask/train_lib_test.py +1 -1
- official/modeling/optimization/__init__.py +1 -1
- official/modeling/optimization/adafactor_optimizer.py +1 -1
- official/modeling/optimization/configs/__init__.py +1 -1
- official/modeling/optimization/configs/learning_rate_config.py +1 -1
- official/modeling/optimization/configs/optimization_config.py +1 -1
- official/modeling/optimization/configs/optimization_config_test.py +1 -1
- official/modeling/optimization/configs/optimizer_config.py +1 -1
- official/modeling/optimization/ema_optimizer.py +1 -1
- official/modeling/optimization/lamb.py +1 -1
- official/modeling/optimization/lamb_test.py +1 -1
- official/modeling/optimization/lars.py +1 -1
- official/modeling/optimization/legacy_adamw.py +1 -1
- official/modeling/optimization/lr_schedule.py +1 -1
- official/modeling/optimization/lr_schedule_test.py +1 -1
- official/modeling/optimization/optimizer_factory.py +1 -1
- official/modeling/optimization/optimizer_factory_test.py +1 -1
- official/modeling/optimization/slide_optimizer.py +1 -1
- official/modeling/performance.py +1 -1
- official/modeling/privacy/__init__.py +1 -1
- official/modeling/privacy/configs.py +1 -1
- official/modeling/privacy/configs_test.py +1 -1
- official/modeling/privacy/ops.py +1 -1
- official/modeling/privacy/ops_test.py +1 -1
- official/modeling/tf_utils.py +1 -1
- official/modeling/tf_utils_test.py +1 -1
- official/nlp/__init__.py +1 -1
- official/nlp/configs/__init__.py +1 -1
- official/nlp/configs/bert.py +1 -1
- official/nlp/configs/electra.py +1 -1
- official/nlp/configs/encoders.py +1 -1
- official/nlp/configs/encoders_test.py +1 -1
- official/nlp/configs/experiment_configs.py +1 -1
- official/nlp/configs/finetuning_experiments.py +1 -1
- official/nlp/configs/pretraining_experiments.py +1 -1
- official/nlp/configs/wmt_transformer_experiments.py +1 -1
- official/nlp/continuous_finetune_lib.py +1 -1
- official/nlp/continuous_finetune_lib_test.py +1 -1
- official/nlp/data/__init__.py +1 -1
- official/nlp/data/classifier_data_lib.py +1 -1
- official/nlp/data/classifier_data_lib_test.py +1 -1
- official/nlp/data/create_finetuning_data.py +1 -2
- official/nlp/data/create_pretraining_data.py +1 -3
- official/nlp/data/create_pretraining_data_test.py +1 -1
- official/nlp/data/create_xlnet_pretraining_data.py +1 -3
- official/nlp/data/create_xlnet_pretraining_data_test.py +1 -1
- official/nlp/data/data_loader.py +1 -1
- official/nlp/data/data_loader_factory.py +1 -1
- official/nlp/data/data_loader_factory_test.py +1 -1
- official/nlp/data/dual_encoder_dataloader.py +1 -1
- official/nlp/data/dual_encoder_dataloader_test.py +1 -1
- official/nlp/data/pretrain_dataloader.py +1 -1
- official/nlp/data/pretrain_dataloader_test.py +1 -1
- official/nlp/data/pretrain_dynamic_dataloader.py +1 -1
- official/nlp/data/pretrain_dynamic_dataloader_test.py +1 -1
- official/nlp/data/pretrain_text_dataloader.py +1 -1
- official/nlp/data/question_answering_dataloader.py +1 -1
- official/nlp/data/question_answering_dataloader_test.py +1 -1
- official/nlp/data/sentence_prediction_dataloader.py +1 -1
- official/nlp/data/sentence_prediction_dataloader_test.py +1 -1
- official/nlp/data/sentence_retrieval_lib.py +1 -1
- official/nlp/data/squad_lib.py +1 -1
- official/nlp/data/squad_lib_sp.py +1 -1
- official/nlp/data/tagging_data_lib.py +1 -1
- official/nlp/data/tagging_data_lib_test.py +1 -1
- official/nlp/data/tagging_dataloader.py +1 -1
- official/nlp/data/tagging_dataloader_test.py +1 -1
- official/nlp/data/train_sentencepiece.py +1 -1
- official/nlp/data/wmt_dataloader.py +1 -1
- official/nlp/data/wmt_dataloader_test.py +1 -1
- official/nlp/metrics/__init__.py +1 -1
- official/nlp/metrics/bleu.py +1 -1
- official/nlp/metrics/bleu_test.py +1 -1
- official/nlp/modeling/__init__.py +1 -1
- official/nlp/modeling/layers/__init__.py +1 -1
- official/nlp/modeling/layers/attention.py +1 -1
- official/nlp/modeling/layers/attention_test.py +1 -1
- official/nlp/modeling/layers/bigbird_attention.py +1 -1
- official/nlp/modeling/layers/bigbird_attention_test.py +1 -1
- official/nlp/modeling/layers/block_diag_feedforward.py +1 -1
- official/nlp/modeling/layers/block_diag_feedforward_test.py +1 -1
- official/nlp/modeling/layers/block_sparse_attention.py +187 -44
- official/nlp/modeling/layers/block_sparse_attention_test.py +137 -7
- official/nlp/modeling/layers/cls_head.py +1 -1
- official/nlp/modeling/layers/cls_head_test.py +1 -1
- official/nlp/modeling/layers/factorized_embedding.py +1 -1
- official/nlp/modeling/layers/factorized_embedding_test.py +1 -1
- official/nlp/modeling/layers/gated_feedforward.py +2 -2
- official/nlp/modeling/layers/gated_feedforward_test.py +1 -1
- official/nlp/modeling/layers/gaussian_process.py +1 -1
- official/nlp/modeling/layers/gaussian_process_test.py +1 -1
- official/nlp/modeling/layers/kernel_attention.py +1 -1
- official/nlp/modeling/layers/kernel_attention_test.py +1 -1
- official/nlp/modeling/layers/masked_lm.py +1 -1
- official/nlp/modeling/layers/masked_lm_test.py +1 -1
- official/nlp/modeling/layers/masked_softmax.py +1 -1
- official/nlp/modeling/layers/masked_softmax_test.py +1 -1
- official/nlp/modeling/layers/mat_mul_with_margin.py +1 -2
- official/nlp/modeling/layers/mat_mul_with_margin_test.py +1 -1
- official/nlp/modeling/layers/mixing.py +1 -1
- official/nlp/modeling/layers/mixing_test.py +1 -1
- official/nlp/modeling/layers/mobile_bert_layers.py +1 -1
- official/nlp/modeling/layers/mobile_bert_layers_test.py +1 -1
- official/nlp/modeling/layers/moe.py +1 -1
- official/nlp/modeling/layers/moe_test.py +1 -1
- official/nlp/modeling/layers/multi_channel_attention.py +1 -1
- official/nlp/modeling/layers/multi_channel_attention_test.py +1 -1
- official/nlp/modeling/layers/multi_query_attention.py +222 -4
- official/nlp/modeling/layers/multi_query_attention_test.py +201 -1
- official/nlp/modeling/layers/on_device_embedding.py +1 -1
- official/nlp/modeling/layers/on_device_embedding_test.py +1 -1
- official/nlp/modeling/layers/pack_optimization.py +1 -1
- official/nlp/modeling/layers/pack_optimization_test.py +1 -1
- official/nlp/modeling/layers/per_dim_scale_attention.py +1 -1
- official/nlp/modeling/layers/per_dim_scale_attention_test.py +1 -1
- official/nlp/modeling/layers/position_embedding.py +1 -1
- official/nlp/modeling/layers/position_embedding_test.py +1 -1
- official/nlp/modeling/layers/relative_attention.py +1 -1
- official/nlp/modeling/layers/relative_attention_test.py +1 -1
- official/nlp/modeling/layers/reuse_attention.py +1 -1
- official/nlp/modeling/layers/reuse_attention_test.py +1 -1
- official/nlp/modeling/layers/reuse_transformer.py +1 -1
- official/nlp/modeling/layers/reuse_transformer_test.py +1 -1
- official/nlp/modeling/layers/rezero_transformer.py +20 -1
- official/nlp/modeling/layers/rezero_transformer_test.py +1 -1
- official/nlp/modeling/layers/routing.py +1 -1
- official/nlp/modeling/layers/routing_test.py +1 -1
- official/nlp/modeling/layers/self_attention_mask.py +1 -1
- official/nlp/modeling/layers/spectral_normalization.py +1 -1
- official/nlp/modeling/layers/spectral_normalization_test.py +1 -1
- official/nlp/modeling/layers/talking_heads_attention.py +1 -1
- official/nlp/modeling/layers/talking_heads_attention_test.py +1 -1
- official/nlp/modeling/layers/text_layers.py +1 -1
- official/nlp/modeling/layers/text_layers_test.py +1 -1
- official/nlp/modeling/layers/tn_expand_condense.py +1 -1
- official/nlp/modeling/layers/tn_expand_condense_test.py +1 -1
- official/nlp/modeling/layers/tn_transformer_expand_condense.py +1 -3
- official/nlp/modeling/layers/tn_transformer_test.py +1 -1
- official/nlp/modeling/layers/transformer.py +1 -1
- official/nlp/modeling/layers/transformer_encoder_block.py +273 -52
- official/nlp/modeling/layers/transformer_encoder_block_test.py +215 -11
- official/nlp/modeling/layers/transformer_scaffold.py +1 -1
- official/nlp/modeling/layers/transformer_scaffold_test.py +1 -1
- official/nlp/modeling/layers/transformer_test.py +1 -1
- official/nlp/modeling/layers/transformer_xl.py +1 -1
- official/nlp/modeling/layers/transformer_xl_test.py +1 -1
- official/nlp/modeling/layers/util.py +1 -1
- official/nlp/modeling/losses/__init__.py +1 -1
- official/nlp/modeling/losses/weighted_sparse_categorical_crossentropy.py +1 -1
- official/nlp/modeling/losses/weighted_sparse_categorical_crossentropy_test.py +1 -1
- official/nlp/modeling/models/__init__.py +1 -1
- official/nlp/modeling/models/bert_classifier.py +1 -1
- official/nlp/modeling/models/bert_classifier_test.py +1 -1
- official/nlp/modeling/models/bert_pretrainer.py +1 -1
- official/nlp/modeling/models/bert_pretrainer_test.py +1 -1
- official/nlp/modeling/models/bert_span_labeler.py +1 -1
- official/nlp/modeling/models/bert_span_labeler_test.py +1 -1
- official/nlp/modeling/models/bert_token_classifier.py +1 -1
- official/nlp/modeling/models/bert_token_classifier_test.py +1 -1
- official/nlp/modeling/models/dual_encoder.py +1 -1
- official/nlp/modeling/models/dual_encoder_test.py +1 -1
- official/nlp/modeling/models/electra_pretrainer.py +1 -1
- official/nlp/modeling/models/electra_pretrainer_test.py +1 -1
- official/nlp/modeling/models/seq2seq_transformer.py +1 -1
- official/nlp/modeling/models/seq2seq_transformer_test.py +1 -1
- official/nlp/modeling/models/t5.py +1 -1
- official/nlp/modeling/models/t5_test.py +1 -1
- official/nlp/modeling/models/xlnet.py +1 -1
- official/nlp/modeling/models/xlnet_test.py +1 -1
- official/nlp/modeling/networks/__init__.py +1 -1
- official/nlp/modeling/networks/albert_encoder.py +1 -1
- official/nlp/modeling/networks/albert_encoder_test.py +1 -1
- official/nlp/modeling/networks/bert_dense_encoder_test.py +1 -2
- official/nlp/modeling/networks/bert_encoder.py +1 -1
- official/nlp/modeling/networks/bert_encoder_test.py +1 -2
- official/nlp/modeling/networks/classification.py +1 -1
- official/nlp/modeling/networks/classification_test.py +1 -1
- official/nlp/modeling/networks/encoder_scaffold.py +1 -1
- official/nlp/modeling/networks/encoder_scaffold_test.py +1 -1
- official/nlp/modeling/networks/fnet.py +1 -1
- official/nlp/modeling/networks/fnet_test.py +1 -1
- official/nlp/modeling/networks/funnel_transformer.py +1 -1
- official/nlp/modeling/networks/funnel_transformer_test.py +1 -1
- official/nlp/modeling/networks/mobile_bert_encoder.py +6 -4
- official/nlp/modeling/networks/mobile_bert_encoder_test.py +1 -1
- official/nlp/modeling/networks/packed_sequence_embedding.py +1 -1
- official/nlp/modeling/networks/packed_sequence_embedding_test.py +1 -3
- official/nlp/modeling/networks/span_labeling.py +1 -1
- official/nlp/modeling/networks/span_labeling_test.py +1 -1
- official/nlp/modeling/networks/sparse_mixer.py +1 -1
- official/nlp/modeling/networks/sparse_mixer_test.py +1 -1
- official/nlp/modeling/networks/xlnet_base.py +1 -1
- official/nlp/modeling/networks/xlnet_base_test.py +1 -1
- official/nlp/modeling/ops/__init__.py +1 -1
- official/nlp/modeling/ops/beam_search.py +1 -1
- official/nlp/modeling/ops/beam_search_test.py +1 -1
- official/nlp/modeling/ops/decoding_module.py +1 -1
- official/nlp/modeling/ops/decoding_module_test.py +1 -1
- official/nlp/modeling/ops/sampling_module.py +3 -3
- official/nlp/modeling/ops/segment_extractor.py +1 -1
- official/nlp/modeling/ops/segment_extractor_test.py +1 -1
- official/nlp/optimization.py +1 -1
- official/nlp/serving/__init__.py +1 -1
- official/nlp/serving/export_savedmodel.py +1 -1
- official/nlp/serving/export_savedmodel_test.py +1 -1
- official/nlp/serving/export_savedmodel_util.py +1 -1
- official/nlp/serving/serving_modules.py +1 -1
- official/nlp/serving/serving_modules_test.py +1 -1
- official/nlp/tasks/__init__.py +1 -1
- official/nlp/tasks/dual_encoder.py +1 -2
- official/nlp/tasks/dual_encoder_test.py +1 -1
- official/nlp/tasks/electra_task.py +1 -1
- official/nlp/tasks/electra_task_test.py +1 -1
- official/nlp/tasks/masked_lm.py +1 -1
- official/nlp/tasks/masked_lm_determinism_test.py +1 -1
- official/nlp/tasks/masked_lm_test.py +1 -1
- official/nlp/tasks/question_answering.py +1 -1
- official/nlp/tasks/question_answering_test.py +1 -1
- official/nlp/tasks/sentence_prediction.py +1 -1
- official/nlp/tasks/sentence_prediction_test.py +1 -1
- official/nlp/tasks/tagging.py +1 -1
- official/nlp/tasks/tagging_test.py +1 -1
- official/nlp/tasks/translation.py +1 -1
- official/nlp/tasks/translation_test.py +1 -1
- official/nlp/tasks/utils.py +1 -1
- official/nlp/tools/__init__.py +1 -1
- official/nlp/tools/export_tfhub.py +1 -1
- official/nlp/tools/export_tfhub_lib.py +1 -2
- official/nlp/tools/export_tfhub_lib_test.py +1 -1
- official/nlp/tools/squad_evaluate_v1_1.py +1 -1
- official/nlp/tools/squad_evaluate_v2_0.py +1 -1
- official/nlp/tools/tf1_bert_checkpoint_converter_lib.py +1 -1
- official/nlp/tools/tf2_albert_encoder_checkpoint_converter.py +1 -1
- official/nlp/tools/tf2_bert_encoder_checkpoint_converter.py +1 -1
- official/nlp/tools/tokenization.py +1 -1
- official/nlp/tools/tokenization_test.py +1 -1
- official/nlp/train.py +1 -1
- official/projects/__init__.py +1 -1
- official/projects/bigbird/__init__.py +1 -1
- official/projects/bigbird/encoder.py +1 -1
- official/projects/bigbird/encoder_test.py +1 -1
- official/projects/bigbird/experiment_configs.py +1 -1
- official/projects/bigbird/recompute_grad.py +1 -1
- official/projects/bigbird/recomputing_dropout.py +1 -1
- official/projects/bigbird/stateless_dropout.py +1 -1
- official/projects/centernet/__init__.py +1 -1
- official/projects/centernet/common/__init__.py +1 -1
- official/projects/centernet/common/registry_imports.py +1 -1
- official/projects/centernet/configs/__init__.py +1 -1
- official/projects/centernet/configs/backbones.py +1 -1
- official/projects/centernet/configs/centernet.py +1 -1
- official/projects/centernet/configs/centernet_test.py +1 -1
- official/projects/centernet/dataloaders/__init__.py +1 -1
- official/projects/centernet/dataloaders/centernet_input.py +1 -1
- official/projects/centernet/losses/__init__.py +1 -1
- official/projects/centernet/losses/centernet_losses.py +1 -1
- official/projects/centernet/losses/centernet_losses_test.py +1 -1
- official/projects/centernet/modeling/__init__.py +1 -1
- official/projects/centernet/modeling/backbones/__init__.py +1 -1
- official/projects/centernet/modeling/backbones/hourglass.py +1 -1
- official/projects/centernet/modeling/backbones/hourglass_test.py +1 -1
- official/projects/centernet/modeling/centernet_model.py +2 -2
- official/projects/centernet/modeling/centernet_model_test.py +1 -1
- official/projects/centernet/modeling/heads/__init__.py +1 -1
- official/projects/centernet/modeling/heads/centernet_head.py +2 -2
- official/projects/centernet/modeling/heads/centernet_head_test.py +1 -1
- official/projects/centernet/modeling/layers/__init__.py +1 -1
- official/projects/centernet/modeling/layers/cn_nn_blocks.py +1 -1
- official/projects/centernet/modeling/layers/cn_nn_blocks_test.py +1 -1
- official/projects/centernet/modeling/layers/detection_generator.py +1 -1
- official/projects/centernet/modeling/layers/detection_generator_test.py +1 -1
- official/projects/centernet/ops/__init__.py +1 -1
- official/projects/centernet/ops/box_list.py +1 -1
- official/projects/centernet/ops/box_list_ops.py +1 -1
- official/projects/centernet/ops/loss_ops.py +1 -1
- official/projects/centernet/ops/nms_ops.py +1 -1
- official/projects/centernet/ops/preprocess_ops.py +1 -1
- official/projects/centernet/ops/target_assigner.py +1 -1
- official/projects/centernet/ops/target_assigner_test.py +1 -1
- official/projects/centernet/tasks/__init__.py +1 -1
- official/projects/centernet/tasks/centernet.py +1 -1
- official/projects/centernet/train.py +1 -1
- official/projects/centernet/utils/__init__.py +1 -1
- official/projects/centernet/utils/checkpoints/__init__.py +1 -1
- official/projects/centernet/utils/checkpoints/config_classes.py +1 -1
- official/projects/centernet/utils/checkpoints/config_data.py +1 -1
- official/projects/centernet/utils/checkpoints/load_weights.py +1 -1
- official/projects/centernet/utils/checkpoints/read_checkpoints.py +1 -1
- official/projects/centernet/utils/tf2_centernet_checkpoint_converter.py +1 -1
- official/projects/deepmac_maskrcnn/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/common/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/common/registry_imports.py +1 -1
- official/projects/deepmac_maskrcnn/configs/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/configs/deep_mask_head_rcnn.py +1 -1
- official/projects/deepmac_maskrcnn/configs/deep_mask_head_rcnn_config_test.py +1 -1
- official/projects/deepmac_maskrcnn/modeling/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/modeling/heads/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/modeling/heads/hourglass_network.py +1 -1
- official/projects/deepmac_maskrcnn/modeling/heads/instance_heads.py +1 -3
- official/projects/deepmac_maskrcnn/modeling/heads/instance_heads_test.py +1 -2
- official/projects/deepmac_maskrcnn/modeling/maskrcnn_model.py +1 -3
- official/projects/deepmac_maskrcnn/modeling/maskrcnn_model_test.py +1 -3
- official/projects/deepmac_maskrcnn/serving/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/serving/detection.py +1 -1
- official/projects/deepmac_maskrcnn/serving/detection_test.py +1 -1
- official/projects/deepmac_maskrcnn/serving/export_saved_model.py +1 -1
- official/projects/deepmac_maskrcnn/tasks/__init__.py +1 -1
- official/projects/deepmac_maskrcnn/tasks/deep_mask_head_rcnn.py +1 -1
- official/projects/deepmac_maskrcnn/train.py +1 -1
- official/projects/detr/__init__.py +14 -0
- official/projects/detr/configs/__init__.py +14 -0
- official/projects/detr/configs/detr.py +277 -0
- official/projects/detr/configs/detr_test.py +51 -0
- official/projects/detr/dataloaders/__init__.py +14 -0
- official/projects/detr/dataloaders/coco.py +157 -0
- official/projects/detr/dataloaders/coco_test.py +111 -0
- official/projects/detr/dataloaders/detr_input.py +175 -0
- official/projects/detr/experiments/__init__.py +14 -0
- official/projects/detr/modeling/__init__.py +14 -0
- official/projects/detr/modeling/detr.py +345 -0
- official/projects/detr/modeling/detr_test.py +70 -0
- official/projects/detr/modeling/transformer.py +849 -0
- official/projects/detr/modeling/transformer_test.py +263 -0
- official/projects/detr/ops/__init__.py +14 -0
- official/projects/detr/ops/matchers.py +489 -0
- official/projects/detr/ops/matchers_test.py +95 -0
- official/projects/detr/optimization.py +151 -0
- official/projects/detr/serving/__init__.py +14 -0
- official/projects/detr/serving/export_module.py +103 -0
- official/projects/detr/serving/export_module_test.py +98 -0
- official/projects/detr/serving/export_saved_model.py +109 -0
- official/projects/detr/tasks/__init__.py +14 -0
- official/projects/detr/tasks/detection.py +433 -0
- official/projects/detr/tasks/detection_test.py +203 -0
- official/projects/detr/train.py +70 -0
- official/projects/maskconver/__init__.py +14 -0
- official/projects/maskconver/configs/__init__.py +14 -0
- official/projects/maskconver/configs/backbones.py +43 -0
- official/projects/maskconver/configs/decoders.py +36 -0
- official/projects/maskconver/configs/maskconver.py +523 -0
- official/projects/maskconver/configs/multiscale_maskconver.py +215 -0
- official/projects/maskconver/tasks/__init__.py +14 -0
- official/projects/maskconver/tasks/maskconver.py +641 -0
- official/projects/maskconver/tasks/multiscale_maskconver.py +278 -0
- official/projects/maskconver/train.py +30 -0
- official/projects/maxvit/__init__.py +1 -1
- official/projects/maxvit/configs/__init__.py +1 -1
- official/projects/maxvit/configs/backbones.py +1 -1
- official/projects/maxvit/configs/image_classification.py +1 -1
- official/projects/maxvit/configs/image_classification_test.py +1 -1
- official/projects/maxvit/configs/rcnn.py +1 -1
- official/projects/maxvit/configs/rcnn_test.py +1 -1
- official/projects/maxvit/configs/retinanet.py +1 -1
- official/projects/maxvit/configs/retinanet_test.py +1 -1
- official/projects/maxvit/configs/semantic_segmentation.py +1 -1
- official/projects/maxvit/configs/semantic_segmentation_test.py +1 -1
- official/projects/maxvit/modeling/__init__.py +1 -1
- official/projects/maxvit/modeling/common_ops.py +14 -1
- official/projects/maxvit/modeling/layers.py +1 -1
- official/projects/maxvit/modeling/maxvit.py +2 -2
- official/projects/maxvit/modeling/maxvit_test.py +1 -1
- official/projects/maxvit/registry_imports.py +1 -1
- official/projects/maxvit/train.py +1 -1
- official/projects/maxvit/train_test.py +1 -1
- official/projects/mobilebert/__init__.py +1 -1
- official/projects/mobilebert/distillation.py +1 -1
- official/projects/mobilebert/distillation_test.py +1 -1
- official/projects/mobilebert/export_tfhub.py +1 -1
- official/projects/mobilebert/model_utils.py +1 -1
- official/projects/mobilebert/run_distillation.py +1 -1
- official/projects/mobilebert/tf2_model_checkpoint_converter.py +1 -1
- official/projects/mobilebert/utils.py +1 -1
- official/projects/movinet/__init__.py +1 -1
- official/projects/movinet/configs/__init__.py +1 -1
- official/projects/movinet/configs/movinet.py +1 -1
- official/projects/movinet/configs/movinet_test.py +1 -1
- official/projects/movinet/modeling/__init__.py +1 -1
- official/projects/movinet/modeling/movinet.py +1 -1
- official/projects/movinet/modeling/movinet_layers.py +1 -1
- official/projects/movinet/modeling/movinet_layers_test.py +1 -1
- official/projects/movinet/modeling/movinet_model.py +1 -1
- official/projects/movinet/modeling/movinet_model_test.py +1 -1
- official/projects/movinet/modeling/movinet_test.py +1 -1
- official/projects/movinet/tools/__init__.py +1 -1
- official/projects/movinet/tools/convert_3d_2plus1d.py +1 -1
- official/projects/movinet/tools/convert_3d_2plus1d_test.py +1 -1
- official/projects/movinet/tools/export_saved_model.py +1 -1
- official/projects/movinet/tools/export_saved_model_test.py +6 -3
- official/projects/movinet/tools/quantize_movinet.py +1 -1
- official/projects/movinet/train.py +1 -1
- official/projects/movinet/train_test.py +1 -1
- official/projects/nhnet/__init__.py +1 -1
- official/projects/nhnet/configs.py +1 -1
- official/projects/nhnet/configs_test.py +1 -1
- official/projects/nhnet/decoder.py +1 -1
- official/projects/nhnet/decoder_test.py +1 -1
- official/projects/nhnet/evaluation.py +1 -3
- official/projects/nhnet/input_pipeline.py +1 -1
- official/projects/nhnet/models.py +1 -1
- official/projects/nhnet/models_test.py +1 -1
- official/projects/nhnet/optimizer.py +1 -1
- official/projects/nhnet/raw_data_process.py +1 -1
- official/projects/nhnet/raw_data_processor.py +1 -1
- official/projects/nhnet/trainer.py +1 -6
- official/projects/nhnet/trainer_test.py +1 -1
- official/projects/nhnet/utils.py +1 -1
- official/projects/panoptic/__init__.py +1 -1
- official/projects/panoptic/configs/__init__.py +1 -1
- official/projects/panoptic/configs/panoptic_deeplab.py +5 -6
- official/projects/panoptic/configs/panoptic_maskrcnn.py +1 -1
- official/projects/panoptic/tasks/__init__.py +1 -1
- official/projects/panoptic/tasks/panoptic_deeplab.py +1 -1
- official/projects/panoptic/tasks/panoptic_maskrcnn.py +3 -1
- official/projects/panoptic/train.py +1 -1
- official/projects/qat/__init__.py +1 -1
- official/projects/qat/nlp/__init__.py +1 -1
- official/projects/qat/nlp/configs/__init__.py +1 -1
- official/projects/qat/nlp/configs/finetuning_experiments.py +1 -1
- official/projects/qat/nlp/modeling/__init__.py +1 -1
- official/projects/qat/nlp/modeling/layers/__init__.py +1 -1
- official/projects/qat/nlp/modeling/layers/mobile_bert_layers.py +1 -1
- official/projects/qat/nlp/modeling/layers/multi_head_attention.py +1 -1
- official/projects/qat/nlp/modeling/layers/transformer_encoder_block.py +1 -1
- official/projects/qat/nlp/modeling/layers/transformer_encoder_block_test.py +1 -1
- official/projects/qat/nlp/modeling/models/__init__.py +1 -1
- official/projects/qat/nlp/modeling/models/bert_span_labeler.py +1 -1
- official/projects/qat/nlp/modeling/networks/__init__.py +1 -1
- official/projects/qat/nlp/modeling/networks/span_labeling.py +1 -1
- official/projects/qat/nlp/pretrained_checkpoint_converter.py +1 -3
- official/projects/qat/nlp/quantization/__init__.py +1 -1
- official/projects/qat/nlp/quantization/configs.py +1 -1
- official/projects/qat/nlp/quantization/configs_test.py +1 -2
- official/projects/qat/nlp/quantization/helper.py +1 -1
- official/projects/qat/nlp/quantization/schemes.py +1 -3
- official/projects/qat/nlp/quantization/wrappers.py +1 -1
- official/projects/qat/nlp/registry_imports.py +1 -1
- official/projects/qat/nlp/tasks/__init__.py +1 -1
- official/projects/qat/nlp/tasks/question_answering.py +1 -1
- official/projects/qat/nlp/tasks/question_answering_test.py +1 -1
- official/projects/qat/nlp/train.py +1 -1
- official/projects/qat/vision/__init__.py +1 -1
- official/projects/qat/vision/configs/__init__.py +1 -1
- official/projects/qat/vision/configs/common.py +1 -1
- official/projects/qat/vision/configs/image_classification.py +1 -1
- official/projects/qat/vision/configs/image_classification_test.py +1 -1
- official/projects/qat/vision/configs/retinanet.py +1 -1
- official/projects/qat/vision/configs/retinanet_test.py +1 -1
- official/projects/qat/vision/configs/semantic_segmentation.py +1 -1
- official/projects/qat/vision/configs/semantic_segmentation_test.py +1 -1
- official/projects/qat/vision/modeling/__init__.py +1 -1
- official/projects/qat/vision/modeling/factory.py +1 -3
- official/projects/qat/vision/modeling/factory_test.py +1 -3
- official/projects/qat/vision/modeling/heads/__init__.py +1 -1
- official/projects/qat/vision/modeling/heads/dense_prediction_heads.py +1 -3
- official/projects/qat/vision/modeling/heads/dense_prediction_heads_test.py +1 -2
- official/projects/qat/vision/modeling/layers/__init__.py +1 -1
- official/projects/qat/vision/modeling/layers/nn_blocks.py +1 -3
- official/projects/qat/vision/modeling/layers/nn_blocks_test.py +1 -2
- official/projects/qat/vision/modeling/layers/nn_layers.py +2 -2
- official/projects/qat/vision/modeling/layers/nn_layers_test.py +1 -2
- official/projects/qat/vision/modeling/segmentation_model.py +1 -2
- official/projects/qat/vision/n_bit/__init__.py +1 -1
- official/projects/qat/vision/n_bit/configs.py +1 -1
- official/projects/qat/vision/n_bit/configs_test.py +1 -3
- official/projects/qat/vision/n_bit/nn_blocks.py +1 -3
- official/projects/qat/vision/n_bit/nn_blocks_test.py +1 -2
- official/projects/qat/vision/n_bit/nn_layers.py +1 -1
- official/projects/qat/vision/n_bit/schemes.py +1 -3
- official/projects/qat/vision/quantization/__init__.py +1 -1
- official/projects/qat/vision/quantization/configs.py +1 -1
- official/projects/qat/vision/quantization/configs_test.py +1 -3
- official/projects/qat/vision/quantization/helper.py +1 -1
- official/projects/qat/vision/quantization/helper_test.py +1 -1
- official/projects/qat/vision/quantization/layer_transforms.py +1 -1
- official/projects/qat/vision/quantization/schemes.py +1 -3
- official/projects/qat/vision/registry_imports.py +1 -1
- official/projects/qat/vision/serving/__init__.py +1 -1
- official/projects/qat/vision/serving/export_module.py +1 -1
- official/projects/qat/vision/serving/export_saved_model.py +1 -1
- official/projects/qat/vision/serving/export_tflite.py +1 -1
- official/projects/qat/vision/tasks/__init__.py +1 -1
- official/projects/qat/vision/tasks/image_classification.py +1 -1
- official/projects/qat/vision/tasks/image_classification_test.py +1 -1
- official/projects/qat/vision/tasks/retinanet.py +1 -1
- official/projects/qat/vision/tasks/retinanet_test.py +1 -1
- official/projects/qat/vision/tasks/semantic_segmentation.py +1 -1
- official/projects/qat/vision/train.py +1 -1
- official/projects/roformer/__init__.py +1 -1
- official/projects/roformer/roformer.py +1 -1
- official/projects/roformer/roformer_attention.py +1 -1
- official/projects/roformer/roformer_attention_test.py +1 -1
- official/projects/roformer/roformer_encoder.py +1 -1
- official/projects/roformer/roformer_encoder_block.py +1 -1
- official/projects/roformer/roformer_encoder_block_test.py +1 -1
- official/projects/roformer/roformer_encoder_test.py +1 -1
- official/projects/roformer/roformer_experiments.py +1 -1
- official/projects/roformer/train.py +1 -1
- official/projects/teams/__init__.py +1 -1
- official/projects/teams/teams.py +1 -1
- official/projects/teams/teams_experiments.py +1 -1
- official/projects/teams/teams_pretrainer.py +1 -1
- official/projects/teams/teams_pretrainer_test.py +1 -1
- official/projects/teams/teams_task.py +1 -1
- official/projects/teams/teams_task_test.py +1 -1
- official/projects/teams/train.py +1 -1
- official/projects/triviaqa/__init__.py +1 -1
- official/projects/triviaqa/dataset.py +1 -1
- official/projects/triviaqa/download_and_prepare.py +1 -1
- official/projects/triviaqa/evaluate.py +1 -1
- official/projects/triviaqa/evaluation.py +1 -1
- official/projects/triviaqa/inputs.py +1 -1
- official/projects/triviaqa/modeling.py +1 -1
- official/projects/triviaqa/predict.py +1 -1
- official/projects/triviaqa/prediction.py +1 -1
- official/projects/triviaqa/preprocess.py +1 -1
- official/projects/triviaqa/sentencepiece_pb2.py +1 -1
- official/projects/triviaqa/train.py +1 -1
- official/projects/video_ssl/__init__.py +1 -1
- official/projects/video_ssl/configs/__init__.py +1 -1
- official/projects/video_ssl/configs/video_ssl.py +1 -1
- official/projects/video_ssl/configs/video_ssl_test.py +1 -1
- official/projects/video_ssl/dataloaders/__init__.py +1 -1
- official/projects/video_ssl/dataloaders/video_ssl_input.py +1 -1
- official/projects/video_ssl/dataloaders/video_ssl_input_test.py +1 -2
- official/projects/video_ssl/losses/__init__.py +1 -1
- official/projects/video_ssl/losses/losses.py +1 -2
- official/projects/video_ssl/modeling/__init__.py +1 -1
- official/projects/video_ssl/modeling/video_ssl_model.py +1 -3
- official/projects/video_ssl/ops/__init__.py +1 -1
- official/projects/video_ssl/ops/video_ssl_preprocess_ops.py +1 -1
- official/projects/video_ssl/ops/video_ssl_preprocess_ops_test.py +1 -1
- official/projects/video_ssl/tasks/__init__.py +1 -1
- official/projects/video_ssl/tasks/linear_eval.py +1 -1
- official/projects/video_ssl/tasks/pretrain.py +1 -1
- official/projects/video_ssl/tasks/pretrain_test.py +1 -1
- official/projects/video_ssl/train.py +1 -1
- official/projects/volumetric_models/__init__.py +1 -1
- official/projects/volumetric_models/configs/__init__.py +1 -1
- official/projects/volumetric_models/configs/backbones.py +1 -1
- official/projects/volumetric_models/configs/decoders.py +1 -1
- official/projects/volumetric_models/configs/semantic_segmentation_3d.py +1 -1
- official/projects/volumetric_models/configs/semantic_segmentation_3d_test.py +1 -1
- official/projects/volumetric_models/dataloaders/__init__.py +1 -1
- official/projects/volumetric_models/dataloaders/segmentation_input_3d.py +1 -1
- official/projects/volumetric_models/dataloaders/segmentation_input_3d_test.py +1 -1
- official/projects/volumetric_models/evaluation/__init__.py +1 -1
- official/projects/volumetric_models/evaluation/segmentation_metrics.py +1 -1
- official/projects/volumetric_models/evaluation/segmentation_metrics_test.py +1 -1
- official/projects/volumetric_models/losses/__init__.py +1 -1
- official/projects/volumetric_models/losses/segmentation_losses.py +1 -1
- official/projects/volumetric_models/losses/segmentation_losses_test.py +1 -1
- official/projects/volumetric_models/modeling/__init__.py +1 -1
- official/projects/volumetric_models/modeling/backbones/__init__.py +1 -1
- official/projects/volumetric_models/modeling/backbones/unet_3d.py +1 -2
- official/projects/volumetric_models/modeling/backbones/unet_3d_test.py +1 -2
- official/projects/volumetric_models/modeling/decoders/__init__.py +1 -1
- official/projects/volumetric_models/modeling/decoders/factory.py +1 -3
- official/projects/volumetric_models/modeling/decoders/factory_test.py +1 -1
- official/projects/volumetric_models/modeling/decoders/unet_3d_decoder.py +1 -1
- official/projects/volumetric_models/modeling/decoders/unet_3d_decoder_test.py +1 -2
- official/projects/volumetric_models/modeling/factory.py +1 -3
- official/projects/volumetric_models/modeling/factory_test.py +1 -1
- official/projects/volumetric_models/modeling/heads/__init__.py +1 -1
- official/projects/volumetric_models/modeling/heads/segmentation_heads_3d.py +1 -1
- official/projects/volumetric_models/modeling/heads/segmentation_heads_3d_test.py +1 -1
- official/projects/volumetric_models/modeling/nn_blocks_3d.py +2 -3
- official/projects/volumetric_models/modeling/nn_blocks_3d_test.py +1 -2
- official/projects/volumetric_models/modeling/segmentation_model_test.py +1 -1
- official/projects/volumetric_models/registry_imports.py +1 -1
- official/projects/volumetric_models/serving/__init__.py +1 -1
- official/projects/volumetric_models/serving/export_saved_model.py +1 -1
- official/projects/volumetric_models/serving/semantic_segmentation_3d.py +1 -1
- official/projects/volumetric_models/serving/semantic_segmentation_3d_test.py +3 -3
- official/projects/volumetric_models/tasks/__init__.py +1 -1
- official/projects/volumetric_models/tasks/semantic_segmentation_3d.py +1 -1
- official/projects/volumetric_models/tasks/semantic_segmentation_3d_test.py +1 -1
- official/projects/volumetric_models/train.py +1 -1
- official/projects/volumetric_models/train_test.py +1 -1
- official/projects/waste_identification_ml/__init__.py +1 -1
- official/projects/waste_identification_ml/data_generation/__init__.py +1 -1
- official/projects/waste_identification_ml/data_generation/utils.py +1 -1
- official/projects/waste_identification_ml/data_generation/utils_test.py +1 -1
- official/projects/yolo/__init__.py +1 -1
- official/projects/yolo/common/__init__.py +1 -1
- official/projects/yolo/common/registry_imports.py +1 -1
- official/projects/yolo/configs/__init__.py +1 -1
- official/projects/yolo/configs/backbones.py +1 -1
- official/projects/yolo/configs/darknet_classification.py +1 -1
- official/projects/yolo/configs/decoders.py +1 -1
- official/projects/yolo/configs/yolo.py +1 -1
- official/projects/yolo/configs/yolov7.py +17 -1
- official/projects/yolo/dataloaders/__init__.py +1 -1
- official/projects/yolo/dataloaders/classification_input.py +1 -1
- official/projects/yolo/dataloaders/tf_example_decoder.py +1 -1
- official/projects/yolo/dataloaders/yolo_input.py +1 -1
- official/projects/yolo/losses/__init__.py +1 -1
- official/projects/yolo/losses/yolo_loss.py +1 -1
- official/projects/yolo/losses/yolo_loss_test.py +1 -1
- official/projects/yolo/losses/yolov7_loss.py +1 -1
- official/projects/yolo/losses/yolov7_loss_test.py +1 -1
- official/projects/yolo/modeling/__init__.py +1 -1
- official/projects/yolo/modeling/backbones/__init__.py +1 -1
- official/projects/yolo/modeling/backbones/darknet.py +1 -1
- official/projects/yolo/modeling/backbones/darknet_test.py +1 -1
- official/projects/yolo/modeling/backbones/yolov7.py +69 -1
- official/projects/yolo/modeling/backbones/yolov7_test.py +1 -1
- official/projects/yolo/modeling/decoders/__init__.py +1 -1
- official/projects/yolo/modeling/decoders/yolo_decoder.py +1 -1
- official/projects/yolo/modeling/decoders/yolo_decoder_test.py +1 -2
- official/projects/yolo/modeling/decoders/yolov7.py +90 -1
- official/projects/yolo/modeling/decoders/yolov7_test.py +1 -1
- official/projects/yolo/modeling/factory.py +1 -1
- official/projects/yolo/modeling/factory_test.py +1 -1
- official/projects/yolo/modeling/heads/__init__.py +1 -1
- official/projects/yolo/modeling/heads/yolo_head.py +1 -1
- official/projects/yolo/modeling/heads/yolo_head_test.py +1 -2
- official/projects/yolo/modeling/heads/yolov7_head.py +1 -1
- official/projects/yolo/modeling/heads/yolov7_head_test.py +1 -1
- official/projects/yolo/modeling/layers/__init__.py +1 -1
- official/projects/yolo/modeling/layers/detection_generator.py +1 -1
- official/projects/yolo/modeling/layers/detection_generator_test.py +1 -1
- official/projects/yolo/modeling/layers/nn_blocks.py +1 -1
- official/projects/yolo/modeling/layers/nn_blocks_test.py +1 -1
- official/projects/yolo/modeling/yolo_model.py +2 -2
- official/projects/yolo/modeling/yolov7_model.py +2 -2
- official/projects/yolo/ops/__init__.py +1 -1
- official/projects/yolo/ops/anchor.py +1 -1
- official/projects/yolo/ops/box_ops.py +1 -1
- official/projects/yolo/ops/box_ops_test.py +1 -1
- official/projects/yolo/ops/initializer_ops.py +1 -1
- official/projects/yolo/ops/kmeans_anchors.py +1 -1
- official/projects/yolo/ops/kmeans_anchors_test.py +1 -1
- official/projects/yolo/ops/loss_utils.py +1 -1
- official/projects/yolo/ops/math_ops.py +1 -1
- official/projects/yolo/ops/mosaic.py +1 -1
- official/projects/yolo/ops/preprocessing_ops.py +1 -1
- official/projects/yolo/ops/preprocessing_ops_test.py +1 -1
- official/projects/yolo/optimization/__init__.py +1 -1
- official/projects/yolo/optimization/configs/__init__.py +1 -1
- official/projects/yolo/optimization/configs/optimization_config.py +1 -1
- official/projects/yolo/optimization/configs/optimizer_config.py +1 -1
- official/projects/yolo/optimization/optimizer_factory.py +1 -1
- official/projects/yolo/optimization/sgd_torch.py +1 -1
- official/projects/yolo/serving/__init__.py +1 -1
- official/projects/yolo/serving/export_module_factory.py +1 -1
- official/projects/yolo/serving/export_saved_model.py +1 -1
- official/projects/yolo/serving/export_tflite.py +1 -1
- official/projects/yolo/serving/model_fn.py +1 -1
- official/projects/yolo/tasks/__init__.py +1 -1
- official/projects/yolo/tasks/image_classification.py +1 -1
- official/projects/yolo/tasks/task_utils.py +1 -1
- official/projects/yolo/tasks/yolo.py +1 -1
- official/projects/yolo/tasks/yolov7.py +1 -1
- official/projects/yolo/train.py +1 -1
- official/projects/yt8m/__init__.py +1 -1
- official/projects/yt8m/configs/__init__.py +1 -1
- official/projects/yt8m/configs/yt8m.py +1 -1
- official/projects/yt8m/configs/yt8m_test.py +1 -1
- official/projects/yt8m/modeling/__init__.py +1 -1
- official/projects/yt8m/modeling/backbones/__init__.py +1 -1
- official/projects/yt8m/modeling/backbones/dbof.py +1 -1
- official/projects/yt8m/modeling/backbones/dbof_test.py +1 -1
- official/projects/yt8m/modeling/heads/__init__.py +1 -1
- official/projects/yt8m/modeling/heads/logistic.py +1 -1
- official/projects/yt8m/modeling/heads/moe.py +1 -1
- official/projects/yt8m/modeling/nn_layers.py +1 -1
- official/projects/yt8m/modeling/nn_layers_test.py +1 -1
- official/projects/yt8m/modeling/yt8m_model.py +1 -1
- official/projects/yt8m/modeling/yt8m_model_test.py +1 -1
- official/projects/yt8m/modeling/yt8m_model_utils.py +1 -1
- official/projects/yt8m/modeling/yt8m_model_utils_test.py +1 -1
- official/projects/yt8m/tasks/__init__.py +1 -1
- official/projects/yt8m/tasks/yt8m_task.py +1 -1
- official/projects/yt8m/train.py +1 -1
- official/projects/yt8m/train_test.py +1 -1
- official/recommendation/__init__.py +1 -1
- official/recommendation/constants.py +1 -1
- official/recommendation/create_ncf_data.py +1 -2
- official/recommendation/data_pipeline.py +1 -1
- official/recommendation/data_preprocessing.py +1 -1
- official/recommendation/data_test.py +4 -4
- official/recommendation/movielens.py +1 -2
- official/recommendation/ncf_common.py +1 -1
- official/recommendation/ncf_input_pipeline.py +1 -1
- official/recommendation/ncf_keras_main.py +1 -1
- official/recommendation/ncf_test.py +1 -1
- official/recommendation/neumf_model.py +1 -1
- official/recommendation/popen_helper.py +1 -1
- official/recommendation/ranking/__init__.py +1 -1
- official/recommendation/ranking/common.py +1 -1
- official/recommendation/ranking/configs/__init__.py +1 -1
- official/recommendation/ranking/configs/config.py +14 -1
- official/recommendation/ranking/configs/config_test.py +1 -1
- official/recommendation/ranking/data/__init__.py +1 -1
- official/recommendation/ranking/data/data_pipeline.py +9 -2
- official/recommendation/ranking/data/data_pipeline_multi_hot.py +8 -2
- official/recommendation/ranking/data/data_pipeline_multi_hot_test.py +12 -6
- official/recommendation/ranking/data/data_pipeline_test.py +18 -8
- official/recommendation/ranking/task.py +102 -19
- official/recommendation/ranking/task_test.py +1 -1
- official/recommendation/ranking/train.py +1 -1
- official/recommendation/ranking/train_test.py +76 -31
- official/recommendation/stat_utils.py +1 -1
- official/recommendation/uplift/__init__.py +1 -1
- official/recommendation/uplift/keras_test_case.py +1 -1
- official/recommendation/uplift/keys.py +1 -1
- official/recommendation/uplift/layers/__init__.py +1 -1
- official/recommendation/uplift/layers/encoders/__init__.py +1 -1
- official/recommendation/uplift/layers/encoders/concat_features.py +1 -1
- official/recommendation/uplift/layers/encoders/concat_features_test.py +1 -1
- official/recommendation/uplift/layers/heads/__init__.py +1 -1
- official/recommendation/uplift/layers/heads/two_tower_logits_head.py +1 -1
- official/recommendation/uplift/layers/heads/two_tower_logits_head_test.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/__init__.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/base_uplift_networks.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/two_tower_output_head.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/two_tower_output_head_test.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/two_tower_uplift_network.py +1 -1
- official/recommendation/uplift/layers/uplift_networks/two_tower_uplift_network_test.py +1 -1
- official/recommendation/uplift/losses/__init__.py +1 -1
- official/recommendation/uplift/losses/true_logits_loss.py +1 -1
- official/recommendation/uplift/losses/true_logits_loss_test.py +1 -1
- official/recommendation/uplift/metrics/__init__.py +1 -1
- official/recommendation/uplift/metrics/label_mean.py +1 -1
- official/recommendation/uplift/metrics/label_mean_test.py +1 -1
- official/recommendation/uplift/metrics/label_variance.py +1 -1
- official/recommendation/uplift/metrics/label_variance_test.py +1 -1
- official/recommendation/uplift/metrics/loss_metric.py +1 -1
- official/recommendation/uplift/metrics/loss_metric_test.py +1 -1
- official/recommendation/uplift/metrics/metric_configs.py +1 -1
- official/recommendation/uplift/metrics/poisson_metrics.py +1 -1
- official/recommendation/uplift/metrics/poisson_metrics_test.py +1 -1
- official/recommendation/uplift/metrics/sliced_metric.py +1 -1
- official/recommendation/uplift/metrics/sliced_metric_test.py +1 -1
- official/recommendation/uplift/metrics/treatment_fraction.py +1 -1
- official/recommendation/uplift/metrics/treatment_fraction_test.py +1 -1
- official/recommendation/uplift/metrics/treatment_sliced_metric.py +1 -1
- official/recommendation/uplift/metrics/treatment_sliced_metric_test.py +1 -1
- official/recommendation/uplift/metrics/uplift_mean.py +1 -1
- official/recommendation/uplift/metrics/uplift_mean_test.py +1 -1
- official/recommendation/uplift/metrics/variance.py +1 -1
- official/recommendation/uplift/metrics/variance_test.py +12 -10
- official/recommendation/uplift/models/__init__.py +1 -1
- official/recommendation/uplift/models/two_tower_uplift_model.py +1 -1
- official/recommendation/uplift/models/two_tower_uplift_model_test.py +1 -1
- official/recommendation/uplift/types.py +1 -1
- official/recommendation/uplift/utils.py +3 -3
- official/recommendation/uplift/utils_test.py +1 -1
- official/utils/__init__.py +1 -1
- official/utils/docs/__init__.py +1 -1
- official/utils/docs/build_orbit_api_docs.py +1 -1
- official/utils/docs/build_tfm_api_docs.py +1 -1
- official/utils/flags/__init__.py +1 -1
- official/utils/flags/_base.py +1 -1
- official/utils/flags/_benchmark.py +1 -1
- official/utils/flags/_conventions.py +1 -1
- official/utils/flags/_device.py +1 -1
- official/utils/flags/_distribution.py +1 -1
- official/utils/flags/_misc.py +1 -1
- official/utils/flags/_performance.py +1 -1
- official/utils/flags/core.py +1 -1
- official/utils/flags/flags_test.py +1 -1
- official/utils/hyperparams_flags.py +1 -1
- official/utils/misc/__init__.py +1 -1
- official/utils/misc/keras_utils.py +1 -1
- official/utils/misc/model_helpers.py +1 -1
- official/utils/misc/model_helpers_test.py +3 -3
- official/utils/testing/__init__.py +1 -1
- official/utils/testing/integration.py +1 -1
- official/utils/testing/mock_task.py +1 -1
- official/vision/__init__.py +1 -1
- official/vision/configs/__init__.py +1 -1
- official/vision/configs/backbones.py +3 -1
- official/vision/configs/backbones_3d.py +1 -2
- official/vision/configs/common.py +1 -3
- official/vision/configs/decoders.py +1 -3
- official/vision/configs/image_classification.py +1 -1
- official/vision/configs/image_classification_test.py +1 -1
- official/vision/configs/maskrcnn.py +1 -1
- official/vision/configs/maskrcnn_test.py +1 -1
- official/vision/configs/retinanet.py +2 -1
- official/vision/configs/retinanet_test.py +1 -1
- official/vision/configs/semantic_segmentation.py +7 -8
- official/vision/configs/semantic_segmentation_test.py +1 -1
- official/vision/configs/video_classification.py +1 -1
- official/vision/configs/video_classification_test.py +1 -1
- official/vision/data/__init__.py +1 -1
- official/vision/data/create_coco_tf_record.py +1 -1
- official/vision/data/fake_feature_generator.py +8 -5
- official/vision/data/image_utils.py +1 -1
- official/vision/data/image_utils_test.py +1 -1
- official/vision/data/process_coco_few_shot_json_files.py +1 -1
- official/vision/data/tf_example_builder.py +1 -1
- official/vision/data/tf_example_builder_test.py +1 -1
- official/vision/data/tf_example_feature_key.py +1 -1
- official/vision/data/tfrecord_lib.py +1 -1
- official/vision/data/tfrecord_lib_test.py +1 -1
- official/vision/dataloaders/__init__.py +1 -1
- official/vision/dataloaders/classification_input.py +1 -2
- official/vision/dataloaders/decoder.py +1 -1
- official/vision/dataloaders/input_reader.py +1 -1
- official/vision/dataloaders/input_reader_factory.py +1 -1
- official/vision/dataloaders/maskrcnn_input.py +1 -2
- official/vision/dataloaders/parser.py +1 -1
- official/vision/dataloaders/retinanet_input.py +1 -3
- official/vision/dataloaders/segmentation_input.py +9 -4
- official/vision/dataloaders/tf_example_decoder.py +1 -1
- official/vision/dataloaders/tf_example_decoder_test.py +1 -2
- official/vision/dataloaders/tf_example_label_map_decoder.py +1 -2
- official/vision/dataloaders/tf_example_label_map_decoder_test.py +1 -2
- official/vision/dataloaders/tfds_classification_decoders.py +1 -1
- official/vision/dataloaders/tfds_detection_decoders.py +1 -1
- official/vision/dataloaders/tfds_factory.py +1 -1
- official/vision/dataloaders/tfds_factory_test.py +1 -1
- official/vision/dataloaders/tfds_segmentation_decoders.py +1 -1
- official/vision/dataloaders/tfexample_utils.py +1 -1
- official/vision/dataloaders/utils.py +1 -2
- official/vision/dataloaders/utils_test.py +1 -3
- official/vision/dataloaders/video_input.py +1 -1
- official/vision/dataloaders/video_input_test.py +1 -2
- official/vision/evaluation/__init__.py +1 -1
- official/vision/evaluation/coco_evaluator.py +1 -2
- official/vision/evaluation/coco_utils.py +1 -3
- official/vision/evaluation/coco_utils_test.py +1 -1
- official/vision/evaluation/instance_metrics.py +1 -1
- official/vision/evaluation/instance_metrics_test.py +1 -1
- official/vision/evaluation/iou.py +1 -1
- official/vision/evaluation/iou_test.py +1 -1
- official/vision/evaluation/panoptic_quality.py +1 -1
- official/vision/evaluation/panoptic_quality_evaluator.py +1 -1
- official/vision/evaluation/panoptic_quality_evaluator_test.py +1 -1
- official/vision/evaluation/panoptic_quality_test.py +1 -1
- official/vision/evaluation/segmentation_metrics.py +1 -1
- official/vision/evaluation/segmentation_metrics_test.py +1 -1
- official/vision/evaluation/wod_detection_evaluator.py +1 -1
- official/vision/losses/__init__.py +1 -1
- official/vision/losses/focal_loss.py +1 -1
- official/vision/losses/loss_utils.py +1 -1
- official/vision/losses/maskrcnn_losses.py +1 -2
- official/vision/losses/maskrcnn_losses_test.py +1 -1
- official/vision/losses/retinanet_losses.py +1 -2
- official/vision/losses/segmentation_losses.py +1 -1
- official/vision/losses/segmentation_losses_test.py +1 -1
- official/vision/modeling/__init__.py +1 -1
- official/vision/modeling/backbones/__init__.py +1 -1
- official/vision/modeling/backbones/efficientnet.py +1 -3
- official/vision/modeling/backbones/efficientnet_test.py +1 -2
- official/vision/modeling/backbones/factory.py +1 -3
- official/vision/modeling/backbones/factory_test.py +1 -2
- official/vision/modeling/backbones/mobiledet.py +1 -1
- official/vision/modeling/backbones/mobiledet_test.py +1 -1
- official/vision/modeling/backbones/mobilenet.py +73 -3
- official/vision/modeling/backbones/mobilenet_test.py +12 -3
- official/vision/modeling/backbones/resnet.py +1 -2
- official/vision/modeling/backbones/resnet_3d.py +1 -2
- official/vision/modeling/backbones/resnet_3d_test.py +1 -2
- official/vision/modeling/backbones/resnet_deeplab.py +5 -4
- official/vision/modeling/backbones/resnet_deeplab_test.py +21 -10
- official/vision/modeling/backbones/resnet_test.py +1 -2
- official/vision/modeling/backbones/resnet_unet.py +1 -2
- official/vision/modeling/backbones/resnet_unet_test.py +1 -3
- official/vision/modeling/backbones/revnet.py +1 -2
- official/vision/modeling/backbones/revnet_test.py +1 -2
- official/vision/modeling/backbones/spinenet.py +1 -3
- official/vision/modeling/backbones/spinenet_mobile.py +1 -3
- official/vision/modeling/backbones/spinenet_mobile_test.py +1 -2
- official/vision/modeling/backbones/spinenet_test.py +1 -2
- official/vision/modeling/backbones/vit.py +53 -27
- official/vision/modeling/backbones/vit_specs.py +1 -1
- official/vision/modeling/backbones/vit_test.py +12 -1
- official/vision/modeling/classification_model.py +1 -2
- official/vision/modeling/classification_model_test.py +1 -2
- official/vision/modeling/decoders/__init__.py +1 -1
- official/vision/modeling/decoders/aspp.py +1 -3
- official/vision/modeling/decoders/aspp_test.py +1 -2
- official/vision/modeling/decoders/factory.py +1 -3
- official/vision/modeling/decoders/factory_test.py +1 -1
- official/vision/modeling/decoders/fpn.py +1 -2
- official/vision/modeling/decoders/fpn_test.py +1 -2
- official/vision/modeling/decoders/nasfpn.py +1 -3
- official/vision/modeling/decoders/nasfpn_test.py +1 -2
- official/vision/modeling/factory.py +1 -1
- official/vision/modeling/factory_3d.py +1 -2
- official/vision/modeling/factory_test.py +1 -2
- official/vision/modeling/heads/__init__.py +1 -1
- official/vision/modeling/heads/dense_prediction_heads.py +1 -3
- official/vision/modeling/heads/dense_prediction_heads_test.py +1 -3
- official/vision/modeling/heads/instance_heads.py +3 -4
- official/vision/modeling/heads/instance_heads_test.py +1 -2
- official/vision/modeling/heads/segmentation_heads.py +2 -2
- official/vision/modeling/heads/segmentation_heads_test.py +1 -2
- official/vision/modeling/layers/__init__.py +1 -1
- official/vision/modeling/layers/box_sampler.py +1 -2
- official/vision/modeling/layers/deeplab.py +1 -1
- official/vision/modeling/layers/deeplab_test.py +1 -1
- official/vision/modeling/layers/detection_generator.py +1 -3
- official/vision/modeling/layers/detection_generator_test.py +1 -3
- official/vision/modeling/layers/edgetpu.py +1 -1
- official/vision/modeling/layers/edgetpu_test.py +1 -1
- official/vision/modeling/layers/mask_sampler.py +1 -2
- official/vision/modeling/layers/nn_blocks.py +1 -2
- official/vision/modeling/layers/nn_blocks_3d.py +1 -2
- official/vision/modeling/layers/nn_blocks_3d_test.py +1 -2
- official/vision/modeling/layers/nn_blocks_test.py +1 -3
- official/vision/modeling/layers/nn_layers.py +1 -1
- official/vision/modeling/layers/nn_layers_test.py +1 -2
- official/vision/modeling/layers/roi_aligner.py +7 -5
- official/vision/modeling/layers/roi_aligner_test.py +1 -2
- official/vision/modeling/layers/roi_generator.py +1 -2
- official/vision/modeling/layers/roi_sampler.py +1 -2
- official/vision/modeling/maskrcnn_model.py +1 -1
- official/vision/modeling/maskrcnn_model_test.py +1 -2
- official/vision/modeling/models/__init__.py +1 -1
- official/vision/modeling/retinanet_model.py +9 -8
- official/vision/modeling/retinanet_model_test.py +1 -2
- official/vision/modeling/segmentation_model.py +4 -4
- official/vision/modeling/segmentation_model_test.py +1 -1
- official/vision/modeling/video_classification_model.py +1 -1
- official/vision/modeling/video_classification_model_test.py +1 -2
- official/vision/ops/__init__.py +1 -1
- official/vision/ops/anchor.py +1 -3
- official/vision/ops/anchor_generator.py +1 -1
- official/vision/ops/anchor_generator_test.py +1 -1
- official/vision/ops/anchor_test.py +1 -2
- official/vision/ops/augment.py +4 -16
- official/vision/ops/augment_test.py +1 -1
- official/vision/ops/box_matcher.py +1 -1
- official/vision/ops/box_matcher_test.py +1 -1
- official/vision/ops/box_ops.py +1 -2
- official/vision/ops/iou_similarity.py +1 -1
- official/vision/ops/iou_similarity_test.py +1 -1
- official/vision/ops/mask_ops.py +1 -3
- official/vision/ops/mask_ops_test.py +1 -2
- official/vision/ops/nms.py +1 -2
- official/vision/ops/preprocess_ops.py +40 -11
- official/vision/ops/preprocess_ops_3d.py +6 -3
- official/vision/ops/preprocess_ops_3d_test.py +1 -1
- official/vision/ops/preprocess_ops_test.py +13 -7
- official/vision/ops/sampling_ops.py +1 -2
- official/vision/ops/spatial_transform_ops.py +1 -1
- official/vision/ops/target_gather.py +1 -1
- official/vision/ops/target_gather_test.py +1 -1
- official/vision/registry_imports.py +1 -1
- official/vision/serving/__init__.py +1 -1
- official/vision/serving/detection.py +21 -1
- official/vision/serving/detection_test.py +39 -1
- official/vision/serving/export_base.py +1 -1
- official/vision/serving/export_base_v2.py +1 -1
- official/vision/serving/export_base_v2_test.py +1 -1
- official/vision/serving/export_module_factory.py +1 -1
- official/vision/serving/export_module_factory_test.py +1 -1
- official/vision/serving/export_saved_model.py +1 -1
- official/vision/serving/export_saved_model_lib.py +1 -1
- official/vision/serving/export_saved_model_lib_test.py +1 -1
- official/vision/serving/export_saved_model_lib_v2.py +1 -1
- official/vision/serving/export_tfhub.py +1 -2
- official/vision/serving/export_tfhub_lib.py +1 -3
- official/vision/serving/export_tflite.py +1 -1
- official/vision/serving/export_tflite_lib.py +1 -1
- official/vision/serving/export_utils.py +1 -1
- official/vision/serving/image_classification.py +1 -1
- official/vision/serving/image_classification_test.py +1 -1
- official/vision/serving/semantic_segmentation.py +6 -3
- official/vision/serving/semantic_segmentation_test.py +71 -7
- official/vision/serving/video_classification.py +1 -1
- official/vision/serving/video_classification_test.py +1 -1
- official/vision/tasks/__init__.py +1 -1
- official/vision/tasks/image_classification.py +1 -1
- official/vision/tasks/maskrcnn.py +1 -1
- official/vision/tasks/retinanet.py +1 -1
- official/vision/tasks/semantic_segmentation.py +1 -1
- official/vision/tasks/video_classification.py +1 -1
- official/vision/train.py +1 -1
- official/vision/train_spatial_partitioning.py +1 -1
- official/vision/utils/__init__.py +1 -1
- official/vision/utils/object_detection/__init__.py +1 -1
- official/vision/utils/object_detection/argmax_matcher.py +1 -1
- official/vision/utils/object_detection/balanced_positive_negative_sampler.py +1 -1
- official/vision/utils/object_detection/box_coder.py +1 -1
- official/vision/utils/object_detection/box_list.py +1 -1
- official/vision/utils/object_detection/box_list_ops.py +1 -1
- official/vision/utils/object_detection/faster_rcnn_box_coder.py +1 -1
- official/vision/utils/object_detection/matcher.py +1 -1
- official/vision/utils/object_detection/minibatch_sampler.py +1 -1
- official/vision/utils/object_detection/ops.py +1 -1
- official/vision/utils/object_detection/preprocessor.py +1 -1
- official/vision/utils/object_detection/region_similarity_calculator.py +1 -1
- official/vision/utils/object_detection/shape_utils.py +1 -1
- official/vision/utils/object_detection/target_assigner.py +1 -1
- official/vision/utils/object_detection/visualization_utils.py +6 -1
- official/vision/utils/ops_test.py +1 -1
- official/vision/utils/summary_manager.py +1 -1
- orbit/__init__.py +1 -1
- orbit/actions/__init__.py +1 -1
- orbit/actions/conditional_action.py +3 -2
- orbit/actions/conditional_action_test.py +1 -1
- orbit/actions/export_saved_model.py +1 -1
- orbit/actions/export_saved_model_test.py +1 -1
- orbit/actions/new_best_metric.py +2 -2
- orbit/actions/new_best_metric_test.py +2 -2
- orbit/actions/save_checkpoint_if_preempted.py +1 -1
- orbit/controller.py +1 -1
- orbit/controller_test.py +1 -1
- orbit/examples/__init__.py +1 -1
- orbit/examples/single_task/__init__.py +1 -1
- orbit/examples/single_task/single_task_evaluator.py +1 -1
- orbit/examples/single_task/single_task_evaluator_test.py +1 -1
- orbit/examples/single_task/single_task_trainer.py +1 -1
- orbit/examples/single_task/single_task_trainer_test.py +1 -1
- orbit/runner.py +1 -1
- orbit/standard_runner.py +1 -1
- orbit/standard_runner_test.py +1 -1
- orbit/utils/__init__.py +1 -1
- orbit/utils/common.py +1 -1
- orbit/utils/common_test.py +1 -1
- orbit/utils/epoch_helper.py +1 -1
- orbit/utils/loop_fns.py +7 -2
- orbit/utils/summary_manager.py +1 -1
- orbit/utils/summary_manager_interface.py +1 -1
- orbit/utils/tpu_summaries.py +1 -1
- orbit/utils/tpu_summaries_test.py +1 -1
- tensorflow_models/__init__.py +1 -1
- tensorflow_models/nlp/__init__.py +1 -1
- tensorflow_models/tensorflow_models_test.py +1 -1
- tensorflow_models/uplift/__init__.py +1 -1
- tensorflow_models/vision/__init__.py +1 -1
- {tf_models_nightly-2.17.0.dev20240617.dist-info → tf_models_nightly-2.20.0.dev20251220.dist-info}/METADATA +1 -1
- tf_models_nightly-2.20.0.dev20251220.dist-info/RECORD +1256 -0
- tf_models_nightly-2.17.0.dev20240617.dist-info/RECORD +0 -1220
- {tf_models_nightly-2.17.0.dev20240617.dist-info → tf_models_nightly-2.20.0.dev20251220.dist-info}/AUTHORS +0 -0
- {tf_models_nightly-2.17.0.dev20240617.dist-info → tf_models_nightly-2.20.0.dev20251220.dist-info}/LICENSE +0 -0
- {tf_models_nightly-2.17.0.dev20240617.dist-info → tf_models_nightly-2.20.0.dev20251220.dist-info}/WHEEL +0 -0
- {tf_models_nightly-2.17.0.dev20240617.dist-info → tf_models_nightly-2.20.0.dev20251220.dist-info}/top_level.txt +0 -0
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# Copyright
|
|
1
|
+
# Copyright 2025 The TensorFlow Authors. All Rights Reserved.
|
|
2
2
|
#
|
|
3
3
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
4
|
# you may not use this file except in compliance with the License.
|
|
@@ -20,6 +20,7 @@ import tensorflow as tf, tf_keras
|
|
|
20
20
|
from official.modeling import tf_utils
|
|
21
21
|
from official.nlp.modeling.layers import block_sparse_attention
|
|
22
22
|
from official.nlp.modeling.layers import multi_query_attention
|
|
23
|
+
from official.nlp.modeling.layers import talking_heads_attention
|
|
23
24
|
from official.nlp.modeling.layers import util
|
|
24
25
|
|
|
25
26
|
|
|
@@ -82,37 +83,47 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
82
83
|
Understanding](https://arxiv.org/abs/1810.04805)
|
|
83
84
|
"""
|
|
84
85
|
|
|
85
|
-
def __init__(
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
|
|
97
|
-
|
|
98
|
-
|
|
99
|
-
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
|
|
86
|
+
def __init__(
|
|
87
|
+
self,
|
|
88
|
+
num_attention_heads,
|
|
89
|
+
inner_dim,
|
|
90
|
+
inner_activation,
|
|
91
|
+
output_range=None,
|
|
92
|
+
kernel_initializer="glorot_uniform",
|
|
93
|
+
bias_initializer="zeros",
|
|
94
|
+
kernel_regularizer=None,
|
|
95
|
+
bias_regularizer=None,
|
|
96
|
+
activity_regularizer=None,
|
|
97
|
+
kernel_constraint=None,
|
|
98
|
+
bias_constraint=None,
|
|
99
|
+
use_bias=True,
|
|
100
|
+
norm_first=False,
|
|
101
|
+
norm_epsilon=1e-12,
|
|
102
|
+
use_rms_norm=False,
|
|
103
|
+
output_dropout=0.0,
|
|
104
|
+
attention_dropout=0.0,
|
|
105
|
+
inner_dropout=0.0,
|
|
106
|
+
attention_initializer=None,
|
|
107
|
+
attention_axes=None,
|
|
108
|
+
use_query_residual=True,
|
|
109
|
+
key_dim=None,
|
|
110
|
+
value_dim=None,
|
|
111
|
+
output_last_dim=None,
|
|
112
|
+
diff_q_kv_att_layer_norm=False,
|
|
113
|
+
return_attention_scores=False,
|
|
114
|
+
num_kv_heads=None,
|
|
115
|
+
src_block_size=None,
|
|
116
|
+
tgt_block_size=None,
|
|
117
|
+
use_sigmoid_attn=False,
|
|
118
|
+
sigmoid_attn_bias=None,
|
|
119
|
+
linformer_dim=None,
|
|
120
|
+
linformer_shared_kv_projection=True,
|
|
121
|
+
lowrank_query_seq_proj_dim=None,
|
|
122
|
+
enable_talking_heads=False,
|
|
123
|
+
enable_gqa_optimization=False,
|
|
124
|
+
softmax_robust_masking=False,
|
|
125
|
+
**kwargs,
|
|
126
|
+
):
|
|
116
127
|
"""Initializes `TransformerEncoderBlock`.
|
|
117
128
|
|
|
118
129
|
Note: If `output_last_dim` is used and `use_query_residual` is `True`, the
|
|
@@ -185,6 +196,22 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
185
196
|
`block_sparse_attention.MultiHeadAttention` for more details.
|
|
186
197
|
tgt_block_size: Target block size. Refer to
|
|
187
198
|
`block_sparse_attention.MultiHeadAttention` for more details.
|
|
199
|
+
use_sigmoid_attn: This param is only used in
|
|
200
|
+
`block_sparse_attention.MultiHeadAttention`
|
|
201
|
+
sigmoid_attn_bias: This param is only used in
|
|
202
|
+
`block_sparse_attention.MultiHeadAttention`
|
|
203
|
+
linformer_dim: Applies low-rank factorization on keys/values as in
|
|
204
|
+
https://arxiv.org/pdf/2006.04768.
|
|
205
|
+
linformer_shared_kv_projection: If set, projection layer is shared for
|
|
206
|
+
keys and values.
|
|
207
|
+
lowrank_query_seq_proj_dim: If set, applies a projection layer on query
|
|
208
|
+
sequence to the given dimension. go/constformer-doc
|
|
209
|
+
enable_talking_heads: Enable talking heads as in
|
|
210
|
+
https://arxiv.org/pdf/2003.02436.
|
|
211
|
+
enable_gqa_optimization: Enable GQA optimization in multi-query attention.
|
|
212
|
+
This flag is valid only when num_kv_heads is set for GQA.
|
|
213
|
+
softmax_robust_masking: If true, will use a more numerically robust
|
|
214
|
+
masking impl for softmax.
|
|
188
215
|
**kwargs: keyword arguments.
|
|
189
216
|
"""
|
|
190
217
|
util.filter_kwargs(kwargs)
|
|
@@ -222,28 +249,46 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
222
249
|
self._num_kv_heads = num_kv_heads
|
|
223
250
|
self._src_block_size = src_block_size
|
|
224
251
|
self._tgt_block_size = tgt_block_size
|
|
225
|
-
|
|
252
|
+
self._use_sigmoid_attn = use_sigmoid_attn
|
|
253
|
+
self._sigmoid_attn_bias = sigmoid_attn_bias
|
|
254
|
+
self._linformer_dim = linformer_dim
|
|
255
|
+
self._linformer_shared_kv_projection = linformer_shared_kv_projection
|
|
256
|
+
self._lowrank_query_seq_proj_dim = lowrank_query_seq_proj_dim
|
|
257
|
+
self._enable_talking_heads = enable_talking_heads
|
|
258
|
+
self._enable_gqa_optimization = enable_gqa_optimization
|
|
259
|
+
self._softmax_robust_masking = softmax_robust_masking
|
|
260
|
+
if (
|
|
261
|
+
self._src_block_size is not None
|
|
262
|
+
and self._num_kv_heads is not None
|
|
263
|
+
and self._num_kv_heads != 1
|
|
264
|
+
):
|
|
226
265
|
raise ValueError(
|
|
227
|
-
"Block sparse attention
|
|
228
|
-
"
|
|
266
|
+
"Block sparse attention only supports Multi-query attention.Please"
|
|
267
|
+
" set num_kv_heads to 1 to enable MQA with block sparse attention."
|
|
229
268
|
)
|
|
230
269
|
if attention_initializer:
|
|
231
270
|
self._attention_initializer = tf_keras.initializers.get(
|
|
232
|
-
attention_initializer
|
|
271
|
+
attention_initializer
|
|
272
|
+
)
|
|
233
273
|
else:
|
|
234
274
|
self._attention_initializer = tf_utils.clone_initializer(
|
|
235
|
-
self._kernel_initializer
|
|
275
|
+
self._kernel_initializer
|
|
276
|
+
)
|
|
236
277
|
self._attention_axes = attention_axes
|
|
237
278
|
|
|
238
279
|
if self._diff_q_kv_att_layer_norm and not self._norm_first:
|
|
239
|
-
raise ValueError(
|
|
240
|
-
|
|
280
|
+
raise ValueError(
|
|
281
|
+
"Setting `diff_q_and_kv_attention_layer_norm` to True"
|
|
282
|
+
"when `norm_first` is False is invalid."
|
|
283
|
+
)
|
|
241
284
|
|
|
242
285
|
def build(self, input_shape):
|
|
243
286
|
if isinstance(input_shape, tf.TensorShape):
|
|
244
287
|
input_tensor_shape = input_shape
|
|
245
288
|
elif isinstance(input_shape, (list, tuple)):
|
|
246
289
|
input_tensor_shape = tf.TensorShape(input_shape[0])
|
|
290
|
+
elif isinstance(input_shape, dict):
|
|
291
|
+
input_tensor_shape = tf.TensorShape(input_shape["input_tensor"])
|
|
247
292
|
else:
|
|
248
293
|
raise ValueError(
|
|
249
294
|
"The type of input shape argument is not supported, got: %s" %
|
|
@@ -273,6 +318,7 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
273
318
|
bias_initializer=tf_utils.clone_initializer(self._bias_initializer),
|
|
274
319
|
attention_axes=self._attention_axes,
|
|
275
320
|
output_shape=self._output_last_dim,
|
|
321
|
+
softmax_robust_masking=self._softmax_robust_masking,
|
|
276
322
|
name="self_attention",
|
|
277
323
|
)
|
|
278
324
|
common_kwargs = dict(
|
|
@@ -282,18 +328,39 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
282
328
|
bias_constraint=self._bias_constraint,
|
|
283
329
|
)
|
|
284
330
|
if self._src_block_size is not None:
|
|
331
|
+
if self._enable_talking_heads:
|
|
332
|
+
raise ValueError(
|
|
333
|
+
"Block sparse attention does not support talking heads. Please"
|
|
334
|
+
" set enable_talking_heads to False."
|
|
335
|
+
)
|
|
285
336
|
attention_layer_kwargs.update(
|
|
286
337
|
src_block_size=self._src_block_size,
|
|
287
338
|
tgt_block_size=self._tgt_block_size,
|
|
339
|
+
use_sigmoid_attn=self._use_sigmoid_attn,
|
|
340
|
+
sigmoid_attn_bias=self._sigmoid_attn_bias,
|
|
341
|
+
num_kv_heads=self._num_kv_heads,
|
|
288
342
|
name="block_sparse_attention",
|
|
289
343
|
)
|
|
290
344
|
attention_fn = block_sparse_attention.MultiHeadAttention
|
|
291
345
|
elif self._num_kv_heads is not None:
|
|
292
346
|
attention_layer_kwargs.update(
|
|
293
347
|
num_kv_heads=self._num_kv_heads,
|
|
348
|
+
enable_gqa_optimization=self._enable_gqa_optimization,
|
|
294
349
|
name="multi_query_attention",
|
|
295
350
|
)
|
|
296
|
-
|
|
351
|
+
if self._enable_talking_heads:
|
|
352
|
+
attention_fn = (
|
|
353
|
+
multi_query_attention.TalkingHeadsMultiQueryAttention
|
|
354
|
+
)
|
|
355
|
+
else:
|
|
356
|
+
attention_fn = multi_query_attention.MultiHeadAttention
|
|
357
|
+
elif self._enable_talking_heads:
|
|
358
|
+
attention_layer_kwargs.update(
|
|
359
|
+
name="talking_heads_attention",
|
|
360
|
+
)
|
|
361
|
+
attention_fn = (
|
|
362
|
+
talking_heads_attention.TalkingHeadsAttention
|
|
363
|
+
)
|
|
297
364
|
else:
|
|
298
365
|
attention_fn = tf_keras.layers.MultiHeadAttention
|
|
299
366
|
self._attention_layer = attention_fn(
|
|
@@ -356,16 +423,48 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
356
423
|
name="output",
|
|
357
424
|
kernel_initializer=tf_utils.clone_initializer(self._kernel_initializer),
|
|
358
425
|
bias_initializer=tf_utils.clone_initializer(self._bias_initializer),
|
|
359
|
-
**common_kwargs
|
|
426
|
+
**common_kwargs,
|
|
427
|
+
)
|
|
360
428
|
self._output_dropout = tf_keras.layers.Dropout(
|
|
361
|
-
rate=self._output_dropout_rate
|
|
429
|
+
rate=self._output_dropout_rate
|
|
430
|
+
)
|
|
362
431
|
# Use float32 in layernorm for numeric stability.
|
|
363
432
|
self._output_layer_norm = tf_keras.layers.LayerNormalization(
|
|
364
433
|
name="output_layer_norm",
|
|
365
434
|
axis=-1,
|
|
366
435
|
epsilon=self._norm_epsilon,
|
|
367
|
-
dtype=tf.float32
|
|
368
|
-
|
|
436
|
+
dtype=tf.float32,
|
|
437
|
+
)
|
|
438
|
+
if self._linformer_dim is not None:
|
|
439
|
+
if self._linformer_shared_kv_projection:
|
|
440
|
+
low_rank_dim = self._linformer_dim
|
|
441
|
+
else:
|
|
442
|
+
low_rank_dim = 2 * self._linformer_dim
|
|
443
|
+
self._lowrank_kv_projection = tf_keras.layers.EinsumDense(
|
|
444
|
+
"...bc,cd->...bd",
|
|
445
|
+
output_shape=(None, low_rank_dim),
|
|
446
|
+
kernel_initializer=tf_utils.clone_initializer(
|
|
447
|
+
self._kernel_initializer
|
|
448
|
+
),
|
|
449
|
+
bias_initializer=tf_utils.clone_initializer(self._bias_initializer),
|
|
450
|
+
name="lowrank_kv_projection",
|
|
451
|
+
**common_kwargs,
|
|
452
|
+
)
|
|
453
|
+
if self._lowrank_query_seq_proj_dim is not None:
|
|
454
|
+
self._lowrank_query_seq_projection = tf_keras.layers.EinsumDense(
|
|
455
|
+
# Squash the sequence-length dimension; keep embedding as is.
|
|
456
|
+
"...ij,ik->...kj",
|
|
457
|
+
output_shape=(
|
|
458
|
+
self._lowrank_query_seq_proj_dim,
|
|
459
|
+
hidden_size,
|
|
460
|
+
),
|
|
461
|
+
kernel_initializer=tf_utils.clone_initializer(
|
|
462
|
+
self._kernel_initializer
|
|
463
|
+
),
|
|
464
|
+
bias_initializer=tf_utils.clone_initializer(self._bias_initializer),
|
|
465
|
+
name="constformer_projection",
|
|
466
|
+
**common_kwargs,
|
|
467
|
+
)
|
|
369
468
|
super().build(input_shape)
|
|
370
469
|
|
|
371
470
|
def get_config(self):
|
|
@@ -413,19 +512,82 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
413
512
|
"num_kv_heads": self._num_kv_heads,
|
|
414
513
|
"src_block_size": self._src_block_size,
|
|
415
514
|
"tgt_block_size": self._tgt_block_size,
|
|
515
|
+
"use_sigmoid_attn": self._use_sigmoid_attn,
|
|
516
|
+
"sigmoid_attn_bias": self._sigmoid_attn_bias,
|
|
517
|
+
"linformer_dim": self._linformer_dim,
|
|
518
|
+
"linformer_shared_kv_projection": self._linformer_shared_kv_projection,
|
|
519
|
+
"lowrank_query_seq_proj_dim": self._lowrank_query_seq_proj_dim,
|
|
520
|
+
"softmax_robust_masking": self._softmax_robust_masking
|
|
416
521
|
}
|
|
417
522
|
base_config = super().get_config()
|
|
418
523
|
return dict(list(base_config.items()) + list(config.items()))
|
|
419
524
|
|
|
525
|
+
def _apply_lowrank_query_projection(
|
|
526
|
+
self,
|
|
527
|
+
query: tf.Tensor,
|
|
528
|
+
attention_mask: tf.Tensor | None,
|
|
529
|
+
):
|
|
530
|
+
"""Applies constformer projection to the source tensor."""
|
|
531
|
+
|
|
532
|
+
# Don't project the source tensor if the `lowrank_query_seq_projection`
|
|
533
|
+
# (constformer) dimension is the same as the input
|
|
534
|
+
# sequence dimension.
|
|
535
|
+
if (
|
|
536
|
+
self._lowrank_query_seq_proj_dim is None
|
|
537
|
+
or query.shape[1] == self._lowrank_query_seq_proj_dim
|
|
538
|
+
):
|
|
539
|
+
return query
|
|
540
|
+
# Don't overwrite the attention mask.
|
|
541
|
+
query = self._apply_query_mask(attention_mask, query)
|
|
542
|
+
dtype = query.dtype
|
|
543
|
+
query = self._lowrank_query_seq_projection(query)
|
|
544
|
+
query = tf.cast(query, dtype)
|
|
545
|
+
return query
|
|
546
|
+
|
|
547
|
+
def _apply_query_mask(
|
|
548
|
+
self,
|
|
549
|
+
attention_mask: tf.Tensor | None,
|
|
550
|
+
query: tf.Tensor,
|
|
551
|
+
):
|
|
552
|
+
"""Applying mask before the low rank factorization so that padding is accounted for.
|
|
553
|
+
|
|
554
|
+
Applies mask to query only if the dimension of query matches the mask. This
|
|
555
|
+
is to avoid the projection from happening multiple times while stacking
|
|
556
|
+
the transformer layers.
|
|
557
|
+
|
|
558
|
+
Args:
|
|
559
|
+
attention_mask: The attention_mask tensor.
|
|
560
|
+
query: The query tensor.
|
|
561
|
+
|
|
562
|
+
Returns:
|
|
563
|
+
query: The query tensor after applying the mask.
|
|
564
|
+
"""
|
|
565
|
+
if attention_mask is None:
|
|
566
|
+
return query
|
|
567
|
+
if attention_mask.shape[1] != query.shape[1]:
|
|
568
|
+
# Skip the mask application for query.
|
|
569
|
+
logging.info(
|
|
570
|
+
"Skipping mask application on query. Shape mismatch: %s vs %s",
|
|
571
|
+
attention_mask.shape,
|
|
572
|
+
query.shape,
|
|
573
|
+
)
|
|
574
|
+
return query
|
|
575
|
+
|
|
576
|
+
query_mask = tf.cast(attention_mask[:, :, 0], dtype=query.dtype)
|
|
577
|
+
query = query * tf.expand_dims(query_mask, axis=-1)
|
|
578
|
+
return query
|
|
579
|
+
|
|
420
580
|
def call(self, inputs: Any, output_range: Optional[tf.Tensor] = None) -> Any:
|
|
421
581
|
"""Transformer self-attention encoder block call.
|
|
422
582
|
|
|
423
583
|
Args:
|
|
424
|
-
inputs: a single tensor or a list of tensors. `input
|
|
425
|
-
sequence of embeddings. [`input tensor`,
|
|
426
|
-
additional attention mask. [`query
|
|
427
|
-
`attention mask`] to have separate input
|
|
428
|
-
key/value to the multi-head attention.
|
|
584
|
+
inputs: a single tensor or a list of tensors, or a dictionary. `input
|
|
585
|
+
tensor` as the single sequence of embeddings. [`input tensor`,
|
|
586
|
+
`attention mask`] to have the additional attention mask. [`query
|
|
587
|
+
tensor`, `key value tensor`, `attention mask`] to have separate input
|
|
588
|
+
streams for the query, and key/value to the multi-head attention. If
|
|
589
|
+
dictionary is provided, it must contain the following keys:
|
|
590
|
+
`input_tensor`, `attention_mask`, `key_value_tensor`.
|
|
429
591
|
output_range: the sequence output range, [0, output_range) for slicing the
|
|
430
592
|
target sequence. `None` means the target sequence is not sliced. If you
|
|
431
593
|
would like to have no change to the model training, it is better to only
|
|
@@ -443,6 +605,21 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
443
605
|
else:
|
|
444
606
|
raise ValueError("Unexpected inputs to %s with length at %d" %
|
|
445
607
|
(self.__class__, len(inputs)))
|
|
608
|
+
elif isinstance(inputs, dict):
|
|
609
|
+
if not set(inputs.keys()).issubset(
|
|
610
|
+
set(["input_tensor", "key_value_tensor", "attention_mask"])
|
|
611
|
+
):
|
|
612
|
+
raise ValueError(
|
|
613
|
+
f"Unexpected keys in input dictionary to: {inputs.keys()}"
|
|
614
|
+
)
|
|
615
|
+
try:
|
|
616
|
+
input_tensor = inputs["input_tensor"]
|
|
617
|
+
except KeyError as e:
|
|
618
|
+
raise ValueError(
|
|
619
|
+
"Missing required key `input_tensor` in input dictionary."
|
|
620
|
+
) from e
|
|
621
|
+
key_value = inputs.get("key_value_tensor", None)
|
|
622
|
+
attention_mask = inputs.get("attention_mask", None)
|
|
446
623
|
else:
|
|
447
624
|
input_tensor, key_value, attention_mask = (inputs, None, None)
|
|
448
625
|
|
|
@@ -451,6 +628,12 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
451
628
|
if output_range:
|
|
452
629
|
if self._norm_first:
|
|
453
630
|
source_tensor = input_tensor[:, 0:output_range, :]
|
|
631
|
+
if self._use_query_residual:
|
|
632
|
+
# `source_tensor` is only used for the residual connection.
|
|
633
|
+
source_tensor = self._apply_lowrank_query_projection(
|
|
634
|
+
source_tensor, attention_mask
|
|
635
|
+
)
|
|
636
|
+
|
|
454
637
|
input_tensor = self._attention_layer_norm(input_tensor)
|
|
455
638
|
if key_value is not None:
|
|
456
639
|
key_value = self._attention_layer_norm_kv(key_value)
|
|
@@ -460,23 +643,61 @@ class TransformerEncoderBlock(tf_keras.layers.Layer):
|
|
|
460
643
|
else:
|
|
461
644
|
if self._norm_first:
|
|
462
645
|
source_tensor = input_tensor
|
|
646
|
+
if self._use_query_residual:
|
|
647
|
+
# `source_tensor` is only used for the residual connection.
|
|
648
|
+
source_tensor = self._apply_lowrank_query_projection(
|
|
649
|
+
source_tensor, attention_mask
|
|
650
|
+
)
|
|
463
651
|
input_tensor = self._attention_layer_norm(input_tensor)
|
|
464
652
|
if key_value is not None:
|
|
465
653
|
key_value = self._attention_layer_norm_kv(key_value)
|
|
466
654
|
target_tensor = input_tensor
|
|
467
655
|
|
|
656
|
+
# Project the query to the constformer dimension.
|
|
657
|
+
target_tensor = self._apply_lowrank_query_projection(
|
|
658
|
+
target_tensor, attention_mask
|
|
659
|
+
)
|
|
660
|
+
|
|
468
661
|
if key_value is None:
|
|
469
662
|
key_value = input_tensor
|
|
470
663
|
|
|
664
|
+
key = key_value
|
|
665
|
+
value = key_value
|
|
666
|
+
if self._linformer_dim is not None:
|
|
667
|
+
if attention_mask is not None:
|
|
668
|
+
# Applying mask before the low rank factorization so that padding is
|
|
669
|
+
# accounted for.
|
|
670
|
+
query_mask = tf.cast(attention_mask[:, :, 0], dtype=target_tensor.dtype)
|
|
671
|
+
if self._lowrank_query_seq_proj_dim is None:
|
|
672
|
+
target_tensor = target_tensor * tf.expand_dims(query_mask, axis=-1)
|
|
673
|
+
key_mask = tf.cast(attention_mask[:, 0, :], dtype=target_tensor.dtype)
|
|
674
|
+
key_value = key_value * tf.expand_dims(key_mask, axis=-1)
|
|
675
|
+
attention_mask = None
|
|
676
|
+
key_value = tf.transpose(key_value, [0, 2, 1])
|
|
677
|
+
key_value = self._lowrank_kv_projection(key_value)
|
|
678
|
+
if self._linformer_shared_kv_projection:
|
|
679
|
+
key_value = tf.transpose(key_value, [0, 2, 1])
|
|
680
|
+
key = key_value
|
|
681
|
+
value = key_value
|
|
682
|
+
else:
|
|
683
|
+
key = tf.transpose(key_value[:, :, : self._linformer_dim], [0, 2, 1])
|
|
684
|
+
value = tf.transpose(key_value[:, :, self._linformer_dim :], [0, 2, 1])
|
|
685
|
+
|
|
471
686
|
if self._return_attention_scores:
|
|
472
687
|
attention_output, attention_scores = self._attention_layer(
|
|
473
688
|
query=target_tensor,
|
|
474
|
-
|
|
689
|
+
key=key,
|
|
690
|
+
value=value,
|
|
475
691
|
attention_mask=attention_mask,
|
|
476
|
-
return_attention_scores=True
|
|
692
|
+
return_attention_scores=True,
|
|
693
|
+
)
|
|
477
694
|
else:
|
|
478
695
|
attention_output = self._attention_layer(
|
|
479
|
-
query=target_tensor,
|
|
696
|
+
query=target_tensor,
|
|
697
|
+
key=key,
|
|
698
|
+
value=value,
|
|
699
|
+
attention_mask=attention_mask,
|
|
700
|
+
)
|
|
480
701
|
attention_output = self._attention_dropout(attention_output)
|
|
481
702
|
|
|
482
703
|
if self._norm_first:
|