mindspore 2.0.0a0__cp37-none-any.whl → 2.0.0rc1__cp37-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of mindspore might be problematic. Click here for more details.
- mindspore/.commit_id +1 -1
- mindspore/Third_Party_Open_Source_Software_Notice +9064 -0
- mindspore/__init__.py +4 -2
- mindspore/_akg/akg/composite/build_module.py +11 -0
- mindspore/_akg/akg/config/repository_cuda.json +11 -0
- mindspore/_akg/akg/tvm/contrib/nvcc.py +4 -3
- mindspore/_c_dataengine.cpython-37m-aarch64-linux-gnu.so +0 -0
- mindspore/_c_expression.cpython-37m-aarch64-linux-gnu.so +0 -0
- mindspore/_c_mindrecord.cpython-37m-aarch64-linux-gnu.so +0 -0
- mindspore/_check_jit_forbidden_api.py +102 -0
- mindspore/_checkparam.py +1066 -1001
- mindspore/_extends/parallel_compile/akg_compiler/akg_process.py +4 -3
- mindspore/_extends/parallel_compile/akg_compiler/tbe_topi.py +50 -48
- mindspore/_extends/parallel_compile/akg_compiler/util.py +9 -4
- mindspore/_extends/parallel_compile/tbe_compiler/tbe_adapter.py +4 -4
- mindspore/_extends/parallel_compile/tbe_compiler/tbe_helper.py +9 -4
- mindspore/_extends/parse/__init__.py +5 -3
- mindspore/_extends/parse/namespace.py +16 -1
- mindspore/_extends/parse/parser.py +107 -22
- mindspore/_extends/parse/resources.py +0 -7
- mindspore/_extends/parse/standard_method.py +885 -413
- mindspore/_mindspore_offline_debug.cpython-37m-aarch64-linux-gnu.so +0 -0
- mindspore/amp.py +52 -57
- mindspore/bin/cache_admin +0 -0
- mindspore/bin/cache_server +0 -0
- mindspore/boost/boost.py +2 -2
- mindspore/boost/boost_cell_wrapper.py +38 -20
- mindspore/boost/dim_reduce.py +3 -3
- mindspore/boost/group_loss_scale_manager.py +1 -1
- mindspore/common/__init__.py +4 -6
- mindspore/common/_decorator.py +2 -0
- mindspore/common/_register_for_adapter.py +55 -0
- mindspore/common/_stub_tensor.py +201 -0
- mindspore/common/_utils.py +41 -7
- mindspore/common/api.py +215 -141
- mindspore/common/dtype.py +8 -1
- mindspore/common/dump.py +2 -2
- mindspore/common/initializer.py +4 -2
- mindspore/common/jit_config.py +17 -13
- mindspore/common/mutable.py +33 -13
- mindspore/common/parameter.py +23 -21
- mindspore/common/seed.py +8 -24
- mindspore/common/sparse_tensor.py +62 -41
- mindspore/common/tensor.py +852 -1154
- mindspore/communication/__init__.py +2 -2
- mindspore/communication/_comm_helper.py +11 -4
- mindspore/communication/management.py +22 -21
- mindspore/config/op_info.config +501 -1008
- mindspore/config/super_bar_config.json +512 -0
- mindspore/context.py +201 -23
- mindspore/dataset/__init__.py +6 -6
- mindspore/dataset/audio/__init__.py +7 -7
- mindspore/dataset/audio/transforms.py +670 -30
- mindspore/dataset/audio/utils.py +47 -4
- mindspore/dataset/audio/validators.py +223 -1
- mindspore/dataset/callback/ds_callback.py +2 -2
- mindspore/dataset/core/config.py +210 -14
- mindspore/dataset/core/validator_helpers.py +2 -2
- mindspore/{parallel/nn/layers.py → dataset/debug/__init__.py} +7 -8
- mindspore/dataset/debug/debug_hook.py +65 -0
- mindspore/dataset/debug/pre_defined_hook.py +67 -0
- mindspore/dataset/engine/__init__.py +7 -3
- mindspore/dataset/engine/cache_client.py +1 -1
- mindspore/dataset/engine/datasets.py +322 -66
- mindspore/dataset/engine/datasets_audio.py +80 -76
- mindspore/dataset/engine/datasets_standard_format.py +51 -38
- mindspore/dataset/engine/datasets_text.py +232 -118
- mindspore/dataset/engine/datasets_user_defined.py +41 -17
- mindspore/dataset/engine/datasets_vision.py +746 -225
- mindspore/dataset/engine/graphdata.py +75 -10
- mindspore/dataset/engine/iterators.py +45 -5
- mindspore/dataset/engine/offload.py +48 -28
- mindspore/dataset/engine/validators.py +117 -8
- mindspore/dataset/text/__init__.py +6 -5
- mindspore/dataset/text/transforms.py +86 -3
- mindspore/dataset/text/utils.py +6 -4
- mindspore/dataset/text/validators.py +25 -0
- mindspore/dataset/transforms/__init__.py +3 -2
- mindspore/dataset/transforms/c_transforms.py +1 -1
- mindspore/dataset/transforms/transforms.py +2 -2
- mindspore/dataset/utils/__init__.py +2 -1
- mindspore/dataset/utils/line_reader.py +121 -0
- mindspore/dataset/vision/__init__.py +2 -3
- mindspore/dataset/vision/c_transforms.py +9 -9
- mindspore/dataset/vision/py_transforms.py +5 -5
- mindspore/dataset/vision/py_transforms_util.py +2 -0
- mindspore/dataset/vision/transforms.py +160 -161
- mindspore/dataset/vision/utils.py +3 -3
- mindspore/experimental/map_parameter.py +38 -26
- mindspore/include/OWNERS +0 -1
- mindspore/include/api/callback/callback.h +9 -13
- mindspore/include/api/callback/ckpt_saver.h +2 -2
- mindspore/include/api/callback/loss_monitor.h +2 -2
- mindspore/include/api/callback/lr_scheduler.h +5 -5
- mindspore/include/api/callback/time_monitor.h +2 -2
- mindspore/include/api/callback/train_accuracy.h +4 -6
- mindspore/include/api/cfg.h +19 -6
- mindspore/include/api/context.h +44 -9
- mindspore/include/api/delegate.h +1 -1
- mindspore/include/api/metrics/accuracy.h +2 -2
- mindspore/include/api/metrics/metrics.h +4 -3
- mindspore/include/api/model.h +9 -4
- mindspore/include/api/model_parallel_runner.h +2 -2
- mindspore/include/api/net.h +12 -11
- mindspore/include/api/serialization.h +19 -3
- mindspore/include/api/types.h +3 -3
- mindspore/include/dataset/constants.h +7 -0
- mindspore/include/dataset/text.h +59 -0
- mindspore/include/mindapi/base/type_id.h +1 -0
- mindspore/lib/libdnnl.so.2 +0 -0
- mindspore/lib/libicudata.so.69 +0 -0
- mindspore/lib/libicui18n.so.69 +0 -0
- mindspore/lib/libicuuc.so.69 +0 -0
- mindspore/lib/libmindspore.so +0 -0
- mindspore/lib/libmindspore_backend.so +0 -0
- mindspore/lib/libmindspore_common.so +0 -0
- mindspore/lib/libmindspore_core.so +0 -0
- mindspore/lib/libmindspore_glog.so.0 +0 -0
- mindspore/lib/libmindspore_gpr.so.15 +0 -0
- mindspore/lib/libmindspore_grpc++.so.1 +0 -0
- mindspore/lib/libmindspore_grpc.so.15 +0 -0
- mindspore/lib/libmindspore_shared_lib.so +0 -0
- mindspore/lib/libmpi_adapter.so +0 -0
- mindspore/lib/libmpi_collective.so +0 -0
- mindspore/lib/libnnacl.so +0 -0
- mindspore/lib/libopencv_core.so.4.5 +0 -0
- mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
- mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
- mindspore/lib/libps_cache.so +0 -0
- mindspore/lib/plugin/ascend/libakg.so +0 -0
- mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
- mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
- mindspore/lib/plugin/ascend/libhccl_plugin.so +0 -0
- mindspore/lib/plugin/ascend/libmindspore_aicpu_kernels.so +0 -0
- mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
- mindspore/lib/plugin/cpu/libakg.so +0 -0
- mindspore/lib/plugin/libmindspore_ascend.so.1 +0 -0
- mindspore/lib/plugin/{libmindspore_ascend.so → libmindspore_ascend.so.2} +0 -0
- mindspore/log.py +1 -1
- mindspore/mindrecord/filereader.py +18 -0
- mindspore/mindrecord/filewriter.py +197 -34
- mindspore/mindrecord/shardreader.py +9 -0
- mindspore/mindrecord/shardwriter.py +1 -1
- mindspore/mindrecord/tools/cifar100_to_mr.py +3 -3
- mindspore/mindrecord/tools/cifar10_to_mr.py +3 -3
- mindspore/mindrecord/tools/csv_to_mr.py +3 -3
- mindspore/mindrecord/tools/imagenet_to_mr.py +16 -11
- mindspore/mindrecord/tools/mnist_to_mr.py +2 -2
- mindspore/mindrecord/tools/tfrecord_to_mr.py +6 -6
- mindspore/nn/__init__.py +0 -4
- mindspore/nn/cell.py +204 -132
- mindspore/nn/dynamic_lr.py +1 -1
- mindspore/nn/grad/cell_grad.py +7 -6
- mindspore/nn/layer/__init__.py +5 -4
- mindspore/nn/layer/activation.py +40 -89
- mindspore/nn/layer/basic.py +255 -624
- mindspore/nn/layer/channel_shuffle.py +7 -6
- mindspore/nn/layer/combined.py +1 -1
- mindspore/nn/layer/container.py +41 -4
- mindspore/nn/layer/conv.py +64 -28
- mindspore/nn/layer/dense.py +9 -8
- mindspore/nn/layer/embedding.py +27 -25
- mindspore/nn/layer/image.py +53 -46
- mindspore/nn/layer/math.py +97 -105
- mindspore/nn/layer/normalization.py +117 -86
- mindspore/nn/layer/padding.py +185 -95
- mindspore/nn/layer/pooling.py +817 -414
- mindspore/nn/layer/rnn_cells.py +10 -15
- mindspore/nn/layer/rnns.py +37 -38
- mindspore/nn/layer/thor_layer.py +11 -12
- mindspore/nn/layer/timedistributed.py +5 -5
- mindspore/nn/layer/transformer.py +701 -0
- mindspore/nn/learning_rate_schedule.py +8 -8
- mindspore/nn/loss/__init__.py +5 -4
- mindspore/nn/loss/loss.py +334 -199
- mindspore/nn/optim/ada_grad.py +6 -6
- mindspore/nn/optim/adadelta.py +2 -3
- mindspore/nn/optim/adafactor.py +4 -5
- mindspore/nn/optim/adam.py +126 -62
- mindspore/nn/optim/adamax.py +3 -4
- mindspore/nn/optim/adasum.py +6 -6
- mindspore/nn/optim/asgd.py +2 -2
- mindspore/nn/optim/ftrl.py +67 -38
- mindspore/nn/optim/lamb.py +4 -5
- mindspore/nn/optim/lars.py +2 -2
- mindspore/nn/optim/lazyadam.py +43 -4
- mindspore/nn/optim/momentum.py +6 -5
- mindspore/nn/optim/optimizer.py +3 -1
- mindspore/nn/optim/proximal_ada_grad.py +2 -2
- mindspore/nn/optim/rmsprop.py +1 -1
- mindspore/nn/optim/rprop.py +8 -9
- mindspore/nn/optim/sgd.py +19 -13
- mindspore/nn/optim/thor.py +10 -15
- mindspore/nn/probability/__init__.py +0 -2
- mindspore/nn/probability/bijector/bijector.py +4 -4
- mindspore/nn/probability/bijector/invert.py +1 -1
- mindspore/nn/probability/bijector/softplus.py +2 -2
- mindspore/nn/probability/bnn_layers/dense_variational.py +1 -1
- mindspore/nn/probability/bnn_layers/layer_distribution.py +2 -2
- mindspore/nn/probability/distribution/_utils/utils.py +9 -15
- mindspore/nn/probability/distribution/bernoulli.py +3 -3
- mindspore/nn/probability/distribution/beta.py +1 -1
- mindspore/nn/probability/distribution/categorical.py +5 -7
- mindspore/nn/probability/distribution/cauchy.py +3 -3
- mindspore/nn/probability/distribution/distribution.py +2 -2
- mindspore/nn/probability/distribution/exponential.py +2 -2
- mindspore/nn/probability/distribution/gamma.py +3 -3
- mindspore/nn/probability/distribution/geometric.py +1 -1
- mindspore/nn/probability/distribution/gumbel.py +3 -3
- mindspore/nn/probability/distribution/half_normal.py +15 -11
- mindspore/nn/probability/distribution/laplace.py +16 -13
- mindspore/nn/probability/distribution/logistic.py +2 -2
- mindspore/nn/probability/distribution/normal.py +1 -1
- mindspore/nn/probability/distribution/poisson.py +1 -1
- mindspore/nn/probability/distribution/student_t.py +20 -15
- mindspore/nn/probability/distribution/transformed_distribution.py +4 -4
- mindspore/nn/probability/distribution/uniform.py +2 -2
- mindspore/nn/reinforcement/_tensors_queue.py +3 -3
- mindspore/nn/reinforcement/tensor_array.py +2 -2
- mindspore/nn/sparse/sparse.py +2 -2
- mindspore/nn/wrap/cell_wrapper.py +27 -10
- mindspore/nn/wrap/grad_reducer.py +2 -2
- mindspore/nn/wrap/loss_scale.py +40 -24
- mindspore/numpy/array_creations.py +33 -22
- mindspore/numpy/array_ops.py +35 -30
- mindspore/numpy/logic_ops.py +6 -27
- mindspore/numpy/math_ops.py +22 -19
- mindspore/numpy/utils.py +1 -1
- mindspore/numpy/utils_const.py +108 -58
- mindspore/ops/_constants.py +0 -6
- mindspore/ops/_grad/__init__.py +2 -1
- mindspore/ops/_grad/grad_array_ops.py +86 -117
- mindspore/ops/_grad/grad_base.py +23 -1
- mindspore/ops/_grad/grad_clip_ops.py +2 -3
- mindspore/ops/_grad/grad_comm_ops.py +34 -24
- mindspore/ops/_grad/grad_implementations.py +9 -45
- mindspore/ops/_grad/grad_inner_ops.py +47 -4
- mindspore/ops/_grad/grad_math_ops.py +142 -117
- mindspore/ops/_grad/grad_nn_ops.py +71 -165
- mindspore/ops/_grad/grad_sequence_ops.py +296 -0
- mindspore/ops/_grad/grad_sparse.py +7 -6
- mindspore/ops/_grad_experimental/__init__.py +1 -0
- mindspore/ops/_grad_experimental/grad_array_ops.py +150 -15
- mindspore/ops/_grad_experimental/grad_image_ops.py +16 -7
- mindspore/ops/_grad_experimental/grad_inner_ops.py +1 -22
- mindspore/ops/_grad_experimental/grad_linalg_ops.py +4 -11
- mindspore/ops/_grad_experimental/grad_math_ops.py +210 -89
- mindspore/ops/_grad_experimental/grad_nn_ops.py +26 -22
- mindspore/ops/_grad_experimental/grad_scalar_ops.py +112 -0
- mindspore/ops/_grad_experimental/grad_sparse_ops.py +49 -8
- mindspore/ops/_op_impl/_custom_op/batch_matmul_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold.py +2 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2.py +2 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2_grad_reduce.py +4 -4
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold_grad.py +3 -3
- mindspore/ops/_op_impl/_custom_op/cholesky_trsm_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/correction_mul.py +2 -2
- mindspore/ops/_op_impl/_custom_op/correction_mul_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/dsd_back_impl.py +1 -5
- mindspore/ops/_op_impl/_custom_op/dsd_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel_grad_reduce.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer_grad_reduce.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perchannel_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perlayer_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fused_abs_max1_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/img2col_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_dense_left_impl.py +2 -2
- mindspore/ops/_op_impl/_custom_op/matmul_cube_dense_right_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_fracz_left_cast_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_fracz_right_mul_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_impl.py +2 -2
- mindspore/ops/_op_impl/_custom_op/matmul_dds_impl.py +0 -4
- mindspore/ops/_op_impl/_custom_op/matrix_combine_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/minmax_update_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/minmax_update_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/transpose02314_impl.py +1 -1
- mindspore/ops/_op_impl/aicpu/__init__.py +236 -4
- mindspore/ops/_op_impl/aicpu/abs.py +36 -0
- mindspore/ops/_op_impl/aicpu/{adaptive_avg_pool_2d_v1.py → adaptive_avg_pool_2d.py} +6 -5
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_2d_grad.py +34 -0
- mindspore/ops/_op_impl/aicpu/add.py +43 -0
- mindspore/ops/_op_impl/aicpu/addcdiv.py +0 -32
- mindspore/ops/_op_impl/aicpu/addcmul.py +0 -84
- mindspore/ops/_op_impl/aicpu/affine_grid_grad.py +35 -0
- mindspore/ops/_op_impl/aicpu/batch_matmul.py +43 -43
- mindspore/ops/_op_impl/aicpu/bernoulli.py +48 -0
- mindspore/{compression/common/__init__.py → ops/_op_impl/aicpu/bessel_i0.py} +15 -8
- mindspore/ops/_op_impl/aicpu/channel_shuffle.py +40 -0
- mindspore/ops/_op_impl/aicpu/conj.py +11 -0
- mindspore/ops/_op_impl/aicpu/cumulative_logsumexp.py +0 -3
- mindspore/ops/_op_impl/aicpu/deformable_offsets.py +38 -0
- mindspore/ops/_op_impl/aicpu/deformable_offsets_grad.py +43 -0
- mindspore/ops/_op_impl/aicpu/{adaptive_avg_pool_2d_grad_v1.py → digamma.py} +7 -9
- mindspore/ops/_op_impl/aicpu/flatten.py +1 -0
- mindspore/ops/_op_impl/aicpu/fmax.py +36 -0
- mindspore/ops/_op_impl/aicpu/fmin.py +37 -0
- mindspore/ops/_op_impl/aicpu/fractional_max_pool3d_with_fixed_ksize.py +1 -1
- mindspore/ops/_op_impl/aicpu/fse_decode.py +43 -0
- mindspore/ops/_op_impl/aicpu/greater.py +41 -0
- mindspore/ops/_op_impl/aicpu/greater_equal.py +41 -0
- mindspore/ops/_op_impl/aicpu/index_put.py +50 -0
- mindspore/ops/_op_impl/aicpu/less.py +41 -0
- mindspore/{nn/probability/infer/variational/__init__.py → ops/_op_impl/aicpu/lgamma.py} +16 -10
- mindspore/ops/_op_impl/aicpu/mirror_pad.py +0 -4
- mindspore/ops/_op_impl/aicpu/mirror_pad_grad.py +0 -4
- mindspore/ops/_op_impl/aicpu/mul.py +3 -1
- mindspore/ops/_op_impl/aicpu/multinomial.py +14 -6
- mindspore/ops/_op_impl/aicpu/nllloss.py +38 -0
- mindspore/ops/_op_impl/aicpu/nllloss_grad.py +39 -0
- mindspore/ops/_op_impl/aicpu/ones_like.py +0 -2
- mindspore/ops/_op_impl/aicpu/polar.py +32 -0
- mindspore/ops/_op_impl/aicpu/polygamma.py +34 -0
- mindspore/ops/_op_impl/aicpu/quant_dtype_cast.py +40 -0
- mindspore/ops/_op_impl/aicpu/quantile.py +35 -0
- mindspore/ops/_op_impl/aicpu/ragged_tensor_to_sparse.py +73 -0
- mindspore/ops/_op_impl/aicpu/randperm_v2.py +41 -0
- mindspore/ops/_op_impl/aicpu/resize_bicubic.py +2 -8
- mindspore/ops/_op_impl/aicpu/resize_bicubic_grad.py +1 -1
- mindspore/ops/_op_impl/aicpu/resize_v2.py +68 -0
- mindspore/ops/_op_impl/aicpu/resize_v2_grad.py +68 -0
- mindspore/ops/_op_impl/aicpu/scatter_elements.py +4 -0
- mindspore/ops/_op_impl/aicpu/scatter_nd_update.py +2 -0
- mindspore/ops/_op_impl/aicpu/sequence_add.py +34 -0
- mindspore/ops/_op_impl/aicpu/sequence_add_offset.py +34 -0
- mindspore/ops/_op_impl/aicpu/sequence_addn.py +38 -0
- mindspore/ops/_op_impl/aicpu/smooth_l1_loss.py +35 -0
- mindspore/ops/_op_impl/aicpu/smooth_l1_loss_grad.py +37 -0
- mindspore/ops/_op_impl/aicpu/sparse_apply_adagrad_da.py +0 -24
- mindspore/ops/_op_impl/aicpu/sparse_cross.py +42 -0
- mindspore/ops/_op_impl/aicpu/sparse_slice.py +4 -0
- mindspore/ops/_op_impl/aicpu/sparse_slice_grad.py +6 -0
- mindspore/ops/_op_impl/aicpu/tensor_scatter_update.py +59 -0
- mindspore/ops/_op_impl/aicpu/trans_data.py +1 -0
- mindspore/ops/_op_impl/aicpu/tril_indices.py +34 -0
- mindspore/ops/_op_impl/aicpu/uniform.py +34 -0
- mindspore/ops/_op_impl/aicpu/uniform_candidate_sampler.py +1 -0
- mindspore/ops/_op_impl/aicpu/unique_consecutive.py +10 -2
- mindspore/ops/_op_impl/cpu/dynamic_shape.py +5 -1
- mindspore/ops/_op_impl/cpu/sparse_slice.py +4 -0
- mindspore/ops/_op_impl/cpu/sparse_slice_grad.py +6 -0
- mindspore/ops/_op_impl/cpu/tensor_shape.py +5 -1
- mindspore/ops/_op_impl/tbe/__init__.py +27 -611
- mindspore/ops/_op_impl/tbe/assign_add_ds.py +1 -0
- mindspore/ops/_op_impl/tbe/atomic_addr_clean.py +1 -1
- mindspore/ops/_op_impl/tbe/avg_pool_3d_grad.py +1 -1
- mindspore/ops/_op_impl/tbe/batch_matmul_ds.py +1 -0
- mindspore/ops/_op_impl/tbe/batch_to_space.py +1 -1
- mindspore/ops/_op_impl/tbe/batch_to_space_nd.py +1 -1
- mindspore/ops/_op_impl/tbe/bn_infer_grad.py +4 -2
- mindspore/ops/_op_impl/tbe/bn_training_update.py +0 -1
- mindspore/ops/_op_impl/tbe/bn_training_update_ds.py +0 -1
- mindspore/ops/_op_impl/tbe/broadcast_to_ds.py +6 -4
- mindspore/ops/_op_impl/tbe/cast.py +0 -2
- mindspore/ops/_op_impl/tbe/cast_ds.py +3 -3
- mindspore/ops/_op_impl/tbe/data_format_dim_map_ds.py +1 -0
- mindspore/ops/_op_impl/tbe/depthwise_conv2d.py +2 -2
- mindspore/ops/_op_impl/tbe/dynamic_atomic_addr_clean.py +1 -1
- mindspore/ops/_op_impl/tbe/gather_nd.py +1 -0
- mindspore/ops/_op_impl/tbe/{index_add.py → inplace_index_add.py} +3 -6
- mindspore/ops/_op_impl/tbe/matmul_ds.py +2 -0
- mindspore/ops/_op_impl/tbe/npu_clear_float_status_v2.py +35 -0
- mindspore/ops/_op_impl/tbe/npu_get_float_status_v2.py +35 -0
- mindspore/ops/_op_impl/tbe/scatter_mul.py +2 -0
- mindspore/ops/_op_impl/tbe/scatter_nd_add.py +0 -2
- mindspore/ops/_op_impl/tbe/space_to_batch.py +1 -1
- mindspore/ops/_op_impl/tbe/space_to_batch_nd.py +1 -1
- mindspore/ops/_op_impl/tbe/trans_data_ds.py +15 -5
- mindspore/ops/_register_for_op.py +1 -0
- mindspore/ops/_utils/__init__.py +1 -2
- mindspore/ops/_utils/utils.py +19 -40
- mindspore/ops/_vmap/vmap_array_ops.py +116 -38
- mindspore/ops/_vmap/vmap_base.py +16 -9
- mindspore/ops/_vmap/vmap_convolution_ops.py +7 -10
- mindspore/ops/_vmap/vmap_grad_math_ops.py +4 -4
- mindspore/ops/_vmap/vmap_grad_nn_ops.py +7 -5
- mindspore/ops/_vmap/vmap_image_ops.py +12 -5
- mindspore/ops/_vmap/vmap_math_ops.py +46 -5
- mindspore/ops/_vmap/vmap_nn_ops.py +15 -21
- mindspore/ops/_vmap/vmap_random_ops.py +1 -1
- mindspore/ops/bprop_mindir/AdaptiveAvgPool2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/AdaptiveMaxPool2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/AvgPool3D_bprop.mindir +150 -0
- mindspore/ops/bprop_mindir/AvgPool_bprop.mindir +66 -0
- mindspore/ops/bprop_mindir/BCEWithLogitsLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BatchNormGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BiasAddGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BinaryCrossEntropy_bprop.mindir +33 -0
- mindspore/ops/bprop_mindir/BroadcastTo_bprop.mindir +220 -106
- mindspore/ops/bprop_mindir/CTCLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Conv2DBackpropFilter_bprop.mindir +240 -0
- mindspore/ops/bprop_mindir/Conv2DBackpropInput_bprop.mindir +247 -0
- mindspore/ops/bprop_mindir/Conv2DTranspose_bprop.mindir +247 -0
- mindspore/ops/bprop_mindir/Conv3DTranspose_bprop.mindir +315 -0
- mindspore/ops/bprop_mindir/Conv3D_bprop.mindir +278 -0
- mindspore/ops/bprop_mindir/DeformableOffsets_bprop.mindir +58 -0
- mindspore/ops/bprop_mindir/DepthwiseConv2dNative_bprop.mindir +138 -0
- mindspore/ops/bprop_mindir/Dropout2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Dropout3D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DropoutDoMask_bprop.mindir +22 -23
- mindspore/ops/bprop_mindir/DropoutGenMask_bprop.mindir +16 -17
- mindspore/ops/bprop_mindir/DropoutGrad_bprop.mindir +27 -0
- mindspore/ops/bprop_mindir/Dropout_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DynamicGRUV2_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DynamicRNN_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Elu_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/EmbeddingLookup_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ExpandDims_bprop.mindir +39 -41
- mindspore/ops/bprop_mindir/FastGeLU_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Flatten_bprop.mindir +41 -43
- mindspore/ops/bprop_mindir/GatherNd_bprop.mindir +51 -57
- mindspore/ops/bprop_mindir/Gather_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/HSigmoid_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/HSwish_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/InstanceNorm_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/KLDivLoss_bprop.mindir +126 -0
- mindspore/ops/bprop_mindir/L2Loss_bprop.mindir +15 -0
- mindspore/ops/bprop_mindir/L2Normalize_bprop.mindir +30 -0
- mindspore/ops/bprop_mindir/LRN_bprop.mindir +43 -0
- mindspore/ops/bprop_mindir/LayerNormGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/LogSoftmax_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/MaxPool3DGradGrad_bprop.mindir +74 -0
- mindspore/ops/bprop_mindir/MaxPool3DGrad_bprop.mindir +74 -0
- mindspore/ops/bprop_mindir/MaxPool3D_bprop.mindir +75 -0
- mindspore/ops/bprop_mindir/MaxPoolGradGrad_bprop.mindir +65 -0
- mindspore/ops/bprop_mindir/MaxPoolWithArgmax_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/MirrorPad_bprop.mindir +27 -0
- mindspore/ops/bprop_mindir/Mish_bprop.mindir +35 -0
- mindspore/ops/bprop_mindir/MulNoNan_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/NLLLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/OneHot_bprop.mindir +24 -25
- mindspore/ops/bprop_mindir/PReLU_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Pad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Padding_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/RNNTLoss_bprop.mindir +29 -0
- mindspore/ops/bprop_mindir/ROIAlign_bprop.mindir +82 -0
- mindspore/ops/bprop_mindir/ReLU6_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/ReLUV2_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ReluGrad_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/Reshape_bprop.mindir +53 -53
- mindspore/ops/bprop_mindir/ResizeBilinear_bprop.mindir +29 -0
- mindspore/ops/bprop_mindir/ResizeNearestNeighbor_bprop.mindir +77 -85
- mindspore/ops/bprop_mindir/SeLU_bprop.mindir +21 -0
- mindspore/ops/bprop_mindir/SigmoidCrossEntropyWithLogits_bprop.mindir +21 -0
- mindspore/ops/bprop_mindir/SigmoidGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Sigmoid_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/SmoothL1Loss_bprop.mindir +36 -0
- mindspore/ops/bprop_mindir/SoftmaxCrossEntropyWithLogits_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Softplus_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Softsign_bprop.mindir +33 -0
- mindspore/ops/bprop_mindir/SparseSoftmaxCrossEntropyWithLogits_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Squeeze_bprop.mindir +37 -39
- mindspore/ops/bprop_mindir/StridedSlice_bprop.mindir +70 -72
- mindspore/ops/bprop_mindir/TanhGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Tanh_bprop.mindir +66 -0
- mindspore/ops/bprop_mindir/Tile_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/TopK_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/TupleGetItem_bprop.mindir +17 -17
- mindspore/ops/bprop_mindir/UpsampleNearest3D_bprop.mindir +32 -0
- mindspore/ops/bprop_mindir/UpsampleTrilinear3D_bprop.mindir +38 -0
- mindspore/ops/bprop_mindir/generate_mindir.py +2 -0
- mindspore/ops/composite/__init__.py +7 -8
- mindspore/ops/composite/base.py +101 -47
- mindspore/ops/composite/math_ops.py +188 -158
- mindspore/ops/composite/multitype_ops/_compile_utils.py +415 -170
- mindspore/ops/composite/multitype_ops/_constexpr_utils.py +142 -87
- mindspore/ops/composite/multitype_ops/add_impl.py +6 -1
- mindspore/ops/composite/multitype_ops/div_impl.py +2 -3
- mindspore/ops/composite/multitype_ops/getitem_impl.py +31 -3
- mindspore/ops/composite/multitype_ops/greater_equal_impl.py +31 -0
- mindspore/ops/composite/multitype_ops/greater_impl.py +31 -0
- mindspore/ops/composite/multitype_ops/in_impl.py +9 -0
- mindspore/ops/composite/multitype_ops/less_equal_impl.py +31 -0
- mindspore/ops/composite/multitype_ops/less_impl.py +31 -0
- mindspore/ops/composite/multitype_ops/mul_impl.py +21 -5
- mindspore/ops/composite/multitype_ops/not_in_impl.py +9 -0
- mindspore/ops/composite/multitype_ops/ones_like_impl.py +2 -4
- mindspore/ops/composite/multitype_ops/setitem_impl.py +21 -3
- mindspore/ops/composite/multitype_ops/sub_impl.py +1 -1
- mindspore/ops/composite/multitype_ops/zeros_like_impl.py +35 -4
- mindspore/ops/function/__init__.py +152 -8
- mindspore/ops/function/array_func.py +2555 -674
- mindspore/ops/function/clip_func.py +209 -13
- mindspore/ops/function/debug_func.py +2 -2
- mindspore/ops/function/grad/__init__.py +2 -1
- mindspore/ops/function/grad/grad_func.py +147 -62
- mindspore/ops/function/image_func.py +54 -38
- mindspore/ops/function/linalg_func.py +167 -16
- mindspore/ops/function/math_func.py +4849 -1492
- mindspore/ops/function/nn_func.py +2573 -988
- mindspore/ops/function/other_func.py +115 -0
- mindspore/ops/function/parameter_func.py +3 -3
- mindspore/ops/function/random_func.py +790 -73
- mindspore/ops/function/sparse_func.py +98 -78
- mindspore/ops/function/sparse_unary_func.py +54 -53
- mindspore/ops/function/spectral_func.py +27 -24
- mindspore/ops/function/vmap_func.py +22 -2
- mindspore/ops/functional.py +97 -37
- mindspore/ops/op_info_register.py +70 -28
- mindspore/ops/operations/__init__.py +47 -14
- mindspore/ops/operations/_csr_ops.py +7 -7
- mindspore/ops/operations/_embedding_cache_ops.py +5 -5
- mindspore/ops/operations/_grad_ops.py +276 -187
- mindspore/ops/operations/_inner_ops.py +319 -113
- mindspore/ops/operations/_ms_kernel.py +10 -8
- mindspore/ops/operations/_ocr_ops.py +9 -9
- mindspore/ops/operations/_opaque_predicate_registry.py +4 -0
- mindspore/ops/operations/_quant_ops.py +137 -102
- mindspore/ops/operations/_rl_inner_ops.py +121 -60
- mindspore/ops/operations/_scalar_ops.py +466 -0
- mindspore/ops/operations/_sequence_ops.py +1004 -2
- mindspore/ops/operations/_tensor_array.py +10 -11
- mindspore/ops/operations/_thor_ops.py +1 -1
- mindspore/ops/operations/array_ops.py +801 -466
- mindspore/ops/operations/comm_ops.py +51 -49
- mindspore/ops/operations/control_ops.py +2 -2
- mindspore/ops/operations/custom_ops.py +123 -44
- mindspore/ops/operations/debug_ops.py +24 -24
- mindspore/ops/operations/image_ops.py +240 -153
- mindspore/ops/operations/inner_ops.py +34 -50
- mindspore/ops/operations/linalg_ops.py +31 -9
- mindspore/ops/operations/math_ops.py +988 -757
- mindspore/ops/operations/nn_ops.py +965 -819
- mindspore/ops/operations/other_ops.py +51 -40
- mindspore/ops/operations/random_ops.py +204 -122
- mindspore/ops/operations/rl_ops.py +8 -9
- mindspore/ops/operations/sparse_ops.py +254 -93
- mindspore/ops/operations/spectral_ops.py +35 -3
- mindspore/ops/primitive.py +111 -9
- mindspore/parallel/_auto_parallel_context.py +189 -83
- mindspore/parallel/_offload_context.py +185 -0
- mindspore/parallel/_parallel_serialization.py +99 -7
- mindspore/parallel/_ps_context.py +9 -5
- mindspore/parallel/_recovery_context.py +1 -1
- mindspore/parallel/_tensor.py +7 -1
- mindspore/{nn/transformer → parallel/_transformer}/__init__.py +6 -6
- mindspore/{nn/transformer → parallel/_transformer}/layers.py +6 -37
- mindspore/{nn/transformer → parallel/_transformer}/loss.py +4 -7
- mindspore/{nn/transformer → parallel/_transformer}/moe.py +20 -16
- mindspore/{nn/transformer → parallel/_transformer}/op_parallel_config.py +3 -3
- mindspore/{nn/transformer → parallel/_transformer}/transformer.py +48 -111
- mindspore/parallel/_utils.py +1 -2
- mindspore/parallel/algo_parameter_config.py +1 -1
- mindspore/parallel/checkpoint_transform.py +37 -34
- mindspore/parallel/shard.py +17 -18
- mindspore/profiler/common/validator/validate_path.py +2 -2
- mindspore/profiler/envprofiling.py +69 -47
- mindspore/profiler/parser/ascend_timeline_generator.py +49 -42
- mindspore/profiler/parser/base_timeline_generator.py +49 -56
- mindspore/profiler/parser/cpu_gpu_timeline_generator.py +98 -78
- mindspore/profiler/parser/hwts_log_parser.py +1 -1
- mindspore/profiler/parser/integrator.py +15 -14
- mindspore/profiler/parser/minddata_analyzer.py +2 -2
- mindspore/profiler/parser/msadvisor_analyzer.py +12 -25
- mindspore/profiler/parser/msadvisor_parser.py +2 -4
- mindspore/profiler/parser/optime_parser.py +17 -18
- mindspore/profiler/parser/profiler_info.py +2 -1
- mindspore/profiler/profiling.py +218 -186
- mindspore/rewrite/__init__.py +3 -1
- mindspore/rewrite/api/node.py +1 -114
- mindspore/rewrite/api/node_type.py +3 -0
- mindspore/rewrite/api/pattern_engine.py +31 -1
- mindspore/rewrite/api/scoped_value.py +4 -4
- mindspore/rewrite/api/symbol_tree.py +3 -78
- mindspore/rewrite/api/tree_node_helper.py +1 -1
- mindspore/rewrite/ast_creator_register.py +1 -0
- mindspore/rewrite/ast_helpers/__init__.py +2 -2
- mindspore/rewrite/ast_helpers/ast_creator.py +1 -2
- mindspore/rewrite/ast_helpers/ast_finder.py +65 -0
- mindspore/rewrite/ast_helpers/ast_modifier.py +11 -3
- mindspore/rewrite/ast_transformers/flatten_recursive_stmt.py +18 -2
- mindspore/rewrite/namespace.py +0 -2
- mindspore/rewrite/node.py +157 -11
- mindspore/rewrite/parsers/assign_parser.py +231 -53
- mindspore/rewrite/parsers/class_def_parser.py +187 -109
- mindspore/rewrite/parsers/for_parser.py +24 -14
- mindspore/rewrite/parsers/function_def_parser.py +21 -4
- mindspore/rewrite/parsers/if_parser.py +6 -2
- mindspore/rewrite/sparsify/__init__.py +0 -0
- mindspore/rewrite/sparsify/sparse_transformer.py +448 -0
- mindspore/rewrite/sparsify/sparsify.py +109 -0
- mindspore/rewrite/sparsify/utils.py +173 -0
- mindspore/rewrite/symbol_tree.py +256 -133
- mindspore/rewrite/symbol_tree_builder.py +38 -1
- mindspore/run_check/_check_version.py +69 -63
- mindspore/run_check/run_check.py +2 -1
- mindspore/scipy/linalg.py +10 -114
- mindspore/scipy/ops.py +2 -2
- mindspore/scipy/ops_wrapper.py +1 -1
- mindspore/scipy/optimize/_bfgs.py +1 -1
- mindspore/scipy/optimize/_lagrange.py +200 -0
- mindspore/scipy/optimize/line_search.py +3 -2
- mindspore/scipy/optimize/minimize.py +41 -2
- mindspore/scipy/sparse/__init__.py +2 -2
- mindspore/scipy/sparse/linalg.py +4 -464
- mindspore/scipy/utils.py +1 -1
- mindspore/scipy/utils_const.py +7 -1
- mindspore/train/__init__.py +1 -1
- mindspore/train/_utils.py +28 -5
- mindspore/train/amp.py +273 -102
- mindspore/train/callback/_backup_and_restore.py +5 -5
- mindspore/train/callback/_callback.py +2 -2
- mindspore/train/callback/_checkpoint.py +3 -3
- mindspore/train/callback/_early_stop.py +3 -3
- mindspore/train/callback/_lambda_callback.py +2 -2
- mindspore/train/callback/_landscape.py +29 -31
- mindspore/train/callback/_loss_monitor.py +3 -3
- mindspore/train/callback/_on_request_exit.py +3 -3
- mindspore/train/callback/_reduce_lr_on_plateau.py +4 -4
- mindspore/train/callback/_summary_collector.py +23 -16
- mindspore/train/callback/_time_monitor.py +3 -3
- mindspore/train/checkpoint_pb2.py +68 -8
- mindspore/train/data_sink.py +15 -3
- mindspore/train/dataset_helper.py +10 -15
- mindspore/train/loss_scale_manager.py +8 -11
- mindspore/train/metrics/__init__.py +1 -1
- mindspore/train/metrics/bleu_score.py +1 -1
- mindspore/train/metrics/confusion_matrix.py +1 -1
- mindspore/train/metrics/cosine_similarity.py +1 -1
- mindspore/train/metrics/dice.py +2 -2
- mindspore/train/metrics/fbeta.py +1 -1
- mindspore/train/metrics/hausdorff_distance.py +4 -3
- mindspore/train/metrics/mean_surface_distance.py +2 -2
- mindspore/train/metrics/occlusion_sensitivity.py +1 -1
- mindspore/train/metrics/perplexity.py +1 -1
- mindspore/train/metrics/precision.py +1 -1
- mindspore/train/metrics/recall.py +1 -1
- mindspore/train/metrics/roc.py +2 -2
- mindspore/train/metrics/root_mean_square_surface_distance.py +2 -2
- mindspore/train/mind_ir_pb2.py +116 -37
- mindspore/train/model.py +45 -28
- mindspore/train/serialization.py +295 -188
- mindspore/train/summary/_summary_adapter.py +1 -1
- mindspore/train/summary/summary_record.py +43 -13
- mindspore/train/train_thor/convert_utils.py +2 -2
- mindspore/train/train_thor/dataset_helper.py +3 -3
- mindspore/version.py +1 -1
- {mindspore-2.0.0a0.dist-info → mindspore-2.0.0rc1.dist-info}/METADATA +3 -2
- {mindspore-2.0.0a0.dist-info → mindspore-2.0.0rc1.dist-info}/RECORD +648 -574
- mindspore/compression/__init__.py +0 -19
- mindspore/compression/common/constant.py +0 -124
- mindspore/compression/export/__init__.py +0 -19
- mindspore/compression/export/quant_export.py +0 -515
- mindspore/compression/quant/__init__.py +0 -28
- mindspore/compression/quant/qat.py +0 -634
- mindspore/compression/quant/quant_utils.py +0 -462
- mindspore/compression/quant/quantizer.py +0 -68
- mindspore/nn/layer/quant.py +0 -1868
- mindspore/nn/layer/rnn_utils.py +0 -90
- mindspore/nn/probability/dpn/__init__.py +0 -22
- mindspore/nn/probability/dpn/vae/__init__.py +0 -25
- mindspore/nn/probability/dpn/vae/cvae.py +0 -140
- mindspore/nn/probability/dpn/vae/vae.py +0 -124
- mindspore/nn/probability/infer/__init__.py +0 -22
- mindspore/nn/probability/infer/variational/elbo.py +0 -70
- mindspore/nn/probability/infer/variational/svi.py +0 -84
- mindspore/nn/probability/toolbox/__init__.py +0 -22
- mindspore/nn/probability/toolbox/anomaly_detection.py +0 -99
- mindspore/nn/probability/toolbox/uncertainty_evaluation.py +0 -364
- mindspore/nn/probability/transforms/__init__.py +0 -22
- mindspore/nn/probability/transforms/transform_bnn.py +0 -262
- mindspore/nn/probability/zhusuan/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/framework/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/framework/bn.py +0 -95
- mindspore/nn/probability/zhusuan/variational/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/variational/elbo.py +0 -46
- mindspore/ops/_op_impl/aicpu/parallel_concat.py +0 -42
- mindspore/ops/_op_impl/tbe/gather_v2.py +0 -56
- mindspore/ops/bprop_mindir/AssignAdd_bprop.mindir +0 -19
- mindspore/ops/bprop_mindir/Cast_bprop.mindir +0 -19
- mindspore/ops/bprop_mindir/LogicalOr_bprop.mindir +0 -19
- mindspore/ops/bprop_mindir/MatMul_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ReLU_bprop.mindir +0 -17
- mindspore/ops/bprop_mindir/Transpose_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/UpdateState_bprop.mindir +0 -15
- mindspore/ops/composite/array_ops.py +0 -241
- mindspore/ops/composite/clip_ops.py +0 -134
- mindspore/ops/composite/random_ops.py +0 -426
- mindspore/ops/composite/vmap_ops.py +0 -38
- mindspore/parallel/nn/__init__.py +0 -42
- mindspore/parallel/nn/loss.py +0 -22
- mindspore/parallel/nn/moe.py +0 -21
- mindspore/parallel/nn/op_parallel_config.py +0 -22
- mindspore/parallel/nn/transformer.py +0 -31
- {mindspore-2.0.0a0.dist-info → mindspore-2.0.0rc1.dist-info}/WHEEL +0 -0
- {mindspore-2.0.0a0.dist-info → mindspore-2.0.0rc1.dist-info}/entry_points.txt +0 -0
- {mindspore-2.0.0a0.dist-info → mindspore-2.0.0rc1.dist-info}/top_level.txt +0 -0
|
@@ -14,11 +14,10 @@
|
|
|
14
14
|
# ============================================================================
|
|
15
15
|
|
|
16
16
|
"""Define the grad rules of neural network related operations."""
|
|
17
|
-
import numpy as np
|
|
18
17
|
from mindspore import context
|
|
19
18
|
from mindspore.common import dtype as mstype
|
|
20
19
|
from mindspore.common.tensor import Tensor
|
|
21
|
-
from mindspore.ops.primitive import
|
|
20
|
+
from mindspore.ops.primitive import _primexpr
|
|
22
21
|
from mindspore.ops.operations import nn_ops as nps
|
|
23
22
|
from mindspore.ops._grad.grad_base import bprop_getters, dyn_size, create_tensor_by_element, dyn_rank
|
|
24
23
|
from mindspore.ops import functional as F
|
|
@@ -27,38 +26,29 @@ from mindspore.ops.composite.multitype_ops.zeros_like_impl import zeros_like
|
|
|
27
26
|
from mindspore.ops.operations import _grad_ops as G
|
|
28
27
|
from mindspore.ops.operations import _inner_ops as inner
|
|
29
28
|
from mindspore.ops.operations import _rl_inner_ops as rl_ops
|
|
30
|
-
from mindspore.ops._utils.utils import range_op, get_1d_shape
|
|
29
|
+
from mindspore.ops._utils.utils import range_op, get_1d_shape
|
|
31
30
|
|
|
32
31
|
|
|
33
|
-
@
|
|
34
|
-
def
|
|
35
|
-
"""
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
def bprop(x, w, out, dout):
|
|
39
|
-
return dout, bias_grad(dout)
|
|
32
|
+
@_primexpr
|
|
33
|
+
def bias_add_gradgrad_helper(shape, bias_shape, data_format):
|
|
34
|
+
"""Helper function of BiasGradGrad to calculate expanded shape."""
|
|
35
|
+
new_shape = list(shape)
|
|
36
|
+
new_bias_shape = list(bias_shape)
|
|
40
37
|
|
|
41
|
-
|
|
38
|
+
ones_1 = []
|
|
39
|
+
ones_2 = []
|
|
40
|
+
for _ in new_shape[2:]:
|
|
41
|
+
ones_1.append(1)
|
|
42
42
|
|
|
43
|
+
for _ in new_shape[:-1]:
|
|
44
|
+
ones_2.append(1)
|
|
43
45
|
|
|
44
|
-
@constexpr
|
|
45
|
-
def bias_add_gradgrad_helper(shape, bias_shape, data_format):
|
|
46
|
-
"""Helper function of BiasGradGrad to calculate expanded shape."""
|
|
47
|
-
shape = np.array(shape).astype(np.int)
|
|
48
|
-
bias_shape = np.array(bias_shape).astype(np.int)
|
|
49
46
|
if data_format == "NCHW":
|
|
50
|
-
expanded_shape =
|
|
51
|
-
|
|
52
|
-
bias_shape,
|
|
53
|
-
np.ones_like(shape[2:])
|
|
54
|
-
], axis=0)
|
|
55
|
-
tile_mults = np.concatenate([shape[:1], [1], shape[2:]], axis=0)
|
|
47
|
+
expanded_shape = [1] + new_bias_shape + ones_1
|
|
48
|
+
tile_mults = [new_shape[0]] + [1] + new_shape[2:]
|
|
56
49
|
else:
|
|
57
|
-
expanded_shape =
|
|
58
|
-
|
|
59
|
-
bias_shape
|
|
60
|
-
], axis=0)
|
|
61
|
-
tile_mults = np.concatenate([shape[:-1], [1]], axis=0)
|
|
50
|
+
expanded_shape = ones_2 + new_bias_shape
|
|
51
|
+
tile_mults = new_shape[:-1] + [1]
|
|
62
52
|
return tuple(expanded_shape), tuple(tile_mults)
|
|
63
53
|
|
|
64
54
|
|
|
@@ -85,7 +75,7 @@ def get_bprop_bias_add_grad(self):
|
|
|
85
75
|
dyn_shape = P.TensorShape()
|
|
86
76
|
dy_shape = dy.shape
|
|
87
77
|
dout_shape = dout.shape
|
|
88
|
-
if
|
|
78
|
+
if F.is_sequence_value_unknown(dy_shape) or F.is_sequence_value_unknown(dout_shape):
|
|
89
79
|
dy_shape = dyn_shape(dy)
|
|
90
80
|
dout_shape = dyn_shape(dout)
|
|
91
81
|
expanded_shape, tile_mults = bias_add_gradgrad_helper_dynamic(dy_shape, dout_shape, data_format)
|
|
@@ -100,38 +90,6 @@ def get_bprop_bias_add_grad(self):
|
|
|
100
90
|
return bprop
|
|
101
91
|
|
|
102
92
|
|
|
103
|
-
@bprop_getters.register(P.Conv2D)
|
|
104
|
-
def get_bprop_conv2d(self):
|
|
105
|
-
"""Grad definition for `Conv2D` operation."""
|
|
106
|
-
self.out_channel = self.get_attr_dict()["out_channel"]
|
|
107
|
-
self.pad_list = self.get_attr_dict()["pad_list"]
|
|
108
|
-
input_grad = P.Conv2DBackpropInput(
|
|
109
|
-
self.out_channel, self.kernel_size, self.pad_mode, self.pad, self.pad_list, mode=self.mode,
|
|
110
|
-
dilation=self.dilation, stride=self.stride, group=self.group, data_format=self.format
|
|
111
|
-
)
|
|
112
|
-
filter_grad = G.Conv2DBackpropFilter(
|
|
113
|
-
self.out_channel, self.kernel_size, self.pad_mode, self.pad, self.pad_list, mode=self.mode,
|
|
114
|
-
dilation=self.dilation, stride=self.stride, group=self.group, data_format=self.format
|
|
115
|
-
)
|
|
116
|
-
get_shape = P.Shape()
|
|
117
|
-
get_dyn_shape = P.TensorShape()
|
|
118
|
-
cast_type = P.Cast()
|
|
119
|
-
|
|
120
|
-
def bprop(x, w, out, dout):
|
|
121
|
-
x_shape = get_shape(x)
|
|
122
|
-
w_shape = get_shape(w)
|
|
123
|
-
if is_shape_unknown(x_shape):
|
|
124
|
-
x_shape = get_dyn_shape(x)
|
|
125
|
-
if is_shape_unknown(w_shape):
|
|
126
|
-
w_shape = get_dyn_shape(w)
|
|
127
|
-
w_shape = cast_type(w_shape, mstype.int32)
|
|
128
|
-
dx = input_grad(dout, w, x_shape)
|
|
129
|
-
dw = filter_grad(dout, x, w_shape)
|
|
130
|
-
return dx, dw
|
|
131
|
-
|
|
132
|
-
return bprop
|
|
133
|
-
|
|
134
|
-
|
|
135
93
|
@bprop_getters.register(nps.Conv3D)
|
|
136
94
|
def get_bprop_conv3d(self):
|
|
137
95
|
"""Grad definition for `Conv3D` operation."""
|
|
@@ -145,15 +103,17 @@ def get_bprop_conv3d(self):
|
|
|
145
103
|
)
|
|
146
104
|
get_shape = P.Shape()
|
|
147
105
|
get_dyn_shape = P.TensorShape()
|
|
106
|
+
cast = P.Cast()
|
|
107
|
+
get_dtype = P.DType()
|
|
148
108
|
|
|
149
109
|
def bprop(x, w, out, dout):
|
|
150
|
-
if
|
|
110
|
+
if F.is_sequence_value_unknown(get_shape(x)) or F.is_sequence_value_unknown(get_shape(w)):
|
|
151
111
|
dx = input_grad(w, dout, get_dyn_shape(x))
|
|
152
|
-
dw = filter_grad(x, dout, get_dyn_shape(w))
|
|
112
|
+
dw = cast(filter_grad(x, dout, get_dyn_shape(w)), get_dtype(x))
|
|
153
113
|
return dx, dw
|
|
154
114
|
|
|
155
115
|
dx = input_grad(w, dout, get_shape(x))
|
|
156
|
-
dw = filter_grad(x, dout, get_shape(w))
|
|
116
|
+
dw = cast(filter_grad(x, dout, get_shape(w)), get_dtype(x))
|
|
157
117
|
return dx, dw
|
|
158
118
|
|
|
159
119
|
return bprop
|
|
@@ -176,7 +136,7 @@ def get_bprop_conv3d_transpose(self):
|
|
|
176
136
|
get_dyn_shape = P.TensorShape()
|
|
177
137
|
|
|
178
138
|
def bprop(x, w, out, dout):
|
|
179
|
-
if
|
|
139
|
+
if F.is_sequence_value_unknown(F.shape(w)):
|
|
180
140
|
dx = input_grad(dout, w)
|
|
181
141
|
dw = filter_grad(dout, x, get_dyn_shape(w))
|
|
182
142
|
return dx, dw
|
|
@@ -249,7 +209,7 @@ def get_bprop_extract_image_patches(self):
|
|
|
249
209
|
def bprop(x, out, dout):
|
|
250
210
|
x_shape = get_shape(x)
|
|
251
211
|
out_shape = get_shape(out)
|
|
252
|
-
if
|
|
212
|
+
if F.is_sequence_value_unknown(x_shape) or F.is_sequence_value_unknown(out_shape):
|
|
253
213
|
return _dyn_extract_image_patched(x, out, dout)
|
|
254
214
|
x_batch, x_depth, x_row, x_col = x_shape
|
|
255
215
|
x_indices_num = x_row * x_col + 1
|
|
@@ -348,6 +308,7 @@ def get_bprop_max_pool_grad_grad(self):
|
|
|
348
308
|
op_range = P.Range()
|
|
349
309
|
dyn_broadcast_op = inner.DynamicBroadcastTo()
|
|
350
310
|
|
|
311
|
+
|
|
351
312
|
def bprop(x1, x2, grad, out, dout):
|
|
352
313
|
dx1 = zeros_like(x1)
|
|
353
314
|
dx2 = zeros_like(x2)
|
|
@@ -355,7 +316,7 @@ def get_bprop_max_pool_grad_grad(self):
|
|
|
355
316
|
dgrad = maxpool_grad_grad(x1, x2, dout)
|
|
356
317
|
else:
|
|
357
318
|
shape_x2 = shape_op(x2)
|
|
358
|
-
if
|
|
319
|
+
if F.is_sequence_value_unknown(shape_x2):
|
|
359
320
|
shape_x2 = dyn_shape_op(x2)
|
|
360
321
|
b, c, h, w = shape_x2
|
|
361
322
|
_, ind = maxpool_with_argmax(x1)
|
|
@@ -394,22 +355,6 @@ def get_bprop_max_pool_grad_grad_grad(self):
|
|
|
394
355
|
return bprop
|
|
395
356
|
|
|
396
357
|
|
|
397
|
-
@bprop_getters.register(P.MaxPool)
|
|
398
|
-
def get_bprop_max_pool_grad(self):
|
|
399
|
-
"""Grad definition for `MaxPool` operation."""
|
|
400
|
-
maxpool_grad = G.MaxPoolGrad(
|
|
401
|
-
kernel_size=self.kernel_size,
|
|
402
|
-
strides=self.strides,
|
|
403
|
-
pad_mode=self.pad_mode,
|
|
404
|
-
data_format=self.format)
|
|
405
|
-
|
|
406
|
-
def bprop(x, out, dout):
|
|
407
|
-
dx = maxpool_grad(x, out, dout)
|
|
408
|
-
return (dx,)
|
|
409
|
-
|
|
410
|
-
return bprop
|
|
411
|
-
|
|
412
|
-
|
|
413
358
|
@bprop_getters.register(P.MaxPool3D)
|
|
414
359
|
def get_bprop_max_pool3d_grad(self):
|
|
415
360
|
"""Grad definition for `MaxPool3D` operation."""
|
|
@@ -494,9 +439,10 @@ def get_bprop_avg_pool_grad(self):
|
|
|
494
439
|
def get_bprop_adaptive_avg_pool2d_grad(self):
|
|
495
440
|
"""Grad definition for `AdaptiveAvgPool2D` operation."""
|
|
496
441
|
adaptive_avgpool_grad = G.AdaptiveAvgPool2DGrad()
|
|
442
|
+
shape = P.TensorShape()
|
|
497
443
|
|
|
498
444
|
def bprop(x, out, dout):
|
|
499
|
-
dx = adaptive_avgpool_grad(
|
|
445
|
+
dx = adaptive_avgpool_grad(dout, shape(x))
|
|
500
446
|
return (dx,)
|
|
501
447
|
|
|
502
448
|
return bprop
|
|
@@ -518,7 +464,7 @@ def get_bprop_avg_pool_3d_grad(self):
|
|
|
518
464
|
|
|
519
465
|
def bprop(x, out, dout):
|
|
520
466
|
x_shape = F.shape(x)
|
|
521
|
-
if
|
|
467
|
+
if F.is_sequence_value_unknown(x_shape):
|
|
522
468
|
x_shape = P.TensorShape()(x)
|
|
523
469
|
dx = avgpool3d_grad(x_shape, dout)
|
|
524
470
|
return (dx,)
|
|
@@ -599,18 +545,6 @@ def get_bprop_mul_no_nan(self):
|
|
|
599
545
|
return bprop
|
|
600
546
|
|
|
601
547
|
|
|
602
|
-
@bprop_getters.register(P.ReLU)
|
|
603
|
-
def get_bprop_relu(self):
|
|
604
|
-
"""Grad definition for `ReLU` operation."""
|
|
605
|
-
input_grad = G.ReluGrad()
|
|
606
|
-
|
|
607
|
-
def bprop(x, out, dout):
|
|
608
|
-
dx = input_grad(dout, out)
|
|
609
|
-
return (dx,)
|
|
610
|
-
|
|
611
|
-
return bprop
|
|
612
|
-
|
|
613
|
-
|
|
614
548
|
@bprop_getters.register(G.ReluGrad)
|
|
615
549
|
def get_bprop_relu_grad(self):
|
|
616
550
|
"""Grad definition for `ReLUGrad` operation."""
|
|
@@ -709,7 +643,7 @@ def get_bprop_sigmoid_grad(self):
|
|
|
709
643
|
return bprop
|
|
710
644
|
|
|
711
645
|
|
|
712
|
-
@
|
|
646
|
+
@_primexpr
|
|
713
647
|
def _get_transpose_axis(x_shp, axis):
|
|
714
648
|
rank = len(x_shp)
|
|
715
649
|
if axis < 0:
|
|
@@ -722,7 +656,7 @@ def _get_transpose_axis(x_shp, axis):
|
|
|
722
656
|
|
|
723
657
|
def _get_dyn_transpose_axis(x, axis, is_ascend):
|
|
724
658
|
"""Get transpose axis"""
|
|
725
|
-
if
|
|
659
|
+
if F.is_sequence_shape_unknown(P.Shape()(x)):
|
|
726
660
|
rank = dyn_rank(x)
|
|
727
661
|
start = Tensor(0, dtype=mstype.int64)
|
|
728
662
|
delta = Tensor(1, dtype=mstype.int64)
|
|
@@ -764,13 +698,13 @@ def get_bprop_softmax(self):
|
|
|
764
698
|
is_ascend = (device_target == "Ascend")
|
|
765
699
|
|
|
766
700
|
def bprop(x, out, dout):
|
|
767
|
-
# dx
|
|
701
|
+
# dx can be expressed as (dout - sum(dout * out)) * out
|
|
768
702
|
# This formula is correct only when the `axis` is the last dimension.
|
|
769
703
|
# In order to support the scenario where the `axis` is other values,
|
|
770
704
|
# we transpose the data of the `axis` dimension to the last dimension for calculation,
|
|
771
705
|
# and then transpose it back after the calculation.
|
|
772
706
|
shp = get_shape(x)
|
|
773
|
-
if
|
|
707
|
+
if F.is_sequence_value_unknown(shp):
|
|
774
708
|
reverse_axis = _get_dyn_transpose_axis(x, axis, is_ascend)
|
|
775
709
|
if is_ascend:
|
|
776
710
|
reverse_axis = P.Cast()(reverse_axis, mstype.int32)
|
|
@@ -855,19 +789,6 @@ def get_bprop_tanh_grad(self):
|
|
|
855
789
|
return bprop
|
|
856
790
|
|
|
857
791
|
|
|
858
|
-
@bprop_getters.register(P.Gelu)
|
|
859
|
-
@bprop_getters.register(P.GeLU)
|
|
860
|
-
def get_bprop_gelu(self):
|
|
861
|
-
"""Grad definition for `GeLU` operation."""
|
|
862
|
-
input_grad = G.GeLUGrad()
|
|
863
|
-
|
|
864
|
-
def bprop(x, out, dout):
|
|
865
|
-
dx = input_grad(dout, x, out)
|
|
866
|
-
return (dx,)
|
|
867
|
-
|
|
868
|
-
return bprop
|
|
869
|
-
|
|
870
|
-
|
|
871
792
|
@bprop_getters.register(P.FastGeLU)
|
|
872
793
|
def get_bprop_fast_gelu(self):
|
|
873
794
|
"""Grad definition for `FastGeLU` operation."""
|
|
@@ -909,30 +830,6 @@ def get_bprop_instance_norm(self):
|
|
|
909
830
|
return bprop
|
|
910
831
|
|
|
911
832
|
|
|
912
|
-
@bprop_getters.register(P.BatchNorm)
|
|
913
|
-
def get_bprop_batch_norm(self):
|
|
914
|
-
"""Grad definition for `BatchNorm` operation."""
|
|
915
|
-
is_training = self.is_training
|
|
916
|
-
input_grad = G.BatchNormGrad(is_training, self.epsilon, self.data_format)
|
|
917
|
-
|
|
918
|
-
def bprop(x, scale, b, mean, variance, out, dout):
|
|
919
|
-
if is_training:
|
|
920
|
-
saved_mean = out[3]
|
|
921
|
-
saved_variance = out[4]
|
|
922
|
-
reserve = out[2]
|
|
923
|
-
else:
|
|
924
|
-
saved_mean = mean
|
|
925
|
-
saved_variance = variance
|
|
926
|
-
reserve = out[2]
|
|
927
|
-
out = input_grad(dout[0], x, scale, saved_mean, saved_variance, reserve)
|
|
928
|
-
dx = out[0]
|
|
929
|
-
dscale = out[1]
|
|
930
|
-
dbias = out[2]
|
|
931
|
-
return dx, dscale, dbias, zeros_like(mean), zeros_like(variance)
|
|
932
|
-
|
|
933
|
-
return bprop
|
|
934
|
-
|
|
935
|
-
|
|
936
833
|
@bprop_getters.register(G.BatchNormGrad)
|
|
937
834
|
def get_bprop_batch_norm_grad(self):
|
|
938
835
|
"""Grad definition for `BatchNorm` operation."""
|
|
@@ -945,19 +842,6 @@ def get_bprop_batch_norm_grad(self):
|
|
|
945
842
|
return bprop
|
|
946
843
|
|
|
947
844
|
|
|
948
|
-
@bprop_getters.register(P.LayerNorm)
|
|
949
|
-
def get_bprop_layer_norm(self):
|
|
950
|
-
"""Grad definition for `LayerNorm` operation."""
|
|
951
|
-
layer_norm_grad = G.LayerNormGrad(self.begin_norm_axis, self.begin_params_axis)
|
|
952
|
-
|
|
953
|
-
def bprop(x, gamma, beta, out, dout):
|
|
954
|
-
dx, d_gamma, d_beta = layer_norm_grad(
|
|
955
|
-
x, dout[0], out[2], out[1], gamma)
|
|
956
|
-
return dx, d_gamma, d_beta
|
|
957
|
-
|
|
958
|
-
return bprop
|
|
959
|
-
|
|
960
|
-
|
|
961
845
|
@bprop_getters.register(G.LayerNormGrad)
|
|
962
846
|
def get_bprop_layer_norm_grad(self):
|
|
963
847
|
"""Grad definition for `LayerNormGrad` operation."""
|
|
@@ -1072,7 +956,7 @@ def get_bprop_top_kv2(self):
|
|
|
1072
956
|
ind_2d = reshape_op(indices, (-1, ind_lastdim))
|
|
1073
957
|
outerdim = shape_op(ind_2d)[0]
|
|
1074
958
|
|
|
1075
|
-
# [0, outterdim, 2*outerdim, ..., (k-1)*outerdim]
|
|
959
|
+
# range_flatten_index can be expressed as: [0, outterdim, 2*outerdim, ..., (k-1)*outerdim]
|
|
1076
960
|
indices_dtype = dtype(indices)
|
|
1077
961
|
range_flatten_index = range_op(0, outerdim * in_lastdim, in_lastdim, indices_dtype)
|
|
1078
962
|
|
|
@@ -1099,7 +983,7 @@ def get_bprop_top_kv2(self):
|
|
|
1099
983
|
ind_2d = reshape_op(indices, create_tensor_by_element((-1, ind_lastdim)))
|
|
1100
984
|
outerdim = dyn_shape(ind_2d)[0]
|
|
1101
985
|
|
|
1102
|
-
# [0, outterdim, 2*outerdim, ..., (k-1)*outerdim]
|
|
986
|
+
# range_flatten_index can be expressed as: [0, outterdim, 2*outerdim, ..., (k-1)*outerdim]
|
|
1103
987
|
range_flatten_index = P.Range()(cast(0, mstype.int64), outerdim * in_lastdim, in_lastdim)
|
|
1104
988
|
|
|
1105
989
|
# expand_dims to (k, 1), then broadcast
|
|
@@ -1115,7 +999,7 @@ def get_bprop_top_kv2(self):
|
|
|
1115
999
|
return out_grad, zeros_like(k)
|
|
1116
1000
|
|
|
1117
1001
|
def bprop(input_x, k, out, dout):
|
|
1118
|
-
if
|
|
1002
|
+
if F.is_sequence_value_unknown(shape_op(input_x)):
|
|
1119
1003
|
return _bprop_dynshape(input_x, k, out, dout)
|
|
1120
1004
|
return _bprop_static(input_x, k, out, dout)
|
|
1121
1005
|
|
|
@@ -1219,6 +1103,27 @@ def get_bprop_lstm(self):
|
|
|
1219
1103
|
return bprop
|
|
1220
1104
|
|
|
1221
1105
|
|
|
1106
|
+
@bprop_getters.register(rl_ops.GRUV2)
|
|
1107
|
+
def get_bppro_gru_v2(self):
|
|
1108
|
+
"""Grad definition for `GRUV2` operation."""
|
|
1109
|
+
gru_grad_v2 = G.GRUV2Grad(
|
|
1110
|
+
self.input_size,
|
|
1111
|
+
self.hidden_size,
|
|
1112
|
+
self.num_layers,
|
|
1113
|
+
self.has_bias,
|
|
1114
|
+
self.bidirectional,
|
|
1115
|
+
self.dropout
|
|
1116
|
+
)
|
|
1117
|
+
|
|
1118
|
+
def bpro(x, hx, w, seq_length, out, dout):
|
|
1119
|
+
y, hy, reverse, _ = out
|
|
1120
|
+
dy, dhy, _, _ = dout
|
|
1121
|
+
dx, dhx, dw = gru_grad_v2(x, hx, w, seq_length, y, hy, dy, dhy, reverse)
|
|
1122
|
+
return dx, dhx, dw, (0)
|
|
1123
|
+
|
|
1124
|
+
return bpro
|
|
1125
|
+
|
|
1126
|
+
|
|
1222
1127
|
@bprop_getters.register(rl_ops.CudnnGRU)
|
|
1223
1128
|
def get_bprop_gru(self):
|
|
1224
1129
|
"""Grad definition for `GRU` operation."""
|
|
@@ -1321,7 +1226,7 @@ def get_bprop_pad(self):
|
|
|
1321
1226
|
for item in paddings:
|
|
1322
1227
|
begin += (item[0],)
|
|
1323
1228
|
shp = shape_op(x)
|
|
1324
|
-
if
|
|
1229
|
+
if F.is_sequence_value_unknown(shp):
|
|
1325
1230
|
shp = dyn_shape_op(x)
|
|
1326
1231
|
dx = P.Slice()(dout, begin, shp)
|
|
1327
1232
|
return (dx,)
|
|
@@ -1353,7 +1258,7 @@ def get_bprop_roi_align(self):
|
|
|
1353
1258
|
|
|
1354
1259
|
def bprop(inputs, rois, out, dout):
|
|
1355
1260
|
inputs_shape = shape_op(inputs)
|
|
1356
|
-
if
|
|
1261
|
+
if F.is_sequence_value_unknown(inputs_shape):
|
|
1357
1262
|
inputs_shape = dyn_shape(inputs)
|
|
1358
1263
|
dx = G.ROIAlignGrad(pooled_height, pooled_width, spatial_scale, sample_num)(dout, rois, inputs_shape)
|
|
1359
1264
|
return dx, zeros_like(rois)
|
|
@@ -1380,7 +1285,7 @@ def get_bprop_conv2d_backprop_input(self):
|
|
|
1380
1285
|
|
|
1381
1286
|
def bprop(x, w, f_sizes, out, dout):
|
|
1382
1287
|
w_shape = get_shape(w)
|
|
1383
|
-
if
|
|
1288
|
+
if F.is_sequence_value_unknown(w_shape):
|
|
1384
1289
|
w_shape = get_dyn_shape(w)
|
|
1385
1290
|
dx = input_grad(dout, w)
|
|
1386
1291
|
dw = filter_grad(x, dout, w_shape)
|
|
@@ -1427,8 +1332,8 @@ def get_bprop_bce_with_logits_loss(self):
|
|
|
1427
1332
|
dx = mul(dx, weight)
|
|
1428
1333
|
grad_target = mul(grad_target, weight)
|
|
1429
1334
|
if reduction == 'mean':
|
|
1430
|
-
dx_size = dyn_size(dx) if
|
|
1431
|
-
target_size = dyn_size(target) if
|
|
1335
|
+
dx_size = dyn_size(dx) if F.is_sequence_value_unknown(shape(dx)) else size(dx)
|
|
1336
|
+
target_size = dyn_size(target) if F.is_sequence_value_unknown(shape(target)) else size(target)
|
|
1432
1337
|
dx = dx / dx_size
|
|
1433
1338
|
grad_target = grad_target / target_size
|
|
1434
1339
|
return dx, grad_target, zeros_like(weight), zeros_like(pos_weight)
|
|
@@ -1439,18 +1344,19 @@ def get_bprop_bce_with_logits_loss(self):
|
|
|
1439
1344
|
@bprop_getters.register(P.KLDivLoss)
|
|
1440
1345
|
def get_bprop_kl_div_loss(self):
|
|
1441
1346
|
"""Grad definition for `KLDivLoss` operation."""
|
|
1442
|
-
|
|
1443
|
-
|
|
1444
|
-
else:
|
|
1445
|
-
grad = G.KLDivLossGrad(self.reduction)
|
|
1347
|
+
reduce_type = self.reduction
|
|
1348
|
+
|
|
1446
1349
|
size = P.Size()
|
|
1447
1350
|
shape = P.Shape()
|
|
1448
|
-
reduce_type = self.reduction
|
|
1449
1351
|
|
|
1450
1352
|
def bprop(x, y, out, dout):
|
|
1353
|
+
if reduce_type == "mean":
|
|
1354
|
+
grad = G.KLDivLossGrad("sum")
|
|
1355
|
+
else:
|
|
1356
|
+
grad = G.KLDivLossGrad(self.reduction)
|
|
1451
1357
|
dx = grad(dout, x, y)
|
|
1452
1358
|
if reduce_type == "mean":
|
|
1453
|
-
x_size = dyn_size(x) if
|
|
1359
|
+
x_size = dyn_size(x) if F.is_sequence_value_unknown(shape(x)) else size(x)
|
|
1454
1360
|
return dx / x_size, zeros_like(y)
|
|
1455
1361
|
return dx, zeros_like(y)
|
|
1456
1362
|
|
|
@@ -1583,7 +1489,7 @@ def get_bprop_conv2d_backprop_filter(self):
|
|
|
1583
1489
|
|
|
1584
1490
|
def bprop(dy, x, filter_size, out, dout):
|
|
1585
1491
|
x_shape = get_shape(x)
|
|
1586
|
-
if
|
|
1492
|
+
if F.is_sequence_value_unknown(x_shape):
|
|
1587
1493
|
x_shape = get_dyn_shape(x)
|
|
1588
1494
|
dw_dx = input_grad(dy, dout, x_shape)
|
|
1589
1495
|
dw_dy = filter_grad(x, dout)
|