mindspore 1.10.0__cp38-cp38-win_amd64.whl → 2.0.0rc1__cp38-cp38-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of mindspore might be problematic. Click here for more details.
- mindspore/.commit_id +1 -1
- mindspore/ConcurrencyCheck.dll +0 -0
- mindspore/CppBuildInsights.dll +0 -0
- mindspore/CppCoreCheck.dll +0 -0
- mindspore/EnumIndex.dll +0 -0
- mindspore/EspXEngine.dll +0 -0
- mindspore/HResultCheck.dll +0 -0
- mindspore/KernelTraceControl.dll +0 -0
- mindspore/LocalESPC.dll +0 -0
- mindspore/Microsoft.Diagnostics.Tracing.EventSource.dll +0 -0
- mindspore/Microsoft.VisualStudio.RemoteControl.dll +0 -0
- mindspore/Microsoft.VisualStudio.Telemetry.dll +0 -0
- mindspore/Microsoft.VisualStudio.Utilities.Internal.dll +0 -0
- mindspore/Newtonsoft.Json.dll +0 -0
- mindspore/System.Runtime.CompilerServices.Unsafe.dll +0 -0
- mindspore/VariantClear.dll +0 -0
- mindspore/__init__.py +9 -4
- mindspore/_c_dataengine.cp38-win_amd64.pyd +0 -0
- mindspore/_c_expression.cp38-win_amd64.pyd +0 -0
- mindspore/_c_mindrecord.cp38-win_amd64.pyd +0 -0
- mindspore/_check_jit_forbidden_api.py +102 -0
- mindspore/_checkparam.py +1066 -1001
- mindspore/_extends/builtin_operations.py +32 -4
- mindspore/_extends/graph_kernel/model/graph_split.py +66 -222
- mindspore/_extends/parallel_compile/akg_compiler/akg_process.py +12 -9
- mindspore/_extends/parallel_compile/akg_compiler/build_tbe_kernel.py +119 -26
- mindspore/_extends/parallel_compile/akg_compiler/tbe_topi.py +50 -50
- mindspore/_extends/parallel_compile/akg_compiler/util.py +9 -6
- mindspore/_extends/parallel_compile/tbe_compiler/tbe_adapter.py +4 -25
- mindspore/_extends/parallel_compile/tbe_compiler/tbe_helper.py +9 -4
- mindspore/_extends/parallel_compile/tbe_compiler/tbe_job_manager.py +1 -27
- mindspore/_extends/parse/__init__.py +5 -3
- mindspore/_extends/parse/namespace.py +17 -2
- mindspore/_extends/parse/parser.py +193 -34
- mindspore/_extends/parse/resources.py +7 -8
- mindspore/_extends/parse/standard_method.py +1780 -435
- mindspore/_extends/parse/trope.py +3 -1
- mindspore/amp.py +53 -58
- mindspore/atlprov.dll +0 -0
- mindspore/boost/adasum.py +3 -2
- mindspore/boost/boost.py +2 -2
- mindspore/boost/boost_cell_wrapper.py +46 -26
- mindspore/boost/dim_reduce.py +6 -5
- mindspore/boost/grad_accumulation.py +2 -1
- mindspore/boost/group_loss_scale_manager.py +1 -1
- mindspore/c1.dll +0 -0
- mindspore/c1xx.dll +0 -0
- mindspore/c2.dll +0 -0
- mindspore/cfgpersist.dll +0 -0
- mindspore/clang_rt.asan_dbg_dynamic-x86_64.dll +0 -0
- mindspore/clang_rt.asan_dynamic-x86_64.dll +0 -0
- mindspore/common/__init__.py +11 -10
- mindspore/common/_decorator.py +2 -0
- mindspore/common/_register_for_adapter.py +55 -0
- mindspore/common/_stub_tensor.py +201 -0
- mindspore/common/_utils.py +57 -0
- mindspore/common/api.py +582 -297
- mindspore/common/dtype.py +66 -18
- mindspore/common/dump.py +2 -2
- mindspore/common/initializer.py +38 -1
- mindspore/common/jit_config.py +25 -13
- mindspore/common/mutable.py +53 -24
- mindspore/common/parameter.py +60 -37
- mindspore/common/seed.py +8 -24
- mindspore/common/sparse_tensor.py +927 -0
- mindspore/common/tensor.py +1627 -3900
- mindspore/communication/__init__.py +10 -5
- mindspore/communication/_comm_helper.py +78 -214
- mindspore/communication/_hccl_management.py +2 -1
- mindspore/communication/management.py +136 -47
- mindspore/config/op_info.config +501 -1008
- mindspore/context.py +291 -56
- mindspore/d3dcompiler_47.dll +0 -0
- mindspore/dataset/__init__.py +12 -8
- mindspore/dataset/audio/__init__.py +9 -9
- mindspore/dataset/audio/transforms.py +1090 -228
- mindspore/dataset/audio/utils.py +87 -39
- mindspore/dataset/audio/validators.py +223 -1
- mindspore/dataset/callback/ds_callback.py +17 -15
- mindspore/dataset/core/config.py +246 -17
- mindspore/dataset/core/py_util_helpers.py +4 -3
- mindspore/dataset/core/validator_helpers.py +10 -10
- mindspore/{parallel/nn/layers.py → dataset/debug/__init__.py} +7 -8
- mindspore/dataset/debug/debug_hook.py +65 -0
- mindspore/dataset/debug/pre_defined_hook.py +67 -0
- mindspore/dataset/engine/__init__.py +7 -3
- mindspore/dataset/engine/cache_client.py +9 -9
- mindspore/dataset/engine/datasets.py +648 -477
- mindspore/dataset/engine/datasets_audio.py +165 -167
- mindspore/dataset/engine/datasets_standard_format.py +93 -67
- mindspore/dataset/engine/datasets_text.py +492 -342
- mindspore/dataset/engine/datasets_user_defined.py +85 -50
- mindspore/dataset/engine/datasets_vision.py +1224 -699
- mindspore/dataset/engine/graphdata.py +134 -69
- mindspore/dataset/engine/iterators.py +50 -9
- mindspore/dataset/engine/offload.py +52 -31
- mindspore/dataset/engine/samplers.py +27 -24
- mindspore/dataset/engine/serializer_deserializer.py +14 -15
- mindspore/dataset/engine/validators.py +213 -52
- mindspore/dataset/text/__init__.py +10 -8
- mindspore/dataset/text/transforms.py +152 -57
- mindspore/dataset/text/utils.py +98 -49
- mindspore/dataset/text/validators.py +25 -0
- mindspore/dataset/transforms/__init__.py +4 -2
- mindspore/dataset/transforms/c_transforms.py +11 -13
- mindspore/dataset/transforms/py_transforms.py +2 -2
- mindspore/dataset/transforms/py_transforms_util.py +10 -0
- mindspore/dataset/transforms/transforms.py +13 -15
- mindspore/dataset/transforms/validators.py +7 -7
- mindspore/dataset/utils/__init__.py +2 -1
- mindspore/dataset/utils/browse_dataset.py +13 -13
- mindspore/dataset/utils/line_reader.py +121 -0
- mindspore/dataset/vision/__init__.py +8 -7
- mindspore/dataset/vision/c_transforms.py +125 -126
- mindspore/dataset/vision/py_transforms.py +37 -37
- mindspore/dataset/vision/py_transforms_util.py +23 -20
- mindspore/dataset/vision/transforms.py +316 -315
- mindspore/dataset/vision/utils.py +313 -17
- mindspore/dataset/vision/validators.py +6 -6
- mindspore/default_config.py +0 -1
- mindspore/dpcmi.dll +0 -0
- mindspore/{compression → experimental}/__init__.py +6 -5
- mindspore/experimental/map_parameter.py +275 -0
- mindspore/include/OWNERS +0 -1
- mindspore/include/api/callback/callback.h +9 -13
- mindspore/include/api/callback/ckpt_saver.h +2 -2
- mindspore/include/api/callback/loss_monitor.h +2 -2
- mindspore/include/api/callback/lr_scheduler.h +5 -5
- mindspore/include/api/callback/time_monitor.h +2 -2
- mindspore/include/api/callback/train_accuracy.h +4 -6
- mindspore/include/api/cfg.h +19 -6
- mindspore/include/api/context.h +70 -9
- mindspore/include/api/delegate.h +8 -1
- mindspore/include/api/dual_abi_helper.h +8 -24
- mindspore/include/api/metrics/accuracy.h +2 -2
- mindspore/include/api/metrics/metrics.h +4 -3
- mindspore/include/api/model.h +9 -4
- mindspore/include/api/model_group.h +68 -0
- mindspore/include/api/model_parallel_runner.h +17 -17
- mindspore/include/api/net.h +12 -11
- mindspore/include/api/serialization.h +20 -4
- mindspore/include/api/status.h +7 -1
- mindspore/include/api/types.h +25 -21
- mindspore/include/api/visible.h +4 -0
- mindspore/include/c_api/model_c.h +5 -0
- mindspore/include/c_api/status_c.h +1 -1
- mindspore/include/dataset/config.h +1 -1
- mindspore/include/dataset/constants.h +14 -0
- mindspore/include/dataset/text.h +59 -0
- mindspore/include/dataset/vision.h +56 -117
- mindspore/include/dataset/vision_lite.h +102 -0
- mindspore/jpeg62.dll +0 -0
- mindspore/log.py +28 -28
- mindspore/mindrecord/common/exceptions.py +2 -4
- mindspore/mindrecord/filereader.py +19 -1
- mindspore/mindrecord/filewriter.py +250 -88
- mindspore/mindrecord/mindpage.py +13 -13
- mindspore/mindrecord/shardheader.py +15 -15
- mindspore/mindrecord/shardreader.py +9 -0
- mindspore/mindrecord/shardwriter.py +29 -29
- mindspore/mindrecord/tools/cifar100_to_mr.py +9 -9
- mindspore/mindrecord/tools/cifar10_to_mr.py +9 -9
- mindspore/mindrecord/tools/csv_to_mr.py +4 -4
- mindspore/mindrecord/tools/imagenet_to_mr.py +70 -65
- mindspore/mindrecord/tools/mnist_to_mr.py +41 -41
- mindspore/mindrecord/tools/tfrecord_to_mr.py +6 -6
- mindspore/{libmindspore_backend.dll → mindspore_backend.dll} +0 -0
- mindspore/mindspore_common.dll +0 -0
- mindspore/mindspore_core.dll +0 -0
- mindspore/mindspore_glog.dll +0 -0
- mindspore/mindspore_shared_lib.dll +0 -0
- mindspore/msobj140.dll +0 -0
- mindspore/mspdb140.dll +0 -0
- mindspore/mspdbcore.dll +0 -0
- mindspore/mspdbst.dll +0 -0
- mindspore/mspft140.dll +0 -0
- mindspore/msvcdis140.dll +0 -0
- mindspore/msvcp140_1.dll +0 -0
- mindspore/msvcp140_2.dll +0 -0
- mindspore/msvcp140_atomic_wait.dll +0 -0
- mindspore/msvcp140_codecvt_ids.dll +0 -0
- mindspore/nn/__init__.py +1 -5
- mindspore/nn/cell.py +297 -234
- mindspore/nn/dynamic_lr.py +1 -1
- mindspore/nn/grad/cell_grad.py +17 -42
- mindspore/nn/layer/__init__.py +7 -4
- mindspore/nn/layer/activation.py +131 -88
- mindspore/nn/layer/basic.py +313 -613
- mindspore/nn/layer/channel_shuffle.py +103 -0
- mindspore/nn/layer/combined.py +1 -1
- mindspore/nn/layer/container.py +52 -6
- mindspore/nn/layer/conv.py +112 -43
- mindspore/nn/layer/dense.py +10 -9
- mindspore/nn/layer/embedding.py +36 -34
- mindspore/nn/layer/image.py +123 -27
- mindspore/nn/layer/math.py +108 -107
- mindspore/nn/layer/normalization.py +212 -366
- mindspore/nn/layer/padding.py +370 -42
- mindspore/nn/layer/pooling.py +1443 -219
- mindspore/nn/layer/rnn_cells.py +11 -16
- mindspore/nn/layer/rnns.py +38 -39
- mindspore/nn/layer/thor_layer.py +24 -25
- mindspore/nn/layer/timedistributed.py +5 -5
- mindspore/nn/layer/transformer.py +701 -0
- mindspore/nn/learning_rate_schedule.py +8 -8
- mindspore/nn/loss/__init__.py +9 -6
- mindspore/nn/loss/loss.py +678 -142
- mindspore/nn/metrics.py +53 -0
- mindspore/nn/optim/_dist_optimizer_registry.py +2 -2
- mindspore/nn/optim/ada_grad.py +8 -8
- mindspore/nn/optim/adadelta.py +2 -3
- mindspore/nn/optim/adafactor.py +18 -14
- mindspore/nn/optim/adam.py +429 -87
- mindspore/nn/optim/adamax.py +5 -6
- mindspore/nn/optim/adasum.py +10 -8
- mindspore/nn/optim/asgd.py +7 -7
- mindspore/nn/optim/ftrl.py +81 -11
- mindspore/nn/optim/lamb.py +7 -8
- mindspore/nn/optim/lars.py +4 -4
- mindspore/nn/optim/lazyadam.py +82 -7
- mindspore/nn/optim/momentum.py +8 -7
- mindspore/nn/optim/optimizer.py +19 -10
- mindspore/nn/optim/proximal_ada_grad.py +6 -5
- mindspore/nn/optim/rmsprop.py +3 -3
- mindspore/nn/optim/rprop.py +20 -16
- mindspore/nn/optim/sgd.py +21 -15
- mindspore/nn/optim/thor.py +23 -21
- mindspore/nn/probability/__init__.py +0 -2
- mindspore/nn/probability/bijector/bijector.py +7 -6
- mindspore/nn/probability/bijector/invert.py +4 -2
- mindspore/nn/probability/bijector/softplus.py +2 -2
- mindspore/nn/probability/bnn_layers/dense_variational.py +1 -1
- mindspore/nn/probability/bnn_layers/layer_distribution.py +2 -2
- mindspore/nn/probability/distribution/__init__.py +6 -0
- mindspore/nn/probability/distribution/_utils/custom_ops.py +3 -2
- mindspore/nn/probability/distribution/_utils/utils.py +11 -17
- mindspore/nn/probability/distribution/bernoulli.py +6 -6
- mindspore/nn/probability/distribution/beta.py +1 -1
- mindspore/nn/probability/distribution/categorical.py +9 -9
- mindspore/nn/probability/distribution/cauchy.py +8 -8
- mindspore/nn/probability/distribution/distribution.py +12 -6
- mindspore/nn/probability/distribution/exponential.py +5 -5
- mindspore/nn/probability/distribution/gamma.py +3 -3
- mindspore/nn/probability/distribution/geometric.py +6 -5
- mindspore/nn/probability/distribution/gumbel.py +5 -5
- mindspore/nn/probability/distribution/half_normal.py +133 -0
- mindspore/nn/probability/distribution/laplace.py +128 -0
- mindspore/nn/probability/distribution/log_normal.py +0 -1
- mindspore/nn/probability/distribution/logistic.py +4 -5
- mindspore/nn/probability/distribution/normal.py +11 -15
- mindspore/nn/probability/distribution/poisson.py +6 -2
- mindspore/nn/probability/distribution/student_t.py +150 -0
- mindspore/nn/probability/distribution/transformed_distribution.py +4 -4
- mindspore/nn/probability/distribution/uniform.py +5 -5
- mindspore/nn/reinforcement/_tensors_queue.py +3 -3
- mindspore/nn/reinforcement/tensor_array.py +2 -2
- mindspore/nn/sparse/sparse.py +8 -1
- mindspore/nn/wrap/cell_wrapper.py +55 -27
- mindspore/nn/wrap/grad_reducer.py +20 -11
- mindspore/nn/wrap/loss_scale.py +47 -30
- mindspore/numpy/array_creations.py +33 -22
- mindspore/numpy/array_ops.py +46 -42
- mindspore/numpy/logic_ops.py +6 -27
- mindspore/numpy/math_ops.py +26 -19
- mindspore/numpy/utils.py +1 -8
- mindspore/numpy/utils_const.py +112 -62
- mindspore/opencv_core452.dll +0 -0
- mindspore/opencv_imgcodecs452.dll +0 -0
- mindspore/opencv_imgproc452.dll +0 -0
- mindspore/ops/__init__.py +6 -3
- mindspore/ops/_constants.py +0 -6
- mindspore/ops/_grad/__init__.py +2 -1
- mindspore/ops/_grad/grad_array_ops.py +209 -152
- mindspore/ops/_grad/grad_base.py +55 -17
- mindspore/ops/_grad/grad_clip_ops.py +11 -3
- mindspore/ops/_grad/grad_comm_ops.py +58 -47
- mindspore/ops/_grad/grad_implementations.py +21 -61
- mindspore/ops/_grad/grad_inner_ops.py +48 -6
- mindspore/ops/_grad/grad_math_ops.py +306 -161
- mindspore/ops/_grad/grad_nn_ops.py +192 -181
- mindspore/ops/_grad/grad_other_ops.py +1 -1
- mindspore/ops/_grad/grad_quant_ops.py +5 -5
- mindspore/ops/_grad/grad_sequence_ops.py +296 -0
- mindspore/ops/_grad/grad_sparse.py +15 -9
- mindspore/ops/_grad_experimental/__init__.py +1 -0
- mindspore/ops/_grad_experimental/grad_array_ops.py +441 -55
- mindspore/ops/_grad_experimental/grad_image_ops.py +25 -7
- mindspore/ops/_grad_experimental/grad_inner_ops.py +3 -44
- mindspore/ops/_grad_experimental/grad_linalg_ops.py +16 -21
- mindspore/ops/_grad_experimental/grad_math_ops.py +979 -49
- mindspore/ops/_grad_experimental/grad_nn_ops.py +78 -8
- mindspore/ops/_grad_experimental/grad_scalar_ops.py +112 -0
- mindspore/ops/_grad_experimental/grad_sparse_ops.py +197 -13
- mindspore/ops/_op_impl/__init__.py +3 -3
- mindspore/ops/_op_impl/_custom_op/__init__.py +0 -1
- mindspore/ops/_op_impl/_custom_op/_basic.py +0 -1
- mindspore/ops/_op_impl/_custom_op/batch_matmul_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold.py +4 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2.py +2 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2_grad_reduce.py +5 -5
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold_grad.py +3 -3
- mindspore/ops/_op_impl/_custom_op/cholesky_trsm_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/correction_mul.py +3 -3
- mindspore/ops/_op_impl/_custom_op/correction_mul_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/dsd_back_impl.py +4 -8
- mindspore/ops/_op_impl/_custom_op/dsd_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel_grad_reduce.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer_grad_reduce.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perchannel_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perlayer_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fused_abs_max1_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/img2col_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_dense_left_impl.py +2 -2
- mindspore/ops/_op_impl/_custom_op/matmul_cube_dense_right_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_fracz_left_cast_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_fracz_right_mul_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_impl.py +2 -2
- mindspore/ops/_op_impl/_custom_op/matmul_dds_grad_impl.py +0 -1
- mindspore/ops/_op_impl/_custom_op/matmul_dds_impl.py +0 -1
- mindspore/ops/_op_impl/_custom_op/matrix_combine_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/minmax_update_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/minmax_update_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/transpose02314_impl.py +1 -1
- mindspore/ops/_op_impl/aicpu/__init__.py +238 -3
- mindspore/ops/_op_impl/aicpu/abs.py +36 -0
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_2d.py +34 -0
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_2d_grad.py +34 -0
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_3d.py +39 -0
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_3d_grad.py +39 -0
- mindspore/ops/_op_impl/aicpu/adaptive_max_pool_2d_grad.py +37 -0
- mindspore/ops/_op_impl/aicpu/adaptive_max_pool_3d.py +42 -0
- mindspore/ops/_op_impl/aicpu/adaptive_max_pool_3d_grad.py +152 -0
- mindspore/ops/_op_impl/aicpu/add.py +43 -0
- mindspore/ops/_op_impl/aicpu/addcdiv.py +0 -32
- mindspore/ops/_op_impl/aicpu/addcmul.py +0 -84
- mindspore/ops/_op_impl/aicpu/affine_grid_grad.py +35 -0
- mindspore/ops/_op_impl/aicpu/arg_max.py +75 -0
- mindspore/ops/_op_impl/aicpu/arg_min.py +75 -0
- mindspore/ops/_op_impl/aicpu/argmin_with_value.py +43 -0
- mindspore/ops/_op_impl/aicpu/batch_matmul.py +43 -0
- mindspore/ops/_op_impl/aicpu/batch_norm_grad_grad.py +49 -0
- mindspore/ops/_op_impl/aicpu/bernoulli.py +48 -0
- mindspore/ops/_op_impl/aicpu/bessel_i0.py +31 -0
- mindspore/ops/_op_impl/aicpu/bias_add.py +44 -0
- mindspore/ops/_op_impl/aicpu/bias_add_grad.py +43 -0
- mindspore/ops/_op_impl/aicpu/bincount.py +33 -0
- mindspore/{nn/probability/infer/variational/__init__.py → ops/_op_impl/aicpu/cauchy.py} +17 -10
- mindspore/ops/_op_impl/aicpu/channel_shuffle.py +40 -0
- mindspore/ops/_op_impl/aicpu/cholesky.py +1 -1
- mindspore/ops/_op_impl/{cpu/bias_add.py → aicpu/choleskygrad.py} +9 -7
- mindspore/ops/_op_impl/aicpu/combined_non_max_suppression.py +42 -0
- mindspore/ops/_op_impl/aicpu/concat_offset.py +42 -0
- mindspore/ops/_op_impl/aicpu/concat_offset_v1.py +31 -0
- mindspore/ops/_op_impl/aicpu/conj.py +11 -0
- mindspore/ops/_op_impl/aicpu/crop_and_resize_grad_image.py +38 -0
- mindspore/ops/_op_impl/aicpu/cumulative_logsumexp.py +36 -0
- mindspore/ops/_op_impl/aicpu/deformable_offsets.py +38 -0
- mindspore/ops/_op_impl/aicpu/deformable_offsets_grad.py +2 -2
- mindspore/ops/_op_impl/aicpu/dense_to_sparse_set_operation.py +48 -0
- mindspore/ops/_op_impl/aicpu/diag.py +36 -0
- mindspore/ops/_op_impl/aicpu/diag_part.py +36 -0
- mindspore/ops/_op_impl/aicpu/diagonal.py +35 -0
- mindspore/ops/_op_impl/{cpu/bias_add_grad.py → aicpu/digamma.py} +9 -7
- mindspore/ops/_op_impl/aicpu/eig.py +35 -0
- mindspore/ops/_op_impl/aicpu/fft_with_size.py +41 -0
- mindspore/ops/_op_impl/aicpu/flatten.py +1 -0
- mindspore/ops/_op_impl/aicpu/fmax.py +36 -0
- mindspore/ops/_op_impl/aicpu/fmin.py +37 -0
- mindspore/ops/_op_impl/aicpu/fractional_max_pool3d_with_fixed_ksize.py +1 -1
- mindspore/ops/_op_impl/aicpu/fse_decode.py +43 -0
- mindspore/ops/_op_impl/aicpu/glu.py +33 -0
- mindspore/ops/_op_impl/aicpu/glu_grad.py +34 -0
- mindspore/ops/_op_impl/aicpu/greater.py +41 -0
- mindspore/ops/_op_impl/aicpu/greater_equal.py +41 -0
- mindspore/ops/_op_impl/aicpu/index_put.py +50 -0
- mindspore/ops/_op_impl/{tbe/scatter_add_ds.py → aicpu/inplace_index_add.py} +17 -21
- mindspore/ops/_op_impl/aicpu/instance_norm_v2.py +41 -0
- mindspore/ops/_op_impl/aicpu/instance_norm_v2_grad.py +44 -0
- mindspore/ops/_op_impl/aicpu/layer_norm_grad_grad.py +47 -0
- mindspore/ops/_op_impl/aicpu/less.py +41 -0
- mindspore/ops/_op_impl/aicpu/less_equal.py +41 -0
- mindspore/ops/_op_impl/aicpu/lgamma.py +32 -0
- mindspore/ops/_op_impl/aicpu/log_normal_reverse.py +33 -0
- mindspore/ops/_op_impl/aicpu/logit.py +33 -0
- mindspore/ops/_op_impl/aicpu/logit_grad.py +34 -0
- mindspore/ops/_op_impl/aicpu/masked_fill.py +42 -0
- mindspore/ops/_op_impl/aicpu/masked_scatter.py +39 -0
- mindspore/ops/_op_impl/aicpu/matmul.py +39 -0
- mindspore/ops/_op_impl/aicpu/matrix_logarithm.py +31 -0
- mindspore/ops/_op_impl/aicpu/matrix_power.py +32 -0
- mindspore/ops/_op_impl/aicpu/matrix_solve_ls.py +36 -0
- mindspore/ops/_op_impl/aicpu/matrix_triangular_solve.py +36 -0
- mindspore/ops/_op_impl/aicpu/mirror_pad.py +2 -0
- mindspore/ops/_op_impl/aicpu/mirror_pad_grad.py +0 -4
- mindspore/ops/_op_impl/aicpu/mul.py +3 -1
- mindspore/ops/_op_impl/aicpu/multinomial.py +14 -6
- mindspore/ops/_op_impl/aicpu/multinomial_with_replacement.py +35 -0
- mindspore/ops/_op_impl/aicpu/nan_to_num.py +34 -0
- mindspore/ops/_op_impl/aicpu/nllloss.py +38 -0
- mindspore/ops/_op_impl/aicpu/nllloss_grad.py +39 -0
- mindspore/ops/_op_impl/aicpu/ones_like.py +0 -2
- mindspore/ops/_op_impl/aicpu/polar.py +32 -0
- mindspore/ops/_op_impl/aicpu/polygamma.py +34 -0
- mindspore/ops/_op_impl/aicpu/qr.py +36 -0
- mindspore/ops/_op_impl/aicpu/quant_dtype_cast.py +40 -0
- mindspore/ops/_op_impl/aicpu/quantile.py +35 -0
- mindspore/ops/_op_impl/aicpu/ragged_tensor_to_sparse.py +73 -0
- mindspore/ops/_op_impl/aicpu/ragged_tensor_to_tensor.py +74 -0
- mindspore/ops/_op_impl/aicpu/random_shuffle.py +3 -0
- mindspore/ops/_op_impl/aicpu/randperm_v2.py +41 -0
- mindspore/ops/_op_impl/aicpu/range.py +36 -0
- mindspore/ops/_op_impl/aicpu/reciprocal.py +34 -0
- mindspore/ops/_op_impl/aicpu/reciprocal_grad.py +35 -0
- mindspore/ops/_op_impl/aicpu/reduce_sum.py +57 -0
- mindspore/ops/_op_impl/aicpu/resize_bicubic.py +2 -8
- mindspore/ops/_op_impl/aicpu/resize_bicubic_grad.py +1 -1
- mindspore/ops/_op_impl/aicpu/resize_v2.py +68 -0
- mindspore/ops/_op_impl/aicpu/resize_v2_grad.py +68 -0
- mindspore/ops/_op_impl/aicpu/scatter_elements.py +4 -0
- mindspore/ops/_op_impl/aicpu/scatter_nd_update.py +2 -0
- mindspore/ops/_op_impl/aicpu/search_sorted.py +12 -6
- mindspore/ops/_op_impl/aicpu/self_adjoint_eig.py +34 -0
- mindspore/ops/_op_impl/aicpu/sequence_add.py +34 -0
- mindspore/ops/_op_impl/aicpu/sequence_add_offset.py +34 -0
- mindspore/ops/_op_impl/aicpu/sequence_addn.py +38 -0
- mindspore/ops/_op_impl/aicpu/slice_grad.py +76 -0
- mindspore/ops/_op_impl/aicpu/smooth_l1_loss.py +35 -0
- mindspore/ops/_op_impl/aicpu/smooth_l1_loss_grad.py +37 -0
- mindspore/ops/_op_impl/aicpu/sort.py +39 -0
- mindspore/ops/_op_impl/aicpu/sparse_apply_adagrad_da.py +0 -24
- mindspore/ops/_op_impl/aicpu/sparse_cross.py +42 -0
- mindspore/ops/_op_impl/aicpu/sparse_fill_empty_rows.py +63 -0
- mindspore/ops/_op_impl/aicpu/sparse_fill_empty_rows_grad.py +45 -0
- mindspore/ops/_op_impl/aicpu/sparse_matrix_mat_mul.py +56 -0
- mindspore/ops/_op_impl/{tbe/slice_ds.py → aicpu/sparse_segment_sum.py} +16 -24
- mindspore/ops/_op_impl/aicpu/sparse_segment_sum_with_num_segments.py +68 -0
- mindspore/ops/_op_impl/aicpu/sparse_slice.py +63 -0
- mindspore/ops/_op_impl/aicpu/sparse_slice_grad.py +61 -0
- mindspore/ops/_op_impl/aicpu/squared_difference.py +2 -0
- mindspore/ops/_op_impl/aicpu/strided_slice_v2.py +93 -0
- mindspore/ops/_op_impl/aicpu/strided_slice_v2_grad.py +66 -0
- mindspore/ops/_op_impl/aicpu/tensor_scatter_update.py +59 -0
- mindspore/ops/_op_impl/{tbe/gather_v2.py → aicpu/tile.py} +24 -24
- mindspore/ops/_op_impl/aicpu/tridiagonal_solve.py +35 -0
- mindspore/ops/_op_impl/aicpu/tril_indices.py +34 -0
- mindspore/ops/_op_impl/aicpu/triu_indices.py +34 -0
- mindspore/ops/_op_impl/aicpu/uniform.py +34 -0
- mindspore/ops/_op_impl/aicpu/uniform_candidate_sampler.py +1 -0
- mindspore/ops/_op_impl/aicpu/unique_consecutive.py +10 -2
- mindspore/ops/_op_impl/cpu/__init__.py +1 -2
- mindspore/ops/_op_impl/cpu/dynamic_shape.py +5 -1
- mindspore/ops/_op_impl/cpu/maximum_grad.py +2 -0
- mindspore/{compression/common/__init__.py → ops/_op_impl/cpu/pyexecute.py} +13 -8
- mindspore/ops/_op_impl/cpu/reduce_sum.py +8 -0
- mindspore/ops/_op_impl/cpu/sparse_slice.py +62 -0
- mindspore/ops/_op_impl/cpu/sparse_slice_grad.py +60 -0
- mindspore/ops/_op_impl/cpu/tensor_shape.py +5 -1
- mindspore/ops/_op_impl/tbe/__init__.py +27 -608
- mindspore/ops/_op_impl/tbe/addcdiv_ds.py +42 -0
- mindspore/ops/_op_impl/tbe/addcmul_ds.py +44 -0
- mindspore/ops/_op_impl/tbe/assign_add_ds.py +1 -0
- mindspore/ops/_op_impl/tbe/atomic_addr_clean.py +1 -1
- mindspore/ops/_op_impl/tbe/avg_pool_3d_grad.py +1 -1
- mindspore/ops/_op_impl/tbe/basic_lstm_cell_c_state_grad_v2.py +0 -1
- mindspore/ops/_op_impl/tbe/batch_to_space.py +1 -1
- mindspore/ops/_op_impl/tbe/batch_to_space_nd.py +1 -1
- mindspore/ops/_op_impl/tbe/batch_to_space_nd_v2.py +41 -0
- mindspore/ops/_op_impl/tbe/bce_with_logits_loss.py +1 -0
- mindspore/ops/_op_impl/tbe/bias_add_grad.py +2 -0
- mindspore/ops/_op_impl/tbe/bn_infer_grad.py +4 -2
- mindspore/ops/_op_impl/tbe/bn_infer_grad_ds.py +40 -0
- mindspore/ops/_op_impl/tbe/bn_training_update.py +0 -1
- mindspore/ops/_op_impl/tbe/bn_training_update_ds.py +0 -1
- mindspore/ops/_op_impl/tbe/broadcast_to_ds.py +6 -4
- mindspore/ops/_op_impl/tbe/cast.py +0 -2
- mindspore/ops/_op_impl/tbe/cast_ds.py +3 -3
- mindspore/ops/_op_impl/tbe/ctc_loss_v2.py +0 -2
- mindspore/ops/_op_impl/tbe/ctc_loss_v2_grad.py +0 -2
- mindspore/ops/_op_impl/tbe/data_format_dim_map_ds.py +1 -0
- mindspore/ops/_op_impl/tbe/deformable_offsets.py +1 -0
- mindspore/ops/_op_impl/tbe/depthwise_conv2d.py +1 -1
- mindspore/ops/_op_impl/tbe/dynamic_atomic_addr_clean.py +1 -1
- mindspore/ops/_op_impl/tbe/gather_nd.py +1 -0
- mindspore/ops/_op_impl/tbe/greater.py +2 -0
- mindspore/ops/_op_impl/tbe/{index_add.py → inplace_index_add.py} +3 -6
- mindspore/ops/_op_impl/tbe/layer_norm_beta_gamma_backprop_v2.py +0 -1
- mindspore/ops/_op_impl/tbe/npu_clear_float_status_v2.py +35 -0
- mindspore/ops/_op_impl/tbe/npu_get_float_status_v2.py +35 -0
- mindspore/ops/_op_impl/tbe/one_hot_ds.py +0 -6
- mindspore/ops/_op_impl/tbe/{greater_ds.py → reduce_all_ds.py} +13 -16
- mindspore/ops/_op_impl/tbe/reduce_any_ds.py +39 -0
- mindspore/ops/_op_impl/tbe/roi_align_ds.py +44 -0
- mindspore/ops/_op_impl/tbe/roi_align_grad_ds.py +44 -0
- mindspore/ops/_op_impl/tbe/scatter_add.py +2 -0
- mindspore/ops/_op_impl/tbe/scatter_nd_add.py +2 -2
- mindspore/ops/_op_impl/tbe/slice.py +26 -15
- mindspore/ops/_op_impl/tbe/space_to_batch.py +1 -1
- mindspore/ops/_op_impl/tbe/space_to_batch_nd.py +1 -1
- mindspore/ops/_op_impl/tbe/strided_slice_grad_d.py +1 -0
- mindspore/ops/_op_impl/tbe/trans_data_ds.py +15 -5
- mindspore/ops/_op_impl/tbe/unsorted_segment_sum.py +1 -1
- mindspore/ops/_op_impl/tbe/unsorted_segment_sum_ds.py +2 -0
- mindspore/ops/_primitive_cache.py +3 -2
- mindspore/ops/_register_for_op.py +11 -0
- mindspore/ops/_utils/__init__.py +1 -1
- mindspore/ops/_utils/utils.py +20 -41
- mindspore/ops/_vmap/__init__.py +2 -2
- mindspore/ops/_vmap/vmap_array_ops.py +170 -78
- mindspore/ops/_vmap/vmap_base.py +24 -10
- mindspore/ops/_vmap/vmap_convolution_ops.py +7 -10
- mindspore/ops/_vmap/vmap_grad_math_ops.py +4 -4
- mindspore/ops/_vmap/vmap_grad_nn_ops.py +41 -9
- mindspore/ops/_vmap/vmap_image_ops.py +52 -0
- mindspore/ops/_vmap/vmap_math_ops.py +77 -6
- mindspore/ops/_vmap/vmap_nn_ops.py +78 -29
- mindspore/ops/_vmap/vmap_other_ops.py +3 -1
- mindspore/ops/_vmap/vmap_random_ops.py +55 -3
- mindspore/ops/_vmap/vmap_sparse_ops.py +1 -0
- mindspore/ops/bprop_mindir/AdaptiveAvgPool2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/AdaptiveMaxPool2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ApproximateEqual_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/Argmax_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/Argmin_bprop.mindir +14 -13
- mindspore/ops/bprop_mindir/AssignSub_bprop.mindir +17 -18
- mindspore/ops/bprop_mindir/Assign_bprop.mindir +16 -16
- mindspore/ops/bprop_mindir/AvgPool3D_bprop.mindir +150 -0
- mindspore/ops/bprop_mindir/AvgPool_bprop.mindir +66 -0
- mindspore/ops/bprop_mindir/BCEWithLogitsLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BNTrainingReduce_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/BatchNormGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BatchToSpaceND_bprop.mindir +28 -0
- mindspore/ops/bprop_mindir/BiasAddGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BinaryCrossEntropy_bprop.mindir +33 -0
- mindspore/ops/bprop_mindir/BroadcastTo_bprop.mindir +306 -0
- mindspore/ops/bprop_mindir/Broadcast_bprop.mindir +12 -8
- mindspore/ops/bprop_mindir/CTCLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Concat_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Conv2DBackpropFilter_bprop.mindir +240 -0
- mindspore/ops/bprop_mindir/Conv2DBackpropInput_bprop.mindir +247 -0
- mindspore/ops/bprop_mindir/Conv2DTranspose_bprop.mindir +247 -0
- mindspore/ops/bprop_mindir/Conv3DTranspose_bprop.mindir +315 -0
- mindspore/ops/bprop_mindir/Conv3D_bprop.mindir +278 -0
- mindspore/ops/bprop_mindir/DType_bprop.mindir +12 -12
- mindspore/ops/bprop_mindir/DeformableOffsets_bprop.mindir +58 -0
- mindspore/ops/bprop_mindir/Depend_bprop.mindir +12 -13
- mindspore/ops/bprop_mindir/DepthToSpace_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/DepthwiseConv2dNative_bprop.mindir +138 -0
- mindspore/ops/bprop_mindir/DiagPart_bprop.mindir +15 -0
- mindspore/ops/bprop_mindir/Dropout2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Dropout3D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DropoutDoMask_bprop.mindir +22 -24
- mindspore/ops/bprop_mindir/DropoutGenMask_bprop.mindir +16 -14
- mindspore/ops/bprop_mindir/DropoutGrad_bprop.mindir +27 -0
- mindspore/ops/bprop_mindir/Dropout_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DynamicGRUV2_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DynamicRNN_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DynamicShape_bprop.mindir +12 -12
- mindspore/ops/bprop_mindir/Elu_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/EmbeddingLookup_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Equal_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/ExpandDims_bprop.mindir +58 -0
- mindspore/ops/bprop_mindir/FastGeLU_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Flatten_bprop.mindir +54 -0
- mindspore/ops/bprop_mindir/FloorDiv_bprop.mindir +18 -15
- mindspore/ops/bprop_mindir/GatherD_bprop.mindir +26 -0
- mindspore/ops/bprop_mindir/GatherNd_bprop.mindir +57 -0
- mindspore/ops/bprop_mindir/Gather_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/GreaterEqual_bprop.mindir +17 -18
- mindspore/ops/bprop_mindir/Greater_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/HSigmoid_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/HSwish_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/IOU_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/InstanceNorm_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/IsFinite_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/IsInf_bprop.mindir +13 -10
- mindspore/ops/bprop_mindir/IsNan_bprop.mindir +14 -11
- mindspore/ops/bprop_mindir/KLDivLoss_bprop.mindir +126 -0
- mindspore/ops/bprop_mindir/L2Loss_bprop.mindir +15 -0
- mindspore/ops/bprop_mindir/L2Normalize_bprop.mindir +30 -0
- mindspore/ops/bprop_mindir/LRN_bprop.mindir +43 -0
- mindspore/ops/bprop_mindir/LayerNormGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/LessEqual_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/Less_bprop.mindir +17 -18
- mindspore/ops/bprop_mindir/LinSpace_bprop.mindir +22 -19
- mindspore/ops/bprop_mindir/Load_bprop.mindir +12 -13
- mindspore/ops/bprop_mindir/LogSoftmax_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/LogicalAnd_bprop.mindir +17 -18
- mindspore/ops/bprop_mindir/LogicalNot_bprop.mindir +14 -13
- mindspore/ops/bprop_mindir/MaskedSelect_bprop.mindir +21 -0
- mindspore/ops/bprop_mindir/MaxPool3DGradGrad_bprop.mindir +74 -0
- mindspore/ops/bprop_mindir/MaxPool3DGrad_bprop.mindir +74 -0
- mindspore/ops/bprop_mindir/MaxPool3D_bprop.mindir +75 -0
- mindspore/ops/bprop_mindir/MaxPoolGradGrad_bprop.mindir +65 -0
- mindspore/ops/bprop_mindir/MaxPoolWithArgmax_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Maximum_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Minimum_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/MirrorPad_bprop.mindir +27 -0
- mindspore/ops/bprop_mindir/Mish_bprop.mindir +35 -0
- mindspore/ops/bprop_mindir/MulNoNan_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/NLLLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/NonZero_bprop.mindir +14 -0
- mindspore/ops/bprop_mindir/NotEqual_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/OneHot_bprop.mindir +25 -23
- mindspore/ops/bprop_mindir/OnesLike_bprop.mindir +13 -13
- mindspore/ops/bprop_mindir/PReLU_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Pad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Padding_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/RNNTLoss_bprop.mindir +29 -0
- mindspore/ops/bprop_mindir/ROIAlign_bprop.mindir +82 -0
- mindspore/ops/bprop_mindir/Range_bprop.mindir +21 -19
- mindspore/ops/bprop_mindir/Rank_bprop.mindir +11 -11
- mindspore/ops/bprop_mindir/ReLU6_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/ReLUV2_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ReduceAll_bprop.mindir +18 -17
- mindspore/ops/bprop_mindir/ReduceAny_bprop.mindir +18 -17
- mindspore/ops/bprop_mindir/ReluGrad_bprop.mindir +19 -23
- mindspore/ops/bprop_mindir/Reshape_bprop.mindir +60 -0
- mindspore/ops/bprop_mindir/ResizeBilinear_bprop.mindir +29 -0
- mindspore/ops/bprop_mindir/ResizeNearestNeighbor_bprop.mindir +89 -0
- mindspore/ops/bprop_mindir/ReverseSequence_bprop.mindir +52 -0
- mindspore/ops/bprop_mindir/ReverseV2_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/Round_bprop.mindir +14 -13
- mindspore/ops/bprop_mindir/ScatterMax_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ScatterMin_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ScatterNdUpdate_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/ScatterNd_bprop.mindir +24 -0
- mindspore/ops/bprop_mindir/ScatterNonAliasingAdd_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/ScatterUpdate_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/SeLU_bprop.mindir +21 -0
- mindspore/ops/bprop_mindir/Select_bprop.mindir +30 -34
- mindspore/ops/bprop_mindir/Shape_bprop.mindir +12 -12
- mindspore/ops/bprop_mindir/SigmoidCrossEntropyWithLogits_bprop.mindir +21 -0
- mindspore/ops/bprop_mindir/SigmoidGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Sigmoid_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Sign_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/Slice_bprop.mindir +26 -0
- mindspore/ops/bprop_mindir/SmoothL1Loss_bprop.mindir +36 -0
- mindspore/ops/bprop_mindir/SoftmaxCrossEntropyWithLogits_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Softplus_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Softsign_bprop.mindir +33 -0
- mindspore/ops/bprop_mindir/Sort_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/SpaceToBatchND_bprop.mindir +28 -0
- mindspore/ops/bprop_mindir/SpaceToDepth_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/SparseGatherV2_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/SparseSoftmaxCrossEntropyWithLogits_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Split_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/Squeeze_bprop.mindir +54 -0
- mindspore/ops/bprop_mindir/StridedSliceGrad_bprop.mindir +95 -0
- mindspore/ops/bprop_mindir/StridedSlice_bprop.mindir +98 -0
- mindspore/ops/bprop_mindir/Switch_bprop.mindir +28 -32
- mindspore/ops/bprop_mindir/TanhGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Tanh_bprop.mindir +66 -0
- mindspore/ops/bprop_mindir/TensorScatterAdd_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/TensorScatterUpdate_bprop.mindir +29 -0
- mindspore/ops/bprop_mindir/TensorShape_bprop.mindir +14 -0
- mindspore/ops/bprop_mindir/Tile_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/TopK_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/TransShape_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/TruncateDiv_bprop.mindir +18 -15
- mindspore/ops/bprop_mindir/TupleGetItem_bprop.mindir +11 -13
- mindspore/ops/bprop_mindir/Unique_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Unstack_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/UpsampleNearest3D_bprop.mindir +32 -0
- mindspore/ops/bprop_mindir/UpsampleTrilinear3D_bprop.mindir +38 -0
- mindspore/ops/bprop_mindir/ZerosLike_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/__init__.py +1 -4
- mindspore/ops/bprop_mindir/generate_mindir.py +32 -20
- mindspore/ops/composite/__init__.py +12 -13
- mindspore/ops/composite/base.py +261 -254
- mindspore/ops/composite/env_ops.py +41 -0
- mindspore/ops/composite/math_ops.py +197 -156
- mindspore/ops/composite/multitype_ops/_compile_utils.py +428 -176
- mindspore/ops/composite/multitype_ops/_constexpr_utils.py +188 -87
- mindspore/ops/composite/multitype_ops/add_impl.py +23 -1
- mindspore/ops/composite/multitype_ops/div_impl.py +3 -3
- mindspore/ops/composite/multitype_ops/equal_impl.py +1 -0
- mindspore/ops/composite/multitype_ops/floordiv_impl.py +1 -1
- mindspore/ops/composite/multitype_ops/getitem_impl.py +52 -5
- mindspore/ops/composite/multitype_ops/greater_equal_impl.py +31 -0
- mindspore/ops/composite/multitype_ops/greater_impl.py +31 -0
- mindspore/ops/composite/multitype_ops/in_impl.py +15 -3
- mindspore/ops/composite/multitype_ops/less_equal_impl.py +33 -2
- mindspore/ops/composite/multitype_ops/less_impl.py +33 -0
- mindspore/ops/composite/multitype_ops/logical_and_impl.py +2 -2
- mindspore/ops/composite/multitype_ops/logical_or_impl.py +2 -1
- mindspore/ops/composite/multitype_ops/mod_impl.py +1 -1
- mindspore/ops/composite/multitype_ops/mul_impl.py +21 -7
- mindspore/ops/composite/multitype_ops/not_in_impl.py +15 -3
- mindspore/ops/composite/multitype_ops/ones_like_impl.py +2 -4
- mindspore/ops/composite/multitype_ops/pow_impl.py +1 -0
- mindspore/ops/composite/multitype_ops/setitem_impl.py +62 -70
- mindspore/ops/composite/multitype_ops/sub_impl.py +3 -3
- mindspore/ops/composite/multitype_ops/zeros_like_impl.py +41 -4
- mindspore/ops/function/__init__.py +323 -8
- mindspore/ops/function/array_func.py +3511 -780
- mindspore/ops/function/clip_func.py +329 -0
- mindspore/ops/function/debug_func.py +6 -6
- mindspore/ops/function/grad/__init__.py +5 -1
- mindspore/ops/function/grad/grad_func.py +736 -65
- mindspore/ops/function/image_func.py +270 -0
- mindspore/ops/function/linalg_func.py +268 -8
- mindspore/ops/function/math_func.py +8032 -3164
- mindspore/ops/function/nn_func.py +5619 -1855
- mindspore/ops/function/other_func.py +115 -0
- mindspore/ops/function/parameter_func.py +11 -10
- mindspore/ops/function/random_func.py +939 -77
- mindspore/ops/function/sparse_func.py +249 -84
- mindspore/ops/function/sparse_unary_func.py +2303 -0
- mindspore/ops/function/spectral_func.py +146 -0
- mindspore/ops/function/vmap_func.py +114 -0
- mindspore/ops/functional.py +182 -254
- mindspore/ops/op_info_register.py +79 -34
- mindspore/ops/operations/__init__.py +210 -118
- mindspore/ops/operations/_csr_ops.py +7 -7
- mindspore/ops/operations/_embedding_cache_ops.py +25 -15
- mindspore/ops/operations/_grad_ops.py +447 -322
- mindspore/ops/operations/_inner_ops.py +547 -176
- mindspore/ops/operations/_map_tensor_ops.py +112 -0
- mindspore/ops/operations/_ms_kernel.py +29 -27
- mindspore/ops/operations/_ocr_ops.py +11 -11
- mindspore/ops/operations/_opaque_predicate_registry.py +41 -0
- mindspore/ops/operations/_quant_ops.py +186 -101
- mindspore/ops/operations/_rl_inner_ops.py +122 -61
- mindspore/ops/operations/_scalar_ops.py +466 -0
- mindspore/ops/operations/_sequence_ops.py +1047 -0
- mindspore/ops/operations/_tensor_array.py +10 -11
- mindspore/ops/operations/_thor_ops.py +4 -4
- mindspore/ops/operations/array_ops.py +1428 -1226
- mindspore/ops/operations/comm_ops.py +180 -117
- mindspore/ops/operations/control_ops.py +4 -2
- mindspore/ops/operations/custom_ops.py +185 -98
- mindspore/ops/operations/debug_ops.py +92 -54
- mindspore/ops/operations/image_ops.py +406 -211
- mindspore/ops/operations/inner_ops.py +42 -53
- mindspore/ops/operations/linalg_ops.py +32 -29
- mindspore/ops/operations/math_ops.py +2076 -897
- mindspore/ops/operations/nn_ops.py +1282 -1252
- mindspore/ops/operations/other_ops.py +124 -278
- mindspore/ops/operations/random_ops.py +345 -178
- mindspore/ops/operations/rl_ops.py +8 -9
- mindspore/ops/operations/sparse_ops.py +502 -157
- mindspore/ops/operations/spectral_ops.py +107 -0
- mindspore/ops/primitive.py +192 -15
- mindspore/ops/vm_impl_registry.py +23 -2
- mindspore/parallel/__init__.py +6 -1
- mindspore/parallel/_auto_parallel_context.py +199 -92
- mindspore/parallel/_cell_wrapper.py +4 -2
- mindspore/parallel/_cost_model_context.py +3 -0
- mindspore/parallel/_dp_allreduce_fusion.py +2 -1
- mindspore/parallel/_offload_context.py +185 -0
- mindspore/parallel/_parallel_serialization.py +167 -28
- mindspore/parallel/_ps_context.py +9 -5
- mindspore/parallel/_recovery_context.py +1 -1
- mindspore/parallel/_tensor.py +9 -1
- mindspore/{nn/transformer → parallel/_transformer}/__init__.py +6 -6
- mindspore/{nn/transformer → parallel/_transformer}/layers.py +59 -37
- mindspore/{nn/transformer → parallel/_transformer}/loss.py +4 -7
- mindspore/{nn/transformer → parallel/_transformer}/moe.py +160 -35
- mindspore/{nn/transformer → parallel/_transformer}/op_parallel_config.py +3 -3
- mindspore/{nn/transformer → parallel/_transformer}/transformer.py +235 -196
- mindspore/parallel/_utils.py +47 -7
- mindspore/parallel/algo_parameter_config.py +5 -1
- mindspore/parallel/checkpoint_transform.py +329 -0
- mindspore/parallel/shard.py +229 -0
- mindspore/perf_msvcbuildinsights.dll +0 -0
- mindspore/pgodb140.dll +0 -0
- mindspore/pgort140.dll +0 -0
- mindspore/profiler/__init__.py +2 -1
- mindspore/profiler/common/util.py +4 -3
- mindspore/profiler/common/validator/validate_path.py +2 -2
- mindspore/profiler/envprofiling.py +249 -0
- mindspore/profiler/parser/aicpu_data_parser.py +38 -39
- mindspore/profiler/parser/ascend_timeline_generator.py +497 -0
- mindspore/profiler/parser/base_timeline_generator.py +471 -0
- mindspore/profiler/parser/cpu_gpu_timeline_generator.py +684 -0
- mindspore/profiler/parser/framework_parser.py +42 -16
- mindspore/profiler/parser/hccl_parser.py +158 -158
- mindspore/profiler/parser/hwts_log_parser.py +7 -6
- mindspore/profiler/parser/integrator.py +18 -1579
- mindspore/profiler/parser/minddata_analyzer.py +8 -8
- mindspore/profiler/parser/msadvisor_analyzer.py +14 -27
- mindspore/profiler/parser/msadvisor_parser.py +2 -4
- mindspore/profiler/parser/optime_parser.py +17 -18
- mindspore/profiler/parser/profiler_info.py +108 -0
- mindspore/profiler/parser/step_trace_parser.py +1 -1
- mindspore/profiler/profiling.py +396 -194
- mindspore/rewrite/__init__.py +6 -2
- mindspore/rewrite/api/node.py +51 -110
- mindspore/rewrite/api/node_type.py +10 -6
- mindspore/rewrite/api/pattern_engine.py +51 -7
- mindspore/rewrite/api/scoped_value.py +64 -53
- mindspore/rewrite/api/symbol_tree.py +108 -61
- mindspore/rewrite/api/tree_node_helper.py +2 -3
- mindspore/{compression/quant/__init__.py → rewrite/ast_creator_register.py} +20 -11
- mindspore/rewrite/ast_helpers/__init__.py +6 -3
- mindspore/rewrite/ast_helpers/ast_creator.py +115 -0
- mindspore/rewrite/ast_helpers/ast_finder.py +99 -1
- mindspore/rewrite/ast_helpers/ast_modifier.py +17 -4
- mindspore/rewrite/ast_helpers/ast_replacer.py +1 -1
- mindspore/rewrite/ast_transformers/__init__.py +0 -1
- mindspore/rewrite/ast_transformers/flatten_recursive_stmt.py +46 -5
- mindspore/rewrite/ast_transformers/remove_return_out_of_if.py +6 -3
- mindspore/rewrite/common/__init__.py +2 -0
- mindspore/rewrite/common/event.py +1 -1
- mindspore/rewrite/common/observable.py +1 -1
- mindspore/rewrite/common/observer.py +1 -1
- mindspore/rewrite/common/rewrite_elog.py +35 -0
- mindspore/rewrite/namer.py +2 -2
- mindspore/rewrite/namespace.py +14 -4
- mindspore/rewrite/node.py +161 -13
- mindspore/rewrite/parser.py +0 -1
- mindspore/rewrite/parser_register.py +0 -1
- mindspore/rewrite/parsers/arguments_parser.py +3 -2
- mindspore/rewrite/parsers/assign_parser.py +267 -67
- mindspore/rewrite/parsers/attribute_parser.py +56 -0
- mindspore/rewrite/parsers/class_def_parser.py +191 -108
- mindspore/rewrite/parsers/constant_parser.py +101 -0
- mindspore/rewrite/parsers/container_parser.py +88 -0
- mindspore/rewrite/parsers/for_parser.py +28 -15
- mindspore/rewrite/parsers/function_def_parser.py +21 -5
- mindspore/rewrite/parsers/if_parser.py +11 -28
- mindspore/rewrite/parsers/module_parser.py +9 -6
- mindspore/rewrite/parsers/return_parser.py +3 -2
- mindspore/rewrite/sparsify/__init__.py +0 -0
- mindspore/rewrite/sparsify/sparse_transformer.py +448 -0
- mindspore/rewrite/sparsify/sparsify.py +109 -0
- mindspore/rewrite/sparsify/utils.py +173 -0
- mindspore/rewrite/symbol_tree.py +322 -109
- mindspore/rewrite/symbol_tree_builder.py +45 -8
- mindspore/rewrite/symbol_tree_dumper.py +0 -1
- mindspore/rewrite/topological_manager.py +1 -2
- mindspore/run_check/_check_version.py +209 -112
- mindspore/run_check/run_check.py +2 -1
- mindspore/tbbmalloc.dll +0 -0
- mindspore/tinyxml2.dll +0 -0
- mindspore/train/__init__.py +6 -4
- mindspore/train/_utils.py +28 -5
- mindspore/train/amp.py +321 -50
- mindspore/train/callback/__init__.py +3 -1
- mindspore/train/callback/_backup_and_restore.py +120 -0
- mindspore/train/callback/_callback.py +8 -8
- mindspore/train/callback/_checkpoint.py +12 -9
- mindspore/train/callback/_early_stop.py +13 -7
- mindspore/train/callback/_history.py +8 -8
- mindspore/train/callback/_lambda_callback.py +6 -6
- mindspore/train/callback/_landscape.py +36 -38
- mindspore/train/callback/_loss_monitor.py +12 -6
- mindspore/train/callback/_lr_scheduler_callback.py +2 -4
- mindspore/train/callback/_on_request_exit.py +212 -0
- mindspore/train/callback/_reduce_lr_on_plateau.py +13 -7
- mindspore/train/callback/_summary_collector.py +27 -19
- mindspore/train/callback/_time_monitor.py +13 -7
- mindspore/train/checkpoint_pb2.py +68 -8
- mindspore/train/data_sink.py +122 -33
- mindspore/train/dataset_helper.py +28 -87
- mindspore/train/loss_scale_manager.py +4 -7
- mindspore/{nn → train}/metrics/__init__.py +20 -20
- mindspore/{nn → train}/metrics/accuracy.py +12 -10
- mindspore/{nn → train}/metrics/auc.py +4 -4
- mindspore/{nn → train}/metrics/bleu_score.py +4 -4
- mindspore/{nn → train}/metrics/confusion_matrix.py +10 -8
- mindspore/{nn → train}/metrics/cosine_similarity.py +4 -4
- mindspore/{nn → train}/metrics/dice.py +6 -5
- mindspore/{nn → train}/metrics/error.py +7 -5
- mindspore/{nn → train}/metrics/fbeta.py +9 -7
- mindspore/{nn → train}/metrics/hausdorff_distance.py +8 -6
- mindspore/{nn → train}/metrics/loss.py +4 -3
- mindspore/{nn → train}/metrics/mean_surface_distance.py +6 -5
- mindspore/{nn → train}/metrics/metric.py +6 -5
- mindspore/{nn → train}/metrics/occlusion_sensitivity.py +4 -3
- mindspore/{nn → train}/metrics/perplexity.py +5 -4
- mindspore/{nn → train}/metrics/precision.py +5 -4
- mindspore/{nn → train}/metrics/recall.py +5 -4
- mindspore/{nn → train}/metrics/roc.py +7 -6
- mindspore/{nn → train}/metrics/root_mean_square_surface_distance.py +6 -5
- mindspore/{nn → train}/metrics/topk.py +7 -5
- mindspore/train/mind_ir_pb2.py +339 -32
- mindspore/train/model.py +113 -84
- mindspore/train/serialization.py +547 -167
- mindspore/train/summary/_summary_adapter.py +1 -1
- mindspore/train/summary/summary_record.py +43 -12
- mindspore/train/train_thor/convert_utils.py +7 -1
- mindspore/train/train_thor/dataset_helper.py +3 -3
- mindspore/train/train_thor/model_thor.py +0 -4
- mindspore/turbojpeg.dll +0 -0
- mindspore/vcmeta.dll +0 -0
- mindspore/vcruntime140.dll +0 -0
- mindspore/vcruntime140_1.dll +0 -0
- mindspore/version.py +1 -1
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/METADATA +4 -3
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/RECORD +901 -660
- mindspore/compression/common/constant.py +0 -124
- mindspore/compression/export/__init__.py +0 -19
- mindspore/compression/export/quant_export.py +0 -514
- mindspore/compression/quant/qat.py +0 -636
- mindspore/compression/quant/quant_utils.py +0 -462
- mindspore/compression/quant/quantizer.py +0 -68
- mindspore/libatomic-1.dll +0 -0
- mindspore/libgcc_s_seh-1.dll +0 -0
- mindspore/libgfortran-4.dll +0 -0
- mindspore/libgomp-1.dll +0 -0
- mindspore/libjpeg-62.dll +0 -0
- mindspore/libmindspore.dll +0 -0
- mindspore/libmindspore_common.dll +0 -0
- mindspore/libmindspore_core.dll +0 -0
- mindspore/libmindspore_glog.dll +0 -0
- mindspore/libnnacl.dll +0 -0
- mindspore/libopencv_core452.dll +0 -0
- mindspore/libopencv_imgcodecs452.dll +0 -0
- mindspore/libopencv_imgproc452.dll +0 -0
- mindspore/libquadmath-0.dll +0 -0
- mindspore/libsqlite3.dll +0 -0
- mindspore/libssp-0.dll +0 -0
- mindspore/libstdc++-6.dll +0 -0
- mindspore/libtinyxml2.dll +0 -0
- mindspore/libturbojpeg.dll +0 -0
- mindspore/libwinpthread-1.dll +0 -0
- mindspore/nn/layer/quant.py +0 -1868
- mindspore/nn/layer/rnn_utils.py +0 -90
- mindspore/nn/probability/dpn/__init__.py +0 -22
- mindspore/nn/probability/dpn/vae/__init__.py +0 -25
- mindspore/nn/probability/dpn/vae/cvae.py +0 -138
- mindspore/nn/probability/dpn/vae/vae.py +0 -122
- mindspore/nn/probability/infer/__init__.py +0 -22
- mindspore/nn/probability/infer/variational/elbo.py +0 -70
- mindspore/nn/probability/infer/variational/svi.py +0 -84
- mindspore/nn/probability/toolbox/__init__.py +0 -22
- mindspore/nn/probability/toolbox/anomaly_detection.py +0 -99
- mindspore/nn/probability/toolbox/uncertainty_evaluation.py +0 -363
- mindspore/nn/probability/transforms/__init__.py +0 -22
- mindspore/nn/probability/transforms/transform_bnn.py +0 -262
- mindspore/nn/probability/zhusuan/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/framework/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/framework/bn.py +0 -95
- mindspore/nn/probability/zhusuan/variational/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/variational/elbo.py +0 -46
- mindspore/ops/_op_impl/tbe/bias_add_grad_ds.py +0 -52
- mindspore/ops/_op_impl/tbe/scatter_nd_add_ds.py +0 -43
- mindspore/ops/bprop_mindir/AssignAdd_bprop.mindir +0 -20
- mindspore/ops/bprop_mindir/Identity_bprop.mindir +0 -9
- mindspore/ops/bprop_mindir/LogicalOr_bprop.mindir +0 -20
- mindspore/ops/bprop_mindir/ReLU_bprop.mindir +0 -16
- mindspore/ops/bprop_mindir/UpdateState_bprop.mindir +0 -17
- mindspore/ops/bprop_mindir/stop_gradient_bprop.mindir +0 -12
- mindspore/ops/composite/array_ops.py +0 -210
- mindspore/ops/composite/clip_ops.py +0 -238
- mindspore/ops/composite/random_ops.py +0 -426
- mindspore/ops/composite/vmap_ops.py +0 -38
- mindspore/ops/operations/sponge_ops.py +0 -3531
- mindspore/ops/operations/sponge_update_ops.py +0 -2546
- mindspore/parallel/nn/__init__.py +0 -42
- mindspore/parallel/nn/loss.py +0 -22
- mindspore/parallel/nn/moe.py +0 -21
- mindspore/parallel/nn/op_parallel_config.py +0 -22
- mindspore/parallel/nn/transformer.py +0 -31
- mindspore/run_check/_check_deps_version.py +0 -84
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/WHEEL +0 -0
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/entry_points.txt +0 -0
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/top_level.txt +0 -0
|
@@ -20,6 +20,7 @@ from mindspore.ops import composite as C
|
|
|
20
20
|
from mindspore.common.tensor import Tensor
|
|
21
21
|
import mindspore.common.dtype as mstype
|
|
22
22
|
from mindspore.common.dtype import dtype_to_nptype, get_py_obj_dtype
|
|
23
|
+
from mindspore._c_expression import Tensor as CTensor
|
|
23
24
|
|
|
24
25
|
|
|
25
26
|
def ScalarAdd(x, y):
|
|
@@ -103,8 +104,11 @@ def zeros_like_tensor(x):
|
|
|
103
104
|
|
|
104
105
|
def OnesLike(x):
|
|
105
106
|
"""Implement `oneslike`."""
|
|
106
|
-
x
|
|
107
|
-
|
|
107
|
+
if isinstance(x, (Tensor, CTensor)):
|
|
108
|
+
x = x.asnumpy()
|
|
109
|
+
value = Tensor(np.ones(x.shape).astype(x.dtype))
|
|
110
|
+
else:
|
|
111
|
+
value = Tensor(1.0)
|
|
108
112
|
return value
|
|
109
113
|
|
|
110
114
|
|
|
@@ -176,11 +180,35 @@ def tuple_to_array(x):
|
|
|
176
180
|
return Tensor(np.array(x))
|
|
177
181
|
|
|
178
182
|
|
|
179
|
-
def
|
|
180
|
-
"""Implement `
|
|
183
|
+
def StopGradient(x):
|
|
184
|
+
"""Implement `StopGradient`."""
|
|
181
185
|
return x
|
|
182
186
|
|
|
183
187
|
|
|
188
|
+
def TensorShape(x):
|
|
189
|
+
"""Implement `TensorShape`."""
|
|
190
|
+
return Tensor(F.shape(x))
|
|
191
|
+
|
|
192
|
+
|
|
193
|
+
def DynamicBroadcastGradientArgs(x, y):
|
|
194
|
+
"""Implement `DynamicBroadcastGradientArgs`."""
|
|
195
|
+
return -1, -1
|
|
196
|
+
|
|
197
|
+
|
|
198
|
+
def StridedSlice(x, begin, end, stride):
|
|
199
|
+
"""Implement `StridedSlice`."""
|
|
200
|
+
if isinstance(x, Tensor):
|
|
201
|
+
x = x.asnumpy()
|
|
202
|
+
ret = x
|
|
203
|
+
for i in range(len(x)):
|
|
204
|
+
ret[i:] = x[begin[i], end[i], stride[i]]
|
|
205
|
+
return Tensor(ret)
|
|
206
|
+
ret = x
|
|
207
|
+
for i in range(len(x)):
|
|
208
|
+
ret[i:] = x[begin[i], end[i], stride[i]]
|
|
209
|
+
return ret
|
|
210
|
+
|
|
211
|
+
|
|
184
212
|
hyper_map = C.HyperMap()
|
|
185
213
|
|
|
186
214
|
|
|
@@ -15,9 +15,7 @@
|
|
|
15
15
|
"""Cost model splitter"""
|
|
16
16
|
from functools import reduce as prod_reduce
|
|
17
17
|
from functools import partial
|
|
18
|
-
from mindspore import log as logger
|
|
19
18
|
from .model import PrimLib, Graph, Tensor, Operator
|
|
20
|
-
from .model import DataFormat as DF
|
|
21
19
|
|
|
22
20
|
|
|
23
21
|
def tensor_size(tensor):
|
|
@@ -175,7 +173,7 @@ class ReshapeElimChecker:
|
|
|
175
173
|
def _get_remap_axis(in_shape, out_shape):
|
|
176
174
|
rin, rout = [], []
|
|
177
175
|
in_prod, out_prod, out_idx = 1, out_shape[-1], -1
|
|
178
|
-
in_ext, out_ext = -len(in_shape)-1, -len(out_shape)-1
|
|
176
|
+
in_ext, out_ext = -len(in_shape) - 1, -len(out_shape) - 1
|
|
179
177
|
for in_idx in range(-1, in_ext, -1):
|
|
180
178
|
in_prod = in_prod * in_shape[in_idx]
|
|
181
179
|
while out_prod < in_prod:
|
|
@@ -191,6 +189,7 @@ class ReshapeElimChecker:
|
|
|
191
189
|
if out_idx > out_ext:
|
|
192
190
|
rout.extend([i for i in range(out_idx, out_ext, -1)])
|
|
193
191
|
return rin, rout
|
|
192
|
+
|
|
194
193
|
remap_in, remap_out = _get_remap_axis(reshape.inputs[0].shape, reshape.output.shape)
|
|
195
194
|
self.exc_fwd = self._collect_exc_ops(reshape, remap_in, True)
|
|
196
195
|
self.exc_bwd = self._collect_exc_ops(reshape, remap_out, False)
|
|
@@ -198,10 +197,11 @@ class ReshapeElimChecker:
|
|
|
198
197
|
@staticmethod
|
|
199
198
|
def _collect_exc_ops(reshape, remap_axis, is_fwd):
|
|
200
199
|
"""collect exclude ops of reshape"""
|
|
200
|
+
|
|
201
201
|
def _propagate(remap, src, des):
|
|
202
202
|
out_remap = []
|
|
203
203
|
src_prod, des_prod, des_idx = 1, 1, 0
|
|
204
|
-
for src_idx in range(-1, -len(src)-1, -1):
|
|
204
|
+
for src_idx in range(-1, -len(src) - 1, -1):
|
|
205
205
|
src_prod = src_prod * src[src_idx]
|
|
206
206
|
if src_idx in remap:
|
|
207
207
|
while des_prod < src_prod:
|
|
@@ -256,6 +256,7 @@ class ReshapeElimChecker:
|
|
|
256
256
|
push_stack(op, remap)
|
|
257
257
|
else:
|
|
258
258
|
exc_ops.add(op)
|
|
259
|
+
|
|
259
260
|
exc_ops, stack, visited = set(), [], {reshape}
|
|
260
261
|
if is_fwd:
|
|
261
262
|
_visit_fwd(reshape, remap_axis)
|
|
@@ -296,7 +297,7 @@ class ReduceOutFuseChecker:
|
|
|
296
297
|
for to in op.output.to_ops:
|
|
297
298
|
idx = to.inputs.index(op.output)
|
|
298
299
|
if PrimLib.iter_type(to) > PrimLib.ELEMWISE or \
|
|
299
|
-
|
|
300
|
+
tensor_size(to.inputs[idx]) != tensor_size(to.output):
|
|
300
301
|
self.output_excluded.add(to)
|
|
301
302
|
else:
|
|
302
303
|
recursion_stack.append(to)
|
|
@@ -384,7 +385,7 @@ class GraphSplitByPattern:
|
|
|
384
385
|
self.unique_id = unique_id
|
|
385
386
|
self.reach_tab = reach_tab
|
|
386
387
|
self.checkers = []
|
|
387
|
-
if self.pattern == PrimLib.RESHAPE and init_op.inputs:
|
|
388
|
+
if self.pattern == PrimLib.RESHAPE and init_op.inputs: # reshape's input may be empty (const value)
|
|
388
389
|
self.checkers.append(ReshapeElimChecker(init_op))
|
|
389
390
|
elif self.pattern == PrimLib.REDUCE:
|
|
390
391
|
self.checkers.append(ReduceOutFuseChecker(init_op))
|
|
@@ -430,6 +431,7 @@ class GraphSplitByPattern:
|
|
|
430
431
|
|
|
431
432
|
def fuse_confirm(self, area):
|
|
432
433
|
"""confirm if area can be fused"""
|
|
434
|
+
|
|
433
435
|
def _check(a, b, res, fwd):
|
|
434
436
|
for checker in a.checkers:
|
|
435
437
|
r = checker.check(b.ops, fwd)
|
|
@@ -441,6 +443,7 @@ class GraphSplitByPattern:
|
|
|
441
443
|
def _commit(a, res):
|
|
442
444
|
for i, checker in enumerate(a.checkers):
|
|
443
445
|
checker.commit(res[i])
|
|
446
|
+
|
|
444
447
|
res1, res2 = [], []
|
|
445
448
|
if not _check(self, area, res1, True) or not _check(area, self, res2, False):
|
|
446
449
|
return False
|
|
@@ -645,7 +648,7 @@ class GraphSplitByPattern:
|
|
|
645
648
|
area.mode = self.get_default_mode(area.ops[0])
|
|
646
649
|
|
|
647
650
|
@staticmethod
|
|
648
|
-
def limit_area_size(dominant, fuse_areas, limit_size
|
|
651
|
+
def limit_area_size(dominant, fuse_areas, limit_size):
|
|
649
652
|
"""Remove some areas if the size is too large"""
|
|
650
653
|
area_sizes = map(lambda area: len(area.ops), fuse_areas)
|
|
651
654
|
dom_size = len(dominant.ops)
|
|
@@ -671,7 +674,7 @@ class GraphSplitByPattern:
|
|
|
671
674
|
continue
|
|
672
675
|
fuse_areas, is_forward = result
|
|
673
676
|
if not is_stitch:
|
|
674
|
-
fuse_areas = self.limit_area_size(dominant, fuse_areas)
|
|
677
|
+
fuse_areas = self.limit_area_size(dominant, fuse_areas, self.flags['composite_op_limit_size'])
|
|
675
678
|
if not fuse_areas:
|
|
676
679
|
continue
|
|
677
680
|
changed = False
|
|
@@ -703,6 +706,7 @@ class GraphSplitByPattern:
|
|
|
703
706
|
|
|
704
707
|
def hfuse(self, selector):
|
|
705
708
|
"""Fuse horizontal areas with same input tensor"""
|
|
709
|
+
|
|
706
710
|
def _do_fuse(areas):
|
|
707
711
|
for i in range(len(areas) - 1):
|
|
708
712
|
dom = areas[i]
|
|
@@ -748,7 +752,7 @@ class GraphSplitByPattern:
|
|
|
748
752
|
result = selector(dominant)
|
|
749
753
|
if result and result[0]:
|
|
750
754
|
fuse_areas, _ = result
|
|
751
|
-
fuse_areas = self.limit_area_size(dominant, fuse_areas)
|
|
755
|
+
fuse_areas = self.limit_area_size(dominant, fuse_areas, self.flags['composite_op_limit_size'])
|
|
752
756
|
if not fuse_areas:
|
|
753
757
|
continue
|
|
754
758
|
if fuse_areas[0] in [self.recom_area, user] and user.fuse_confirm(self.recom_area):
|
|
@@ -788,9 +792,47 @@ class GraphSplitByPattern:
|
|
|
788
792
|
self.pattern_fuse()
|
|
789
793
|
if self.enable_recompute:
|
|
790
794
|
self.recompute_fuse()
|
|
795
|
+
# The reshape should not be output node
|
|
796
|
+
# Note: after this function, the input output relation is not maintained.
|
|
797
|
+
self.split_output_reshapes()
|
|
791
798
|
subgraphs, graphmodes = self.to_subgraphs()
|
|
792
799
|
return subgraphs, graphmodes
|
|
793
800
|
|
|
801
|
+
def split_output_reshapes(self):
|
|
802
|
+
"""Force split the output Reshapes into other new area"""
|
|
803
|
+
|
|
804
|
+
def _remove_output_reshape(reshape_ops, other_ops):
|
|
805
|
+
def _run():
|
|
806
|
+
for op in reshape_ops:
|
|
807
|
+
if any((to_op in other_ops for to_op in op.output.to_ops)):
|
|
808
|
+
reshape_ops.remove(op)
|
|
809
|
+
other_ops.append(op)
|
|
810
|
+
return True
|
|
811
|
+
return False
|
|
812
|
+
|
|
813
|
+
while _run():
|
|
814
|
+
pass
|
|
815
|
+
|
|
816
|
+
new_areas = []
|
|
817
|
+
for area in self.areas:
|
|
818
|
+
reshape_ops = list(op for op in area.ops if PrimLib.iter_type(op) == PrimLib.RESHAPE)
|
|
819
|
+
other_ops = list(op for op in area.ops if op not in reshape_ops)
|
|
820
|
+
if not other_ops or not reshape_ops:
|
|
821
|
+
continue
|
|
822
|
+
# remove the output reshape from "reshape_ops" and add it into "other_ops"
|
|
823
|
+
_remove_output_reshape(reshape_ops, other_ops)
|
|
824
|
+
if not reshape_ops:
|
|
825
|
+
continue
|
|
826
|
+
for op in reshape_ops:
|
|
827
|
+
a = self.Area(op, False, 0, self.reach_tab)
|
|
828
|
+
self.set_default_mode(a)
|
|
829
|
+
new_areas.append(a)
|
|
830
|
+
area.ops = other_ops
|
|
831
|
+
if len(other_ops) == 1:
|
|
832
|
+
self.set_default_mode(area)
|
|
833
|
+
if new_areas:
|
|
834
|
+
self.areas += new_areas
|
|
835
|
+
|
|
794
836
|
def recompute_fuse(self):
|
|
795
837
|
"""find recompute regions and copy them out to new Areas"""
|
|
796
838
|
|
|
@@ -959,10 +1001,21 @@ class GraphSplitGpu(GraphSplitByPattern):
|
|
|
959
1001
|
return reduce_size >= 1024
|
|
960
1002
|
return True
|
|
961
1003
|
|
|
1004
|
+
def _may_multi_filter(dom_ops):
|
|
1005
|
+
count = 1
|
|
1006
|
+
stack = [dom_ops[0]]
|
|
1007
|
+
while stack:
|
|
1008
|
+
op = stack.pop()
|
|
1009
|
+
for t in op.inputs:
|
|
1010
|
+
if t.op and t.op in dom_ops:
|
|
1011
|
+
count = count + 1
|
|
1012
|
+
stack.append(t.op)
|
|
1013
|
+
return count < len(dom_ops)
|
|
1014
|
+
|
|
962
1015
|
def _reduce_output(dom):
|
|
963
1016
|
if dom.pattern != PrimLib.REDUCE:
|
|
964
1017
|
return []
|
|
965
|
-
if
|
|
1018
|
+
if _may_multi_filter(dom.ops):
|
|
966
1019
|
return []
|
|
967
1020
|
if _is_atomic_add_available(dom):
|
|
968
1021
|
return []
|
|
@@ -1122,6 +1175,7 @@ class GraphSplitGpu(GraphSplitByPattern):
|
|
|
1122
1175
|
|
|
1123
1176
|
def _broadcast_tot(dom):
|
|
1124
1177
|
"""Fuse rule for TensorScatterAdd and UnsortedSegmentSum."""
|
|
1178
|
+
|
|
1125
1179
|
def _same_input(op1, op2):
|
|
1126
1180
|
return bool(set(op1.inputs) & set(op2.inputs))
|
|
1127
1181
|
|
|
@@ -1182,7 +1236,7 @@ class GraphSplitGpu(GraphSplitByPattern):
|
|
|
1182
1236
|
if dom.is_output or len(to_ops) != 1 or len(dom.out_relations) != 1:
|
|
1183
1237
|
return []
|
|
1184
1238
|
to_area = list(dom.out_relations.keys())[0]
|
|
1185
|
-
if (to_area.pattern
|
|
1239
|
+
if (to_area.pattern >= PrimLib.REDUCE and to_area.dom_op().prim not in injective_ops) or \
|
|
1186
1240
|
to_ops[0] not in to_area.ops:
|
|
1187
1241
|
return []
|
|
1188
1242
|
if len(to_area.ops) > self.TRANSPOSE_FUSE_DEPTH:
|
|
@@ -1214,6 +1268,7 @@ class GraphSplitGpu(GraphSplitByPattern):
|
|
|
1214
1268
|
def _link_csr(dom):
|
|
1215
1269
|
def _same_input(op1, op2):
|
|
1216
1270
|
return bool(set(op1.inputs.copy()) & set(op2.inputs.copy()))
|
|
1271
|
+
|
|
1217
1272
|
fuse_arg = {"CSRReduceSum": slice(1, 3), "CSRGather": slice(2, 3)}
|
|
1218
1273
|
arg_idx = fuse_arg.get(dom.dom_op().prim, -1)
|
|
1219
1274
|
if arg_idx == -1:
|
|
@@ -1275,220 +1330,9 @@ class GraphSplitGpu(GraphSplitByPattern):
|
|
|
1275
1330
|
_fuse_once(fuse_func)
|
|
1276
1331
|
|
|
1277
1332
|
|
|
1278
|
-
class GraphSplitAscend(GraphSplitByPattern):
|
|
1279
|
-
"""Graph splitter"""
|
|
1280
|
-
BROADCAST_FUSE_DEPTH = 6
|
|
1281
|
-
|
|
1282
|
-
def __init__(self, graph, flags):
|
|
1283
|
-
super().__init__(graph, flags)
|
|
1284
|
-
self.reduce_fuse_depth = 10 if self.reduce_fuse_depth < 0 else self.reduce_fuse_depth
|
|
1285
|
-
|
|
1286
|
-
def get_default_mode(self, op):
|
|
1287
|
-
"""Get default mode for Ascend"""
|
|
1288
|
-
|
|
1289
|
-
def _dtype_same(tensors):
|
|
1290
|
-
dtype = tensors[0].dtype
|
|
1291
|
-
for tensor_ in tensors:
|
|
1292
|
-
if tensor_.dtype != dtype:
|
|
1293
|
-
return False
|
|
1294
|
-
return True
|
|
1295
|
-
|
|
1296
|
-
if op.prim == "MatMul":
|
|
1297
|
-
if op.inputs[0].dtype == "float16" and not _dtype_same(op.inputs):
|
|
1298
|
-
return self.Area.MODE_COMPOSITE
|
|
1299
|
-
if op.prim in ("Tile", "BroadcastTo", "ExpandDims"):
|
|
1300
|
-
return self.Area.MODE_COMPOSITE
|
|
1301
|
-
return self.Area.MODE_BASIC
|
|
1302
|
-
|
|
1303
|
-
def pattern_fuse(self, fuse_func=None):
|
|
1304
|
-
"""fuse Areas by pattern"""
|
|
1305
|
-
|
|
1306
|
-
def _likely_multicore(dom):
|
|
1307
|
-
op = dom.dom_op()
|
|
1308
|
-
iter_size = tensor_size(op.output if not PrimLib.is_reduce(op) else op.inputs[0])
|
|
1309
|
-
return iter_size > 1024
|
|
1310
|
-
|
|
1311
|
-
def _broadcast_pat_exclude(dom, a, r):
|
|
1312
|
-
if _likely_multicore(a) and (dom.is_output or len(dom.ops) > self.BROADCAST_FUSE_DEPTH):
|
|
1313
|
-
return True
|
|
1314
|
-
return a.pattern > PrimLib.REDUCE or r > PrimLib.BROADCAST
|
|
1315
|
-
|
|
1316
|
-
def _broadcast_bwd_depth(dom):
|
|
1317
|
-
if dom.pattern not in (PrimLib.ELEMWISE, PrimLib.BROADCAST) or len(dom.out_relations) != 1:
|
|
1318
|
-
return []
|
|
1319
|
-
a, r = list(dom.out_relations.items())[0]
|
|
1320
|
-
if _broadcast_pat_exclude(dom, a, r) or len(a.in_relations) != 1:
|
|
1321
|
-
return []
|
|
1322
|
-
return [a], False
|
|
1323
|
-
|
|
1324
|
-
def _broadcast_bwd_width(dom):
|
|
1325
|
-
if dom.pattern not in (PrimLib.ELEMWISE, PrimLib.BROADCAST):
|
|
1326
|
-
return []
|
|
1327
|
-
fused = []
|
|
1328
|
-
for a, r in dom.out_relations.items():
|
|
1329
|
-
if _broadcast_pat_exclude(dom, a, r) or not dom.check_acyclic(a) or \
|
|
1330
|
-
(fused and tensor_size(fused[0].dom_op().output) != tensor_size(a.dom_op().output)):
|
|
1331
|
-
return []
|
|
1332
|
-
fused.append(a)
|
|
1333
|
-
return fused, False
|
|
1334
|
-
|
|
1335
|
-
def _reduce_pat_exclude(dom, a, r):
|
|
1336
|
-
if len(a.ops) > self.reduce_fuse_depth:
|
|
1337
|
-
return True
|
|
1338
|
-
if r == PrimLib.BROADCAST and _likely_multicore(dom) and \
|
|
1339
|
-
(dom.is_output or len(dom.ops) > self.BROADCAST_FUSE_DEPTH):
|
|
1340
|
-
return True
|
|
1341
|
-
return a.pattern > PrimLib.BROADCAST or r > PrimLib.REDUCE
|
|
1342
|
-
|
|
1343
|
-
def _reduce_depth(dom):
|
|
1344
|
-
if dom.pattern != PrimLib.REDUCE or len(dom.in_relations) != 1:
|
|
1345
|
-
return []
|
|
1346
|
-
a, r = list(dom.in_relations.items())[0]
|
|
1347
|
-
if _reduce_pat_exclude(dom, a, r) or len(a.out_relations) != 1:
|
|
1348
|
-
return []
|
|
1349
|
-
return [a], True
|
|
1350
|
-
|
|
1351
|
-
def _reduce_width(dom):
|
|
1352
|
-
if dom.pattern != PrimLib.REDUCE:
|
|
1353
|
-
return []
|
|
1354
|
-
fused = []
|
|
1355
|
-
for a, r in dom.in_relations.items():
|
|
1356
|
-
if not _reduce_pat_exclude(dom, a, r) and a.check_acyclic(dom):
|
|
1357
|
-
fused.append(a)
|
|
1358
|
-
return fused, True
|
|
1359
|
-
|
|
1360
|
-
def _matmul_depth(dom):
|
|
1361
|
-
if dom.dom_op().prim != "MatMul" and dom.dom_op().prim != "BatchMatMul":
|
|
1362
|
-
return []
|
|
1363
|
-
fused = []
|
|
1364
|
-
for a, _ in dom.out_relations.items():
|
|
1365
|
-
if (((a.dom_op().prim == "AddN" or a.dom_op().prim == "Add" or a.dom_op().prim == "Cast")
|
|
1366
|
-
and dom.dom_op().prim == "MatMul")
|
|
1367
|
-
or (a.pattern == PrimLib.ELEMWISE and dom.dom_op().prim == "BatchMatMul")) \
|
|
1368
|
-
and a.check_acyclic(dom):
|
|
1369
|
-
fused.append(a)
|
|
1370
|
-
return fused, False
|
|
1371
|
-
|
|
1372
|
-
def _reduce_output(dom):
|
|
1373
|
-
if dom.pattern != PrimLib.REDUCE:
|
|
1374
|
-
return []
|
|
1375
|
-
op_attrs = dom.dom_op().attrs
|
|
1376
|
-
if not op_attrs.get('reduce_output_fuse'):
|
|
1377
|
-
return []
|
|
1378
|
-
fused = []
|
|
1379
|
-
for a, r in dom.out_relations.items():
|
|
1380
|
-
if a.pattern <= PrimLib.BROADCAST and r <= PrimLib.BROADCAST and \
|
|
1381
|
-
dom.check_acyclic(a):
|
|
1382
|
-
fused.append(a)
|
|
1383
|
-
return fused, False
|
|
1384
|
-
|
|
1385
|
-
def _reduce_stitch(dom):
|
|
1386
|
-
if dom.pattern != PrimLib.REDUCE:
|
|
1387
|
-
return []
|
|
1388
|
-
if tensor_size(dom.ops[0].output) == 1:
|
|
1389
|
-
return []
|
|
1390
|
-
if tensor_size(dom.ops[0].inputs[0]) < 32 * 16 * 16:
|
|
1391
|
-
return []
|
|
1392
|
-
|
|
1393
|
-
fused = []
|
|
1394
|
-
for a, r in dom.out_relations.items():
|
|
1395
|
-
if not may_stitch(dom, a, r, 32, 32 * 16 * 16):
|
|
1396
|
-
continue
|
|
1397
|
-
if a.pattern == PrimLib.REDUCE:
|
|
1398
|
-
if a.ops[0].attrs['reduce_axis'] == dom.ops[0].attrs['reduce_axis']:
|
|
1399
|
-
dom.stitch_info.stitch_ops.add(dom.ops[0].output.name)
|
|
1400
|
-
fused.append(a)
|
|
1401
|
-
elif a.pattern <= PrimLib.BROADCAST:
|
|
1402
|
-
dom.stitch_info.stitch_ops.add(dom.ops[0].output.name)
|
|
1403
|
-
fused.append(a)
|
|
1404
|
-
return fused, False
|
|
1405
|
-
|
|
1406
|
-
def _transdata_pattern_support(dom, a):
|
|
1407
|
-
transdata_op = dom.dom_op()
|
|
1408
|
-
|
|
1409
|
-
# Currently, if transdata has the pad, it is not used to fuse
|
|
1410
|
-
def _has_pad():
|
|
1411
|
-
res = False
|
|
1412
|
-
input_shape = transdata_op.inputs[0].shape
|
|
1413
|
-
output_shape = transdata_op.output.shape
|
|
1414
|
-
cube_size = 16
|
|
1415
|
-
for dim in input_shape[-2:]:
|
|
1416
|
-
if dim % cube_size != 0:
|
|
1417
|
-
res = True
|
|
1418
|
-
for dim in output_shape[-2:]:
|
|
1419
|
-
if dim % cube_size != 0:
|
|
1420
|
-
res = True
|
|
1421
|
-
return res
|
|
1422
|
-
|
|
1423
|
-
has_pad = _has_pad()
|
|
1424
|
-
if has_pad:
|
|
1425
|
-
return False
|
|
1426
|
-
|
|
1427
|
-
if a.dom_op().prim == "MatMul" and len(dom.ops) == 1:
|
|
1428
|
-
return True
|
|
1429
|
-
|
|
1430
|
-
# reshape/elewise/broadcast + transdata
|
|
1431
|
-
if a.pattern <= PrimLib.BROADCAST and len(dom.ops) == 1:
|
|
1432
|
-
op_attrs = dom.dom_op().attrs
|
|
1433
|
-
if 'src_format' not in op_attrs.keys() \
|
|
1434
|
-
or 'dst_format' not in op_attrs.keys():
|
|
1435
|
-
logger.error("For 'TransData', can not find the attr 'src_format' or 'dst_format'")
|
|
1436
|
-
return False
|
|
1437
|
-
src_format, dst_format = op_attrs['src_format'], op_attrs['dst_format']
|
|
1438
|
-
if src_format == DF.FRAC_NZ and dst_format in (DF.DEFAULT, DF.NCHW):
|
|
1439
|
-
return True
|
|
1440
|
-
# For the Default/NCHW to FRAC_NZ, currently only the Cast+Transdata is supported
|
|
1441
|
-
if src_format in (DF.DEFAULT, DF.NCHW) and dst_format == DF.FRAC_NZ \
|
|
1442
|
-
and len(a.ops) == 1 and a.dom_op().prim == "Cast" and not a.is_output:
|
|
1443
|
-
return True
|
|
1444
|
-
return False
|
|
1445
|
-
|
|
1446
|
-
def _transdata(dom):
|
|
1447
|
-
if dom.dom_op().prim != "TransData":
|
|
1448
|
-
return []
|
|
1449
|
-
fused = []
|
|
1450
|
-
for a, _ in dom.in_relations.items():
|
|
1451
|
-
if _transdata_pattern_support(dom, a) and a.check_acyclic(dom):
|
|
1452
|
-
fused.append(a)
|
|
1453
|
-
return fused, True
|
|
1454
|
-
|
|
1455
|
-
def _fuse_loop():
|
|
1456
|
-
self.fuse(CommonPattern.reshape)
|
|
1457
|
-
self.fuse(CommonPattern.assign)
|
|
1458
|
-
self.fuse(CommonPattern.elemwise_depth)
|
|
1459
|
-
self.fuse(CommonPattern.elemwise_width)
|
|
1460
|
-
self.fuse(CommonPattern.broadcast_depth)
|
|
1461
|
-
self.fuse(CommonPattern.broadcast_width)
|
|
1462
|
-
self.fuse(_reduce_depth)
|
|
1463
|
-
self.fuse(_reduce_width)
|
|
1464
|
-
self.fuse(_broadcast_bwd_depth)
|
|
1465
|
-
self.fuse(_broadcast_bwd_width)
|
|
1466
|
-
self.fuse(_matmul_depth)
|
|
1467
|
-
self.fuse(_reduce_output)
|
|
1468
|
-
if self.enable_stitch_fusion:
|
|
1469
|
-
self.fuse(_reduce_stitch, True)
|
|
1470
|
-
self.fuse(_transdata)
|
|
1471
|
-
|
|
1472
|
-
def _fuse_once(fuse_func):
|
|
1473
|
-
if fuse_func(CommonPattern.reshape) or \
|
|
1474
|
-
fuse_func(CommonPattern.elemwise_depth) or fuse_func(CommonPattern.elemwise_width) or \
|
|
1475
|
-
fuse_func(CommonPattern.broadcast_depth) or fuse_func(CommonPattern.broadcast_width) or \
|
|
1476
|
-
fuse_func(_reduce_depth) or fuse_func(_reduce_width) or \
|
|
1477
|
-
fuse_func(_broadcast_bwd_depth) or fuse_func(_broadcast_bwd_width) or \
|
|
1478
|
-
fuse_func(_matmul_depth) or fuse_func(_reduce_output) or fuse_func(_transdata):
|
|
1479
|
-
pass
|
|
1480
|
-
|
|
1481
|
-
if fuse_func is None:
|
|
1482
|
-
_fuse_loop()
|
|
1483
|
-
else:
|
|
1484
|
-
_fuse_once(fuse_func)
|
|
1485
|
-
|
|
1486
|
-
|
|
1487
1333
|
def split(graph, target, flags):
|
|
1488
1334
|
"""Split graph"""
|
|
1489
1335
|
result = None
|
|
1490
1336
|
if target == "cuda":
|
|
1491
1337
|
result = GraphSplitGpu(graph, flags).split()
|
|
1492
|
-
else:
|
|
1493
|
-
result = GraphSplitAscend(graph, flags).split()
|
|
1494
1338
|
return result
|
|
@@ -21,7 +21,7 @@ from multiprocessing import Pool, cpu_count
|
|
|
21
21
|
from mindspore import log as logger
|
|
22
22
|
from mindspore._extends.parallel_compile.akg_compiler.get_file_path import get_akg_path
|
|
23
23
|
from mindspore._extends.parallel_compile.akg_compiler.util import get_ascend_compile_dirs, create_compile_dirs, \
|
|
24
|
-
get_log_level, update_attr, select_best, print_compile_log, check_tbe_support
|
|
24
|
+
get_log_level, update_attr, select_best, print_compile_log, check_tbe_support, get_kernel_meta_parent_dir
|
|
25
25
|
|
|
26
26
|
|
|
27
27
|
def _compile_akg_task_default(json_strs, attrs):
|
|
@@ -35,6 +35,7 @@ def _compile_akg_task_default(json_strs, attrs):
|
|
|
35
35
|
sys.path.insert(0, get_akg_path())
|
|
36
36
|
p = __import__("akg", globals(), locals(), ['ms'], 0)
|
|
37
37
|
func = getattr(p.ms, "compilewithjson")
|
|
38
|
+
os.environ["MS_COMPILER_CACHE_PATH"] = get_kernel_meta_parent_dir(attrs)
|
|
38
39
|
|
|
39
40
|
for json_str in json_strs:
|
|
40
41
|
res = func(json_str, attrs)
|
|
@@ -66,12 +67,12 @@ def _compile_akg_task_ascend(json_strs, attrs):
|
|
|
66
67
|
return
|
|
67
68
|
log_level = get_log_level(attrs)
|
|
68
69
|
compiler = os.path.join(os.path.split(os.path.realpath(__file__))[0], "compiler.py")
|
|
69
|
-
compile_dirs = get_ascend_compile_dirs()
|
|
70
|
+
compile_dirs = get_ascend_compile_dirs(attrs)
|
|
70
71
|
kernel_meta_dir = compile_dirs.get("kernel_meta_dir")
|
|
71
72
|
akg_compile_dir = compile_dirs.get("akg_compile_dir")
|
|
72
73
|
tbe_compile_dir = compile_dirs.get("tbe_compile_dir")
|
|
73
74
|
composite_graph_dir = compile_dirs.get("composite_graph_dir")
|
|
74
|
-
attrs = update_attr(attrs, {"dump_composite_graph": composite_graph_dir})
|
|
75
|
+
attrs = update_attr(attrs, {"dump_composite_graph": composite_graph_dir, "optimize_for_tbe": True})
|
|
75
76
|
for json_str in json_strs:
|
|
76
77
|
json_desc = json.loads(json_str)
|
|
77
78
|
op_name = json_desc["op"]
|
|
@@ -87,11 +88,13 @@ def _compile_akg_task_ascend(json_strs, attrs):
|
|
|
87
88
|
_compile_subprocess(compiler, akg_compile_dir, info_path, "AKG", attrs, compile_log, log_level)
|
|
88
89
|
|
|
89
90
|
# Load composite optimized json str and compile it with TBE
|
|
90
|
-
|
|
91
|
-
if
|
|
92
|
-
composite_graph_path =
|
|
93
|
-
|
|
94
|
-
|
|
91
|
+
composite_graph_path = os.path.join(composite_graph_dir, op_name + ".info")
|
|
92
|
+
if not os.path.isfile(composite_graph_path):
|
|
93
|
+
composite_graph_path = info_path
|
|
94
|
+
with open(composite_graph_path, 'r') as f:
|
|
95
|
+
composite_graph = f.read()
|
|
96
|
+
if "buffer_stitch" not in json_desc and "parallel_fusion" not in json_desc and \
|
|
97
|
+
check_tbe_support(json.loads(composite_graph)):
|
|
95
98
|
_compile_subprocess(compiler, tbe_compile_dir, composite_graph_path, "TBE", attrs, compile_log, log_level)
|
|
96
99
|
|
|
97
100
|
print_compile_log(compile_log)
|
|
@@ -149,7 +152,7 @@ class AkgProcess:
|
|
|
149
152
|
"not be zero.")
|
|
150
153
|
args = list((arg, attrs) for arg in self.args)
|
|
151
154
|
if self.platform == "ASCEND":
|
|
152
|
-
create_compile_dirs(get_ascend_compile_dirs())
|
|
155
|
+
create_compile_dirs(get_ascend_compile_dirs(attrs))
|
|
153
156
|
with Pool(processes=self.process_num) as pool:
|
|
154
157
|
res = pool.starmap_async(_compile_akg_task_ascend, args)
|
|
155
158
|
res.get(timeout=self.wait_time)
|