PyPI - mindspore - Versions diffs - 2.2.14__cp39-cp39-win_amd64.whl → 2.4.0__cp39-cp39-win_amd64.whl - Mend

mindspore 2.2.14__cp39-cp39-win_amd64.whl → 2.4.0__cp39-cp39-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (1217) hide show

mindspore/.commit_id +1 -1
mindspore/Microsoft.VisualStudio.Telemetry.dll +0 -0
mindspore/Newtonsoft.Json.dll +0 -0
mindspore/__init__.py +8 -5
mindspore/_c_dataengine.cp39-win_amd64.pyd +0 -0
mindspore/_c_expression.cp39-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp39-win_amd64.pyd +0 -0
mindspore/_checkparam.py +124 -25
mindspore/_extends/builtin_operations.py +2 -1
mindspore/_extends/graph_kernel/model/graph_parallel.py +16 -6
mindspore/_extends/parallel_compile/akg_compiler/akg_process.py +3 -16
mindspore/_extends/parallel_compile/akg_compiler/build_tbe_kernel.py +16 -4
mindspore/_extends/parallel_compile/akg_compiler/compiler.py +1 -0
mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +96 -0
mindspore/_extends/parallel_compile/akg_compiler/tbe_topi.py +2 -1
mindspore/_extends/parallel_compile/akg_compiler/util.py +5 -2
mindspore/_extends/parse/__init__.py +18 -14
mindspore/_extends/parse/compile_config.py +299 -0
mindspore/_extends/parse/namespace.py +2 -2
mindspore/_extends/parse/parser.py +182 -68
mindspore/_extends/parse/resources.py +45 -14
mindspore/_extends/parse/standard_method.py +192 -252
mindspore/{ops/_op_impl/tbe/atomic_addr_clean.py → _extends/pijit/__init__.py} +6 -16
mindspore/_extends/pijit/pijit_func_white_list.py +669 -0
mindspore/_extends/remote/kernel_build_server.py +2 -0
mindspore/_profiler.py +30 -0
mindspore/amp.py +67 -26
mindspore/atlprov.dll +0 -0
mindspore/avcodec-59.dll +0 -0
mindspore/avdevice-59.dll +0 -0
mindspore/avfilter-8.dll +0 -0
mindspore/avformat-59.dll +0 -0
mindspore/avutil-57.dll +0 -0
mindspore/boost/adasum.py +1 -1
mindspore/boost/base.py +1 -1
mindspore/boost/boost_cell_wrapper.py +2 -2
mindspore/boost/grad_freeze.py +2 -2
mindspore/boost/group_loss_scale_manager.py +1 -1
mindspore/boost/less_batch_normalization.py +9 -6
mindspore/c1.dll +0 -0
mindspore/c1xx.dll +0 -0
mindspore/c2.dll +0 -0
mindspore/common/__init__.py +20 -7
mindspore/common/_jit_fallback_utils.py +2 -3
mindspore/common/_pijit_context.py +190 -0
mindspore/common/_register_for_adapter.py +7 -0
mindspore/common/_register_for_recompute.py +48 -0
mindspore/common/_register_for_tensor.py +10 -10
mindspore/common/_stub_tensor.py +7 -1
mindspore/common/_tensor_overload.py +139 -0
mindspore/common/_utils.py +5 -17
mindspore/common/api.py +449 -129
mindspore/common/auto_dynamic_shape.py +27 -14
mindspore/common/dtype.py +17 -10
mindspore/common/dump.py +8 -11
mindspore/common/file_system.py +48 -0
mindspore/common/generator.py +254 -0
mindspore/common/hook_handle.py +65 -30
mindspore/common/initializer.py +1 -1
mindspore/common/jit_config.py +34 -14
mindspore/common/lazy_inline.py +72 -19
mindspore/common/mindir_util.py +12 -2
mindspore/common/mutable.py +79 -14
mindspore/common/no_inline.py +54 -0
mindspore/common/np_dtype.py +25 -0
mindspore/common/parameter.py +73 -21
mindspore/common/recompute.py +292 -0
mindspore/common/seed.py +9 -9
mindspore/common/sparse_tensor.py +276 -24
mindspore/common/symbol.py +122 -0
mindspore/common/tensor.py +668 -514
mindspore/communication/__init__.py +6 -11
mindspore/communication/_comm_helper.py +43 -3
mindspore/communication/comm_func.py +1395 -0
mindspore/communication/management.py +117 -104
mindspore/config/op_info.config +22 -54
mindspore/context.py +455 -71
mindspore/dataset/__init__.py +5 -5
mindspore/dataset/audio/__init__.py +6 -6
mindspore/dataset/audio/transforms.py +711 -158
mindspore/dataset/callback/ds_callback.py +2 -2
mindspore/dataset/core/config.py +7 -0
mindspore/dataset/core/validator_helpers.py +7 -0
mindspore/dataset/engine/cache_client.py +2 -2
mindspore/dataset/engine/datasets.py +201 -116
mindspore/dataset/engine/datasets_audio.py +14 -14
mindspore/dataset/engine/datasets_standard_format.py +83 -3
mindspore/dataset/engine/datasets_text.py +39 -39
mindspore/dataset/engine/datasets_user_defined.py +230 -141
mindspore/dataset/engine/datasets_vision.py +78 -74
mindspore/dataset/engine/iterators.py +29 -0
mindspore/dataset/engine/obs/util.py +7 -0
mindspore/dataset/engine/offload.py +5 -7
mindspore/dataset/engine/queue.py +138 -66
mindspore/dataset/engine/serializer_deserializer.py +2 -2
mindspore/dataset/engine/validators.py +41 -15
mindspore/dataset/text/__init__.py +2 -5
mindspore/dataset/text/transforms.py +408 -121
mindspore/dataset/text/utils.py +9 -9
mindspore/dataset/transforms/__init__.py +0 -3
mindspore/dataset/transforms/transforms.py +261 -76
mindspore/dataset/utils/browse_dataset.py +9 -9
mindspore/dataset/utils/line_reader.py +2 -0
mindspore/dataset/vision/__init__.py +7 -10
mindspore/dataset/vision/c_transforms.py +10 -10
mindspore/dataset/vision/py_transforms_util.py +1 -1
mindspore/dataset/vision/transforms.py +2844 -549
mindspore/dataset/vision/utils.py +161 -10
mindspore/dataset/vision/validators.py +16 -3
mindspore/dnnl.dll +0 -0
mindspore/dpcmi.dll +0 -0
mindspore/{rewrite/ast_creator_register.py → experimental/es/__init__.py} +5 -20
mindspore/experimental/es/embedding_service.py +883 -0
mindspore/experimental/es/embedding_service_layer.py +581 -0
mindspore/experimental/llm_boost/__init__.py +21 -0
mindspore/experimental/llm_boost/atb/__init__.py +23 -0
mindspore/experimental/llm_boost/atb/boost_base.py +211 -0
mindspore/experimental/llm_boost/atb/llama_boost.py +115 -0
mindspore/experimental/llm_boost/atb/qwen_boost.py +101 -0
mindspore/experimental/llm_boost/register.py +129 -0
mindspore/experimental/llm_boost/utils.py +31 -0
mindspore/experimental/optim/__init__.py +12 -2
mindspore/experimental/optim/adadelta.py +161 -0
mindspore/experimental/optim/adagrad.py +168 -0
mindspore/experimental/optim/adam.py +35 -34
mindspore/experimental/optim/adamax.py +170 -0
mindspore/experimental/optim/adamw.py +124 -15
mindspore/experimental/optim/asgd.py +153 -0
mindspore/experimental/optim/lr_scheduler.py +66 -121
mindspore/experimental/optim/nadam.py +157 -0
mindspore/experimental/optim/optimizer.py +18 -8
mindspore/experimental/optim/radam.py +194 -0
mindspore/experimental/optim/rmsprop.py +154 -0
mindspore/experimental/optim/rprop.py +164 -0
mindspore/experimental/optim/sgd.py +28 -19
mindspore/hal/__init__.py +40 -0
mindspore/hal/_ascend.py +57 -0
mindspore/hal/_base.py +57 -0
mindspore/hal/_cpu.py +56 -0
mindspore/hal/_gpu.py +57 -0
mindspore/hal/contiguous_tensors_handle.py +175 -0
mindspore/hal/device.py +356 -0
mindspore/hal/event.py +179 -0
mindspore/hal/memory.py +326 -0
mindspore/hal/stream.py +357 -0
mindspore/include/api/data_type.h +2 -2
mindspore/include/api/dual_abi_helper.h +16 -3
mindspore/include/api/model.h +4 -3
mindspore/include/api/model_group.h +13 -1
mindspore/include/api/status.h +14 -0
mindspore/include/api/types.h +10 -10
mindspore/include/c_api/model_c.h +173 -0
mindspore/include/c_api/types_c.h +19 -0
mindspore/include/dataset/config.h +2 -2
mindspore/include/dataset/constants.h +2 -2
mindspore/include/dataset/execute.h +3 -5
mindspore/include/dataset/vision.h +58 -2
mindspore/jpeg62.dll +0 -0
mindspore/log.py +3 -3
mindspore/mindrecord/__init__.py +5 -1
mindspore/mindrecord/config.py +809 -0
mindspore/mindrecord/filereader.py +25 -0
mindspore/mindrecord/filewriter.py +138 -103
mindspore/mindrecord/mindpage.py +40 -6
mindspore/mindrecord/shardutils.py +3 -2
mindspore/mindrecord/shardwriter.py +7 -0
mindspore/mindrecord/tools/cifar100_to_mr.py +8 -13
mindspore/mindrecord/tools/cifar10_to_mr.py +9 -15
mindspore/mindrecord/tools/csv_to_mr.py +4 -9
mindspore/mindrecord/tools/imagenet_to_mr.py +3 -8
mindspore/mindrecord/tools/mnist_to_mr.py +7 -12
mindspore/mindrecord/tools/tfrecord_to_mr.py +1 -6
mindspore/mindspore_backend.dll +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_glog.dll +0 -0
mindspore/mindspore_np_dtype.dll +0 -0
mindspore/mindspore_ops.dll +0 -0
mindspore/mint/__init__.py +1586 -0
mindspore/mint/distributed/__init__.py +31 -0
mindspore/mint/distributed/distributed.py +254 -0
mindspore/{rewrite/ast_transformers → mint/linalg}/__init__.py +9 -4
mindspore/mint/nn/__init__.py +757 -0
mindspore/mint/nn/functional.py +679 -0
mindspore/mint/nn/layer/__init__.py +39 -0
mindspore/mint/nn/layer/activation.py +133 -0
mindspore/mint/nn/layer/normalization.py +477 -0
mindspore/mint/nn/layer/pooling.py +110 -0
mindspore/mint/optim/__init__.py +24 -0
mindspore/mint/optim/adamw.py +206 -0
mindspore/mint/special/__init__.py +63 -0
mindspore/msobj140.dll +0 -0
mindspore/mspdb140.dll +0 -0
mindspore/mspdbcore.dll +0 -0
mindspore/mspdbst.dll +0 -0
mindspore/mspft140.dll +0 -0
mindspore/msvcdis140.dll +0 -0
mindspore/msvcp140_1.dll +0 -0
mindspore/msvcp140_2.dll +0 -0
mindspore/msvcp140_atomic_wait.dll +0 -0
mindspore/msvcp140_codecvt_ids.dll +0 -0
mindspore/multiprocessing/__init__.py +73 -0
mindspore/nn/cell.py +461 -323
mindspore/nn/dynamic_lr.py +2 -2
mindspore/nn/layer/activation.py +292 -135
mindspore/nn/layer/basic.py +288 -83
mindspore/nn/layer/channel_shuffle.py +3 -16
mindspore/nn/layer/container.py +3 -3
mindspore/nn/layer/conv.py +75 -66
mindspore/nn/layer/embedding.py +221 -45
mindspore/nn/layer/image.py +4 -7
mindspore/nn/layer/math.py +1 -1
mindspore/nn/layer/normalization.py +150 -68
mindspore/nn/layer/padding.py +64 -87
mindspore/nn/layer/pooling.py +175 -12
mindspore/nn/layer/rnn_cells.py +6 -16
mindspore/nn/layer/rnns.py +6 -5
mindspore/nn/layer/thor_layer.py +1 -2
mindspore/nn/layer/timedistributed.py +1 -1
mindspore/nn/layer/transformer.py +55 -53
mindspore/nn/learning_rate_schedule.py +6 -5
mindspore/nn/loss/__init__.py +2 -2
mindspore/nn/loss/loss.py +145 -88
mindspore/nn/optim/__init__.py +2 -1
mindspore/nn/optim/ada_grad.py +4 -2
mindspore/nn/optim/adadelta.py +4 -2
mindspore/nn/optim/adafactor.py +1 -1
mindspore/nn/optim/adam.py +102 -181
mindspore/nn/optim/adamax.py +4 -2
mindspore/nn/optim/adasum.py +3 -3
mindspore/nn/optim/asgd.py +4 -2
mindspore/nn/optim/ftrl.py +31 -61
mindspore/nn/optim/lamb.py +5 -3
mindspore/nn/optim/lars.py +2 -2
mindspore/nn/optim/lazyadam.py +6 -4
mindspore/nn/optim/momentum.py +13 -25
mindspore/nn/optim/optimizer.py +6 -3
mindspore/nn/optim/proximal_ada_grad.py +4 -2
mindspore/nn/optim/rmsprop.py +9 -3
mindspore/nn/optim/rprop.py +4 -2
mindspore/nn/optim/sgd.py +5 -3
mindspore/nn/optim/tft_wrapper.py +127 -0
mindspore/nn/optim/thor.py +2 -2
mindspore/nn/probability/distribution/_utils/custom_ops.py +2 -2
mindspore/nn/probability/distribution/beta.py +2 -2
mindspore/nn/probability/distribution/categorical.py +4 -6
mindspore/nn/probability/distribution/cauchy.py +2 -2
mindspore/nn/probability/distribution/exponential.py +2 -2
mindspore/nn/probability/distribution/geometric.py +1 -1
mindspore/nn/probability/distribution/gumbel.py +2 -2
mindspore/nn/probability/distribution/logistic.py +1 -1
mindspore/nn/probability/distribution/poisson.py +2 -2
mindspore/nn/probability/distribution/uniform.py +2 -2
mindspore/nn/reinforcement/_tensors_queue.py +13 -1
mindspore/nn/wrap/__init__.py +2 -1
mindspore/nn/wrap/cell_wrapper.py +46 -12
mindspore/nn/wrap/grad_reducer.py +148 -8
mindspore/nn/wrap/loss_scale.py +44 -7
mindspore/numpy/__init__.py +2 -0
mindspore/numpy/array_creations.py +67 -68
mindspore/numpy/array_ops.py +70 -66
mindspore/numpy/dtypes.py +3 -3
mindspore/numpy/fft.py +966 -0
mindspore/numpy/logic_ops.py +11 -10
mindspore/numpy/math_ops.py +147 -152
mindspore/numpy/utils.py +3 -0
mindspore/numpy/utils_const.py +4 -4
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/opencv_imgproc452.dll +0 -0
mindspore/ops/__init__.py +9 -6
mindspore/ops/_grad_experimental/grad_array_ops.py +4 -129
mindspore/ops/_grad_experimental/grad_comm_ops.py +135 -36
mindspore/ops/_grad_experimental/grad_math_ops.py +61 -298
mindspore/ops/_grad_experimental/grad_nn_ops.py +0 -53
mindspore/ops/_grad_experimental/grad_quant_ops.py +3 -3
mindspore/ops/_grad_experimental/grad_sparse.py +1 -1
mindspore/ops/_grad_experimental/grad_sparse_ops.py +3 -3
mindspore/ops/_op_impl/__init__.py +0 -1
mindspore/ops/_op_impl/aicpu/gamma.py +2 -0
mindspore/ops/_op_impl/aicpu/generate_eod_mask.py +1 -1
mindspore/ops/_op_impl/aicpu/log_uniform_candidate_sampler.py +1 -3
mindspore/ops/_op_impl/aicpu/poisson.py +2 -0
mindspore/ops/_op_impl/cpu/__init__.py +1 -3
mindspore/ops/_op_impl/cpu/adam.py +2 -2
mindspore/ops/_op_impl/cpu/adam_weight_decay.py +3 -2
mindspore/ops/_op_impl/cpu/maximum_grad.py +16 -14
mindspore/ops/_op_impl/cpu/minimum_grad.py +8 -0
mindspore/ops/_vmap/vmap_array_ops.py +162 -101
mindspore/ops/_vmap/vmap_base.py +8 -1
mindspore/ops/_vmap/vmap_grad_math_ops.py +95 -9
mindspore/ops/_vmap/vmap_grad_nn_ops.py +143 -58
mindspore/ops/_vmap/vmap_image_ops.py +70 -13
mindspore/ops/_vmap/vmap_math_ops.py +147 -59
mindspore/ops/_vmap/vmap_nn_ops.py +292 -117
mindspore/ops/_vmap/vmap_other_ops.py +1 -1
mindspore/ops/auto_generate/__init__.py +31 -0
mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +309 -0
mindspore/ops/auto_generate/gen_arg_dtype_cast.py +252 -0
mindspore/ops/auto_generate/gen_arg_handler.py +197 -0
mindspore/ops/auto_generate/gen_extend_func.py +1701 -0
mindspore/ops/auto_generate/gen_ops_def.py +8482 -0
mindspore/ops/auto_generate/gen_ops_prim.py +16704 -0
mindspore/ops/auto_generate/pyboost_inner_prim.py +549 -0
mindspore/ops/composite/__init__.py +5 -2
mindspore/ops/composite/base.py +201 -66
mindspore/ops/composite/math_ops.py +10 -49
mindspore/ops/composite/multitype_ops/_compile_utils.py +192 -618
mindspore/ops/composite/multitype_ops/_constexpr_utils.py +25 -134
mindspore/ops/composite/multitype_ops/add_impl.py +6 -0
mindspore/ops/composite/multitype_ops/bitwise_and_impl.py +6 -0
mindspore/ops/composite/multitype_ops/bitwise_or_impl.py +6 -0
mindspore/ops/composite/multitype_ops/bitwise_xor_impl.py +6 -0
mindspore/ops/composite/multitype_ops/div_impl.py +8 -0
mindspore/ops/composite/multitype_ops/equal_impl.py +6 -0
mindspore/ops/composite/multitype_ops/floordiv_impl.py +8 -0
mindspore/ops/composite/multitype_ops/getitem_impl.py +6 -0
mindspore/ops/composite/multitype_ops/greater_equal_impl.py +6 -0
mindspore/ops/composite/multitype_ops/greater_impl.py +6 -0
mindspore/ops/composite/multitype_ops/in_impl.py +8 -2
mindspore/ops/composite/multitype_ops/left_shift_impl.py +6 -0
mindspore/ops/composite/multitype_ops/less_equal_impl.py +6 -0
mindspore/ops/composite/multitype_ops/less_impl.py +6 -0
mindspore/ops/composite/multitype_ops/logic_not_impl.py +6 -0
mindspore/ops/composite/multitype_ops/logical_and_impl.py +6 -0
mindspore/ops/composite/multitype_ops/logical_or_impl.py +6 -0
mindspore/ops/composite/multitype_ops/mod_impl.py +6 -0
mindspore/ops/composite/multitype_ops/mul_impl.py +6 -0
mindspore/ops/composite/multitype_ops/negative_impl.py +9 -3
mindspore/ops/composite/multitype_ops/not_equal_impl.py +6 -0
mindspore/ops/composite/multitype_ops/not_in_impl.py +8 -3
mindspore/ops/composite/multitype_ops/ones_like_impl.py +2 -2
mindspore/ops/composite/multitype_ops/pow_impl.py +6 -0
mindspore/ops/composite/multitype_ops/right_shift_impl.py +6 -0
mindspore/ops/composite/multitype_ops/setitem_impl.py +32 -21
mindspore/ops/composite/multitype_ops/sub_impl.py +6 -0
mindspore/ops/composite/multitype_ops/zeros_like_impl.py +6 -3
mindspore/ops/deprecated.py +14 -3
mindspore/ops/function/__init__.py +53 -11
mindspore/ops/function/array_func.py +1269 -1821
mindspore/ops/function/clip_func.py +19 -31
mindspore/ops/function/debug_func.py +114 -5
mindspore/ops/function/fft_func.py +44 -0
mindspore/ops/function/grad/grad_func.py +30 -22
mindspore/ops/function/image_func.py +27 -21
mindspore/ops/function/linalg_func.py +35 -68
mindspore/ops/function/math_func.py +1170 -2697
mindspore/ops/function/nn_func.py +2116 -1128
mindspore/ops/function/other_func.py +8 -8
mindspore/ops/function/parameter_func.py +5 -93
mindspore/ops/function/random_func.py +435 -113
mindspore/ops/function/reshard_func.py +104 -0
mindspore/ops/function/sparse_func.py +4 -4
mindspore/ops/function/sparse_unary_func.py +9 -16
mindspore/ops/function/spectral_func.py +1 -1
mindspore/ops/function/vmap_func.py +16 -15
mindspore/ops/functional.py +355 -346
mindspore/ops/op_info_register.py +18 -45
mindspore/ops/operations/__init__.py +38 -24
mindspore/ops/operations/_grad_ops.py +21 -927
mindspore/ops/operations/_infer_ops.py +19 -0
mindspore/ops/operations/_inner_ops.py +173 -607
mindspore/ops/operations/_rl_inner_ops.py +2 -2
mindspore/ops/operations/_scalar_ops.py +5 -480
mindspore/ops/operations/_sequence_ops.py +6 -36
mindspore/ops/operations/_tensor_array.py +8 -8
mindspore/ops/operations/array_ops.py +106 -2837
mindspore/ops/operations/comm_ops.py +799 -127
mindspore/ops/operations/custom_ops.py +124 -119
mindspore/ops/operations/debug_ops.py +142 -41
mindspore/ops/operations/image_ops.py +1 -217
mindspore/ops/operations/inner_ops.py +5 -40
mindspore/ops/operations/linalg_ops.py +1 -49
mindspore/ops/operations/manually_defined/__init__.py +24 -0
mindspore/ops/operations/manually_defined/_inner.py +73 -0
mindspore/ops/operations/manually_defined/ops_def.py +2271 -0
mindspore/ops/operations/math_ops.py +666 -4972
mindspore/ops/operations/nn_ops.py +205 -2213
mindspore/ops/operations/other_ops.py +60 -49
mindspore/ops/operations/random_ops.py +50 -54
mindspore/ops/operations/reshard_ops.py +53 -0
mindspore/ops/operations/sparse_ops.py +4 -4
mindspore/ops/primitive.py +216 -103
mindspore/ops_generate/__init__.py +27 -0
mindspore/ops_generate/arg_dtype_cast.py +252 -0
mindspore/ops_generate/arg_handler.py +197 -0
mindspore/ops_generate/gen_aclnn_implement.py +263 -0
mindspore/ops_generate/gen_constants.py +36 -0
mindspore/ops_generate/gen_ops.py +1099 -0
mindspore/ops_generate/gen_ops_inner_prim.py +131 -0
mindspore/ops_generate/gen_pyboost_func.py +1052 -0
mindspore/ops_generate/gen_utils.py +209 -0
mindspore/ops_generate/op_proto.py +145 -0
mindspore/ops_generate/pyboost_utils.py +367 -0
mindspore/ops_generate/template.py +261 -0
mindspore/parallel/__init__.py +8 -4
mindspore/parallel/_auto_parallel_context.py +100 -10
mindspore/parallel/_cell_wrapper.py +99 -9
mindspore/parallel/_cost_model_context.py +1 -1
mindspore/parallel/_dp_allreduce_fusion.py +159 -159
mindspore/parallel/_parallel_serialization.py +67 -23
mindspore/parallel/_ps_context.py +1 -1
mindspore/parallel/_recovery_context.py +1 -1
mindspore/parallel/_tensor.py +99 -22
mindspore/parallel/_transformer/__init__.py +1 -1
mindspore/parallel/_transformer/layers.py +1 -1
mindspore/parallel/_transformer/loss.py +1 -1
mindspore/parallel/_transformer/moe.py +1 -1
mindspore/parallel/_transformer/op_parallel_config.py +1 -1
mindspore/parallel/_transformer/transformer.py +2 -2
mindspore/parallel/_utils.py +173 -6
mindspore/parallel/algo_parameter_config.py +8 -10
mindspore/parallel/checkpoint_transform.py +204 -38
mindspore/parallel/cluster/__init__.py +15 -0
mindspore/parallel/cluster/process_entity/__init__.py +18 -0
mindspore/parallel/cluster/process_entity/_api.py +352 -0
mindspore/parallel/cluster/process_entity/_utils.py +101 -0
mindspore/parallel/cluster/run.py +136 -0
mindspore/parallel/mpi/__init__.py +1 -1
mindspore/parallel/mpi/_mpi_config.py +1 -1
mindspore/parallel/parameter_broadcast.py +151 -0
mindspore/parallel/shard.py +279 -37
mindspore/parallel/transform_safetensors.py +993 -0
mindspore/pgodb140.dll +0 -0
mindspore/pgort140.dll +0 -0
mindspore/profiler/__init__.py +4 -2
mindspore/profiler/common/constant.py +29 -0
mindspore/profiler/common/process_pool.py +41 -0
mindspore/profiler/common/registry.py +47 -0
mindspore/profiler/common/singleton.py +28 -0
mindspore/profiler/common/util.py +153 -0
mindspore/profiler/dynamic_profiler.py +694 -0
mindspore/profiler/envprofiling.py +18 -20
mindspore/{_extends/parallel_compile/tbe_compiler → profiler/parser/ascend_analysis}/__init__.py +1 -1
mindspore/profiler/parser/ascend_analysis/constant.py +71 -0
mindspore/profiler/parser/ascend_analysis/file_manager.py +180 -0
mindspore/profiler/parser/ascend_analysis/function_event.py +185 -0
mindspore/profiler/parser/ascend_analysis/fwk_cann_parser.py +136 -0
mindspore/profiler/parser/ascend_analysis/fwk_file_parser.py +131 -0
mindspore/profiler/parser/ascend_analysis/msprof_timeline_parser.py +104 -0
mindspore/profiler/parser/ascend_analysis/path_manager.py +313 -0
mindspore/profiler/parser/ascend_analysis/profiler_info_parser.py +123 -0
mindspore/profiler/parser/ascend_analysis/tlv_decoder.py +86 -0
mindspore/profiler/parser/ascend_analysis/trace_event_manager.py +75 -0
mindspore/profiler/parser/ascend_cluster_generator.py +14 -9
mindspore/profiler/parser/ascend_communicate_generator.py +0 -1
mindspore/profiler/parser/ascend_flops_generator.py +20 -4
mindspore/profiler/parser/ascend_hccl_generator.py +29 -278
mindspore/profiler/parser/ascend_integrate_generator.py +42 -0
mindspore/profiler/parser/ascend_memory_generator.py +185 -0
mindspore/profiler/parser/ascend_msprof_exporter.py +148 -146
mindspore/profiler/parser/ascend_msprof_generator.py +73 -283
mindspore/profiler/parser/ascend_op_generator.py +92 -42
mindspore/profiler/parser/ascend_timeline_generator.py +298 -133
mindspore/profiler/parser/base_timeline_generator.py +25 -25
mindspore/profiler/parser/cpu_gpu_timeline_generator.py +25 -12
mindspore/profiler/parser/framework_parser.py +4 -393
mindspore/profiler/parser/gpu_analysis/__init__.py +14 -0
mindspore/profiler/parser/gpu_analysis/function_event.py +44 -0
mindspore/profiler/parser/gpu_analysis/fwk_file_parser.py +89 -0
mindspore/profiler/parser/gpu_analysis/profiler_info_parser.py +72 -0
mindspore/profiler/parser/integrator.py +3 -1
mindspore/profiler/parser/memory_usage_parser.py +0 -154
mindspore/profiler/parser/minddata_parser.py +72 -3
mindspore/profiler/parser/profiler_info.py +94 -7
mindspore/profiler/profiler.py +153 -0
mindspore/profiler/profiling.py +631 -508
mindspore/rewrite/__init__.py +2 -14
mindspore/rewrite/api/node.py +122 -36
mindspore/rewrite/api/pattern_engine.py +2 -3
mindspore/rewrite/api/scoped_value.py +16 -15
mindspore/rewrite/api/symbol_tree.py +45 -29
mindspore/rewrite/ast_helpers/__init__.py +3 -6
mindspore/rewrite/ast_helpers/ast_converter.py +143 -0
mindspore/rewrite/ast_helpers/ast_finder.py +48 -0
mindspore/rewrite/ast_helpers/ast_flattener.py +268 -0
mindspore/rewrite/ast_helpers/ast_modifier.py +160 -92
mindspore/rewrite/common/__init__.py +1 -2
mindspore/rewrite/common/config.py +24 -0
mindspore/rewrite/common/{rewrite_elog.py → error_log.py} +39 -39
mindspore/rewrite/{namer.py → common/namer.py} +63 -18
mindspore/rewrite/common/namespace.py +118 -0
mindspore/rewrite/node/__init__.py +5 -5
mindspore/rewrite/node/call_function.py +23 -7
mindspore/rewrite/node/cell_container.py +7 -3
mindspore/rewrite/node/control_flow.py +53 -28
mindspore/rewrite/node/node.py +212 -196
mindspore/rewrite/node/node_manager.py +51 -22
mindspore/rewrite/node/node_topological_manager.py +3 -23
mindspore/rewrite/parsers/__init__.py +12 -0
mindspore/rewrite/parsers/arguments_parser.py +8 -9
mindspore/rewrite/parsers/assign_parser.py +637 -413
mindspore/rewrite/parsers/attribute_parser.py +3 -4
mindspore/rewrite/parsers/class_def_parser.py +115 -148
mindspore/rewrite/parsers/constant_parser.py +5 -5
mindspore/rewrite/parsers/container_parser.py +4 -6
mindspore/rewrite/parsers/expr_parser.py +55 -0
mindspore/rewrite/parsers/for_parser.py +31 -98
mindspore/rewrite/parsers/function_def_parser.py +13 -5
mindspore/rewrite/parsers/if_parser.py +28 -10
mindspore/rewrite/parsers/module_parser.py +8 -182
mindspore/rewrite/parsers/parser.py +1 -5
mindspore/rewrite/parsers/parser_register.py +1 -1
mindspore/rewrite/parsers/return_parser.py +5 -10
mindspore/rewrite/parsers/while_parser.py +59 -0
mindspore/rewrite/sparsify/utils.py +1 -1
mindspore/rewrite/symbol_tree/__init__.py +20 -0
mindspore/rewrite/{symbol_tree.py → symbol_tree/symbol_tree.py} +705 -186
mindspore/rewrite/{symbol_tree_builder.py → symbol_tree/symbol_tree_builder.py} +8 -8
mindspore/rewrite/{symbol_tree_dumper.py → symbol_tree/symbol_tree_dumper.py} +4 -4
mindspore/run_check/_check_version.py +40 -115
mindspore/run_check/run_check.py +1 -1
mindspore/safeguard/rewrite_obfuscation.py +597 -263
mindspore/swresample-4.dll +0 -0
mindspore/swscale-6.dll +0 -0
mindspore/tbbmalloc.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/train/__init__.py +7 -5
mindspore/train/_utils.py +204 -4
mindspore/train/amp.py +335 -295
mindspore/train/anf_ir_pb2.py +14 -2
mindspore/train/callback/__init__.py +5 -2
mindspore/train/callback/_backup_and_restore.py +5 -5
mindspore/train/callback/_callback.py +4 -4
mindspore/train/callback/_checkpoint.py +220 -43
mindspore/train/callback/_cluster_monitor.py +201 -0
mindspore/train/callback/_early_stop.py +2 -2
mindspore/train/callback/_flops_collector.py +239 -0
mindspore/train/callback/_landscape.py +15 -9
mindspore/train/callback/_loss_monitor.py +5 -5
mindspore/train/callback/_on_request_exit.py +136 -33
mindspore/train/callback/_reduce_lr_on_plateau.py +2 -2
mindspore/train/callback/_summary_collector.py +12 -12
mindspore/train/callback/_tft_register.py +352 -0
mindspore/train/callback/_time_monitor.py +3 -3
mindspore/train/data_sink.py +6 -5
mindspore/train/dataset_helper.py +66 -23
mindspore/train/loss_scale_manager.py +2 -2
mindspore/train/metrics/accuracy.py +7 -7
mindspore/train/metrics/confusion_matrix.py +8 -6
mindspore/train/metrics/cosine_similarity.py +6 -4
mindspore/train/metrics/error.py +2 -2
mindspore/train/metrics/metric.py +3 -3
mindspore/train/metrics/perplexity.py +2 -1
mindspore/train/metrics/roc.py +4 -4
mindspore/train/metrics/topk.py +2 -2
mindspore/train/mind_ir_pb2.py +116 -37
mindspore/train/model.py +382 -76
mindspore/train/serialization.py +787 -288
mindspore/train/summary/_summary_adapter.py +1 -1
mindspore/train/summary/summary_record.py +51 -28
mindspore/train/train_thor/convert_utils.py +3 -3
mindspore/turbojpeg.dll +0 -0
mindspore/utils/__init__.py +21 -0
mindspore/utils/utils.py +60 -0
mindspore/vcmeta.dll +0 -0
mindspore/vcruntime140.dll +0 -0
mindspore/vcruntime140_1.dll +0 -0
mindspore/version.py +1 -1
{mindspore-2.2.14.dist-info → mindspore-2.4.0.dist-info}/METADATA +8 -4
mindspore-2.4.0.dist-info/RECORD +1406 -0
{mindspore-2.2.14.dist-info → mindspore-2.4.0.dist-info}/entry_points.txt +1 -0
mindspore/_extends/parallel_compile/tbe_compiler/tbe_adapter.py +0 -662
mindspore/_extends/parallel_compile/tbe_compiler/tbe_helper.py +0 -377
mindspore/_extends/parallel_compile/tbe_compiler/tbe_job.py +0 -201
mindspore/_extends/parallel_compile/tbe_compiler/tbe_job_manager.py +0 -515
mindspore/gen_ops.py +0 -273
mindspore/include/c_api/ms/abstract.h +0 -67
mindspore/include/c_api/ms/attribute.h +0 -197
mindspore/include/c_api/ms/base/handle_types.h +0 -43
mindspore/include/c_api/ms/base/macros.h +0 -32
mindspore/include/c_api/ms/base/status.h +0 -33
mindspore/include/c_api/ms/base/types.h +0 -282
mindspore/include/c_api/ms/context.h +0 -102
mindspore/include/c_api/ms/graph.h +0 -160
mindspore/include/c_api/ms/node.h +0 -606
mindspore/include/c_api/ms/tensor.h +0 -161
mindspore/include/c_api/ms/value.h +0 -84
mindspore/mindspore_shared_lib.dll +0 -0
mindspore/nn/layer/flash_attention.py +0 -189
mindspore/ops/_op_impl/aicpu/strided_slice_v2.py +0 -93
mindspore/ops/_op_impl/aicpu/strided_slice_v2_grad.py +0 -66
mindspore/ops/_op_impl/cpu/concat.py +0 -39
mindspore/ops/_op_impl/cpu/tensor_shape.py +0 -42
mindspore/ops/_op_impl/tbe/__init__.py +0 -47
mindspore/ops/_op_impl/tbe/abs.py +0 -38
mindspore/ops/_op_impl/tbe/abs_ds.py +0 -39
mindspore/ops/_op_impl/tbe/abs_grad.py +0 -43
mindspore/ops/_op_impl/tbe/abs_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/accumulate_n_v2.py +0 -41
mindspore/ops/_op_impl/tbe/accumulate_n_v2_ds.py +0 -42
mindspore/ops/_op_impl/tbe/acos.py +0 -37
mindspore/ops/_op_impl/tbe/acos_ds.py +0 -38
mindspore/ops/_op_impl/tbe/acos_grad.py +0 -43
mindspore/ops/_op_impl/tbe/acos_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/acosh.py +0 -37
mindspore/ops/_op_impl/tbe/acosh_ds.py +0 -38
mindspore/ops/_op_impl/tbe/acosh_grad.py +0 -43
mindspore/ops/_op_impl/tbe/acosh_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/act_ulq_clamp_max_grad.py +0 -38
mindspore/ops/_op_impl/tbe/act_ulq_clamp_min_grad.py +0 -38
mindspore/ops/_op_impl/tbe/acts_ulq.py +0 -45
mindspore/ops/_op_impl/tbe/acts_ulq_input_grad.py +0 -38
mindspore/ops/_op_impl/tbe/adam_apply_one.py +0 -50
mindspore/ops/_op_impl/tbe/adam_apply_one_assign.py +0 -53
mindspore/ops/_op_impl/tbe/adam_apply_one_ds.py +0 -51
mindspore/ops/_op_impl/tbe/adam_apply_one_with_decay.py +0 -54
mindspore/ops/_op_impl/tbe/adam_apply_one_with_decay_assign.py +0 -54
mindspore/ops/_op_impl/tbe/adam_apply_one_with_decay_ds.py +0 -55
mindspore/ops/_op_impl/tbe/adaptive_max_pool2d.py +0 -37
mindspore/ops/_op_impl/tbe/add.py +0 -42
mindspore/ops/_op_impl/tbe/add_ds.py +0 -43
mindspore/ops/_op_impl/tbe/add_n.py +0 -39
mindspore/ops/_op_impl/tbe/add_n_ds.py +0 -40
mindspore/ops/_op_impl/tbe/addcdiv.py +0 -41
mindspore/ops/_op_impl/tbe/addcdiv_ds.py +0 -42
mindspore/ops/_op_impl/tbe/addcmul.py +0 -43
mindspore/ops/_op_impl/tbe/addcmul_ds.py +0 -44
mindspore/ops/_op_impl/tbe/apply_ada_max.py +0 -68
mindspore/ops/_op_impl/tbe/apply_ada_max_ds.py +0 -69
mindspore/ops/_op_impl/tbe/apply_adadelta.py +0 -66
mindspore/ops/_op_impl/tbe/apply_adadelta_ds.py +0 -67
mindspore/ops/_op_impl/tbe/apply_adagrad.py +0 -55
mindspore/ops/_op_impl/tbe/apply_adagrad_d_a.py +0 -67
mindspore/ops/_op_impl/tbe/apply_adagrad_ds.py +0 -56
mindspore/ops/_op_impl/tbe/apply_adagrad_v2.py +0 -48
mindspore/ops/_op_impl/tbe/apply_adagrad_v2_ds.py +0 -49
mindspore/ops/_op_impl/tbe/apply_adam.py +0 -79
mindspore/ops/_op_impl/tbe/apply_adam_ds.py +0 -80
mindspore/ops/_op_impl/tbe/apply_adam_with_amsgrad.py +0 -60
mindspore/ops/_op_impl/tbe/apply_adam_with_amsgrad_ds.py +0 -61
mindspore/ops/_op_impl/tbe/apply_add_sign.py +0 -65
mindspore/ops/_op_impl/tbe/apply_add_sign_ds.py +0 -66
mindspore/ops/_op_impl/tbe/apply_centered_rms_prop.py +0 -77
mindspore/ops/_op_impl/tbe/apply_centered_rms_prop_ds.py +0 -78
mindspore/ops/_op_impl/tbe/apply_ftrl.py +0 -67
mindspore/ops/_op_impl/tbe/apply_ftrl_ds.py +0 -68
mindspore/ops/_op_impl/tbe/apply_gradient_descent.py +0 -44
mindspore/ops/_op_impl/tbe/apply_gradient_descent_ds.py +0 -45
mindspore/ops/_op_impl/tbe/apply_keras_momentum.py +0 -49
mindspore/ops/_op_impl/tbe/apply_momentum.py +0 -64
mindspore/ops/_op_impl/tbe/apply_momentum_ds.py +0 -65
mindspore/ops/_op_impl/tbe/apply_power_sign.py +0 -65
mindspore/ops/_op_impl/tbe/apply_power_sign_ds.py +0 -66
mindspore/ops/_op_impl/tbe/apply_proximal_adagrad.py +0 -57
mindspore/ops/_op_impl/tbe/apply_proximal_adagrad_ds.py +0 -58
mindspore/ops/_op_impl/tbe/apply_proximal_gradient_descent.py +0 -54
mindspore/ops/_op_impl/tbe/apply_proximal_gradient_descent_ds.py +0 -55
mindspore/ops/_op_impl/tbe/apply_rms_prop.py +0 -52
mindspore/ops/_op_impl/tbe/approximate_equal.py +0 -39
mindspore/ops/_op_impl/tbe/approximate_equal_ds.py +0 -40
mindspore/ops/_op_impl/tbe/arg_max.py +0 -38
mindspore/ops/_op_impl/tbe/arg_max_with_value.py +0 -38
mindspore/ops/_op_impl/tbe/arg_max_with_value_ds.py +0 -39
mindspore/ops/_op_impl/tbe/arg_min.py +0 -38
mindspore/ops/_op_impl/tbe/arg_min_v2_ds.py +0 -40
mindspore/ops/_op_impl/tbe/arg_min_with_value.py +0 -38
mindspore/ops/_op_impl/tbe/arg_min_with_value_ds.py +0 -39
mindspore/ops/_op_impl/tbe/asin.py +0 -37
mindspore/ops/_op_impl/tbe/asin_ds.py +0 -38
mindspore/ops/_op_impl/tbe/asin_grad.py +0 -43
mindspore/ops/_op_impl/tbe/asin_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/asinh.py +0 -37
mindspore/ops/_op_impl/tbe/asinh_ds.py +0 -38
mindspore/ops/_op_impl/tbe/asinh_grad.py +0 -43
mindspore/ops/_op_impl/tbe/asinh_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/assign.py +0 -79
mindspore/ops/_op_impl/tbe/assign_add.py +0 -59
mindspore/ops/_op_impl/tbe/assign_add_ds.py +0 -60
mindspore/ops/_op_impl/tbe/assign_ds.py +0 -80
mindspore/ops/_op_impl/tbe/assign_sub.py +0 -55
mindspore/ops/_op_impl/tbe/assign_sub_ds.py +0 -56
mindspore/ops/_op_impl/tbe/atan.py +0 -37
mindspore/ops/_op_impl/tbe/atan2.py +0 -38
mindspore/ops/_op_impl/tbe/atan2_ds.py +0 -39
mindspore/ops/_op_impl/tbe/atan_ds.py +0 -38
mindspore/ops/_op_impl/tbe/atan_grad.py +0 -43
mindspore/ops/_op_impl/tbe/atan_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/atanh.py +0 -37
mindspore/ops/_op_impl/tbe/atanh_ds.py +0 -38
mindspore/ops/_op_impl/tbe/avg_pool.py +0 -43
mindspore/ops/_op_impl/tbe/avg_pool_3d.py +0 -44
mindspore/ops/_op_impl/tbe/avg_pool_3d_grad.py +0 -45
mindspore/ops/_op_impl/tbe/avg_pool_ds.py +0 -44
mindspore/ops/_op_impl/tbe/avg_pool_grad.py +0 -42
mindspore/ops/_op_impl/tbe/avg_pool_grad_vm.py +0 -42
mindspore/ops/_op_impl/tbe/basic_lstm_cell.py +0 -57
mindspore/ops/_op_impl/tbe/basic_lstm_cell_c_state_grad.py +0 -50
mindspore/ops/_op_impl/tbe/basic_lstm_cell_c_state_grad_v2.py +0 -51
mindspore/ops/_op_impl/tbe/basic_lstm_cell_input_grad.py +0 -42
mindspore/ops/_op_impl/tbe/basic_lstm_cell_weight_grad.py +0 -41
mindspore/ops/_op_impl/tbe/batch_matmul.py +0 -42
mindspore/ops/_op_impl/tbe/batch_matmul_ds.py +0 -41
mindspore/ops/_op_impl/tbe/batch_matmul_v2.py +0 -47
mindspore/ops/_op_impl/tbe/batch_to_space.py +0 -38
mindspore/ops/_op_impl/tbe/batch_to_space_nd.py +0 -38
mindspore/ops/_op_impl/tbe/batch_to_space_nd_ds.py +0 -39
mindspore/ops/_op_impl/tbe/batch_to_space_nd_v2.py +0 -41
mindspore/ops/_op_impl/tbe/batchnorm.py +0 -58
mindspore/ops/_op_impl/tbe/batchnorm_grad.py +0 -58
mindspore/ops/_op_impl/tbe/bce_with_logits_loss.py +0 -42
mindspore/ops/_op_impl/tbe/bessel_i0e.py +0 -37
mindspore/ops/_op_impl/tbe/bessel_i0e_ds.py +0 -38
mindspore/ops/_op_impl/tbe/bessel_i1e.py +0 -37
mindspore/ops/_op_impl/tbe/bessel_i1e_ds.py +0 -38
mindspore/ops/_op_impl/tbe/bias_add.py +0 -38
mindspore/ops/_op_impl/tbe/bias_add_ds.py +0 -39
mindspore/ops/_op_impl/tbe/bias_add_grad.py +0 -53
mindspore/ops/_op_impl/tbe/binary_cross_entropy.py +0 -39
mindspore/ops/_op_impl/tbe/binary_cross_entropy_ds.py +0 -40
mindspore/ops/_op_impl/tbe/binary_cross_entropy_grad.py +0 -44
mindspore/ops/_op_impl/tbe/binary_cross_entropy_grad_ds.py +0 -45
mindspore/ops/_op_impl/tbe/bitwise_and.py +0 -39
mindspore/ops/_op_impl/tbe/bitwise_and_ds.py +0 -40
mindspore/ops/_op_impl/tbe/bitwise_or.py +0 -39
mindspore/ops/_op_impl/tbe/bitwise_or_ds.py +0 -40
mindspore/ops/_op_impl/tbe/bitwise_xor.py +0 -39
mindspore/ops/_op_impl/tbe/bitwise_xor_ds.py +0 -40
mindspore/ops/_op_impl/tbe/bn_infer.py +0 -43
mindspore/ops/_op_impl/tbe/bn_infer_ds.py +0 -45
mindspore/ops/_op_impl/tbe/bn_infer_grad.py +0 -41
mindspore/ops/_op_impl/tbe/bn_infer_grad_ds.py +0 -40
mindspore/ops/_op_impl/tbe/bn_inference.py +0 -50
mindspore/ops/_op_impl/tbe/bn_training_reduce.py +0 -38
mindspore/ops/_op_impl/tbe/bn_training_reduce_ds.py +0 -39
mindspore/ops/_op_impl/tbe/bn_training_reduce_grad.py +0 -46
mindspore/ops/_op_impl/tbe/bn_training_reduce_grad_ds.py +0 -47
mindspore/ops/_op_impl/tbe/bn_training_update.py +0 -52
mindspore/ops/_op_impl/tbe/bn_training_update_ds.py +0 -53
mindspore/ops/_op_impl/tbe/bn_training_update_grad.py +0 -44
mindspore/ops/_op_impl/tbe/bn_training_update_grad_ds.py +0 -45
mindspore/ops/_op_impl/tbe/bn_training_update_v2.py +0 -48
mindspore/ops/_op_impl/tbe/bn_training_update_v3.py +0 -51
mindspore/ops/_op_impl/tbe/bounding_box_decode.py +0 -41
mindspore/ops/_op_impl/tbe/bounding_box_decode_ds.py +0 -42
mindspore/ops/_op_impl/tbe/bounding_box_encode.py +0 -38
mindspore/ops/_op_impl/tbe/broadcast_to.py +0 -40
mindspore/ops/_op_impl/tbe/broadcast_to_ds.py +0 -44
mindspore/ops/_op_impl/tbe/cast.py +0 -55
mindspore/ops/_op_impl/tbe/cast_ds.py +0 -58
mindspore/ops/_op_impl/tbe/cdist.py +0 -38
mindspore/ops/_op_impl/tbe/cdist_grad.py +0 -42
mindspore/ops/_op_impl/tbe/ceil.py +0 -37
mindspore/ops/_op_impl/tbe/ceil_ds.py +0 -38
mindspore/ops/_op_impl/tbe/celu.py +0 -39
mindspore/ops/_op_impl/tbe/centralization.py +0 -39
mindspore/ops/_op_impl/tbe/check_valid.py +0 -38
mindspore/ops/_op_impl/tbe/check_valid_ds.py +0 -39
mindspore/ops/_op_impl/tbe/clip_by_norm_no_div_sum.py +0 -41
mindspore/ops/_op_impl/tbe/clip_by_norm_no_div_sum_ds.py +0 -42
mindspore/ops/_op_impl/tbe/clip_by_value.py +0 -41
mindspore/ops/_op_impl/tbe/clip_by_value_ds.py +0 -42
mindspore/ops/_op_impl/tbe/concat.py +0 -40
mindspore/ops/_op_impl/tbe/concat_ds.py +0 -38
mindspore/ops/_op_impl/tbe/confusion_matrix.py +0 -63
mindspore/ops/_op_impl/tbe/confusion_mul_grad.py +0 -40
mindspore/ops/_op_impl/tbe/confusion_softmax_grad.py +0 -41
mindspore/ops/_op_impl/tbe/confusion_transpose_d.py +0 -39
mindspore/ops/_op_impl/tbe/conv2d.py +0 -47
mindspore/ops/_op_impl/tbe/conv2d_backprop_filter.py +0 -42
mindspore/ops/_op_impl/tbe/conv2d_backprop_filter_ds.py +0 -43
mindspore/ops/_op_impl/tbe/conv2d_backprop_input.py +0 -42
mindspore/ops/_op_impl/tbe/conv2d_backprop_input_ds.py +0 -44
mindspore/ops/_op_impl/tbe/conv2d_ds.py +0 -47
mindspore/ops/_op_impl/tbe/conv2d_transpose.py +0 -48
mindspore/ops/_op_impl/tbe/conv3d.py +0 -45
mindspore/ops/_op_impl/tbe/conv3d_backprop_filter.py +0 -42
mindspore/ops/_op_impl/tbe/conv3d_backprop_input.py +0 -42
mindspore/ops/_op_impl/tbe/conv3d_transpose.py +0 -47
mindspore/ops/_op_impl/tbe/conv3d_transpose_ds.py +0 -48
mindspore/ops/_op_impl/tbe/cos.py +0 -37
mindspore/ops/_op_impl/tbe/cos_ds.py +0 -38
mindspore/ops/_op_impl/tbe/cosh.py +0 -37
mindspore/ops/_op_impl/tbe/cosh_ds.py +0 -38
mindspore/ops/_op_impl/tbe/ctc_loss_v2.py +0 -42
mindspore/ops/_op_impl/tbe/ctc_loss_v2_grad.py +0 -44
mindspore/ops/_op_impl/tbe/cum_sum.py +0 -42
mindspore/ops/_op_impl/tbe/cum_sum_ds.py +0 -44
mindspore/ops/_op_impl/tbe/cummin.py +0 -41
mindspore/ops/_op_impl/tbe/cumprod.py +0 -42
mindspore/ops/_op_impl/tbe/data_format_dim_map.py +0 -38
mindspore/ops/_op_impl/tbe/data_format_dim_map_ds.py +0 -40
mindspore/ops/_op_impl/tbe/deformable_offsets.py +0 -45
mindspore/ops/_op_impl/tbe/deformable_offsets_grad.py +0 -48
mindspore/ops/_op_impl/tbe/depth_to_space_ds.py +0 -49
mindspore/ops/_op_impl/tbe/depthwise_conv2d.py +0 -44
mindspore/ops/_op_impl/tbe/depthwise_conv2d_backprop_filter.py +0 -41
mindspore/ops/_op_impl/tbe/depthwise_conv2d_backprop_input.py +0 -41
mindspore/ops/_op_impl/tbe/diag.py +0 -38
mindspore/ops/_op_impl/tbe/diag_part.py +0 -38
mindspore/ops/_op_impl/tbe/dilation.py +0 -40
mindspore/ops/_op_impl/tbe/div.py +0 -41
mindspore/ops/_op_impl/tbe/div_ds.py +0 -42
mindspore/ops/_op_impl/tbe/div_no_nan.py +0 -41
mindspore/ops/_op_impl/tbe/div_no_nan_ds.py +0 -42
mindspore/ops/_op_impl/tbe/dropout_do_mask.py +0 -38
mindspore/ops/_op_impl/tbe/dropout_do_mask_ds.py +0 -39
mindspore/ops/_op_impl/tbe/dropout_do_mask_v3.py +0 -39
mindspore/ops/_op_impl/tbe/dynamic_atomic_addr_clean.py +0 -34
mindspore/ops/_op_impl/tbe/dynamic_gru_v2.py +0 -95
mindspore/ops/_op_impl/tbe/dynamic_rnn.py +0 -82
mindspore/ops/_op_impl/tbe/elu.py +0 -38
mindspore/ops/_op_impl/tbe/elu_ds.py +0 -39
mindspore/ops/_op_impl/tbe/elu_grad.py +0 -43
mindspore/ops/_op_impl/tbe/elu_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/equal.py +0 -42
mindspore/ops/_op_impl/tbe/equal_ds.py +0 -42
mindspore/ops/_op_impl/tbe/erf.py +0 -37
mindspore/ops/_op_impl/tbe/erf_ds.py +0 -38
mindspore/ops/_op_impl/tbe/erfc.py +0 -37
mindspore/ops/_op_impl/tbe/erfc_ds.py +0 -38
mindspore/ops/_op_impl/tbe/erfinv.py +0 -36
mindspore/ops/_op_impl/tbe/exp.py +0 -40
mindspore/ops/_op_impl/tbe/exp_ds.py +0 -41
mindspore/ops/_op_impl/tbe/expand_dims.py +0 -38
mindspore/ops/_op_impl/tbe/expm1.py +0 -37
mindspore/ops/_op_impl/tbe/expm1_ds.py +0 -38
mindspore/ops/_op_impl/tbe/extract_image_patches.py +0 -41
mindspore/ops/_op_impl/tbe/extract_volume_patches.py +0 -39
mindspore/ops/_op_impl/tbe/fake_quant_with_min_max_vars.py +0 -39
mindspore/ops/_op_impl/tbe/fake_quant_with_min_max_vars_gradient.py +0 -43
mindspore/ops/_op_impl/tbe/fake_quant_with_min_max_vars_per_channel.py +0 -39
mindspore/ops/_op_impl/tbe/fake_quant_with_min_max_vars_per_channel_gradient.py +0 -43
mindspore/ops/_op_impl/tbe/fast_gelu.py +0 -37
mindspore/ops/_op_impl/tbe/fast_gelu_ds.py +0 -38
mindspore/ops/_op_impl/tbe/fast_gelu_grad.py +0 -41
mindspore/ops/_op_impl/tbe/fast_gelu_grad_ds.py +0 -42
mindspore/ops/_op_impl/tbe/fill.py +0 -56
mindspore/ops/_op_impl/tbe/fill_ds.py +0 -42
mindspore/ops/_op_impl/tbe/flatten.py +0 -48
mindspore/ops/_op_impl/tbe/floor.py +0 -37
mindspore/ops/_op_impl/tbe/floor_div.py +0 -41
mindspore/ops/_op_impl/tbe/floor_div_ds.py +0 -42
mindspore/ops/_op_impl/tbe/floor_ds.py +0 -38
mindspore/ops/_op_impl/tbe/floor_mod.py +0 -39
mindspore/ops/_op_impl/tbe/floor_mod_ds.py +0 -40
mindspore/ops/_op_impl/tbe/fused_dbn_dw.py +0 -52
mindspore/ops/_op_impl/tbe/fused_mul_add.py +0 -38
mindspore/ops/_op_impl/tbe/fused_mul_add_n.py +0 -48
mindspore/ops/_op_impl/tbe/fused_mul_add_n_l2loss.py +0 -53
mindspore/ops/_op_impl/tbe/fused_mul_apply_momentum.py +0 -57
mindspore/ops/_op_impl/tbe/fused_mul_apply_momentum_extern.py +0 -67
mindspore/ops/_op_impl/tbe/gather_nd.py +0 -52
mindspore/ops/_op_impl/tbe/gather_nd_ds.py +0 -48
mindspore/ops/_op_impl/tbe/gather_v2.py +0 -56
mindspore/ops/_op_impl/tbe/gather_v2_ds.py +0 -68
mindspore/ops/_op_impl/tbe/gelu.py +0 -37
mindspore/ops/_op_impl/tbe/gelu_ds.py +0 -38
mindspore/ops/_op_impl/tbe/gelu_grad.py +0 -42
mindspore/ops/_op_impl/tbe/gelu_grad_ds.py +0 -43
mindspore/ops/_op_impl/tbe/ger.py +0 -43
mindspore/ops/_op_impl/tbe/ger_ds.py +0 -44
mindspore/ops/_op_impl/tbe/greater.py +0 -43
mindspore/ops/_op_impl/tbe/greater_equal.py +0 -41
mindspore/ops/_op_impl/tbe/greater_equal_ds.py +0 -42
mindspore/ops/_op_impl/tbe/gru_v2_hidden_grad.py +0 -51
mindspore/ops/_op_impl/tbe/gru_v2_hidden_grad_cell.py +0 -52
mindspore/ops/_op_impl/tbe/hard_swish.py +0 -37
mindspore/ops/_op_impl/tbe/hard_swish_ds.py +0 -38
mindspore/ops/_op_impl/tbe/hard_swish_grad.py +0 -41
mindspore/ops/_op_impl/tbe/hard_swish_grad_ds.py +0 -42
mindspore/ops/_op_impl/tbe/histogram_fixed_width.py +0 -40
mindspore/ops/_op_impl/tbe/hshrink.py +0 -33
mindspore/ops/_op_impl/tbe/hshrink_grad.py +0 -37
mindspore/ops/_op_impl/tbe/hsigmoid.py +0 -45
mindspore/ops/_op_impl/tbe/hsigmoid_grad.py +0 -39
mindspore/ops/_op_impl/tbe/ifmr.py +0 -47
mindspore/ops/_op_impl/tbe/ifmr_ds.py +0 -48
mindspore/ops/_op_impl/tbe/im2col.py +0 -42
mindspore/ops/_op_impl/tbe/in_top_k.py +0 -37
mindspore/ops/_op_impl/tbe/inplace_add.py +0 -39
mindspore/ops/_op_impl/tbe/inplace_index_add.py +0 -46
mindspore/ops/_op_impl/tbe/inplace_sub.py +0 -39
mindspore/ops/_op_impl/tbe/inplace_update.py +0 -39
mindspore/ops/_op_impl/tbe/inplace_update_ds.py +0 -40
mindspore/ops/_op_impl/tbe/inv.py +0 -38
mindspore/ops/_op_impl/tbe/inv_ds.py +0 -39
mindspore/ops/_op_impl/tbe/inv_grad.py +0 -40
mindspore/ops/_op_impl/tbe/inv_grad_ds.py +0 -41
mindspore/ops/_op_impl/tbe/invert.py +0 -37
mindspore/ops/_op_impl/tbe/invert_ds.py +0 -38
mindspore/ops/_op_impl/tbe/iou.py +0 -38
mindspore/ops/_op_impl/tbe/iou_ds.py +0 -39
mindspore/ops/_op_impl/tbe/is_close.py +0 -40
mindspore/ops/_op_impl/tbe/kl_div_loss.py +0 -38
mindspore/ops/_op_impl/tbe/kl_div_loss_ds.py +0 -39
mindspore/ops/_op_impl/tbe/kl_div_loss_grad.py +0 -40
mindspore/ops/_op_impl/tbe/l2_loss.py +0 -36
mindspore/ops/_op_impl/tbe/l2_loss_ds.py +0 -37
mindspore/ops/_op_impl/tbe/l2_normalize.py +0 -38
mindspore/ops/_op_impl/tbe/l2_normalize_grad.py +0 -40
mindspore/ops/_op_impl/tbe/lamb_apply_optimizer_assign.py +0 -55
mindspore/ops/_op_impl/tbe/lamb_apply_weight_assign.py +0 -42
mindspore/ops/_op_impl/tbe/lamb_next_mv.py +0 -59
mindspore/ops/_op_impl/tbe/lamb_next_mv_with_decay.py +0 -59
mindspore/ops/_op_impl/tbe/lamb_next_right.py +0 -44
mindspore/ops/_op_impl/tbe/lamb_update_with_lr.py +0 -48
mindspore/ops/_op_impl/tbe/lamb_update_with_lr_v2.py +0 -44
mindspore/ops/_op_impl/tbe/lars_update.py +0 -50
mindspore/ops/_op_impl/tbe/lars_update_ds.py +0 -51
mindspore/ops/_op_impl/tbe/layer_norm.py +0 -46
mindspore/ops/_op_impl/tbe/layer_norm_beta_gamma_backprop.py +0 -44
mindspore/ops/_op_impl/tbe/layer_norm_beta_gamma_backprop_ds.py +0 -45
mindspore/ops/_op_impl/tbe/layer_norm_beta_gamma_backprop_v2.py +0 -40
mindspore/ops/_op_impl/tbe/layer_norm_beta_gamma_backprop_v2_ds.py +0 -41
mindspore/ops/_op_impl/tbe/layer_norm_ds.py +0 -47
mindspore/ops/_op_impl/tbe/layer_norm_grad.py +0 -48
mindspore/ops/_op_impl/tbe/layer_norm_x_backprop.py +0 -43
mindspore/ops/_op_impl/tbe/layer_norm_x_backprop_ds.py +0 -44
mindspore/ops/_op_impl/tbe/layer_norm_x_backprop_v2.py +0 -45
mindspore/ops/_op_impl/tbe/layer_norm_x_backprop_v2_ds.py +0 -45
mindspore/ops/_op_impl/tbe/lerp.py +0 -38
mindspore/ops/_op_impl/tbe/less.py +0 -41
mindspore/ops/_op_impl/tbe/less_ds.py +0 -42
mindspore/ops/_op_impl/tbe/less_equal.py +0 -41
mindspore/ops/_op_impl/tbe/less_equal_ds.py +0 -42
mindspore/ops/_op_impl/tbe/log.py +0 -40
mindspore/ops/_op_impl/tbe/log1p.py +0 -37
mindspore/ops/_op_impl/tbe/log1p_ds.py +0 -38
mindspore/ops/_op_impl/tbe/log_ds.py +0 -41
mindspore/ops/_op_impl/tbe/logical_and.py +0 -37
mindspore/ops/_op_impl/tbe/logical_and_ds.py +0 -38
mindspore/ops/_op_impl/tbe/logical_not.py +0 -36
mindspore/ops/_op_impl/tbe/logical_not_ds.py +0 -37
mindspore/ops/_op_impl/tbe/logical_or.py +0 -37
mindspore/ops/_op_impl/tbe/logical_or_ds.py +0 -38
mindspore/ops/_op_impl/tbe/logsoftmax.py +0 -37
mindspore/ops/_op_impl/tbe/logsoftmax_ds.py +0 -38
mindspore/ops/_op_impl/tbe/logsoftmax_grad.py +0 -38
mindspore/ops/_op_impl/tbe/logsoftmax_grad_ds.py +0 -39
mindspore/ops/_op_impl/tbe/lp_norm.py +0 -40
mindspore/ops/_op_impl/tbe/lp_norm_ds.py +0 -41
mindspore/ops/_op_impl/tbe/lrn.py +0 -41
mindspore/ops/_op_impl/tbe/lrn_grad.py +0 -42
mindspore/ops/_op_impl/tbe/lstm_input_grad.py +0 -51
mindspore/ops/_op_impl/tbe/masked_fill.py +0 -40
mindspore/ops/_op_impl/tbe/masked_fill_ds.py +0 -41
mindspore/ops/_op_impl/tbe/matmul.py +0 -53
mindspore/ops/_op_impl/tbe/matmul_ds.py +0 -47
mindspore/ops/_op_impl/tbe/matmul_v2.py +0 -50
mindspore/ops/_op_impl/tbe/matrix_diag.py +0 -45
mindspore/ops/_op_impl/tbe/matrix_diag_part.py +0 -45
mindspore/ops/_op_impl/tbe/matrix_set_diag.py +0 -46
mindspore/ops/_op_impl/tbe/max_pool.py +0 -39
mindspore/ops/_op_impl/tbe/max_pool3d.py +0 -44
mindspore/ops/_op_impl/tbe/max_pool3d_grad.py +0 -43
mindspore/ops/_op_impl/tbe/max_pool3d_grad_grad.py +0 -44
mindspore/ops/_op_impl/tbe/max_pool_ds.py +0 -40
mindspore/ops/_op_impl/tbe/max_pool_grad.py +0 -43
mindspore/ops/_op_impl/tbe/max_pool_grad_grad.py +0 -41
mindspore/ops/_op_impl/tbe/max_pool_grad_grad_with_argmax.py +0 -41
mindspore/ops/_op_impl/tbe/max_pool_grad_with_argmax.py +0 -42
mindspore/ops/_op_impl/tbe/max_pool_with_argmax.py +0 -40
mindspore/ops/_op_impl/tbe/maximum.py +0 -39
mindspore/ops/_op_impl/tbe/maximum_ds.py +0 -40
mindspore/ops/_op_impl/tbe/maximum_grad.py +0 -46
mindspore/ops/_op_impl/tbe/maximum_grad_ds.py +0 -47
mindspore/ops/_op_impl/tbe/mem_set.py +0 -38
mindspore/ops/_op_impl/tbe/minimum.py +0 -40
mindspore/ops/_op_impl/tbe/minimum_ds.py +0 -41
mindspore/ops/_op_impl/tbe/minimum_grad.py +0 -46
mindspore/ops/_op_impl/tbe/minimum_grad_ds.py +0 -47
mindspore/ops/_op_impl/tbe/mish.py +0 -37
mindspore/ops/_op_impl/tbe/mod.py +0 -41
mindspore/ops/_op_impl/tbe/mod_ds.py +0 -42
mindspore/ops/_op_impl/tbe/mul.py +0 -37
mindspore/ops/_op_impl/tbe/mul_ds.py +0 -38
mindspore/ops/_op_impl/tbe/mul_no_nan.py +0 -39
mindspore/ops/_op_impl/tbe/mul_no_nan_ds.py +0 -40
mindspore/ops/_op_impl/tbe/multilabel_margin_loss.py +0 -39
mindspore/ops/_op_impl/tbe/neg.py +0 -39
mindspore/ops/_op_impl/tbe/neg_ds.py +0 -40
mindspore/ops/_op_impl/tbe/new_im2col.py +0 -40
mindspore/ops/_op_impl/tbe/nll_loss.py +0 -41
mindspore/ops/_op_impl/tbe/nll_loss_grad.py +0 -44
mindspore/ops/_op_impl/tbe/nms_with_mask.py +0 -39
mindspore/ops/_op_impl/tbe/not_equal.py +0 -41
mindspore/ops/_op_impl/tbe/not_equal_ds.py +0 -42
mindspore/ops/_op_impl/tbe/npu_alloc_float_status.py +0 -34
mindspore/ops/_op_impl/tbe/npu_clear_float_status.py +0 -35
mindspore/ops/_op_impl/tbe/npu_clear_float_status_v2.py +0 -35
mindspore/ops/_op_impl/tbe/npu_get_float_status.py +0 -35
mindspore/ops/_op_impl/tbe/npu_get_float_status_v2.py +0 -35
mindspore/ops/_op_impl/tbe/one_hot.py +0 -48
mindspore/ops/_op_impl/tbe/one_hot_ds.py +0 -45
mindspore/ops/_op_impl/tbe/ones_like.py +0 -40
mindspore/ops/_op_impl/tbe/ones_like_ds.py +0 -41
mindspore/ops/_op_impl/tbe/p_s_r_o_i_pooling.py +0 -40
mindspore/ops/_op_impl/tbe/p_s_r_o_i_pooling_grad.py +0 -40
mindspore/ops/_op_impl/tbe/pack.py +0 -58
mindspore/ops/_op_impl/tbe/pack_ds.py +0 -59
mindspore/ops/_op_impl/tbe/pad_d.py +0 -40
mindspore/ops/_op_impl/tbe/pad_d_ds.py +0 -41
mindspore/ops/_op_impl/tbe/parallel_concat.py +0 -70
mindspore/ops/_op_impl/tbe/parallel_resize_bilinear.py +0 -45
mindspore/ops/_op_impl/tbe/parallel_resize_bilinear_grad.py +0 -44
mindspore/ops/_op_impl/tbe/pdist.py +0 -36
mindspore/ops/_op_impl/tbe/pooling.py +0 -46
mindspore/ops/_op_impl/tbe/population_count.py +0 -38
mindspore/ops/_op_impl/tbe/pow.py +0 -41
mindspore/ops/_op_impl/tbe/pow_ds.py +0 -42
mindspore/ops/_op_impl/tbe/prelu.py +0 -37
mindspore/ops/_op_impl/tbe/prelu_ds.py +0 -38
mindspore/ops/_op_impl/tbe/prelu_grad.py +0 -40
mindspore/ops/_op_impl/tbe/range.py +0 -39
mindspore/ops/_op_impl/tbe/real_div.py +0 -38
mindspore/ops/_op_impl/tbe/real_div_ds.py +0 -39
mindspore/ops/_op_impl/tbe/reciprocal.py +0 -36
mindspore/ops/_op_impl/tbe/reciprocal_ds.py +0 -37
mindspore/ops/_op_impl/tbe/reciprocal_grad.py +0 -38
mindspore/ops/_op_impl/tbe/reciprocal_grad_ds.py +0 -39
mindspore/ops/_op_impl/tbe/reduce_all.py +0 -38
mindspore/ops/_op_impl/tbe/reduce_all_ds.py +0 -39
mindspore/ops/_op_impl/tbe/reduce_any.py +0 -38
mindspore/ops/_op_impl/tbe/reduce_any_ds.py +0 -39
mindspore/ops/_op_impl/tbe/reduce_max.py +0 -43
mindspore/ops/_op_impl/tbe/reduce_max_ds.py +0 -41
mindspore/ops/_op_impl/tbe/reduce_mean.py +0 -40
mindspore/ops/_op_impl/tbe/reduce_mean_ds.py +0 -42
mindspore/ops/_op_impl/tbe/reduce_min.py +0 -41
mindspore/ops/_op_impl/tbe/reduce_min_ds.py +0 -41
mindspore/ops/_op_impl/tbe/reduce_prod.py +0 -42
mindspore/ops/_op_impl/tbe/reduce_prod_ds.py +0 -41
mindspore/ops/_op_impl/tbe/reduce_std.py +0 -44
mindspore/ops/_op_impl/tbe/reduce_sum.py +0 -39
mindspore/ops/_op_impl/tbe/reduce_sum_ds.py +0 -41
mindspore/ops/_op_impl/tbe/relu.py +0 -39
mindspore/ops/_op_impl/tbe/relu6.py +0 -38
mindspore/ops/_op_impl/tbe/relu6_ds.py +0 -39
mindspore/ops/_op_impl/tbe/relu6_grad.py +0 -43
mindspore/ops/_op_impl/tbe/relu6_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/relu_ds.py +0 -40
mindspore/ops/_op_impl/tbe/relu_grad.py +0 -41
mindspore/ops/_op_impl/tbe/relu_grad_ds.py +0 -42
mindspore/ops/_op_impl/tbe/relu_grad_v2.py +0 -40
mindspore/ops/_op_impl/tbe/relu_grad_v2_ds.py +0 -41
mindspore/ops/_op_impl/tbe/relu_v2.py +0 -40
mindspore/ops/_op_impl/tbe/relu_v2_ds.py +0 -41
mindspore/ops/_op_impl/tbe/renorm.py +0 -39
mindspore/ops/_op_impl/tbe/resize_bilinear.py +0 -40
mindspore/ops/_op_impl/tbe/resize_bilinear_grad.py +0 -41
mindspore/ops/_op_impl/tbe/resize_bilinear_v2.py +0 -43
mindspore/ops/_op_impl/tbe/resize_nearest_neighbor.py +0 -40
mindspore/ops/_op_impl/tbe/resize_nearest_neighbor_ds.py +0 -40
mindspore/ops/_op_impl/tbe/resize_nearest_neighbor_grad.py +0 -39
mindspore/ops/_op_impl/tbe/resize_nearest_neighbor_grad_ds.py +0 -42
mindspore/ops/_op_impl/tbe/reverse_v2_d.py +0 -37
mindspore/ops/_op_impl/tbe/rint.py +0 -37
mindspore/ops/_op_impl/tbe/rint_ds.py +0 -38
mindspore/ops/_op_impl/tbe/roi_align.py +0 -43
mindspore/ops/_op_impl/tbe/roi_align_ds.py +0 -44
mindspore/ops/_op_impl/tbe/roi_align_grad.py +0 -43
mindspore/ops/_op_impl/tbe/roi_align_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/roll.py +0 -42
mindspore/ops/_op_impl/tbe/round.py +0 -38
mindspore/ops/_op_impl/tbe/round_ds.py +0 -39
mindspore/ops/_op_impl/tbe/rsqrt.py +0 -37
mindspore/ops/_op_impl/tbe/rsqrt_ds.py +0 -38
mindspore/ops/_op_impl/tbe/rsqrt_grad.py +0 -40
mindspore/ops/_op_impl/tbe/rsqrt_grad_ds.py +0 -41
mindspore/ops/_op_impl/tbe/scatter_add.py +0 -44
mindspore/ops/_op_impl/tbe/scatter_div.py +0 -46
mindspore/ops/_op_impl/tbe/scatter_max.py +0 -45
mindspore/ops/_op_impl/tbe/scatter_min.py +0 -45
mindspore/ops/_op_impl/tbe/scatter_mul.py +0 -44
mindspore/ops/_op_impl/tbe/scatter_nd.py +0 -41
mindspore/ops/_op_impl/tbe/scatter_nd_add.py +0 -45
mindspore/ops/_op_impl/tbe/scatter_nd_d.py +0 -41
mindspore/ops/_op_impl/tbe/scatter_nd_ds.py +0 -49
mindspore/ops/_op_impl/tbe/scatter_nd_sub.py +0 -47
mindspore/ops/_op_impl/tbe/scatter_nd_sub_ds.py +0 -48
mindspore/ops/_op_impl/tbe/scatter_nd_update.py +0 -47
mindspore/ops/_op_impl/tbe/scatter_nd_update_ds.py +0 -48
mindspore/ops/_op_impl/tbe/scatter_non_aliasing_add.py +0 -39
mindspore/ops/_op_impl/tbe/scatter_non_aliasing_add_ds.py +0 -40
mindspore/ops/_op_impl/tbe/scatter_sub.py +0 -47
mindspore/ops/_op_impl/tbe/scatter_sub_ds.py +0 -48
mindspore/ops/_op_impl/tbe/scatter_update.py +0 -43
mindspore/ops/_op_impl/tbe/select.py +0 -38
mindspore/ops/_op_impl/tbe/select_ds.py +0 -39
mindspore/ops/_op_impl/tbe/selu.py +0 -39
mindspore/ops/_op_impl/tbe/selu_ds.py +0 -40
mindspore/ops/_op_impl/tbe/sgd.py +0 -62
mindspore/ops/_op_impl/tbe/sigmoid.py +0 -37
mindspore/ops/_op_impl/tbe/sigmoid_cross_entropy_with_logits.py +0 -41
mindspore/ops/_op_impl/tbe/sigmoid_cross_entropy_with_logits_ds.py +0 -42
mindspore/ops/_op_impl/tbe/sigmoid_cross_entropy_with_logits_grad.py +0 -42
mindspore/ops/_op_impl/tbe/sigmoid_cross_entropy_with_logits_grad_ds.py +0 -43
mindspore/ops/_op_impl/tbe/sigmoid_ds.py +0 -38
mindspore/ops/_op_impl/tbe/sigmoid_grad.py +0 -39
mindspore/ops/_op_impl/tbe/sigmoid_grad_ds.py +0 -40
mindspore/ops/_op_impl/tbe/sign.py +0 -38
mindspore/ops/_op_impl/tbe/sign_ds.py +0 -39
mindspore/ops/_op_impl/tbe/sin.py +0 -37
mindspore/ops/_op_impl/tbe/sin_ds.py +0 -38
mindspore/ops/_op_impl/tbe/sinh.py +0 -37
mindspore/ops/_op_impl/tbe/sinh_ds.py +0 -38
mindspore/ops/_op_impl/tbe/slice.py +0 -58
mindspore/ops/_op_impl/tbe/smooth_l1_loss.py +0 -45
mindspore/ops/_op_impl/tbe/smooth_l1_loss_ds.py +0 -46
mindspore/ops/_op_impl/tbe/smooth_l1_loss_grad.py +0 -46
mindspore/ops/_op_impl/tbe/smooth_l1_loss_grad_ds.py +0 -47
mindspore/ops/_op_impl/tbe/soft_margin_loss.py +0 -38
mindspore/ops/_op_impl/tbe/soft_margin_loss_grad.py +0 -39
mindspore/ops/_op_impl/tbe/soft_shrink.py +0 -36
mindspore/ops/_op_impl/tbe/soft_shrink_grad.py +0 -38
mindspore/ops/_op_impl/tbe/softmax.py +0 -37
mindspore/ops/_op_impl/tbe/softmax_cross_entropy_with_logits.py +0 -38
mindspore/ops/_op_impl/tbe/softmax_cross_entropy_with_logits_ds.py +0 -39
mindspore/ops/_op_impl/tbe/softmax_ds.py +0 -38
mindspore/ops/_op_impl/tbe/softmax_grad_ext.py +0 -42
mindspore/ops/_op_impl/tbe/softmax_v2_with_dropout_do_mask_v3.py +0 -39
mindspore/ops/_op_impl/tbe/softplus.py +0 -37
mindspore/ops/_op_impl/tbe/softplus_ds.py +0 -38
mindspore/ops/_op_impl/tbe/softplus_grad.py +0 -38
mindspore/ops/_op_impl/tbe/softplus_grad_ds.py +0 -38
mindspore/ops/_op_impl/tbe/softsign.py +0 -37
mindspore/ops/_op_impl/tbe/softsign_ds.py +0 -38
mindspore/ops/_op_impl/tbe/sort.py +0 -38
mindspore/ops/_op_impl/tbe/sort_ds.py +0 -39
mindspore/ops/_op_impl/tbe/space_to_batch.py +0 -38
mindspore/ops/_op_impl/tbe/space_to_batch_nd.py +0 -38
mindspore/ops/_op_impl/tbe/space_to_depth.py +0 -47
mindspore/ops/_op_impl/tbe/sparse_apply_adadelta.py +0 -56
mindspore/ops/_op_impl/tbe/sparse_apply_adagrad.py +0 -45
mindspore/ops/_op_impl/tbe/sparse_apply_adagrad_ds.py +0 -46
mindspore/ops/_op_impl/tbe/sparse_apply_adagrad_v2.py +0 -46
mindspore/ops/_op_impl/tbe/sparse_apply_adagrad_v2_ds.py +0 -47
mindspore/ops/_op_impl/tbe/sparse_apply_ftrl_d.py +0 -53
mindspore/ops/_op_impl/tbe/sparse_apply_ftrl_d_ds.py +0 -50
mindspore/ops/_op_impl/tbe/sparse_apply_ftrl_v2.py +0 -50
mindspore/ops/_op_impl/tbe/sparse_apply_proximal_adagrad.py +0 -66
mindspore/ops/_op_impl/tbe/sparse_apply_proximal_adagrad_ds.py +0 -67
mindspore/ops/_op_impl/tbe/sparse_apply_r_m_s_prop.py +0 -57
mindspore/ops/_op_impl/tbe/sparse_apply_r_m_s_prop_ds.py +0 -58
mindspore/ops/_op_impl/tbe/sparse_gather_v2.py +0 -56
mindspore/ops/_op_impl/tbe/sparse_gather_v2_ds.py +0 -58
mindspore/ops/_op_impl/tbe/split_d.py +0 -38
mindspore/ops/_op_impl/tbe/split_d_ds.py +0 -39
mindspore/ops/_op_impl/tbe/split_v.py +0 -39
mindspore/ops/_op_impl/tbe/splitv.py +0 -39
mindspore/ops/_op_impl/tbe/sqrt.py +0 -37
mindspore/ops/_op_impl/tbe/sqrt_ds.py +0 -38
mindspore/ops/_op_impl/tbe/sqrt_grad.py +0 -43
mindspore/ops/_op_impl/tbe/sqrt_grad_ds.py +0 -44
mindspore/ops/_op_impl/tbe/square.py +0 -38
mindspore/ops/_op_impl/tbe/square_ds.py +0 -39
mindspore/ops/_op_impl/tbe/square_sum_all.py +0 -40
mindspore/ops/_op_impl/tbe/square_sum_all_ds.py +0 -41
mindspore/ops/_op_impl/tbe/square_sum_v1.py +0 -38
mindspore/ops/_op_impl/tbe/square_sum_v1_ds.py +0 -39
mindspore/ops/_op_impl/tbe/square_sum_v2.py +0 -39
mindspore/ops/_op_impl/tbe/squared_difference.py +0 -39
mindspore/ops/_op_impl/tbe/squared_difference_ds.py +0 -41
mindspore/ops/_op_impl/tbe/squeeze.py +0 -37
mindspore/ops/_op_impl/tbe/strided_read.py +0 -38
mindspore/ops/_op_impl/tbe/strided_slice_d.py +0 -44
mindspore/ops/_op_impl/tbe/strided_slice_ds.py +0 -71
mindspore/ops/_op_impl/tbe/strided_slice_grad_d.py +0 -51
mindspore/ops/_op_impl/tbe/strided_slice_grad_ds.py +0 -57
mindspore/ops/_op_impl/tbe/strided_write.py +0 -38
mindspore/ops/_op_impl/tbe/sub.py +0 -39
mindspore/ops/_op_impl/tbe/sub_ds.py +0 -40
mindspore/ops/_op_impl/tbe/tan.py +0 -38
mindspore/ops/_op_impl/tbe/tan_ds.py +0 -39
mindspore/ops/_op_impl/tbe/tanh.py +0 -37
mindspore/ops/_op_impl/tbe/tanh_ds.py +0 -38
mindspore/ops/_op_impl/tbe/tanh_grad.py +0 -39
mindspore/ops/_op_impl/tbe/tanh_grad_ds.py +0 -40
mindspore/ops/_op_impl/tbe/tensor_move.py +0 -49
mindspore/ops/_op_impl/tbe/tensor_move_ds.py +0 -50
mindspore/ops/_op_impl/tbe/tensor_scatter_update.py +0 -41
mindspore/ops/_op_impl/tbe/tile.py +0 -37
mindspore/ops/_op_impl/tbe/tile_ds.py +0 -42
mindspore/ops/_op_impl/tbe/top_k.py +0 -42
mindspore/ops/_op_impl/tbe/top_k_ds.py +0 -43
mindspore/ops/_op_impl/tbe/trans_data.py +0 -167
mindspore/ops/_op_impl/tbe/trans_data_ds.py +0 -180
mindspore/ops/_op_impl/tbe/trans_data_rnn.py +0 -44
mindspore/ops/_op_impl/tbe/transpose.py +0 -60
mindspore/ops/_op_impl/tbe/transpose_d.py +0 -47
mindspore/ops/_op_impl/tbe/transpose_nod.py +0 -60
mindspore/ops/_op_impl/tbe/trunc.py +0 -39
mindspore/ops/_op_impl/tbe/truncate_div.py +0 -41
mindspore/ops/_op_impl/tbe/truncate_div_ds.py +0 -42
mindspore/ops/_op_impl/tbe/truncate_mod.py +0 -41
mindspore/ops/_op_impl/tbe/truncate_mod_ds.py +0 -42
mindspore/ops/_op_impl/tbe/unpack.py +0 -38
mindspore/ops/_op_impl/tbe/unpack_ds.py +0 -39
mindspore/ops/_op_impl/tbe/unsorted_segment_max.py +0 -49
mindspore/ops/_op_impl/tbe/unsorted_segment_max_ds.py +0 -40
mindspore/ops/_op_impl/tbe/unsorted_segment_min.py +0 -49
mindspore/ops/_op_impl/tbe/unsorted_segment_min_ds.py +0 -40
mindspore/ops/_op_impl/tbe/unsorted_segment_prod.py +0 -49
mindspore/ops/_op_impl/tbe/unsorted_segment_prod_ds.py +0 -38
mindspore/ops/_op_impl/tbe/unsorted_segment_sum.py +0 -38
mindspore/ops/_op_impl/tbe/unsorted_segment_sum_ds.py +0 -41
mindspore/ops/_op_impl/tbe/wts_arq.py +0 -40
mindspore/ops/_op_impl/tbe/xdivy.py +0 -38
mindspore/ops/_op_impl/tbe/xdivy_ds.py +0 -39
mindspore/ops/_op_impl/tbe/xlogy.py +0 -38
mindspore/ops/_op_impl/tbe/xlogy_ds.py +0 -39
mindspore/ops/_op_impl/tbe/zeros_like.py +0 -41
mindspore/ops/_op_impl/tbe/zeros_like_ds.py +0 -42
mindspore/ops/_tracefunc.py +0 -241
mindspore/ops/arg_dtype_cast.py +0 -54
mindspore/ops/silent_check.py +0 -162
mindspore/profiler/parser/msadvisor_analyzer.py +0 -82
mindspore/profiler/parser/msadvisor_parser.py +0 -240
mindspore/rewrite/api/tree_node_helper.py +0 -60
mindspore/rewrite/ast_helpers/ast_creator.py +0 -115
mindspore/rewrite/ast_transformers/flatten_recursive_stmt.py +0 -267
mindspore/rewrite/ast_transformers/remove_return_out_of_if.py +0 -228
mindspore/rewrite/namespace.py +0 -53
mindspore-2.2.14.dist-info/RECORD +0 -1924
{mindspore-2.2.14.dist-info → mindspore-2.4.0.dist-info}/WHEEL +0 -0
{mindspore-2.2.14.dist-info → mindspore-2.4.0.dist-info}/top_level.txt +0 -0

mindspore/context.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Copyright 2020-2023 Huawei Technologies Co., Ltd
+# Copyright 2020-2024 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -34,6 +34,8 @@ from mindspore.parallel._auto_parallel_context import _set_auto_parallel_context
 from mindspore.parallel._ps_context import _set_ps_context, _get_ps_context, _reset_ps_context, \
     _need_reset_device_target_for_ps
 from mindspore.parallel._offload_context import _set_offload_context, _get_offload_context
+from mindspore.hal.device import is_initialized
+from mindspore.common import api
 __all__ = ['GRAPH_MODE', 'PYNATIVE_MODE', 'STRICT', 'COMPATIBLE', 'LAX', 'set_context', 'get_context',
            'set_auto_parallel_context', 'get_auto_parallel_context', 'reset_auto_parallel_context', 'ParallelMode',
@@ -50,6 +52,10 @@ STRICT = 0
 COMPATIBLE = 1
 LAX = 2
+# Enumerate for the property 'debug_level'.
+RELEASE = 0
+DEBUG = 1
 def _make_directory(path):
     """Make directory."""
@@ -63,7 +69,7 @@ def _make_directory(path):
     if not os.path.exists(path):
         logger.debug("The directory(%s) doesn't exist, will create it", path)
         try:
-            os.makedirs(path)
+            os.makedirs(path, mode=0o700)
         except FileExistsError:
             logger.debug("The directory(%s) already exist.", path)
         except PermissionError as e:
@@ -161,6 +167,12 @@ class _Context:
         self._context_switches = _ContextSwitchInfo(False)
         self._context_handle = MSContext.get_instance()
         self._support_binary = False
+        self.enable_compile_cache = None
+        self._mode = PYNATIVE_MODE
+        self.aoe_config = {}
+        self.jit_config = {}
+        self.ascend_config = {}
+        self.gpu_config = {}
     def __getattribute__(self, attr):
         value = object.__getattribute__(self, attr)
@@ -176,7 +188,11 @@ class _Context:
     def get_mode(self):
         """Get current mode."""
-        return self.get_param(ms_ctx_param.mode)
+        return self._mode
+    def get_jit_config(self):
+        """Get current jit_config."""
+        return self.jit_config
     def set_mode(self, mode):
         """
@@ -204,6 +220,7 @@ class _Context:
             raise ValueError(f"For 'context.set_context', the argument 'mode' should be context.GRAPH_MODE (0) "
                              f"or context.PYNATIVE_MODE (1), but got {mode}.")
         self.set_param(ms_ctx_param.mode, mode)
+        self._mode = mode
     def set_jit_syntax_level(self, level):
         """"Set the JIT syntax level for graph compiling"""
@@ -212,6 +229,13 @@ class _Context:
                              f"or context.LAX, but got {level}.")
         self.set_param(ms_ctx_param.jit_syntax_level, level)
+    def set_debug_level(self, level):
+        """"Set the debug level for graph compiling"""
+        if level != RELEASE and level != DEBUG:
+            raise ValueError(f"For 'context.set_debug_level', the argument 'level' should be context.RELEASE "
+                             f"or context.DEBUG, but got {level}.")
+        self.set_param(ms_ctx_param.debug_level, level)
     def set_memory_optimize_level(self, memory_optimize_level):
         """
         The memory optimize level, support "O0", "O1".
@@ -228,6 +252,16 @@ class _Context:
         else:
             self.set_param(ms_ctx_param.memory_optimize_level, 1)
+    def set_exec_order(self, exec_order):
+        """
+        The execution order mode, support "bfs", "dfs", "gpto".
+        """
+        exec_order_modes = ["bfs", "dfs", "gpto"]
+        if exec_order not in exec_order_modes:
+            raise ValueError(f"For 'context.set_context', the argument 'exec_order' must be one of "
+                             f"{exec_order_modes}, but got {exec_order}.")
+        self.set_param(ms_ctx_param.exec_order, exec_order)
     def set_memory_offload(self, memory_offload):
         """
         Enable memory offload or not, support "ON", "OFF".
@@ -257,6 +291,29 @@ class _Context:
                              f"{deterministic_options}, but got {deterministic}.")
         self.set_param(ms_ctx_param.deterministic, deterministic)
+        hccl_deterministic = os.getenv("HCCL_DETERMINISTIC")
+        te_parallel_compiler = os.getenv("TE_PARALLEL_COMPILER")
+        if deterministic == "ON":
+            if hccl_deterministic and hccl_deterministic != "true":
+                logger.warning(f"Environment 'HCCL_DETERMINISTIC' should be 'true' when set deterministic='ON', but "
+                               f"got '{hccl_deterministic}'. 'HCCL_DETERMINISTIC' will be set to 'true'.")
+            if te_parallel_compiler and te_parallel_compiler != "1":
+                logger.warning(f"Environment 'TE_PARALLEL_COMPILER' should be '1' when set deterministic='ON', but "
+                               f"got '{te_parallel_compiler}'. 'TE_PARALLEL_COMPILER' will be set to '1'.")
+            os.environ["HCCL_DETERMINISTIC"] = "true"
+            os.environ["TE_PARALLEL_COMPILER"] = "1"
+        if deterministic == "OFF":
+            if hccl_deterministic and hccl_deterministic != "false":
+                logger.warning(f"Environment 'HCCL_DETERMINISTIC' should not be set or be 'false' when set "
+                               f"deterministic='OFF', but got '{hccl_deterministic}'. 'HCCL_DETERMINISTIC' "
+                               f"will be unset.")
+                del os.environ["HCCL_DETERMINISTIC"]
+            if te_parallel_compiler and te_parallel_compiler != "0":
+                logger.warning(f"Environment 'TE_PARALLEL_COMPILER' should not be set or be '0' when set "
+                               f"deterministic='OFF', but got '{te_parallel_compiler}'. 'TE_PARALLEL_COMPILER' "
+                               f"will be unset.")
+                del os.environ["TE_PARALLEL_COMPILER"]
     def set_ascend_config(self, ascend_config):
         """
         Enable ascend config.
@@ -268,11 +325,18 @@ class _Context:
                             "allow_mix_precision_fp16" and "allow_mix_precision_bf16".
                 - jit_compile (bool): ``False`` and ``True``.
                 - atomic_clean_policy (int): ``0`` and ``1``. Default: ``1`` .
+                - op_precision_mode (str): precision mode config file path.
+                - op_debug_option (str): Enable debugging options for Ascend operators,
+                  default not enabled, only supports ``"oom"`` currently.
+                  ``"oom"``: Detect memory out of bounds.
+                - ge_options (dict): Global or session CANN options.
                 - exception_dump (str): Enable exception dump for Ascend operators. ``"0"`` , ``"1"`` and ``"2"``.
                   Default: ``"2"`` .
-                - op_precision_mode (str): config file path.
                 - parallel_speed_up_json_path(Union[str, None]): The path to the parallel speed up json file.
                   If its value is None or '', it does not take effect. Default None.
+                - host_scheduling_max_threshold(int): The host scheduling max threshold.
+                - hccl_watchdog (bool): Enable a thread to monitor the failure of collective communication.
+                  Default: ``True`` .
         """
         ascend_cfg_modes = {
             'precision_mode': ["force_fp16", "allow_fp32_to_fp16", "allow_mix_precision", "must_keep_origin_dtype",
@@ -284,8 +348,16 @@ class _Context:
             'conv_allow_hf32': [True, False],
             'exception_dump': ["0", "1", "2"],
             'op_precision_mode': (str,),
+            'ge_options': (dict,),
             'parallel_speed_up_json_path': (str, None),
-            'topo_order': (dict,)
+            'host_scheduling_max_threshold': (int,),
+            'cur_step_num': (int,),
+            'save_checkpoint_steps': (int,),
+            'need_ckpt': (bool,),
+            'last_triggered_step': (int,),
+            'hccl_watchdog': (bool,),
+            'topo_order': (dict,),
+            'op_debug_option': (str, None),
         }
         ascend_cfg_setters = {
             'precision_mode': self._get_ascend_config_setter('precision_mode'),
@@ -294,8 +366,16 @@ class _Context:
             'matmul_allow_hf32': self._get_ascend_config_setter('matmul_allow_hf32', lambda v: "1" if v else "0"),
             'conv_allow_hf32': self._get_ascend_config_setter('conv_allow_hf32', lambda v: "1" if v else "0"),
             'exception_dump': self._get_ascend_config_setter('exception_dump'),
+            'op_debug_option': self._set_op_debug_option,
             'op_precision_mode': self._set_op_precision_mode,
+            'ge_options': self._set_ge_options,
             'parallel_speed_up_json_path': self._set_speedup_config_path,
+            'host_scheduling_max_threshold': self._get_ascend_config_setter('host_scheduling_max_threshold', str),
+            'cur_step_num': self._set_cur_step_num,
+            'save_checkpoint_steps': self._set_save_checkpoint_steps,
+            'need_ckpt': self._set_need_ckpt,
+            'last_triggered_step': self._set_last_triggered_step,
+            'hccl_watchdog': self._set_hccl_watchdog,
             'topo_order': self._set_topo_order
         }
         ascend_cfg_set = tuple(ascend_cfg_modes.keys())
@@ -312,6 +392,7 @@ class _Context:
                                 f"{supported_modes}, but got {type(ascend_value)}.")
             cfg_setter = ascend_cfg_setters.get(ascend_key)
             cfg_setter(ascend_value)
+        self.ascend_config = ascend_config
     def set_gpu_config(self, gpu_config):
         """
@@ -353,6 +434,33 @@ class _Context:
                 self.set_param(ms_ctx_param.conv_allow_tf32, gpu_config[gpu_key])
             if gpu_key == 'matmul_allow_tf32':
                 self.set_param(ms_ctx_param.matmul_allow_tf32, gpu_config[gpu_key])
+            self.gpu_config = gpu_config
+    def set_jit_config(self, jit_config):
+        """
+        Enable jit config.
+        Args:
+            jit_config (dict):
+                - jit_level (str): "O0", "O1" or "O2" to control the compilation optimization level.
+        """
+        jit_cfgs = {'jit_level': ["O0", "O1", "O2"], 'infer_boost': ["on", "off"]}
+        key_args_map = {'jit_level': ms_ctx_param.jit_level, 'infer_boost': ms_ctx_param.infer_boost}
+        for jit_key in jit_config:
+            if jit_key not in jit_cfgs:
+                raise ValueError(f"For 'context.set_context', the key of argument 'jit_config' must be one of "
+                                 f"{jit_cfgs}, but got {jit_key}.")
+            supported_value = jit_cfgs.get(jit_key)
+            if jit_config[jit_key] not in supported_value:
+                raise ValueError(f"For 'jit_config', the value of argument {jit_key} must be one of "
+                                 f"{supported_value}, but got {jit_config[jit_key]}.")
+            self.set_param(key_args_map[jit_key], jit_config[jit_key])
+        self.jit_config = jit_config
+        jit_level = jit_config.get("jit_level", None)
+        if jit_config.get("infer_boost", None) == "on" and (jit_level == "O1" or jit_level == "O2"):
+            raise ValueError(f"Only jit_level set O0 can set infer_boost to on.")
     def set_backend_policy(self, policy):
         success = self._context_handle.set_backend_policy(policy)
@@ -424,6 +532,7 @@ class _Context:
                                  f"{supported_value}, but got {aoe_config[aoe_config_key]}.")
             if aoe_config_key == 'job_type':
                 self.set_param(ms_ctx_param.aoe_job_type, aoe_config[aoe_config_key])
+        self.aoe_config = aoe_config
     def set_device_id(self, device_id):
         if device_id < 0 or device_id > 4095:
@@ -475,9 +584,13 @@ class _Context:
     def set_mempool_block_size(self, mempool_block_size):
         """Set the block size of memory pool."""
-        if _get_mode() == GRAPH_MODE:
+        global_jit_config = get_jit_config()
+        is_force_kbk = False
+        if global_jit_config:
+            is_force_kbk = global_jit_config.get('jit_level') == "O0" or global_jit_config.get('jit_level') == "O1"
+        if _get_mode() == GRAPH_MODE and not is_force_kbk:
             logger.warning("Graph mode doesn't support to set parameter 'mempool_block_size' of context currently, "
-                           "you can use context.set_context to set pynative mode.")
+                           "you can use context.set_context to set pynative mode or set jit_level=O0/O1.")
             return
         if not Validator.check_str_by_regular(mempool_block_size, _RE_PATTERN):
             raise ValueError("For 'context.set_context', the argument 'mempool_block_size' should be in "
@@ -558,13 +671,16 @@ class _Context:
         'inter_op_parallel_num': set_inter_op_parallel_num,
         'runtime_num_threads': set_runtime_num_threads,
         'memory_optimize_level': set_memory_optimize_level,
+        'exec_order': set_exec_order,
         'op_timeout': set_op_timeout,
         'memory_offload': set_memory_offload,
         'deterministic': set_deterministic,
         'ascend_config': set_ascend_config,
         'jit_syntax_level': set_jit_syntax_level,
+        'debug_level': set_debug_level,
         'gpu_config': set_gpu_config,
         'aoe_config': set_aoe_config,
+        'jit_config': set_jit_config,
     }
     @property
@@ -612,6 +728,16 @@ class _Context:
             trans_fn = lambda x: x
         return _config_setter
+    def _set_op_debug_option(self, option_value):
+        valid_order = {'oom'}
+        if not isinstance(option_value, str):
+            raise TypeError(f"For 'ascend_config', the type of 'op_debug_option' must be str, "
+                            f"but got {type(option_value)}.")
+        if option_value not in valid_order:
+            raise ValueError(f"For 'ascend_config', the 'op_debug_option' supports being set to 'oom' currently, "
+                             f"but got {option_value}.")
+        self.set_param(ms_ctx_param.op_debug_option, option_value)
     def _set_op_precision_mode(self, ascend_value):
         op_precision_path = ascend_value
         real_path = os.path.realpath(op_precision_path)
@@ -620,6 +746,28 @@ class _Context:
                              f"got '{op_precision_path}'.")
         self.set_param(ms_ctx_param.op_precision_mode, ascend_value)
+    def _set_ge_options(self, ge_options):
+        """Set ge options."""
+        for level, options in ge_options.items():
+            if level not in ['global', 'session']:
+                raise ValueError(f"For 'ascend_config', the key of ge_options must be one of "
+                                 f"('global', 'session'), but got {level}.")
+            if not isinstance(options, dict):
+                raise TypeError(f"For 'ge_options', the type of {level} options must be dict, "
+                                f"but got {type(options)}. The error options: {options}.")
+            for key, value in options.items():
+                if not isinstance(key, str):
+                    raise TypeError(f"For 'ge_options', the type of key and value must be str, "
+                                    f"but got {type(key)}. The error key is {key}.")
+                if not isinstance(value, str):
+                    raise TypeError(f"For 'ge_options', the type of key and value must be str, "
+                                    f"but got {type(value)}. The error value is {value}")
+        options_str = json.dumps(ge_options)
+        self.set_param(ms_ctx_param.ge_options, options_str)
     def _set_topo_order(self, topo_order):
         """
         Set topo order.
@@ -642,33 +790,81 @@ class _Context:
         options_str = json.dumps(topo_order)
         self.set_param(ms_ctx_param.topo_order, options_str)
+    def _set_hccl_watchdog(self, flag):
+        """set hccl watchdog"""
+        if not isinstance(flag, bool):
+            raise TypeError(f"For 'ascend_config', the type of 'hccl_watchdog' must be bool, but got {type(flag)}.")
+        self.set_param(ms_ctx_param.hccl_watchdog, flag)
+    def _set_need_ckpt(self, need_ckpt):
+        """Set need ckpt flag"""
+        if not isinstance(need_ckpt, bool):
+            raise TypeError(f"For step num, the value type should be int, but got {type(need_ckpt)}, {need_ckpt}")
+        self.set_param(ms_ctx_param.need_ckpt, need_ckpt)
+    def _set_cur_step_num(self, step_num):
+        """set current step num at every step begin"""
+        if not isinstance(step_num, int):
+            raise TypeError(f"For step num, the value type should be int, but got {type(step_num)}, {step_num}")
+        self.set_param(ms_ctx_param.cur_step_num, step_num)
+    def _set_save_checkpoint_steps(self, steps):
+        """set save checkpoint steps before run"""
+        if not isinstance(steps, int):
+            raise TypeError(f"For step num, the value type should be int, but got {type(steps)}, {steps}")
+        self.set_param(ms_ctx_param.save_checkpoint_steps, steps)
+    def _set_last_triggered_step(self, step):
+        """set last triggered save ckpt steps before run"""
+        if not isinstance(step, int):
+            raise TypeError(f"For step num, the value type should be int, but got {type(step)}, {step}")
+        self.set_param(ms_ctx_param.last_triggered_step, step)
     def _set_speedup_config_path(self, speedup_config_path):
         """"Check and set speedup config for auto parallel."""
         if speedup_config_path is None or speedup_config_path == "":
             return
-        speedup_config_real_path = os.path.abspath(speedup_config_path)
+        speedup_config_real_path = os.path.realpath(speedup_config_path)
         if not os.path.exists(speedup_config_real_path):
             raise ValueError(f"For 'ascend_config', the path to parallel_speed_up_json: "
                              f"{speedup_config_real_path} does not exist, please check whether the "
                              f"'parallel_speed_up_json_path' is correct.")
         try:
-            valid_option = {"recompute_comm_overlap": ms_ctx_param.recompute_comm_overlap,
-                            "matmul_grad_comm_overlap": ms_ctx_param.matmul_grad_comm_overlap,
-                            "enable_task_opt": ms_ctx_param.enable_task_opt,
-                            "enable_grad_comm_opt": ms_ctx_param.enable_grad_comm_opt,
-                            "interleaved_matmul_comm": ms_ctx_param.interleaved_matmul_comm,
-                            "enable_opt_shard_comm_opt": ms_ctx_param.enable_opt_shard_comm_opt,
-                            "interleaved_layernorm_comm": ms_ctx_param.interleaved_layernorm_comm}
+            valid_option = {"recompute_comm_overlap": (ms_ctx_param.recompute_comm_overlap, bool),
+                            "matmul_grad_comm_overlap": (ms_ctx_param.matmul_grad_comm_overlap, bool),
+                            "enable_task_opt": (ms_ctx_param.enable_task_opt, bool),
+                            "enable_grad_comm_opt": (ms_ctx_param.enable_grad_comm_opt, bool),
+                            "recompute_allgather_overlap_fagrad":
+                                (ms_ctx_param.recompute_allgather_overlap_fagrad, bool),
+                            "interleaved_matmul_comm": (ms_ctx_param.interleaved_matmul_comm, bool),
+                            "bias_add_comm_swap": (ms_ctx_param.bias_add_comm_swap, bool),
+                            "enable_opt_shard_comm_opt": (ms_ctx_param.enable_opt_shard_comm_opt, bool),
+                            "enable_begin_end_inline_opt": (ms_ctx_param.enable_begin_end_inline_opt, bool),
+                            "enable_concat_eliminate_opt": (ms_ctx_param.enable_concat_eliminate_opt, bool),
+                            "interleaved_layernorm_comm": (ms_ctx_param.interleaved_layernorm_comm, bool),
+                            "enable_allreduce_slice_to_reducescatter":
+                                (ms_ctx_param.enable_allreduce_slice_to_reducescatter, bool),
+                            "enable_interleave_split_concat_branch":
+                                (ms_ctx_param.enable_interleave_split_concat_branch, bool),
+                            "enable_offloading_packed_experts": (ms_ctx_param.enable_offloading_packed_experts, bool),
+                            "compute_communicate_fusion_level":
+                                (ms_ctx_param.compute_communicate_fusion_level, int),
+                            "enable_flash_attention_load_balance":
+                                (ms_ctx_param.enable_flash_attention_load_balance, bool),
+                            "dataset_broadcast_opt_level":
+                                (ms_ctx_param.dataset_broadcast_opt_level, int)}
             with open(speedup_config_real_path, 'r') as f:
                 speedup_config = json.load(f)
-                for k, v in speedup_config.items():
-                    if not isinstance(k, str):
-                        raise TypeError("key {} is not a str".format(k))
-                    if k not in valid_option:
-                        raise ValueError("key {} should be one of {}.".format(k, valid_option.keys()))
-                    if not isinstance(v, bool):
-                        raise TypeError("value {} is not a bool".format(v))
-                    self.set_param(valid_option.get(k), v)
+                for key, value in speedup_config.items():
+                    if not isinstance(key, str):
+                        raise TypeError("key {} is not a str".format(key))
+                    if key not in valid_option:
+                        raise ValueError("key {} should be one of {}.".format(key, valid_option.keys()))
+                    set_func, valid_type = valid_option.get(key)
+                    if not isinstance(value, valid_type):
+                        raise TypeError(f"The value type of {key} must be {valid_type}, "
+                                        f"but got value is {value} and type is {type(value)}.")
+                    self.set_param(set_func, value)
         except (TypeError, ValueError) as exo:
             raise ValueError(str(exo) + "\nFor 'context.set_context', "
                                         "open or load the 'speedup_config_path' file {} "
@@ -705,8 +901,9 @@ def _context():
                  auto_parallel_search_mode=str, search_mode=str, parameter_broadcast=bool, strategy_ckpt_load_file=str,
                  strategy_ckpt_save_file=str, full_batch=bool, enable_parallel_optimizer=bool, enable_alltoall=bool,
                  all_reduce_fusion_config=list, pipeline_stages=int, pipeline_segments=int,
-                 pipeline_config=dict, parallel_optimizer_config=dict,
-                 comm_fusion=dict, strategy_ckpt_config=dict)
+                 pipeline_result_broadcast=bool, parallel_optimizer_config=dict,
+                 pipeline_config=dict,
+                 comm_fusion=dict, strategy_ckpt_config=dict, force_fp32_communication=bool)
 def set_auto_parallel_context(**kwargs):
     r"""
     Set auto parallel context, only data parallel supported on CPU.
@@ -733,8 +930,12 @@ def set_auto_parallel_context(**kwargs):
     parallel_optimizer_config    dataset_strategy
     enable_alltoall              pipeline_stages
     pipeline_config              auto_parallel_search_mode
+    force_fp32_communication     pipeline_result_broadcast
                \                 comm_fusion
                \                 strategy_ckpt_config
+               \                 group_ckpt_save_file
+               \                 auto_pipeline
+               \                 dump_local_norm
     ===========================  ===========================
     Args:
@@ -744,6 +945,8 @@ def set_auto_parallel_context(**kwargs):
                      "stand_alone" do not support gradients_mean. Default: ``False`` .
         gradient_fp32_sync (bool): Run allreduce of gradients in fp32. "stand_alone", "data_parallel"
                      and "hybrid_parallel" do not support gradient_fp32_sync. Default: ``True`` .
+        loss_repeated_mean (bool) - Indicates whether the mean operator is executed backwards when the
+                     calculation is repeated. Default: ``True`` .
         parallel_mode (str): There are five kinds of parallel modes, ``"stand_alone"`` , ``"data_parallel"`` ,
                      ``"hybrid_parallel"`` , ``"semi_auto_parallel"`` and ``"auto_parallel"`` . Note the pynative mode
                      only supports the ``"stand_alone"`` and ``"data_parallel"`` mode. Default: ``"stand_alone"`` .
@@ -758,15 +961,16 @@ def set_auto_parallel_context(**kwargs):
                      - auto_parallel: Achieving parallelism automatically.
         search_mode (str): There are three kinds of shard strategy search modes: ``"recursive_programming"`` ,
-                     ``"dynamic_programming"`` and ``"sharding_propagation"`` . Default: ``"recursive_programming"`` .
+                     ``"sharding_propagation"`` and ``"dynamic_programming"`` (Not recommended).
+                     Default: ``"recursive_programming"`` .
                      - recursive_programming: Recursive programming search mode. In order to obtain optimal performance,
                        it is recommended that users set the batch size to be greater than or equal to the product of
                        the number of devices and the number of multi-copy parallelism.
-                     - dynamic_programming: Dynamic programming search mode.
                      - sharding_propagation: Propagate shardings from configured ops to non-configured ops.
+                     - dynamic_programming: Dynamic programming search mode.
         auto_parallel_search_mode (str): This is the old version of 'search_mode'. Here, remaining this attribute is
                      for forward compatibility, and this attribute will be deleted in a future MindSpore version.
         parameter_broadcast (bool): Whether to broadcast parameters before training. Before training, in order to have
@@ -792,6 +996,9 @@ def set_auto_parallel_context(**kwargs):
                        data parallel training in the benefit of time and memory saving. Currently, auto and semi auto
                        parallel mode support all optimizers in both Ascend and GPU. Data parallel mode only supports
                        `Lamb` and `AdamWeightDecay` in Ascend . Default: ``False`` .
+        force_fp32_communication (bool): A switch that determines whether reduce operators (AllReduce, ReduceScatter)
+                        are forced to use the fp32 data type for communication during communication. True is the enable
+                        switch. Default: ``False`` .
         enable_alltoall (bool): A switch that allows AllToAll operators to be generated during communication. If its
                         value is ``False`` , there will be a combination of operators such as AllGather, Split and
                         Concat instead of AllToAll. Default: ``False`` .
@@ -801,6 +1008,8 @@ def set_auto_parallel_context(**kwargs):
                         distributed alone in the pipeline. The total devices will be divided into 'pipeline_stags'
                         stages.
                         Default: ``1`` .
+        pipeline_result_broadcast (bool): A switch that broadcast the last stage result to all other stage in pipeline
+                        parallel inference. Default: ``False`` .
         pipeline_config (dict): A dict contains the keys and values for setting the pipeline parallelism configuration.
                         It supports the following keys:
@@ -866,14 +1075,21 @@ def set_auto_parallel_context(**kwargs):
                         - load_file (str): The path to load parallel strategy checkpoint. If the file name extension is
                           `.json`, the file is loaded in JSON format. Otherwise, the file is loaded in ProtoBuf
                           format.
-                          Default: ''
+                          Default: ``''``
                         - save_file (str): The path to save parallel strategy checkpoint. If the file name extension is
                           `.json`, the file is saved in JSON format. Otherwise, the file is saved in ProtoBuf format.
-                          Default: ''
+                          Default: ``''``
                         - only_trainable_params (bool): Only save/load the strategy information for trainable parameter.
                           Default: ``True`` .
+        group_ckpt_save_file (str): The path to save parallel group checkpoint.
+        auto_pipeline (bool): Set the pipeline stage number to automatic. Its value will be selected between 1 and the
+                        parameter `pipeline_stages`. This option requires the `parallel_mode` to be ``auto_parallel``
+                        and the `search_mode` to be ``recursive_programming``. Default: ``False`` .
+        dump_local_norm (bool): Whether to dump local_norm value, when the `parallel_mode` is set to
+                        ``semi_auto_parallel`` or ``auto_parallel``.
+                        Default: ``False`` .
     Raises:
         ValueError: If input key is not attribute in auto parallel context.
@@ -885,8 +1101,8 @@ def set_auto_parallel_context(**kwargs):
         >>> ms.set_auto_parallel_context(gradients_mean=True)
         >>> ms.set_auto_parallel_context(gradient_fp32_sync=False)
         >>> ms.set_auto_parallel_context(parallel_mode="auto_parallel")
-        >>> ms.set_auto_parallel_context(search_mode="dynamic_programming")
-        >>> ms.set_auto_parallel_context(auto_parallel_search_mode="dynamic_programming")
+        >>> ms.set_auto_parallel_context(search_mode="recursive_programming")
+        >>> ms.set_auto_parallel_context(auto_parallel_search_mode="recursive_programming")
         >>> ms.set_auto_parallel_context(parameter_broadcast=False)
         >>> ms.set_auto_parallel_context(strategy_ckpt_load_file="./strategy_stage1.ckpt")
         >>> ms.set_auto_parallel_context(strategy_ckpt_save_file="./strategy_stage1.ckpt")
@@ -895,6 +1111,7 @@ def set_auto_parallel_context(**kwargs):
         >>> ms.set_auto_parallel_context(enable_alltoall=False)
         >>> ms.set_auto_parallel_context(all_reduce_fusion_config=[8, 160])
         >>> ms.set_auto_parallel_context(pipeline_stages=2)
+        >>> ms.set_auto_parallel_context(pipeline_stages=2, pipeline_result_broadcast=True)
         >>> parallel_config = {"gradient_accumulation_shard": True, "parallel_optimizer_threshold": 24,
         ...                    "optimizer_weight_shard_size": 2}
         >>> ms.set_auto_parallel_context(parallel_optimizer_config=parallel_config, enable_parallel_optimizer=True)
@@ -943,15 +1160,20 @@ def reset_auto_parallel_context():
     - strategy_ckpt_save_file: ''.
     - full_batch: False.
     - enable_parallel_optimizer: False.
+    - force_fp32_communication: False.
     - enable_alltoall: False.
     - pipeline_stages: 1.
+    - pipeline_result_broadcast: False.
     - fusion_threshold: 64.
+    - dump_local_norm: False.
+    - auto_pipeline: False.
     Examples:
         >>> import mindspore as ms
         >>> ms.reset_auto_parallel_context()
     """
     _reset_auto_parallel_context()
+    api.ms_compile_cache.clear()
 @args_type_check(offload_config=dict)
@@ -961,7 +1183,8 @@ def set_offload_context(offload_config):
     Note:
         The offload configuration is only used if the memory offload feature is enabled
-        via mindspore.set_context(memory_offload="ON").
+        via mindspore.set_context(memory_offload="ON"), and the memory_optimize_level must be set to O0. On the Ascend
+        hardware platform, the graph compilation level must be O0.
     Args:
         offload_config (dict): A dict contains the keys and values for setting the offload context
@@ -1035,6 +1258,23 @@ def _check_target_specific_cfgs(device, arg_key):
     return False
+def _check_ascend_device_context_initialized(device_target, settings):
+    if device_target == 'Ascend' and is_initialized(device_target):
+        for key, _ in settings.items():
+            if key in ('ascend_config', 'deterministic', 'jit_compile', 'exception_dump', 'device_id'):
+                logger.warning(f"For 'context.set_context' in Ascend backend, the backend is already initialized, "
+                               "please set it before the definition of any Tensor and Parameter, and the "
+                               "instantiation and execution of any operation and net, otherwise the settings may not "
+                               "take effect. ")
+                break
+def _check_key(key):
+    if key in ('precision_mode', 'jit_compile', 'atomic_clean_policy', 'matmul_allow_hf32', 'conv_allow_hf32',
+               'op_precision_mode', 'host_scheduling_max_threshold', 'ge_options', 'op_debug_option'):
+        raise ValueError(f"Please set '{key}' through parameter ascend_config")
 @args_type_check(mode=int, precompile_only=bool, device_target=str, device_id=int, save_graphs=(bool, int),
                  save_graphs_path=str, enable_dump=bool, aoe_tune_mode=str, aoe_config=dict,
                  save_dump_path=str, enable_reduce_precision=bool, variable_memory_max_size=str,
@@ -1043,8 +1283,8 @@ def _check_target_specific_cfgs(device, arg_key):
                  max_device_memory=str, print_file_path=str, max_call_depth=int, env_config_path=str,
                  graph_kernel_flags=str, save_compile_cache=bool, runtime_num_threads=int, load_compile_cache=bool,
                  grad_for_scalar=bool, pynative_synchronize=bool, mempool_block_size=str, disable_format_transform=bool,
-                 op_timeout=int, deterministic=str, ascend_config=dict, jit_syntax_level=int,
-                 jit_enable_inplace_ops=bool, gpu_config=dict)
+                 op_timeout=int, deterministic=str, ascend_config=dict, jit_syntax_level=int, debug_level=int,
+                 jit_enable_inplace_ops=bool, gpu_config=dict, jit_config=dict, enable_compile_cache=bool)
 def set_context(**kwargs):
     """
     Set context for running environment.
@@ -1093,6 +1333,8 @@ def set_context(**kwargs):
     |                         |  reserve_class_name_in_scope |  CPU/GPU/Ascend            |
     |                         +------------------------------+----------------------------+
     |                         |  pynative_synchronize        |  CPU/GPU/Ascend            |
+    |                         +------------------------------+----------------------------+
+    |                         |  debug_level                 |  CPU/GPU/Ascend            |
     +-------------------------+------------------------------+----------------------------+
     | Executive Control       |   mode                       |   CPU/GPU/Ascend           |
     |                         +------------------------------+----------------------------+
@@ -1133,6 +1375,10 @@ def set_context(**kwargs):
     |                         |  jit_syntax_level            |  CPU/GPU/Ascend            |
     |                         +------------------------------+----------------------------+
     |                         |  gpu_config                  |  GPU                       |
+    |                         +------------------------------+----------------------------+
+    |                         |  jit_config                  |  CPU/GPU/Ascend            |
+    |                         +------------------------------+----------------------------+
+    |                         |  exec_order                  |  Ascend                    |
     +-------------------------+------------------------------+----------------------------+
     Args:
@@ -1142,15 +1388,21 @@ def set_context(**kwargs):
             If device target is not set, the version of MindSpore package is used.
         max_device_memory (str): Set the maximum memory available for devices. The format is "xxGB".
             Default: ``" 1024GB"`` . The actual used memory size is the minimum of the available memory of the device
-            and max_device_memory. 'max_device_memory' should be set before the program runs.
+            and max_device_memory. 'max_device_memory' should be set before the program runs. When virtual memory is
+            enabled, a too small 'max_device_memory' will cause frequent defragmentation, affecting performance.
         variable_memory_max_size (str): This parameter is deprecated, and will be removed in a future version.
             Please use parameter 'max_device_memory' instead.
-        mempool_block_size (str): Set the size of the memory pool block in PyNative mode for devices.
-            The format is "xxGB". Default: ``"1GB"`` . Minimum size is "1G". The actual used memory block size is the
-            minimum of the available memory of the device and mempool_block_size.
+        mempool_block_size (str): It takes effect when virtual memory is turned off, set the size of the memory pool
+            block for devices. The format is "xxGB". Default: ``"1GB"`` . Minimum size is "1G". The actual used memory
+            block size is the minimum of the available memory of the device and mempool_block_size. When there is
+            enough memory, the memory will be expanded by this value.
         op_timeout (int): Set the maximum duration of executing an operator in seconds.
-            If the execution time exceeds this value, system will terminate the task. 0 means endless wait.
-            Default: ``1900`` .
+            If the execution time exceeds this value, system will terminate the task.
+            0 means endless wait. The defaults for AI Core and AICPU operators vary on different hardware.
+            For more information,
+            please refer to `Ascend Community document about aclrtSetOpExecuteTimeOut
+            <https://www.hiascend.com/document/detail/en/CANNCommunityEdition/600alphaX/infacldevg/aclcppdevg/aclcppdevg_03_0069.html>`_.
+            Default: ``900`` .
         save_graphs (bool or int): Whether to save intermediate compilation graphs. Default: ``0`` .
             Available values are:
@@ -1159,10 +1411,13 @@ def set_context(**kwargs):
             - True or 2: Generate more ir files related to backend process.
             - 3: Generate visualization computing graphs and detailed frontend ir graphs.
+            When the network structure is complex, setting `save_graphs` attribute to ``2`` or ``3`` may take too long.
+            If you need quick problem locating, you can switch to ``1`` first.
             When the `save_graphs` attribute is set as ``True`` , ``1`` , ``2`` or ``3`` , attribute of
             `save_graphs_path` is used to set the intermediate compilation graph storage path. By default, the graphs
             are saved in the current directory.
-        save_graphs_path (str): Path to save graphs. Default: ".".
+        save_graphs_path (str): Path to save graphs. Default: ``"."``.
             If the specified directory does not exist, the system will automatically create the directory.
             During distributed training, graphs will be saved to the directory of
             `save_graphs_path/rank_${rank_id}/`. `rank_id` is the ID of the current device in the cluster.
@@ -1182,6 +1437,8 @@ def set_context(**kwargs):
             If the saved file already exists, the timestamp suffix will be added to the file. Saving data to a file
             solves the problem of data loss in screen printing when a large amount of data is generated.
             If it is not set, an error will be reported: prompt to set the upper absolute path.
+            When print data to file, the total output bytes of single print must be less then 2GB(limited by
+            protobuf).
         env_config_path (str): Config path for DFX.
             Through mindspore.set_context(env_config_path="./mindspore_config.json")
@@ -1226,7 +1483,7 @@ def set_context(**kwargs):
             If enable_graph_kernel is set to ``True`` , acceleration can be enabled.
             For details of graph kernel fusion, please check
             `Enabling Graph Kernel Fusion
-            <https://www.mindspore.cn/tutorials/experts/en/r2.2/optimize/graph_fusion_engine.html>`_.
+            <https://www.mindspore.cn/docs/en/master/model_train/optimize/graph_fusion_engine.html>`_.
         graph_kernel_flags (str):
             Optimization options of graph kernel fusion, and the priority is higher when it conflicts
             with enable_graph_kernel. Only for experienced users.
@@ -1251,6 +1508,11 @@ def set_context(**kwargs):
                 Be caution when using this level.
             - dump_as_text: dumps detail info as text files. Default: ``False`` .
+            - enable_cluster_ops: Add user-specified operator to the set of operators involved in fusion. For example,
+              by setting ``--enable_cluster_ops=MatMul``, MatMul operator can be included in the fusion process.
+            - enable_pass/disable_pass: Enable/disable user-specified custom fusion passes. See details in
+              `Custom Fusion Pass
+              <https://www.mindspore.cn/docs/en/master/model_train/custom_program/fusion_pass.html>`_.
         enable_reduce_precision (bool): Whether to enable precision reduction.
             If the operator does not support the user-specified precision, the precision will
@@ -1281,8 +1543,9 @@ def set_context(**kwargs):
             if enable_compile_cache is still set to ``True`` and the network scripts are not changed,
             the compile cache is loaded. Note that only limited automatic detection for the changes of
             python scripts is supported by now, which means that there is a correctness risk. Default: ``False`` .
+            Currently, do not support the graph which is larger than 2G after compiled.
             This is an experimental prototype that is subject to change and/or deletion.
-        compile_cache_path (str): Path to save the compile cache. Default: ".".
+        compile_cache_path (str): Path to save the compile cache. Default: ``"."``.
             If the specified directory does not exist, the system will automatically create the directory.
             The cache will be saved to the directory of `compile_cache_path/rank_${rank_id}/`. The `rank_id` is
             the ID of the current device in the cluster.
@@ -1290,7 +1553,8 @@ def set_context(**kwargs):
             which means use the default num.
         runtime_num_threads(int): The thread pool number of cpu kernel used in runtime,
             which must bigger than or equal to 0. Default value is ``30`` , if you run many processes at
-            the same time, you should set the value smaller to avoid thread contention.
+            the same time, you should set the value smaller to avoid thread contention. If set runtime_num_threads to 1,
+            the runtime asynchronous pipeline capability cannot be enabled, which may affect performance.
         disable_format_transform (bool): Whether to disable the automatic format transform function from NCHW to NHWC.
             When the network training performance of fp16 is worse than fp32, `disable_format_transform` can be set to
             ``True`` to try to improve training performance. Default: ``False`` .
@@ -1299,16 +1563,18 @@ def set_context(**kwargs):
             of the interfaces would be compiled by MindSpore to the interfaces definition .py file that should be
             guaranteed to be writable. Then compile the .py file to the .pyc or .so file, and could run in Graph mode.
         memory_optimize_level (str): The memory optimize level.
-            Default: O0. The value must be in ['O0', 'O1'].
+            On Ascend hardware platform, default: ``O1``, on other hardware platforms, default: ``O0``.
+            The value must be in ['O0', 'O1'].
-            - O0: priority performance option, disable SOMAS (Safe Optimized Memory Allocation Solver).
-            - O1: priority memory option, enable SOMAS.
+            - O0: priority performance option, disable SOMAS (Safe Optimized Memory Allocation Solver)
+              and some other memory optimizations.
+            - O1: priority memory option, enable SOMAS and some other memory optimizations.
         memory_offload (str): Whether to enable the memory offload function. When it is enabled, the idle data will be
             temporarily copied to the host side in the case of insufficient device memory. The value must be in the
             range of ['ON', 'OFF'], and the default value is ``'OFF'`` .
             - ON: Enable the memory Offload function. On Ascend hardware platform, this parameter does not take effect
-              when the environment variable "GRAPH_OP_RUN=1" is not set; This parameter does not take effect when
+              when the graph compilation level is not 'O0'; This parameter does not take effect when
               memory_optimize_level is set 'O1'.
             - OFF: Turn off the memory Offload function.
         ascend_config (dict): Set the parameters specific to Ascend hardware platform. It is not set by default.
@@ -1319,22 +1585,27 @@ def set_context(**kwargs):
               is ``force_fp16`` . The value range is as follows:
               - force_fp16: When the operator supports both float16 and float32, select float16 directly.
-              - allow_fp32_to_fp16: When the operator does not support the float32 data type, directly reduce
-                the precision of float16.
+              - allow_fp32_to_fp16: For cube operators, use the float16. For vector operators,
+                prefer to keep the origin dtype, if the operator in model can support float32,
+                it will keep original dtype, otherwise it will reduce to float16.
               - allow_mix_precision: Automatic mixing precision, facing the whole network operator, according
                 to the built-in optimization strategy, automatically reduces the precision of some operators
                 to float16 or bfloat16.
               - must_keep_origin_dtype: Keep the accuracy of the original drawing.
               - force_fp32: When the input of the matrix calculation operator is float16 and the output supports
                 float16 and float32, output is forced to float32.
-              - allow_fp32_to_bf16: When the operator does not support the float32 data type, directly reduce
-                the precision of bfloat16.
+              - allow_fp32_to_bf16: For cube operators, use the bfloat16. For vector operators,
+                prefer to keep the origin dtype, if the operator in model can support float32,
+                it will keep original dtype, otherwise it will reduce to bfloat16.
               - allow_mix_precision_fp16: Automatic mixing precision, facing the whole network operator, automatically
                 reduces the precision of some operators to float16 according to the built-in optimization strategy.
               - allow_mix_precision_bf16: Automatic mixing precision, facing the whole network operator, according to
                 the built-in optimization strategy, automatically reduces the precision of some operators to bfloat16.
-            - jit_compile (bool): Whether to select online compilation. the default value is based on CANN.
+            - jit_compile (bool): Whether to select online compilation. When set to 'True', online compilation is
+              prioritized. When set to 'False', compiled operator binary files are prioritized to improve compilation
+              performance. The default settings are online compilation for static shape, and compiled operator binary
+              files for dynamic shape.
             - atomic_clean_policy (int): The policy for cleaning memory occupied by atomic operators in the network.
               Default: ``1`` .
@@ -1350,24 +1621,76 @@ def set_context(**kwargs):
               For detailed information, please refer to `Ascend community <https://www.hiascend.com/>`_ .
             - exception_dump (str): Enable exception dump for Ascend operators, providing the input and output data for
               failing Ascend operators. The value can be ``"0"`` , ``"1"`` and ``"2"``. For ``"0"`` , exception dump is
-              turned off; for ``"1"``, all inputs and outputs will be dumped for AICore and AICPU exception operators;
-              for ``"2"``, inputs will be dumped for AICore exception operators. Default: ``"2"`` .
+              turned off; for ``"1"``, all inputs and outputs will be dumped for AICore exception operators;
+              for ``"2"``, inputs will be dumped for AICore exception operators, reducing the saved information
+              but improving performance. Default: ``"2"`` .
             - op_precision_mode (str): Path to config file of op precision mode. For detailed information, please refer
               to `Ascend community <https://www.hiascend.com/>`_ .
+            - op_debug_option (str): Enable debugging options for Ascend operators, default not enabled.
+              The value currently only supports being set to ``"oom"``.
+              - ``"oom"``: When there is a memory out of bounds during the execution of an operator,
+                AscendCL will return an error code of ``EZ9999``.
+            - ge_options (dict): Set options for CANN. The options are divided into two categories: global and session.
+              This is an experimental prototype that is subject to change and/or deletion.
+              For detailed information, please refer to `Ascend community <https://www.hiascend.com/document/detail/zh/canncommercial/70RC1/inferapplicationdev/graphdevg/atlasgeapi_07_0119.html>`_ .
+              The configuration options in `ge_options` may be duplicated with the options in `ascend_config`. If the
+              same configuration options are set in both `ascend_config` and `ge_options`, the one set in `ge_options`
+              shall prevail.
+              - global (dict): Set global options.
+              - session (dict): Set session options.
             - parallel_speed_up_json_path(Union[str, None]): The path to the parallel speed up json file, configuration
               can refer to `parallel_speed_up.json
-              <https://gitee.com/mindspore/mindspore/blob/r2.2/config/parallel_speed_up.json>`_ .
+              <https://gitee.com/mindspore/mindspore/blob/master/config/parallel_speed_up.json>`_ .
               If its value is None or '', it does not take effect. Default None.
               - recompute_comm_overlap (bool): Enable overlap between recompute ops and communication ops if True.
                 Default: False.
-              - matmul_grad_comm_overlap (bool): Enable overlap between grad ops and communication ops if True.
+              - matmul_grad_comm_overlap (bool): Enable overlap between dw matmul and
+                tensor parallel communication ops if True. Default: False.
+              - recompute_allgather_overlap_fagrad (bool): Enable overlap between duplicated allgather by recomputing
+                in sequence parallel and flashattentionscoregrad ops if True. Default: False.
+              - enable_task_opt (bool): Enable communication fusion to optimize the number of communication operator
+                tasks if True.
                 Default: False.
-              - enable_task_opt (bool): Enable the optimization of the number of tasks for each communication if True.
+              - enable_grad_comm_opt (bool): Enable overlap between dx ops and data parallel communication ops if True.
+                Currently, do not support
+                `LazyInline <https://www.mindspore.cn/docs/en/master/api_python/mindspore/mindspore.lazy_inline.html>`
                 Default: False.
-              - interleaved_matmul_comm (bool): Enable interleaved optimization of Matmul-Comm if True. Default: False.
-              - interleaved_layernorm_comm (bool): Enable interleaved optimization of LayerNorm-Comm if True.
+              - enable_opt_shard_comm_opt (bool): Enable overlap between forward ops
+                and optimizer parallel allgather communication if True. Currently, do not support
+                `LazyInline <https://www.mindspore.cn/docs/en/master/api_python/mindspore/mindspore.lazy_inline.html>`
                 Default: False.
+              - compute_communicate_fusion_level (int): Enable the fusion between compute and communicate.
+                Default: ``0``. Note: This function must be used with Ascend Training Solution 24.0.RC2 or later.
+                - 0: Disable fusion.
+                - 1: Apply fusion to forward nodes.
+                - 2: Apply fusion to backward nodes.
+                - 3: Apply fusion to all nodes.
+              - dataset_broadcast_opt_level (int): Optimize the scenario that the dataset repeated reading. Only
+                support O0/O1 jit level. It doesn't work in O2 mode. Default: ``0``.
+                - 0: Disable this optimize.
+                - 1: Optimize dataset reader between pipeline stage.
+                - 2: Optimize dataset reader within pipeline stage.
+                - 3: Optimize dataset reader with all scenes.
+              - bias_add_comm_swap (bool): Enable node execution order swap communication operators and add operators
+                if ``True``. Only 1-dimension bias node is supported. Default: ``False``.
+            - host_scheduling_max_threshold(int): The max threshold to control whether the dynamic shape process is
+              used when run the static graph, the default value is 0. When the number of operations in the static graph
+              is less than the max threshold, this graph will be executed in dynamic shape process. In large model
+              scenarios, this approach can save stream resources. If the number of operations in the static graph is
+              greater than the maximum threshold, this graph will be executed in original static process.
         jit_syntax_level (int): Set JIT syntax level for graph compiling, triggered by GRAPH_MODE and @jit decorator.
             The value must be ``STRICT`` or ``LAX`` . Default: ``LAX`` . All levels support all backends.
@@ -1378,6 +1701,12 @@ def set_context(**kwargs):
               affected and not optimal. Cannot be used for MindIR load and export due to some syntax that may not be
               able to be exported.
+        debug_level (int): Set config for debugging. Default value: ``RELEASE``.
+            - ``RELEASE``: Used for normally running, and some debug information will be discard to get a better
+              compiling performance.
+            - ``DEBUG``: Used for debugging when errors occur, more information will be record in compiling process.
         gpu_config (dict): Set the parameters specific to gpu hardware platform. It is not set by default.
             Currently, only setting `conv_fprop_algo` and `conv_dgrad_algo` and `conv_wgrad_algo` and `conv_allow_tf32`
             and `matmul_allow_tf32` are supported on GPU hardware platform.
@@ -1449,6 +1778,39 @@ def set_context(**kwargs):
             - matmul_allow_tf32 (bool): The flag below controls to allow Tensor core TF32 computation on CUBLAS and the
               default value is ``False``.
+        jit_config (dict): Set the global jit config for compile, take effect in network defined in Cell or jit
+            decorators. It is not set by default.
+            The setting in context is the global jit config, while JitConfig is the local network's jit config.
+            When both exist simultaneously, the global jit config will not overwrite the local network's jit config.
+            - jit_level (str): Used to control the compilation optimization level. Default: ``""`` , The framework
+              automatically selects the execution method based on product, Altas training product is O2, and all other
+              products are O0. In addition, The option of the dynamic shape must be O0 or O1, O2 is not supported.
+              The value range is as follows:
+              - ``"O0"``: Except for optimizations that may affect functionality, all other optimizations are turned
+                off, adopt KernelByKernel execution mode.
+              - ``"O1"``: Using commonly used optimizations and automatic operator fusion optimizations,
+                adopt KernelByKernel execution mode. This optimization level is experimental and is being improved.
+              - ``"O2"``: Ultimate performance optimization, adopt Sink execution mode.
+            - infer_boost (str): Used to control the infer mode. Default: ``"off"`` . The value range is as follows:
+              - ``"on"``: Enable infer mode, get better infer performance.
+              - ``"off"``: Disable infer mode, use forward to infer, performance is not good.
+        exec_order (str): Set the sorting method for operator execution in GRAPH_MODE Currently, only three sorting
+            methods are supported: bfs and gpto, and the default method is bfs.
+            - ``"bfs"``: The default sorting method, breadth priority, good communication masking, relatively good
+              performance.
+            - ``"dfs"``: An optional sorting method, depth-first sorting. The performance is relatively worse than that
+              of bfs execution order, but it occupies less memory. It is recommended to try dfs in scenarios where other
+              execution orders run out of memory (OOM).
+            - ``"gpto"``: An optional sorting method. This method combines multiple execution orders and selects a
+              method with relatively good performance. There may be some performance gains in scenarios with multiple
+              replicas running in parallel.
     Raises:
         ValueError: If input key is not an attribute in context.
@@ -1482,16 +1844,24 @@ def set_context(**kwargs):
         >>> ms.set_context(memory_offload='ON')
         >>> ms.set_context(deterministic='ON')
         >>> ms.set_context(ascend_config={"precision_mode": "force_fp16", "jit_compile": True,
-        ...                "atomic_clean_policy": 1, "op_precision_mode": "./op_precision_config_file"})
+        ...                "atomic_clean_policy": 1, "op_precision_mode": "./op_precision_config_file",
+        ...                "op_debug_option": "oom",
+        ...                "ge_options": {"global": {"ge.opSelectImplmode": "high_precision"},
+        ...                               "session": {"ge.exec.atomicCleanPolicy": "0"}}})
         >>> ms.set_context(jit_syntax_level=ms.STRICT)
+        >>> ms.set_context(debug_level=ms.context.DEBUG)
         >>> ms.set_context(gpu_config={"conv_fprop_algo": "performance", "conv_allow_tf32": True,
         ...                "matmul_allow_tf32": True})
+        >>> ms.set_context(jit_config={"jit_level": "O0"})
+        >>> ms.set_context(exec_order="gpto")
     """
     ctx = _context()
     # set device target first
     if 'device_target' in kwargs:
         ctx.set_device_target(kwargs['device_target'])
     device = ctx.get_param(ms_ctx_param.device_target)
+    _check_ascend_device_context_initialized(device, kwargs)
     for key, value in kwargs.items():
         if key in ('enable_sparse', 'auto_tune_mode'):
             logger.warning(f"For 'context.set_context', '{key}' parameter is deprecated, "
@@ -1501,9 +1871,7 @@ def set_context(**kwargs):
             logger.warning(f"For 'context.set_context', '{key}' parameter is deprecated. "
                            "For details, please see the interface parameter API comments")
             continue
-        if key in ('precision_mode', 'jit_compile', 'atomic_clean_policy', 'matmul_allow_hf32', 'conv_allow_hf32',
-                   'op_precision_mode'):
-            raise ValueError(f"Please set '{key}' through parameter ascend_config")
+        _check_key(key)
         if key == 'save_graphs':
             if value is True:
                 value = 2
@@ -1514,14 +1882,21 @@ def set_context(**kwargs):
         if key == 'jit_syntax_level' and value not in (STRICT, COMPATIBLE, LAX):
             raise ValueError(f"For 'jit_syntax_level', the value should be context.STRICT"
                              f" or context.LAX, but got {value}.")
-        if not _check_target_specific_cfgs(device, key):
-            continue
-        if hasattr(ctx, key):
+        if key == 'debug_level' and value not in (RELEASE, DEBUG):
+            raise ValueError(f"For 'debug_level', the value should be context.DEBUG"
+                             f" or context.RELEASE, but got {value}.")
+        if key == 'enable_compile_cache':
             setattr(ctx, key, value)
+            ctx.set_param(ms_ctx_param.__members__[key], int(value))
+            continue
+        if not _check_target_specific_cfgs(device, key):
             continue
         if key in ctx.setters:
             ctx.setters[key](ctx, value)
             continue
+        if hasattr(ctx, key):
+            setattr(ctx, key, value)
+            continue
         # enum variables beginning with '_' are for internal use
         if key in ms_ctx_param.__members__ and key[0] != '_':
             ctx.set_param(ms_ctx_param.__members__[key], value)
@@ -1571,6 +1946,17 @@ def _get_mode():
     return ctx.get_mode()
+def get_jit_config():
+    """
+    Get global jit config.
+    Returns:
+        Object: The Value of jit config.
+    """
+    ctx = _context()
+    return ctx.get_jit_config()
 class ParallelMode:
     """
     Parallel mode options.
@@ -1668,9 +2054,7 @@ def get_ps_context(attr_key):
 def reset_ps_context():
     """
-    Reset parameter server training mode context attributes to the default values:
-    - enable_ps: False.
+    Reset parameter server training mode context attributes to the default values.
     Meaning of each field and its default value refer to :func:`mindspore.set_ps_context`.