PyPI - mindspore - Versions diffs - 2.4.10__cp39-cp39-win_amd64.whl → 2.6.0rc1__cp39-cp39-win_amd64.whl - Mend

mindspore 2.4.10__cp39-cp39-win_amd64.whl → 2.6.0rc1__cp39-cp39-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (577) hide show

mindspore/.commit_id +1 -1
mindspore/__init__.py +13 -6
mindspore/_c_dataengine.cp39-win_amd64.pyd +0 -0
mindspore/_c_expression.cp39-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp39-win_amd64.pyd +0 -0
mindspore/_check_jit_forbidden_api.py +3 -0
mindspore/_checkparam.py +3 -38
mindspore/_deprecated/__init__.py +17 -0
mindspore/_deprecated/jit.py +198 -0
mindspore/_extends/builtin_operations.py +1 -1
mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
mindspore/_extends/parse/__init__.py +6 -7
mindspore/_extends/parse/compile_config.py +83 -0
mindspore/_extends/parse/deprecated/__init__.py +0 -0
mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +394 -0
mindspore/_extends/parse/jit_fallback_modules/__init__.py +0 -0
mindspore/_extends/parse/jit_fallback_modules/check_utils.py +123 -0
mindspore/_extends/parse/jit_fallback_modules/third_party_modules.py +50 -0
mindspore/_extends/parse/parser.py +46 -197
mindspore/_extends/parse/resources.py +1 -5
mindspore/_extends/parse/standard_method.py +217 -98
mindspore/_extends/pijit/__init__.py +2 -2
mindspore/_extends/pijit/pijit_func_white_list.py +17 -12
mindspore/_extends/pijit/tensor_func_list.py +27 -0
mindspore/_extends/utils.py +1 -1
mindspore/amp.py +11 -5
mindspore/avcodec-59.dll +0 -0
mindspore/avdevice-59.dll +0 -0
mindspore/avfilter-8.dll +0 -0
mindspore/avformat-59.dll +0 -0
mindspore/avutil-57.dll +0 -0
mindspore/boost/__init__.py +2 -2
mindspore/boost/base.py +3 -7
mindspore/boost/boost_cell_wrapper.py +138 -43
mindspore/common/__init__.py +6 -3
mindspore/common/_grad_function.py +56 -0
mindspore/common/_pijit_context.py +14 -5
mindspore/common/_register_for_tensor.py +1 -2
mindspore/common/_stub_tensor.py +30 -14
mindspore/common/_tensor_cpp_method.py +17 -0
mindspore/common/_tensor_docs.py +4760 -0
mindspore/common/api.py +435 -371
mindspore/common/auto_dynamic_shape.py +41 -44
mindspore/common/dtype.py +39 -36
mindspore/common/dump.py +9 -6
mindspore/common/file_system.py +9 -1
mindspore/common/generator.py +2 -0
mindspore/common/hook_handle.py +6 -2
mindspore/common/initializer.py +13 -10
mindspore/common/jit_begin_end.py +94 -0
mindspore/common/jit_config.py +6 -1
mindspore/common/jit_context.py +76 -0
mindspore/common/jit_trace.py +378 -0
mindspore/common/lazy_inline.py +9 -3
mindspore/common/mindir_util.py +10 -2
mindspore/common/mutable.py +5 -4
mindspore/common/parameter.py +135 -52
mindspore/common/seed.py +2 -2
mindspore/common/sparse_tensor.py +23 -17
mindspore/common/tensor.py +951 -1992
mindspore/communication/__init__.py +7 -5
mindspore/communication/_comm_helper.py +52 -2
mindspore/communication/comm_func.py +240 -181
mindspore/communication/management.py +95 -26
mindspore/context.py +314 -566
mindspore/dataset/__init__.py +65 -37
mindspore/dataset/audio/__init__.py +2 -8
mindspore/dataset/audio/transforms.py +3 -17
mindspore/dataset/callback/ds_callback.py +2 -1
mindspore/dataset/core/config.py +87 -6
mindspore/dataset/engine/cache_admin.py +3 -3
mindspore/dataset/engine/cache_client.py +6 -5
mindspore/dataset/engine/datasets.py +292 -267
mindspore/dataset/engine/datasets_audio.py +22 -8
mindspore/dataset/engine/datasets_standard_format.py +46 -27
mindspore/dataset/engine/datasets_text.py +78 -48
mindspore/dataset/engine/datasets_user_defined.py +182 -116
mindspore/dataset/engine/datasets_vision.py +120 -44
mindspore/dataset/engine/iterators.py +283 -63
mindspore/dataset/engine/obs/obs_mindrecord_dataset.py +1 -1
mindspore/dataset/engine/obs/util.py +8 -0
mindspore/dataset/engine/queue.py +40 -0
mindspore/dataset/engine/samplers.py +289 -43
mindspore/dataset/engine/serializer_deserializer.py +3 -2
mindspore/dataset/engine/validators.py +53 -11
mindspore/dataset/text/__init__.py +7 -6
mindspore/dataset/text/transforms.py +6 -5
mindspore/dataset/text/utils.py +3 -3
mindspore/dataset/transforms/__init__.py +0 -9
mindspore/dataset/transforms/py_transforms_util.py +17 -0
mindspore/dataset/transforms/transforms.py +31 -14
mindspore/dataset/utils/browse_dataset.py +1 -1
mindspore/dataset/vision/__init__.py +2 -9
mindspore/dataset/vision/transforms.py +202 -158
mindspore/dataset/vision/utils.py +7 -5
mindspore/dataset/vision/validators.py +1 -2
mindspore/device_context/__init__.py +21 -0
mindspore/device_context/ascend/__init__.py +25 -0
mindspore/device_context/ascend/device.py +72 -0
mindspore/device_context/ascend/op_debug.py +153 -0
mindspore/device_context/ascend/op_precision.py +193 -0
mindspore/device_context/ascend/op_tuning.py +123 -0
mindspore/{ops_generate/gen_constants.py → device_context/cpu/__init__.py} +6 -17
mindspore/device_context/cpu/device.py +62 -0
mindspore/device_context/cpu/op_tuning.py +43 -0
mindspore/device_context/gpu/__init__.py +21 -0
mindspore/device_context/gpu/device.py +70 -0
mindspore/device_context/gpu/op_precision.py +67 -0
mindspore/device_context/gpu/op_tuning.py +175 -0
mindspore/device_manager.py +170 -0
mindspore/experimental/es/embedding_service.py +35 -27
mindspore/experimental/llm_boost/__init__.py +1 -0
mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
mindspore/experimental/llm_boost/atb/llama_boost.py +6 -1
mindspore/experimental/llm_boost/register.py +1 -0
mindspore/experimental/map_parameter.py +4 -4
mindspore/experimental/optim/adadelta.py +6 -6
mindspore/experimental/optim/adagrad.py +4 -4
mindspore/experimental/optim/adam.py +7 -0
mindspore/experimental/optim/adamax.py +4 -4
mindspore/experimental/optim/adamw.py +4 -0
mindspore/experimental/optim/asgd.py +1 -1
mindspore/experimental/optim/lr_scheduler.py +73 -46
mindspore/experimental/optim/radam.py +34 -31
mindspore/experimental/optim/rprop.py +1 -1
mindspore/experimental/optim/sgd.py +1 -1
mindspore/hal/contiguous_tensors_handle.py +6 -10
mindspore/hal/device.py +55 -53
mindspore/hal/event.py +52 -52
mindspore/hal/memory.py +157 -117
mindspore/hal/stream.py +150 -109
mindspore/include/api/context.h +0 -1
mindspore/include/dataset/constants.h +7 -4
mindspore/include/dataset/execute.h +2 -2
mindspore/jpeg62.dll +0 -0
mindspore/log.py +50 -0
mindspore/mindrecord/__init__.py +21 -8
mindspore/mindrecord/config.py +17 -316
mindspore/mindrecord/filereader.py +1 -9
mindspore/mindrecord/filewriter.py +5 -15
mindspore/mindrecord/mindpage.py +1 -9
mindspore/mindspore_backend_common.dll +0 -0
mindspore/mindspore_backend_manager.dll +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_dump.dll +0 -0
mindspore/mindspore_frontend.dll +0 -0
mindspore/mindspore_memory_pool.dll +0 -0
mindspore/mindspore_ms_backend.dll +0 -0
mindspore/mindspore_ops.dll +0 -0
mindspore/{mindspore_backend.dll → mindspore_ops_host.dll} +0 -0
mindspore/mindspore_ops_kernel_common.dll +0 -0
mindspore/mindspore_profiler.dll +0 -0
mindspore/mindspore_pyboost.dll +0 -0
mindspore/mindspore_pynative.dll +0 -0
mindspore/mindspore_res_manager.dll +0 -0
mindspore/mindspore_runtime_pipeline.dll +0 -0
mindspore/mint/__init__.py +796 -759
mindspore/mint/distributed/__init__.py +70 -4
mindspore/mint/distributed/distributed.py +2679 -44
mindspore/mint/linalg/__init__.py +8 -0
mindspore/mint/nn/__init__.py +743 -22
mindspore/mint/nn/functional.py +716 -23
mindspore/mint/nn/layer/__init__.py +21 -4
mindspore/mint/nn/layer/_functions.py +334 -0
mindspore/mint/nn/layer/activation.py +276 -1
mindspore/mint/nn/layer/basic.py +123 -0
mindspore/mint/nn/layer/conv.py +921 -0
mindspore/mint/nn/layer/normalization.py +223 -28
mindspore/mint/nn/layer/padding.py +797 -0
mindspore/mint/nn/layer/pooling.py +235 -0
mindspore/mint/optim/__init__.py +3 -1
mindspore/mint/optim/adam.py +223 -0
mindspore/mint/optim/adamw.py +26 -19
mindspore/mint/optim/sgd.py +171 -0
mindspore/mint/special/__init__.py +2 -1
mindspore/multiprocessing/__init__.py +5 -0
mindspore/nn/__init__.py +4 -1
mindspore/nn/cell.py +1370 -189
mindspore/nn/dynamic_lr.py +2 -1
mindspore/nn/layer/activation.py +29 -27
mindspore/nn/layer/basic.py +51 -35
mindspore/nn/layer/channel_shuffle.py +3 -3
mindspore/nn/layer/container.py +1 -1
mindspore/nn/layer/conv.py +22 -17
mindspore/nn/layer/embedding.py +12 -11
mindspore/nn/layer/normalization.py +56 -49
mindspore/nn/layer/padding.py +4 -3
mindspore/nn/layer/pooling.py +120 -42
mindspore/nn/layer/rnn_cells.py +1 -1
mindspore/nn/layer/rnns.py +2 -1
mindspore/nn/layer/timedistributed.py +5 -5
mindspore/nn/layer/transformer.py +59 -36
mindspore/nn/learning_rate_schedule.py +8 -4
mindspore/nn/loss/loss.py +58 -55
mindspore/nn/optim/ada_grad.py +7 -5
mindspore/nn/optim/adadelta.py +11 -9
mindspore/nn/optim/adafactor.py +1 -1
mindspore/nn/optim/adam.py +17 -13
mindspore/nn/optim/adamax.py +8 -7
mindspore/nn/optim/adasum.py +5 -5
mindspore/nn/optim/asgd.py +1 -1
mindspore/nn/optim/ftrl.py +11 -9
mindspore/nn/optim/lamb.py +1 -1
mindspore/nn/optim/lars.py +1 -4
mindspore/nn/optim/lazyadam.py +12 -10
mindspore/nn/optim/momentum.py +7 -6
mindspore/nn/optim/optimizer.py +3 -3
mindspore/nn/optim/proximal_ada_grad.py +12 -10
mindspore/nn/optim/rmsprop.py +13 -12
mindspore/nn/optim/rprop.py +11 -9
mindspore/nn/optim/sgd.py +9 -6
mindspore/nn/optim/tft_wrapper.py +5 -2
mindspore/nn/optim/thor.py +2 -1
mindspore/nn/probability/bijector/bijector.py +17 -11
mindspore/nn/probability/bijector/gumbel_cdf.py +5 -5
mindspore/nn/probability/bijector/invert.py +2 -2
mindspore/nn/probability/bijector/scalar_affine.py +3 -3
mindspore/nn/probability/bijector/softplus.py +3 -2
mindspore/nn/probability/distribution/beta.py +3 -3
mindspore/nn/probability/distribution/categorical.py +1 -1
mindspore/nn/probability/distribution/cauchy.py +4 -2
mindspore/nn/probability/distribution/exponential.py +6 -7
mindspore/nn/probability/distribution/gamma.py +2 -2
mindspore/nn/probability/distribution/gumbel.py +2 -2
mindspore/nn/probability/distribution/half_normal.py +5 -3
mindspore/nn/probability/distribution/logistic.py +5 -3
mindspore/nn/probability/distribution/poisson.py +1 -1
mindspore/nn/probability/distribution/uniform.py +5 -3
mindspore/nn/reinforcement/_tensors_queue.py +1 -1
mindspore/nn/reinforcement/tensor_array.py +1 -1
mindspore/nn/utils/init.py +13 -11
mindspore/nn/wrap/__init__.py +6 -6
mindspore/nn/wrap/cell_wrapper.py +181 -122
mindspore/nn/wrap/grad_reducer.py +45 -36
mindspore/nn/wrap/loss_scale.py +6 -7
mindspore/numpy/array_creations.py +63 -65
mindspore/numpy/array_ops.py +149 -144
mindspore/numpy/logic_ops.py +41 -42
mindspore/numpy/math_ops.py +365 -363
mindspore/numpy/utils.py +17 -18
mindspore/numpy/utils_const.py +5 -6
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/opencv_imgproc452.dll +0 -0
mindspore/ops/__init__.py +5 -3
mindspore/ops/_grad_experimental/grad_comm_ops.py +112 -16
mindspore/ops/_grad_experimental/grad_debug_ops.py +14 -2
mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
mindspore/ops/_grad_experimental/taylor_rule.py +29 -0
mindspore/ops/_op_impl/cpu/__init__.py +1 -0
mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
mindspore/ops/_register_for_op.py +0 -11
mindspore/{ops_generate → ops/_utils}/arg_dtype_cast.py +123 -4
mindspore/{ops_generate → ops/_utils}/arg_handler.py +3 -65
mindspore/ops/_vmap/vmap_array_ops.py +27 -25
mindspore/ops/_vmap/vmap_base.py +0 -2
mindspore/ops/_vmap/vmap_grad_nn_ops.py +21 -14
mindspore/ops/_vmap/vmap_math_ops.py +15 -16
mindspore/ops/_vmap/vmap_nn_ops.py +29 -42
mindspore/ops/auto_generate/__init__.py +4 -3
mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +236 -46
mindspore/ops/auto_generate/gen_extend_func.py +764 -124
mindspore/ops/auto_generate/gen_ops_def.py +4018 -2264
mindspore/ops/auto_generate/gen_ops_prim.py +15463 -5037
mindspore/ops/auto_generate/pyboost_inner_prim.py +221 -87
mindspore/ops/composite/__init__.py +2 -1
mindspore/ops/composite/base.py +20 -25
mindspore/ops/composite/math_ops.py +6 -16
mindspore/ops/composite/multitype_ops/__init__.py +5 -2
mindspore/ops/composite/multitype_ops/_compile_utils.py +228 -30
mindspore/ops/composite/multitype_ops/_constexpr_utils.py +1 -2
mindspore/ops/composite/multitype_ops/add_impl.py +2 -1
mindspore/ops/composite/multitype_ops/bitwise_and_impl.py +2 -1
mindspore/ops/composite/multitype_ops/bitwise_or_impl.py +2 -1
mindspore/ops/composite/multitype_ops/bitwise_xor_impl.py +2 -1
mindspore/ops/composite/multitype_ops/div_impl.py +6 -4
mindspore/ops/composite/multitype_ops/equal_impl.py +4 -3
mindspore/ops/composite/multitype_ops/floordiv_impl.py +2 -1
mindspore/ops/composite/multitype_ops/getitem_impl.py +3 -2
mindspore/ops/composite/multitype_ops/greater_equal_impl.py +4 -3
mindspore/ops/composite/multitype_ops/greater_impl.py +4 -3
mindspore/ops/composite/multitype_ops/in_impl.py +2 -1
mindspore/ops/composite/multitype_ops/invert_impl.py +50 -0
mindspore/ops/composite/multitype_ops/left_shift_impl.py +2 -1
mindspore/ops/composite/multitype_ops/less_equal_impl.py +4 -3
mindspore/ops/composite/multitype_ops/less_impl.py +4 -3
mindspore/ops/composite/multitype_ops/logic_not_impl.py +3 -2
mindspore/ops/composite/multitype_ops/logical_and_impl.py +2 -1
mindspore/ops/composite/multitype_ops/logical_or_impl.py +2 -1
mindspore/ops/composite/multitype_ops/mod_impl.py +2 -1
mindspore/ops/composite/multitype_ops/mul_impl.py +3 -2
mindspore/ops/composite/multitype_ops/negative_impl.py +2 -1
mindspore/ops/composite/multitype_ops/not_equal_impl.py +2 -1
mindspore/ops/composite/multitype_ops/not_in_impl.py +2 -1
mindspore/ops/composite/multitype_ops/ones_like_impl.py +18 -0
mindspore/ops/composite/multitype_ops/pow_impl.py +2 -30
mindspore/ops/composite/multitype_ops/right_shift_impl.py +2 -1
mindspore/ops/composite/multitype_ops/setitem_impl.py +2 -1
mindspore/ops/composite/multitype_ops/sub_impl.py +2 -1
mindspore/ops/function/__init__.py +40 -2
mindspore/ops/function/_add_attr_func.py +58 -0
mindspore/ops/function/array_func.py +2089 -2403
mindspore/ops/function/clip_func.py +80 -23
mindspore/ops/function/debug_func.py +57 -57
mindspore/ops/function/grad/__init__.py +1 -0
mindspore/ops/function/grad/grad_func.py +104 -71
mindspore/ops/function/image_func.py +2 -2
mindspore/ops/function/linalg_func.py +47 -78
mindspore/ops/function/math_func.py +4501 -3802
mindspore/ops/function/nn_func.py +1726 -620
mindspore/ops/function/other_func.py +159 -1
mindspore/ops/function/parameter_func.py +18 -84
mindspore/ops/function/random_func.py +440 -387
mindspore/ops/function/reshard_func.py +4 -70
mindspore/ops/function/sparse_func.py +3 -3
mindspore/ops/function/sparse_unary_func.py +6 -6
mindspore/ops/function/spectral_func.py +25 -58
mindspore/ops/function/vmap_func.py +24 -17
mindspore/ops/functional.py +22 -7
mindspore/ops/functional_overload.py +1440 -0
mindspore/ops/op_info_register.py +32 -244
mindspore/ops/operations/__init__.py +13 -7
mindspore/ops/operations/_custom_ops_utils.py +247 -0
mindspore/ops/operations/_embedding_cache_ops.py +4 -4
mindspore/ops/operations/_grad_ops.py +2 -43
mindspore/ops/operations/_infer_ops.py +2 -1
mindspore/ops/operations/_inner_ops.py +43 -84
mindspore/ops/operations/_ms_kernel.py +4 -10
mindspore/ops/operations/_rl_inner_ops.py +1 -1
mindspore/ops/operations/_scalar_ops.py +3 -2
mindspore/ops/operations/_sequence_ops.py +1 -1
mindspore/ops/operations/_tensor_array.py +1 -1
mindspore/ops/operations/array_ops.py +81 -324
mindspore/ops/operations/comm_ops.py +154 -108
mindspore/ops/operations/custom_ops.py +232 -78
mindspore/ops/operations/debug_ops.py +153 -59
mindspore/ops/operations/inner_ops.py +7 -5
mindspore/ops/operations/linalg_ops.py +1 -57
mindspore/ops/operations/manually_defined/_inner.py +1 -1
mindspore/ops/operations/manually_defined/ops_def.py +928 -180
mindspore/ops/operations/math_ops.py +32 -234
mindspore/ops/operations/nn_ops.py +210 -498
mindspore/ops/operations/other_ops.py +62 -9
mindspore/ops/operations/random_ops.py +13 -7
mindspore/ops/operations/reshard_ops.py +1 -1
mindspore/ops/operations/sparse_ops.py +2 -2
mindspore/ops/primitive.py +66 -53
mindspore/ops/tensor_method.py +1888 -0
mindspore/ops_generate/__init__.py +0 -5
mindspore/ops_generate/aclnn/__init__.py +0 -0
mindspore/ops_generate/aclnn/aclnn_kernel_register_auto_cc_generator.py +135 -0
mindspore/ops_generate/aclnn/gen_aclnn_implement.py +257 -0
mindspore/ops_generate/api/__init__.py +0 -0
mindspore/ops_generate/api/add_tensor_docs_generator.py +56 -0
mindspore/ops_generate/api/cpp_create_prim_instance_helper_generator.py +105 -0
mindspore/ops_generate/api/functional_map_cpp_generator.py +504 -0
mindspore/ops_generate/api/functional_overload_py_generator.py +112 -0
mindspore/ops_generate/api/functions_cc_generator.py +237 -0
mindspore/ops_generate/api/gen_api.py +103 -0
mindspore/ops_generate/api/op_api_proto.py +235 -0
mindspore/ops_generate/api/tensor_func_reg_cpp_generator.py +461 -0
mindspore/ops_generate/common/__init__.py +0 -0
mindspore/ops_generate/common/base_generator.py +11 -0
mindspore/ops_generate/common/gen_constants.py +91 -0
mindspore/ops_generate/common/gen_utils.py +348 -0
mindspore/ops_generate/common/op_proto.py +473 -0
mindspore/ops_generate/common/template.py +523 -0
mindspore/ops_generate/gen_ops.py +22 -1069
mindspore/ops_generate/op_def/__init__.py +0 -0
mindspore/ops_generate/op_def/gen_op_def.py +90 -0
mindspore/ops_generate/op_def/lite_ops_cpp_generator.py +191 -0
mindspore/ops_generate/op_def/ops_def_cc_generator.py +299 -0
mindspore/ops_generate/op_def/ops_def_h_generator.py +74 -0
mindspore/ops_generate/op_def/ops_name_h_generator.py +83 -0
mindspore/ops_generate/op_def/ops_primitive_h_generator.py +125 -0
mindspore/ops_generate/op_def_py/__init__.py +0 -0
mindspore/ops_generate/op_def_py/gen_op_def_py.py +47 -0
mindspore/ops_generate/op_def_py/op_def_py_generator.py +132 -0
mindspore/ops_generate/op_def_py/op_prim_py_generator.py +489 -0
mindspore/ops_generate/pyboost/__init__.py +0 -0
mindspore/ops_generate/pyboost/auto_grad_impl_cc_generator.py +139 -0
mindspore/ops_generate/pyboost/auto_grad_reg_cc_generator.py +93 -0
mindspore/ops_generate/pyboost/gen_pyboost_func.py +175 -0
mindspore/ops_generate/pyboost/op_template_parser.py +517 -0
mindspore/ops_generate/pyboost/pyboost_functions_cpp_generator.py +407 -0
mindspore/ops_generate/pyboost/pyboost_functions_h_generator.py +100 -0
mindspore/ops_generate/pyboost/pyboost_functions_py_generator.py +148 -0
mindspore/ops_generate/pyboost/pyboost_grad_function_cpp_generator.py +155 -0
mindspore/ops_generate/pyboost/pyboost_inner_prim_generator.py +132 -0
mindspore/ops_generate/pyboost/pyboost_native_grad_functions_generator.py +272 -0
mindspore/ops_generate/pyboost/pyboost_op_cpp_code_generator.py +938 -0
mindspore/ops_generate/pyboost/pyboost_overload_functions_cpp_generator.py +357 -0
mindspore/ops_generate/{pyboost_utils.py → pyboost/pyboost_utils.py} +179 -36
mindspore/ops_generate/resources/__init__.py +0 -0
mindspore/ops_generate/resources/resource_list.py +30 -0
mindspore/ops_generate/resources/resource_loader.py +36 -0
mindspore/ops_generate/resources/resource_manager.py +64 -0
mindspore/ops_generate/resources/yaml_loader.py +88 -0
mindspore/ops_generate/tensor_py_cc_generator.py +122 -0
mindspore/parallel/__init__.py +7 -3
mindspore/parallel/_auto_parallel_context.py +152 -34
mindspore/parallel/_cell_wrapper.py +130 -15
mindspore/parallel/_parallel_serialization.py +107 -5
mindspore/parallel/_ps_context.py +1 -1
mindspore/parallel/_recovery_context.py +7 -2
mindspore/parallel/_tensor.py +142 -18
mindspore/parallel/_utils.py +199 -23
mindspore/parallel/algo_parameter_config.py +4 -4
mindspore/parallel/auto_parallel.py +732 -0
mindspore/parallel/checkpoint_convert.py +159 -0
mindspore/parallel/checkpoint_transform.py +698 -35
mindspore/parallel/cluster/process_entity/_api.py +276 -50
mindspore/parallel/cluster/process_entity/_utils.py +41 -6
mindspore/parallel/cluster/run.py +21 -4
mindspore/parallel/function/__init__.py +24 -0
mindspore/parallel/function/reshard_func.py +259 -0
mindspore/parallel/nn/__init__.py +25 -0
mindspore/parallel/nn/parallel_cell_wrapper.py +263 -0
mindspore/parallel/nn/parallel_grad_reducer.py +169 -0
mindspore/parallel/parameter_broadcast.py +25 -14
mindspore/parallel/shard.py +137 -58
mindspore/parallel/transform_safetensors.py +363 -305
mindspore/profiler/__init__.py +22 -5
mindspore/profiler/analysis/__init__.py +0 -0
mindspore/profiler/analysis/parser/__init__.py +0 -0
mindspore/profiler/analysis/parser/ascend_cann_parser.py +170 -0
mindspore/profiler/analysis/parser/base_parser.py +158 -0
mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +264 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +106 -0
mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +415 -0
mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
mindspore/profiler/analysis/task_manager.py +131 -0
mindspore/profiler/analysis/time_converter.py +84 -0
mindspore/profiler/analysis/viewer/__init__.py +0 -0
mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +372 -0
mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +250 -0
mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +320 -0
mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +327 -0
mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +376 -0
mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +96 -0
mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
mindspore/profiler/analysis/work_flow.py +73 -0
mindspore/profiler/common/ascend_msprof_exporter.py +139 -0
mindspore/profiler/common/command_executor.py +90 -0
mindspore/profiler/common/constant.py +186 -3
mindspore/profiler/common/file_manager.py +208 -0
mindspore/profiler/common/log.py +130 -0
mindspore/profiler/common/msprof_cmd_tool.py +221 -0
mindspore/profiler/common/path_manager.py +395 -0
mindspore/profiler/common/process_bar.py +168 -0
mindspore/profiler/common/process_pool.py +9 -3
mindspore/profiler/common/profiler_context.py +500 -0
mindspore/profiler/common/profiler_info.py +304 -0
mindspore/profiler/common/profiler_meta_data.py +74 -0
mindspore/profiler/common/profiler_output_path.py +284 -0
mindspore/profiler/common/profiler_parameters.py +251 -0
mindspore/profiler/common/profiler_path_manager.py +179 -0
mindspore/profiler/common/record_function.py +76 -0
mindspore/profiler/common/tlv_decoder.py +76 -0
mindspore/profiler/common/util.py +75 -2
mindspore/profiler/dynamic_profiler.py +341 -75
mindspore/profiler/envprofiler.py +163 -0
mindspore/profiler/experimental_config.py +197 -0
mindspore/profiler/mstx.py +242 -0
mindspore/profiler/platform/__init__.py +21 -0
mindspore/profiler/platform/base_profiler.py +40 -0
mindspore/profiler/platform/cpu_profiler.py +124 -0
mindspore/profiler/platform/gpu_profiler.py +74 -0
mindspore/profiler/platform/npu_profiler.py +335 -0
mindspore/profiler/profiler.py +1073 -90
mindspore/profiler/profiler_action_controller.py +187 -0
mindspore/profiler/profiler_interface.py +118 -0
mindspore/profiler/schedule.py +243 -0
mindspore/rewrite/api/node.py +15 -13
mindspore/rewrite/api/symbol_tree.py +2 -3
mindspore/run_check/_check_version.py +27 -20
mindspore/run_check/run_check.py +1 -1
mindspore/runtime/__init__.py +37 -0
mindspore/runtime/device.py +27 -0
mindspore/runtime/event.py +209 -0
mindspore/runtime/executor.py +177 -0
mindspore/runtime/memory.py +409 -0
mindspore/runtime/stream.py +460 -0
mindspore/runtime/thread_bind_core.py +401 -0
mindspore/safeguard/rewrite_obfuscation.py +12 -9
mindspore/swresample-4.dll +0 -0
mindspore/swscale-6.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/train/__init__.py +8 -8
mindspore/train/_utils.py +88 -25
mindspore/train/amp.py +9 -5
mindspore/train/callback/__init__.py +2 -2
mindspore/train/callback/_callback.py +2 -16
mindspore/train/callback/_checkpoint.py +53 -55
mindspore/train/callback/_cluster_monitor.py +14 -18
mindspore/train/callback/_early_stop.py +1 -1
mindspore/train/callback/_flops_collector.py +103 -68
mindspore/train/callback/_history.py +8 -5
mindspore/train/callback/_lambda_callback.py +2 -2
mindspore/train/callback/_landscape.py +0 -3
mindspore/train/callback/_loss_monitor.py +2 -1
mindspore/train/callback/_on_request_exit.py +6 -5
mindspore/train/callback/_reduce_lr_on_plateau.py +11 -6
mindspore/train/callback/_summary_collector.py +52 -19
mindspore/train/callback/_time_monitor.py +2 -1
mindspore/train/callback/{_tft_register.py → _train_fault_tolerance.py} +204 -107
mindspore/train/data_sink.py +25 -2
mindspore/train/dataset_helper.py +15 -16
mindspore/train/loss_scale_manager.py +8 -7
mindspore/train/metrics/accuracy.py +3 -3
mindspore/train/metrics/confusion_matrix.py +9 -9
mindspore/train/metrics/error.py +3 -3
mindspore/train/metrics/hausdorff_distance.py +4 -4
mindspore/train/metrics/mean_surface_distance.py +3 -3
mindspore/train/metrics/metric.py +0 -12
mindspore/train/metrics/occlusion_sensitivity.py +4 -2
mindspore/train/metrics/precision.py +11 -10
mindspore/train/metrics/recall.py +9 -9
mindspore/train/metrics/root_mean_square_surface_distance.py +2 -2
mindspore/train/mind_ir_pb2.py +174 -46
mindspore/train/model.py +184 -113
mindspore/train/serialization.py +622 -978
mindspore/train/summary/_summary_adapter.py +2 -2
mindspore/train/summary/summary_record.py +2 -3
mindspore/train/train_thor/model_thor.py +1 -1
mindspore/turbojpeg.dll +0 -0
mindspore/utils/__init__.py +6 -3
mindspore/utils/dryrun.py +140 -0
mindspore/utils/hooks.py +81 -0
mindspore/utils/runtime_execution_order_check.py +550 -0
mindspore/utils/utils.py +138 -4
mindspore/version.py +1 -1
{mindspore-2.4.10.dist-info → mindspore-2.6.0rc1.dist-info}/METADATA +3 -3
{mindspore-2.4.10.dist-info → mindspore-2.6.0rc1.dist-info}/RECORD +562 -393
{mindspore-2.4.10.dist-info → mindspore-2.6.0rc1.dist-info}/entry_points.txt +1 -1
mindspore/_install_custom.py +0 -43
mindspore/common/_register_for_adapter.py +0 -74
mindspore/common/_tensor_overload.py +0 -139
mindspore/mindspore_np_dtype.dll +0 -0
mindspore/ops/auto_generate/gen_arg_dtype_cast.py +0 -252
mindspore/ops/auto_generate/gen_arg_handler.py +0 -197
mindspore/ops/operations/_opaque_predicate_registry.py +0 -41
mindspore/ops_generate/gen_aclnn_implement.py +0 -263
mindspore/ops_generate/gen_ops_inner_prim.py +0 -131
mindspore/ops_generate/gen_pyboost_func.py +0 -1052
mindspore/ops_generate/gen_utils.py +0 -209
mindspore/ops_generate/op_proto.py +0 -145
mindspore/ops_generate/template.py +0 -261
mindspore/profiler/envprofiling.py +0 -254
mindspore/profiler/profiling.py +0 -1926
{mindspore-2.4.10.dist-info → mindspore-2.6.0rc1.dist-info}/WHEEL +0 -0
{mindspore-2.4.10.dist-info → mindspore-2.6.0rc1.dist-info}/top_level.txt +0 -0

mindspore/nn/cell.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Copyright 2020-2024 Huawei Technologies Co., Ltd
+# Copyright 2020-2025 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -15,13 +15,26 @@
 """cell"""
 from __future__ import absolute_import
-import gc
 import inspect
 import os
 import time
-from collections import OrderedDict
-import numpy
+import warnings
+import itertools
+from collections import OrderedDict, namedtuple
+from typing import (
+    Dict,
+    Optional,
+    Set,
+    Callable,
+    List,
+    Tuple,
+    Iterator,
+    Any,
+    TypeVar,
+    Mapping
+)
+import mindspore as ms
 from mindspore._checkparam import args_type_check, check_hook_fn
 from mindspore.common._auto_dynamic import is_auto_dynamic, convert_inputs_to_dynamic
 from mindspore import log as logger
@@ -34,19 +47,62 @@ from mindspore import _checkparam as Validator
 from mindspore.common import dtype as mstype
 from mindspore.common.api import _cell_graph_executor, _pynative_executor, _get_args_for_run, cells_compile_cache, \
     _no_grad
-from mindspore.common.api import _generate_branch_control_input, _convert_python_data, _get_args_for_run_predict
+from mindspore.common.api import _convert_python_data, _get_args_for_run_predict
 from mindspore.common.api import _process_dyn_args, _generate_dyn_compile_args
-from mindspore.common.parameter import Parameter, ParameterTuple
+from mindspore.common.parameter import _Buffer, Parameter, ParameterTuple
 from mindspore.common.tensor import Tensor
 from mindspore.ops.operations import Cast
 from mindspore.ops.primitive import Primitive
 from mindspore.ops.operations import _inner_ops as inner
 from mindspore.parallel.shard import Shard
+from mindspore.parallel._utils import _init_auto_parallel_context, _clear_auto_parallel_context
 from mindspore._check_jit_forbidden_api import jit_forbidden_register
 from mindspore.common._decorator import deprecated
 from mindspore.common._register_for_recompute import recompute_registry
+__all__ = [
+    "register_cell_buffer_registration_hook",
+]
+_global_buffer_registration_hooks: Dict[int, Callable] = OrderedDict()
+_EXTRA_STATE_KEY_SUFFIX = "_extra_state"
+class _IncompatibleKeys(namedtuple("IncompatibleKeys", ["missing_keys", "unexpected_keys"]),):
+    def __repr__(self):
+        if not self.missing_keys and not self.unexpected_keys:
+            return "<All keys matched successfully>"
+        return super().__repr__()
+    __str__ = __repr__
+def register_cell_buffer_registration_hook(hook: Callable[..., None],):
+    r"""Register a buffer registration hook common to all cells.
+    .. warning ::
+        This adds global state to the `nn.Cell` cell
+    The hook will be called every time :func:`register_buffer` is invoked.
+    It should have the following signature::
+        hook(cell, name, buffer) -> None or new buffer
+    The hook can modify the input or return a single modified value in the hook.
+    Returns:
+        A handle that can be used to remove the added hook by calling
+        `handle.remove()`.
+    """
+    from mindspore.utils.hooks import _RemovableHandle
+    handle = _RemovableHandle(_global_buffer_registration_hooks)
+    _global_buffer_registration_hooks[handle.id] = hook
+    return handle
 class Cell(Cell_):
     """
     The basic building block of neural networks in MindSpore. The model or neural network layer should inherit this
@@ -60,7 +116,7 @@ class Cell(Cell_):
     .. note::
         Cell is the inference mode by default. For a class that inherits a Cell,
         if the training and inference have different structures, the subclass performs the inference branch by default.
-        To set the training mode, refer to `mindspore.nn.Cell.set_train` .
+        To set the training mode, refer to :func:`mindspore.nn.Cell.set_train` .
     .. warning::
         In the subclass of Cell, it's not allowed to define a method named 'cast' and not allowed to define an attribute
@@ -105,8 +161,11 @@ class Cell(Cell_):
                    '_func_graph_flags', '_parameter_layout_dict', '_params_list', '_phase', '_bprop_debug',
                    '_forward_pre_hook', '_forward_hook', '_backward_pre_hook', '_backward_hook',
                    '_cell_backward_pre_hook', '_cell_backward_hook', '_is_run', '_param_prefix',
-                   '_attr_synced', 'pynative', 'requires_grad', 'cell_type']
+                   '_attr_synced', 'pynative', 'requires_grad', 'cell_type',
+                   '_parameters_forward_hook', '_parameters_backward_hook']
     total_instance_count = 0
+    _buffers: Dict[str, Optional[Tensor]]
+    _non_persistent_buffers_set: Set[str]
     def __init__(self, auto_prefix=True, flags=None):
         Cell_.__init__(self, self._cell_tag)
@@ -114,10 +173,17 @@ class Cell(Cell_):
         self.instance_count = Cell.total_instance_count
         self._params = OrderedDict()
         self._cells = OrderedDict()
+        super().__setattr__("_buffers", {})
+        super().__setattr__("_non_persistent_buffers_set", set())
+        super().__setattr__("_state_dict_hooks", OrderedDict())
+        super().__setattr__("_state_dict_pre_hooks", OrderedDict())
+        super().__setattr__("_load_state_dict_pre_hooks", OrderedDict())
+        super().__setattr__("_load_state_dict_post_hooks", OrderedDict())
         self._params_list = OrderedDict()
         self._primitives = OrderedDict()
         self.training = False
         self.requires_grad = False
+        self.is_top_cell = False
         self.pynative = False
         self._attr_synced = False
         self._param_prefix = ''
@@ -134,8 +200,8 @@ class Cell(Cell_):
         cells_compile_cache[id(self)] = self.compile_cache
         self.parameter_broadcast_done = False
         self._id = 1
-        self.exist_names = set("")
-        self.exist_objs = set()
+        self._exist_objs = None
+        self._exist_names = None
         self._recompute_cell = None
         self.mixed_precision_type = None
         self.sig = inspect.signature(self.construct)
@@ -143,7 +209,8 @@ class Cell(Cell_):
         # call gc to release GE session resources used by non-used cell objects
         if os.getenv('GC_COLLECT_IN_CELL') == '1':
-            gc.collect()
+            logger.warning("The convenient environment 'GC_COLLECT_IN_CELL' is deprecated from version 2.5 "
+                           "and will be removed in a future version.")
         if flags:
             self.add_flags(**flags)
@@ -158,6 +225,10 @@ class Cell(Cell_):
         self._cell_backward_hook = None
         self._is_recursion_hook = False
+        # parameters hook
+        self._parameters_forward_hook = None
+        self._parameters_backward_hook = None
         self.cell_type = None
         self.cast = Cast()
         self._has_config_recompute = False
@@ -202,6 +273,21 @@ class Cell(Cell_):
     def cell_init_args(self):
         return self._cell_init_args
+    @property
+    def exist_names(self):
+        """
+        Get exist parameter names adding by tuple or list of parameter.
+        """
+        if self._exist_names is None:
+            self._exist_names = set("")
+        return self._exist_names
+    @property
+    def exist_objs(self):
+        if self._exist_objs is None:
+            self._exist_objs = set()
+        return self._exist_objs
     @property
     def param_prefix(self):
         """
@@ -230,11 +316,6 @@ class Cell(Cell_):
     def bprop_debug(self):
         """
         Get whether cell custom bprop debug is enabled.
-        Tutorial Examples:
-            - `Custom Neural Network Layers - Custom Cell Reverse
-              <https://mindspore.cn/docs/en/master/model_train/custom_program/network_custom.html
-              #custom-cell-reverse>`_
         """
         return self._bprop_debug
@@ -351,8 +432,6 @@ class Cell(Cell_):
             raise ValueError("For 'Cell', the property 'pipeline_stage' "
                              "can not be less than 0, but got {}".format(value))
         self._pipeline_stage = value
-        for item in self.trainable_params():
-            item.add_pipeline_stage(value)
     @property
     def pipeline_segment(self):
@@ -388,6 +467,374 @@ class Cell(Cell_):
     def enable_backward_hook(self):
         return self._enable_backward_hook
+    @jit_forbidden_register
+    def register_buffer(
+            self, name: str, tensor: Optional[Tensor], persistent: bool = True
+    ) -> None:
+        r"""Add a buffer to the cell.
+        This is typically used to register a buffer that should not to be
+        considered a model parameter. For example, BatchNorm's `running_mean`
+        is not a parameter, but is part of the cell's state. Buffers, by
+        default, are persistent and will be saved alongside parameters. This
+        behavior can be changed by setting `persistent` to ``False`` . The
+        only difference between a persistent buffer and a non-persistent buffer
+        is that the latter will not be a part of this cell's :attr:`state_dict` .
+        Buffers can be accessed as attributes using given names.
+        Args:
+            name (str): name of the buffer. The buffer can be accessed
+                from this cell using the given name.
+            tensor (Tensor): Buffer to be registered. If ``None`` ,
+                the buffer is not included in the cell's :attr:`state_dict` .
+            persistent (bool, optional): Whether the buffer is part of this cell's :attr:`state_dict`. Default ``True``.
+        Examples:
+            >>> import mindspore
+            ...
+            >>> class Net(mindspore.nn.Cell):
+            ...    def __init__(self):
+            ...        super().__init__()
+            ...        self.register_buffer("buffer0", mindspore.tensor([1, 2, 3]))
+            ...
+            ...    def construct(self, x):
+            ...        return x + self.net_buffer
+            ...
+            >>> net = Net()
+            >>> net.register_buffer("buffer0", mindspore.tensor([4, 5, 6]))
+            >>> print(net.buffer0)
+            [4 5 6]
+        """
+        if "_buffers" not in self.__dict__:
+            raise AttributeError("cannot assign buffer before Cell.__init__() call")
+        if not isinstance(name, str):
+            raise TypeError(
+                f"buffer name should be a string.But got this type: {type(name)}"
+            )
+        if "." in name:
+            raise KeyError('buffer name can\'t contain "."')
+        if name == "":
+            raise KeyError('buffer name can\'t be empty string ""')
+        if hasattr(self, name) and name not in self._buffers:
+            raise KeyError(f"attribute '{name}' already exists")
+        if tensor is not None and not isinstance(tensor, Tensor):
+            raise TypeError(
+                f"cannot assign '{type(tensor)}' object to buffer '{name}' "
+                "(mindspore Tensor or None required)"
+            )
+        for hook in _global_buffer_registration_hooks.values():
+            output = hook(self, name, tensor)
+            if output is not None:
+                tensor = output
+        if tensor is not None:
+            tensor._is_buffer = True
+        self._buffers[name] = tensor
+        if persistent:
+            self._non_persistent_buffers_set.discard(name)
+        else:
+            self._non_persistent_buffers_set.add(name)
+    @jit_forbidden_register
+    def get_buffer(self, target: str) -> "Tensor":
+        """Return the buffer given by `target` if it exists, otherwise throw an error.
+        See the docstring for `get_sub_cell` for a more detailed
+        explanation of this method's functionality as well as how to
+        correctly specify `target` .
+        Args:
+            target (str): The fully-qualified string name of the buffer
+                to look for. (See `get_sub_cell` for how to specify a
+                fully-qualified string.)
+        Returns:
+            Tensor
+        Examples:
+            >>> import mindspore
+            ...
+            ...
+            >>> class NetC(mindspore.nn.Cell):
+            ...     def __init__(self):
+            ...         super().__init__()
+            ...         self.register_buffer("buffer_c", mindspore.tensor([0, 0, 0]))
+            ...
+            ...     def construct(self, x):
+            ...         return x + self.buffer_c
+            ...
+            ...
+            >>> class NetB(mindspore.nn.Cell):
+            ...     def __init__(self, net_c):
+            ...         super().__init__()
+            ...         self.net_c = net_c
+            ...         self.register_buffer("buffer_b", mindspore.tensor([1, 2, 3]))
+            ...
+            ...     def construct(self, x):
+            ...         return self.net_c(x) + self.buffer_b
+            ...
+            ...
+            >>> class NetA(mindspore.nn.Cell):
+            ...     def __init__(self, net_b):
+            ...         super().__init__()
+            ...         self.net_b = net_b
+            ...         self.register_buffer("buffer_a", mindspore.tensor([4, 5, 6]))
+            ...
+            ...     def construct(self, x):
+            ...         return self.net_b(x) + self.buffer_a
+            ...
+            ...
+            >>> net_c = NetC()
+            >>> net_b = NetB(net_c)
+            >>> net_a = NetA(net_b)
+            >>> buffer_c = net_a.get_buffer("net_b.net_c.buffer_c")
+            >>> print(f'buffer_c is {buffer_c}')
+            buffer_c is [0 0 0]
+        """
+        cell_path, _, buffer_name = target.rpartition(".")
+        cell = self.get_sub_cell(cell_path)
+        if not hasattr(cell, buffer_name):
+            raise AttributeError(
+                cell._get_name() + " has no attribute `" + buffer_name + "`"
+            )
+        buffer = getattr(cell, buffer_name)
+        if buffer_name not in cell._buffers:
+            raise AttributeError("`" + buffer_name + "` is not a buffer")
+        return buffer
+    @jit_forbidden_register
+    def named_buffers(
+            self, prefix: str = "", recurse: bool = True, remove_duplicate: bool = True
+    ) -> Iterator[Tuple[str, Tensor]]:
+        r"""Return an iterator over cell buffers, yielding both the name of the buffer as well as the buffer itself.
+        Args:
+            prefix (str, optional): prefix to prepend to all buffer names. Default ``""``.
+            recurse (bool, optional): if ``True`` , then yields buffers of this cell
+                and all sub cells. Otherwise, yields only buffers that
+                are direct members of this cell. Default ``True``.
+            remove_duplicate (bool, optional): Whether to remove the duplicated buffers in the result. Default ``True``.
+        Returns:
+            Iterator[Tuple[str, Tensor]], an iterator of tuple containing the name and buffer.
+        Examples:
+            >>> import mindspore
+            ...
+            ...
+            >>> class NetB(mindspore.nn.Cell):
+            ...     def __init__(self):
+            ...         super().__init__()
+            ...         self.register_buffer("buffer_b", mindspore.tensor([1, 2, 3]))
+            ...
+            ...     def construct(self, x):
+            ...         return x + self.buffer_b
+            ...
+            ...
+            >>> class NetA(mindspore.nn.Cell):
+            ...     def __init__(self, net_b):
+            ...         super().__init__()
+            ...         self.net_b = net_b
+            ...         self.register_buffer("buffer_a", mindspore.tensor([4, 5, 6]))
+            ...
+            ...     def construct(self, x):
+            ...         return self.net_b(x) + self.buffer_a
+            ...
+            ...
+            >>> net_b = NetB()
+            >>> net_a = NetA(net_b)
+            >>>
+            >>> for name, buffer in net_a.named_buffers():
+            ...     print(f'buffer name is {name}, buffer is {buffer}')
+            buffer name is buffer_a, buffer is [4 5 6]
+            buffer name is net_b.buffer_b, buffer is [1 2 3]
+        """
+        gen = self._named_members(
+            lambda cell: cell._buffers.items(),
+            prefix=prefix,
+            recurse=recurse,
+            remove_duplicate=remove_duplicate,
+        )
+        yield from gen
+    @jit_forbidden_register
+    def buffers(self, recurse: bool = True) -> Iterator[Tensor]:
+        r"""Return an iterator over cell buffers.
+        Args:
+            recurse (bool, optional): If ``True`` , then yields buffers of this cell
+                and all sub cells. Otherwise, yields only buffers that
+                are direct members of this cell. Default ``True``.
+        Returns:
+            Iterator[Tensor], an iterator of buffer.
+        Examples:
+            >>> import mindspore
+            ...
+            ...
+            >>> class NetB(mindspore.nn.Cell):
+            ...     def __init__(self):
+            ...         super().__init__()
+            ...         self.register_buffer("buffer_b", mindspore.tensor([1, 2, 3]))
+            ...
+            ...     def construct(self, x):
+            ...         return x + self.buffer_b
+            ...
+            ...
+            >>> class NetA(mindspore.nn.Cell):
+            ...     def __init__(self, net_b):
+            ...         super().__init__()
+            ...         self.net_b = net_b
+            ...         self.register_buffer("buffer_a", mindspore.tensor([4, 5, 6]))
+            ...
+            ...     def construct(self, x):
+            ...         return self.net_b(x) + self.buffer_a
+            ...
+            ...
+            >>> net_b = NetB()
+            >>> net_a = NetA(net_b)
+            >>>
+            >>> for buffer in net_a.buffers():
+            ...     print(f'buffer is {buffer}')
+            buffer is [4 5 6]
+            buffer is [1 2 3]
+        """
+        for _, buf in self.named_buffers(recurse=recurse):
+            yield buf
+    def _named_members(self, get_members_fn, prefix="", recurse=True, remove_duplicate: bool = True):
+        r"""Help yield various names + members of cells."""
+        memo = set()
+        cells = (
+            self.cells_and_names(name_prefix=prefix)
+            if recurse
+            else [(prefix, self)]
+        )
+        for cell_prefix, cell in cells:
+            members = get_members_fn(cell)
+            for k, v in members:
+                if v is None or v in memo:
+                    continue
+                if remove_duplicate:
+                    memo.add(v)
+                name = cell_prefix + ("." if cell_prefix else "") + k
+                yield name, v
+    @jit_forbidden_register
+    def get_sub_cell(self, target: str) -> "Cell":
+        """Return the sub cell given by `target` if it exists, otherwise throw an error.
+        For example, let's say you have an ``nn.Cell`` ``A`` that
+        looks like this:
+        .. code-block:: text
+            A(
+                (net_b): NetB(
+                    (net_c): NetC(
+                        (conv): Conv2d(16, 33, kernel_size=(3, 3), stride=(2, 2))
+                    )
+                    (dense): Dense(in_features=100, out_features=200, bias=True)
+                )
+            )
+        (The diagram shows an ``nn.Cell`` ``A``. ``A`` has a nested
+        sub cell ``net_b``, which itself has two sub cells ``net_c``
+        and ``dense``. ``net_c`` then has a sub cell ``conv``.)
+        To check whether we have the ``dense`` sub cell, we
+        would call `get_sub_cell("net_b.dense")`. To check whether
+        we have the ``conv`` sub cell, we would call
+        `get_sub_cell("net_b.net_c.conv")`.
+        The runtime of ``get_sub_cell`` is bounded by the degree
+        of cell nesting in `target`. A query against
+        `name_cells` achieves the same result, but it is O(N) in
+        the number of transitive cells. So, for a simple check to see
+        if some sub cells exist, ``get_sub_cell`` should always be
+        used.
+        Args:
+            target (str): The fully-qualified string name of the sub cell
+                to look for. (See above example for how to specify a
+                fully-qualified string.)
+        Returns:
+            Cell
+        Examples:
+            >>> import mindspore
+            ...
+            ...
+            >>> class NetC(mindspore.nn.Cell):
+            ...     def __init__(self):
+            ...         super().__init__()
+            ...         self.register_buffer("buffer_c", mindspore.tensor([0, 0, 0]))
+            ...         self.dense_c = mindspore.nn.Dense(5, 3)
+            ...
+            ...     def construct(self, x):
+            ...         return self.dense_c(x) + self.buffer_c
+            ...
+            ...
+            >>> class NetB(mindspore.nn.Cell):
+            ...     def __init__(self, net_c):
+            ...         super().__init__()
+            ...         self.net_c = net_c
+            ...         self.register_buffer("buffer_b", mindspore.tensor([1, 2, 3]))
+            ...
+            ...     def construct(self, x):
+            ...         return self.net_c(x) + self.buffer_b
+            ...
+            ...
+            >>> class NetA(mindspore.nn.Cell):
+            ...     def __init__(self, net_b):
+            ...         super().__init__()
+            ...         self.net_b = net_b
+            ...         self.register_buffer("buffer_a", mindspore.tensor([4, 5, 6]))
+            ...
+            ...     def construct(self, x):
+            ...         return self.net_b(x) + self.buffer_a
+            ...
+            ...
+            >>> net_c = NetC()
+            >>> net_b = NetB(net_c)
+            >>> net_a = NetA(net_b)
+            >>> net_c = net_a.get_sub_cell("net_b.net_c")
+            >>> print(f'net_c is {net_c}')
+            net_c is NetC(
+                (dense_c): Dense(input_channels=5, output_channels=3, has_bias=True)
+            )
+        """
+        if target == "":
+            return self
+        atoms: List[str] = target.split(".")
+        cell = self
+        for item in atoms:
+            if not hasattr(cell, item):
+                raise AttributeError(
+                    cell._get_name() + " has no " "attribute `" + item + "`"
+                )
+            cell = getattr(cell, item)
+            if not isinstance(cell, Cell):
+                raise AttributeError("`" + item + "` is not " "an nn.Cell")
+        return cell
     def get_func_graph_proto(self):
         """Return graph binary proto."""
         exec_id = ".".join([self.phase, str(self.create_time), str(id(self))])
@@ -398,6 +845,10 @@ class Cell(Cell_):
             params = self.__dict__['_params']
             if name in params:
                 return params[name]
+        if '_buffers' in self.__dict__:
+            buffers = self.__dict__['_buffers']
+            if name in buffers:
+                return buffers[name]
         if '_cells' in self.__dict__:
             cells = self.__dict__['_cells']
             if name in cells:
@@ -420,6 +871,8 @@ class Cell(Cell_):
     def __delattr__(self, name):
         if name in self._params:
             del self._params[name]
+        elif name in self._buffers:
+            del self._buffers[name]
         elif name in self._cells:
             del self._cells[name]
         elif '_params_list' in self.__dict__ and name in self._params_list:
@@ -492,14 +945,17 @@ class Cell(Cell_):
         if self._forward_pre_hook:
             inputs = self._run_forward_pre_hook(inputs)
-        if self._backward_hook:
-            output = self._backward_hook_construct(*inputs, **kwargs)
-        elif self._shard_fn is not None:
+        if self._shard_fn is not None:
             output = self._shard_fn(*inputs, **kwargs)
-        elif self._recompute_cell is not None:
-            output = self._recompute_cell(*inputs, **kwargs)
-        elif self.has_bprop and _pynative_executor.requires_grad():
-            output = self._call_custom_bprop(*inputs, **kwargs)
+        elif _pynative_executor.requires_grad():
+            if self._backward_hook:
+                output = self._backward_hook_construct(*inputs, **kwargs)
+            elif self._recompute_cell is not None:
+                output = self._recompute_cell(*inputs, **kwargs)
+            elif self.has_bprop:
+                output = self._call_custom_bprop(*inputs, **kwargs)
+            else:
+                output = self.construct(*inputs, **kwargs)
         else:
             output = self.construct(*inputs, **kwargs)
@@ -590,6 +1046,89 @@ class Cell(Cell_):
         for prim in all_prims:
             prim.add_prim_attr("strategy_gen_mode", "data_parallel")
+    def offload(self, backward_prefetch="Auto"):
+        """
+        Set the cell offload. All primitive ops in the cell will be set offload. For the intermediate
+        activations calculated by these primitive ops, we will not save them in the forward pass, but
+        offload them and onload them in the backward pass.
+        Note:
+            - If Cell.offload is called, the mode should be set to "GRAPH_MODE".
+            - If Cell.offload is called, lazyinline should be enabled.
+        Args:
+            backward_prefetch(Union[str, int], optional): The timing for prefetching activations in advance in backward
+                                                          pass. Default: ``"Auto"``. If set it to ``"Auto"``, framework
+                                                          will start to prefetch activations one operator in advance.
+                                                          If set it to a positive int value, framework will start to
+                                                          prefetch activations ``backward_prefetch`` operators in
+                                                          advance, such as 1, 20, 100.
+        Examples:
+            >>> import mindspore.nn as nn
+            >>> from mindspore import ops
+            >>> from mindspore.common import Tensor, Parameter
+            >>> from mindspore.common.lazy_inline import lazy_inline
+            >>>
+            >>> class Block(nn.Cell):
+            ...     def __init__(self):
+            ...         super(Block, self).__init__()
+            ...         self.transpose1 = ops.Transpose()
+            ...         self.transpose2 = ops.Transpose()
+            ...         self.transpose3 = ops.Transpose()
+            ...         self.transpose4 = ops.Transpose()
+            ...         self.real_div1 = ops.RealDiv()
+            ...         self.real_div2 = ops.RealDiv()
+            ...         self.batch_matmul1 = ops.BatchMatMul()
+            ...         self.batch_matmul2 = ops.BatchMatMul()
+            ...         self.softmax = ops.Softmax(-1)
+            ...         self.expand_dims = ops.ExpandDims()
+            ...         self.sub = ops.Sub()
+            ...         self.y = Parameter(Tensor(np.ones((1024, 128, 128)).astype(np.float32)))
+            ...     def construct(self, x):
+            ...         transpose1 = self.transpose1(x, (0, 2, 1, 3))
+            ...         real_div1 = self.real_div1(transpose1, Tensor(2.37891))
+            ...         transpose2 = self.transpose2(x, (0, 2, 3, 1))
+            ...         real_div2 = self.real_div2(transpose2, Tensor(2.37891))
+            ...         batch_matmul1 = self.batch_matmul1(real_div1, real_div2)
+            ...         expand_dims = self.expand_dims(self.y, 1)
+            ...         sub = self.sub(Tensor([1.0]), expand_dims)
+            ...         soft_max = self.softmax(sub)
+            ...         transpose3 = self.transpose3(x, (0, 2, 1, 3))
+            ...         batch_matmul2 = self.batch_matmul2(soft_max[0], transpose3)
+            ...         transpose4 = self.transpose4(batch_matmul2, (0, 2, 1, 3))
+            ...         return transpose4
+            >>>
+            >>> class OuterBlock(nn.Cell):
+            ...     @lazy_inline
+            ...     def __init__(self):
+            ...         super(OuterBlock, self).__init__()
+            ...         self.block = Block()
+            ...     def construct(self, x):
+            ...         return self.block(x)
+            >>>
+            >>> class Nets(nn.Cell):
+            ...     def __init__(self):
+            ...         super(Nets, self).__init__()
+            ...         self.blocks = nn.CellList()
+            ...         for _ in range(3):
+            ...             b = OuterBlock()
+            ...             b.offload()
+            ...             self.blocks.append(b)
+            ...     def construct(self, x):
+            ...         out = x
+            ...         for i in range(3):
+            ...             out = self.blocks[i](out)
+            ...         return out
+        """
+        if context._get_mode() == context.PYNATIVE_MODE:
+            raise ValueError("The Cell offload does not support PyNative mode now.")
+        if isinstance(backward_prefetch, str):
+            Validator.check_string(backward_prefetch, ['Auto'], 'backward_prefetch', self.cls_name)
+        else:
+            Validator.check_non_negative_int(backward_prefetch)
+        for prim in self._get_prims_recursively():
+            prim._offload(backward_prefetch=backward_prefetch)
     def shard(self, in_strategy, out_strategy=None, parameter_plan=None, device="Ascend", level=0):
         """
         Defining the input and output layouts of this cell and the parallel strategies of remaining ops will be
@@ -598,7 +1137,7 @@ class Cell(Cell_):
         strategy for others will be set by sharding propagation.
         in_strategy and out_strategy define the input and output layout respectively.
         in_strategy/out_strategy should be a tuple, each element of which corresponds to the desired layout of
-        this input/output, which can refer to the description of `mindspore.ops.Primitive.shard`.
+        this input/output, which can refer to the description of :func:`mindspore.ops.Primitive.shard`.
         The parallel strategies of remaining operators are derived from the strategy specified by the input and output.
         Note:
@@ -618,7 +1157,7 @@ class Cell(Cell_):
                                                 If the parameter name is incorrect or the corresponding parameter
                                                 has been set, the parameter setting will be ignored.
                                                 Default: ``None`` .
-            device (string): Select a certain device target. It is not in use right now.
+            device (str): Select a certain device target. It is not in use right now.
                              Support [ ``"CPU"`` , ``"GPU"`` , ``"Ascend"`` ]. Default: ``"Ascend"`` .
             level (int): Option for parallel strategy infer algorithm, namely the object function, maximize computation
                          over communication ratio, maximize speed performance, minimize memory usage etc. It is not in
@@ -650,10 +1189,8 @@ class Cell(Cell_):
             ...     x = self.block2_shard(x)
             ...     return x
         """
-        if context.get_auto_parallel_context("parallel_mode") not in ["auto_parallel", "semi_auto_parallel"]:
-            raise AssertionError(f"Cell shard only supports auto parallel or semi_auto_parallel "
-                                 f"Please check the parallel mode in parallel context.")
+        if ms.communication.management.get_group_size() == 1:
+            return self
         shard_fn = Shard()
         fn = shard_fn(self, in_strategy, out_strategy, parameter_plan, device, level)
         self._shard_fn = fn
@@ -756,7 +1293,8 @@ class Cell(Cell_):
         """
         Process cell info before call construct
         """
-        if self.requires_grad:
+        if self.requires_grad and (not _pynative_executor.grad_flag() or _pynative_executor.high_order()):
+            self.is_top_cell = True
             _pynative_executor.set_grad_flag(True)
             _pynative_executor.new_graph(self, *args, **kwargs)
         elif self._dynamic_shape_inputs is not None:
@@ -770,8 +1308,9 @@ class Cell(Cell_):
         """
         Process cell info after call construct
         """
-        if self.requires_grad:
+        if self.requires_grad and self.is_top_cell:
             _pynative_executor.end_graph(self, output, *args, **kwargs)
+            self.is_top_cell = False
         elif self._dynamic_shape_inputs is not None:
             _pynative_executor.set_cell_use_dynamic_shape_process(False)
@@ -816,52 +1355,41 @@ class Cell(Cell_):
             self._add_attr(key, value)
         self._attr_synced = True
-    def _set_attr_for_parameter(self, name, value):
-        """Set attr for parameter."""
-        cells = self.__dict__.get('_cells')
-        params = self.__dict__.get('_params')
-        if params is None:
-            raise AttributeError("For 'Cell', can not assign params before Cell.__init__() is called.")
-        if name in self.__dict__:
-            if self.__dict__[name] is not None:
-                raise TypeError(f"For 'Cell', the {name} should not be Parameter.")
-            del self.__dict__[name]
-        if cells and name in cells:
-            raise TypeError(f"For 'Cell', the {name} must be Cell, but got Parameter.")
-        self.insert_param_to_cell(name, value)
-    def _set_attr_for_parameter_tuple(self, name, value):
-        """Set attr for parameter in ParameterTuple."""
-        params = self.__dict__.get('_params')
-        params_list = self.__dict__.get('_params_list')
-        if params is None:
-            raise AttributeError("For 'Cell', can not assign params before Cell.__init__() is called.")
-        exist_names = set("")
-        exist_objs = set()
-        for item in value:
-            if item in exist_objs:
-                # If there are multiple identical objects, their names only check once.
-                continue
-            exist_objs.add(item)
-            if item.name == PARAMETER_NAME_DEFAULT:
-                logger.warning("For 'Cell', the parameter definition is deprecated.\n"
-                               "Please set a unique name for the parameter in ParameterTuple '{}'.".format(value))
-                item.name = item.name + "$" + str(self._id)
-                self._id += 1
-            self.insert_param_to_cell(item.name, item, check_name_contain_dot=False)
-            if item.name in exist_names:
-                raise ValueError("The value {} , its name '{}' already exists. "
-                                 "Please set a unique name for the parameter.".format(value, item.name))
-            exist_names.add(item.name)
-        if context._get_mode() == context.PYNATIVE_MODE:
+    def _set_attr_for_param_or_param_tuple(self, name, value):
+        """Set attr for param and tensor."""
+        if isinstance(value, Parameter):
             if name in self.__dict__:
                 del self.__dict__[name]
-            if name in params:
-                del params[name]
-            params_list[name] = value
-        else:
-            object.__setattr__(self, name, value)
+            self.insert_param_to_cell(name, value)
+        elif isinstance(value, ParameterTuple):
+            exist_names = set("")
+            exist_objs = set()
+            for item in value:
+                if item in exist_objs:
+                    # If there are multiple identical objects, their names only check once.
+                    continue
+                exist_objs.add(item)
+                if item.name == PARAMETER_NAME_DEFAULT:
+                    logger.warning("For 'Cell', the parameter definition is deprecated.\n"
+                                   "Please set a unique name for the parameter in ParameterTuple '{}'.".format(value))
+                    item.name = item.name + "$" + str(self._id)
+                    self._id += 1
+                self.insert_param_to_cell(item.name, item, check_name_contain_dot=False)
+                if item.name in exist_names:
+                    raise ValueError("The value {} , its name '{}' already exists. "
+                                     "Please set a unique name for the parameter.".format(value, item.name))
+                exist_names.add(item.name)
+            if context._get_mode() == context.PYNATIVE_MODE:
+                if name in self.__dict__:
+                    del self.__dict__[name]
+                params = self.__dict__.get('_params')
+                if name in params:
+                    del params[name]
+                params_list = self.__dict__.get('_params_list')
+                params_list[name] = value
+            else:
+                object.__setattr__(self, name, value)
     def _set_attr_for_parameter_in_list_or_tuple(self, name, value):
         """Set attr for parameter in list or tuple."""
@@ -874,24 +1402,18 @@ class Cell(Cell_):
                 item.name = item.name + "$" + str(self._id)
                 self._id += 1
             if item.name in self.exist_names:
-                raise ValueError("The value {} , its name '{}' already exists. "
-                                 "Please set a unique name for the parameter.".format(value, item.name))
+                raise ValueError(f"The value {value} , its name '{item.name}' already exists. "
+                                 "Please set a unique name for the parameter.")
             self.exist_names.add(item.name)
         object.__setattr__(self, name, value)
     def _set_attr_for_cell(self, name, value):
         """Set attr for cell."""
-        cells = self.__dict__.get('_cells')
-        params = self.__dict__.get('_params')
-        if cells is None:
-            raise AttributeError("For 'Cell', can not assign cells before Cell.__init__() is called.")
         if name in self.__dict__:
             del self.__dict__[name]
-        if params and name in params:
-            raise TypeError(f"For 'Cell', the {name} must be Parameter, but got Cell.")
         if self._auto_prefix:
             value.update_parameters_name(name + '.')
-        cells[name] = value
+        self.insert_child_to_cell(name, value)
         if hasattr(self, '_cell_init_args'):
             self.cell_init_args += str({name: value})
@@ -904,30 +1426,57 @@ class Cell(Cell_):
         else:
             self.insert_param_to_cell(name, None)
-    def __setattr__(self, name, value):
-        cells = self.__dict__.get('_cells')
+    def _set_attr_for_object(self, name, value):
+        """Set attr for py object."""
         params = self.__dict__.get('_params')
-        if isinstance(value, Parameter):
-            self._set_attr_for_parameter(name, value)
-        elif isinstance(value, ParameterTuple):
-            self._set_attr_for_parameter_tuple(name, value)
-        elif isinstance(value, (list, tuple)) and value and _check_param_list_tuple(value):
+        if params is not None and name in params:
+            if value is not None:
+                if isinstance(value, Tensor):
+                    params[name].set_data(value)
+                    return
+                raise TypeError(
+                    f"Parameter '{name}' already exists in network, "
+                    f"can not assign this type: '{type(value)}' as a parameter.")
+            params[name] = None
+            return
+        cells = self.__dict__.get('_cells')
+        if cells is not None and name in cells:
+            if value is not None:
+                raise TypeError(
+                    f"Sub cell '{name}' already exists in network, "
+                    f"can not assign this type: '{type(value)}' as a cell.")
+            cells[name] = None
+            return
+        buffers = self.__dict__.get('_buffers')
+        if buffers is not None and name in buffers:
+            if value is not None:
+                raise TypeError(
+                    f"Buffer '{name}' already exists in network, "
+                    f"can not assign this type: '{type(value)}' as a buffer.")
+            buffers[name] = None
+            return
+        object.__setattr__(self, name, value)
+    def __setattr__(self, name, value):
+        if isinstance(value, (Parameter, ParameterTuple)):
+            self._set_attr_for_param_or_param_tuple(name, value)
+        elif _is_parameter_list_or_tuple(value):
             self._set_attr_for_parameter_in_list_or_tuple(name, value)
         elif isinstance(value, Cell):
             self._set_attr_for_cell(name, value)
-        elif params and name in params:
-            self._set_attr_for_params(name, value)
-        elif cells and name in cells:
-            if value is not None:
-                raise TypeError(f"For 'Cell', the type of {name} must be cell, but got {type(value).__name__}.")
-            self._cells[name] = None
-        else:
-            if isinstance(value, Primitive):
-                value.set_prim_instance_name(name)
-                self._primitives[name] = value
+        elif isinstance(value, _Buffer):
+            if name in self.__dict__:
+                del self.__dict__[name]
+            self.register_buffer(name, value)
+        elif isinstance(value, Primitive):
+            value.set_prim_instance_name(name)
+            self._primitives[name] = value
             object.__setattr__(self, name, value)
-        if name not in Cell.IGNORE_LIST:
-            self._attr_synced = False
+        else:
+            self._set_attr_for_object(name, value)
+    def _get_name(self):
+        return self.__class__.__name__
     def extend_repr(self):
         """
@@ -941,19 +1490,28 @@ class Cell(Cell_):
         return self.__repr__()
     def __repr__(self):
-        extra_str = self.extend_repr()
-        info_str = self.__class__.__name__ + '<'
-        if self._cells:
-            sub_str = '\n'
-            if extra_str:
-                sub_str += '{}\n'.format(self.extend_repr())
-            for key, value in self._cells.items():
-                sub_str += '({}): {}\n'.format(key, repr(value))
-            sub_str = sub_str.replace('\n', '\n  ') + '>'
-            info_str += sub_str
-        else:
-            info_str += extra_str + '>'
-        return info_str
+        extra_lines = []
+        extend_repr = self.extend_repr()
+        # empty string will be split into list ['']
+        if extend_repr:
+            extra_lines = extend_repr.split("\n")
+        child_lines = []
+        for key, cell in self._cells.items():
+            cell_str = repr(cell)
+            cell_str = _addindent(cell_str, 2)
+            child_lines.append("(" + key + "): " + cell_str)
+        lines = extra_lines + child_lines
+        main_str = self._get_name() + "("
+        if lines:
+            # simple one-liner info, which most builtin Modules will use
+            if len(extra_lines) == 1 and not child_lines:
+                main_str += extra_lines[0]
+            else:
+                main_str += "\n  " + "\n  ".join(lines) + "\n"
+        main_str += ")"
+        return main_str
     def load_parameter_slice(self, params):
         """
@@ -1119,9 +1677,11 @@ class Cell(Cell_):
             args (tuple): Args of the Cell object.
             kwargs (dict): Kwargs of the Cell object.
         """
+        _init_auto_parallel_context(self)
         self._compile_args = self._get_compile_args(args)
         _cell_graph_executor.compile(self, *self._compile_args, phase=self.phase,
                                      jit_config_dict=self._jit_config_dict, **kwargs)
+        _clear_auto_parallel_context(self)
     def compile_and_run(self, *args, **kwargs):
         """
@@ -1252,9 +1812,9 @@ class Cell(Cell_):
             >>> net2 = nn.Dense(2, 2)
             >>> net1.insert_child_to_cell("child", net2)
             >>> print(net1)
-            ReLU<
-              (child): Dense<input_channels=2, output_channels=2, has_bias=True>
-              >
+            ReLU(
+              (child): Dense(input_channels=2, output_channels=2, has_bias=True)
+            )
         """
         if not isinstance(child_name, str):
             raise TypeError(f"For 'insert_child_to_cell', the type of parameter 'child_name' must be str, "
@@ -1312,13 +1872,22 @@ class Cell(Cell_):
                         new_param_tuple.append(param)
                     cell.__dict__[key] = ParameterTuple(new_param_tuple)
+    def _get_cell_parallel_mode(self):
+        """Determine whether the current cell is in parallel mode."""
+        is_parallel_mode = False
+        for _, param in self.parameters_and_names():
+            if param.param_info.is_param_init:
+                is_parallel_mode = True
+                break
+        return is_parallel_mode
     def init_parameters_data(self, auto_parallel_mode=False):
         """
         Initialize all parameters and replace the original saved parameters in cell.
         Note:
             trainable_params() and other similar interfaces may return different parameter instance after
-            `init_parameters_data`, do not save these results.
+            `init_parameters_data`. It is not recommended to save these results.
         Args:
             auto_parallel_mode (bool): If running in auto_parallel_mode. Default: ``False`` .
@@ -1350,15 +1919,24 @@ class Cell(Cell_):
         def _updata(param):
             if param in replace:
                 return replace.get(param)
-            new_p = param.init_data(None, set_sliced=False)
+            new_p = param.init_data(None, set_sliced=param.sliced)
             replace[param] = new_p
             return new_p
         # replace all original usage.
         cells = self.cells_and_names()
+        is_parallel_mode = self._get_cell_parallel_mode()
+        is_graph_mode = context.get_context('mode') == context.GRAPH_MODE
         for _, cell in cells:
             params = cell._params.items()
             for param_name, param in params:
+                not_sliced = not param.sliced
+                judgment = not_sliced
+                if param.param_info.is_pipeline_shared_param:
+                    continue
+                if is_graph_mode and is_parallel_mode and judgment:
+                    continue
                 if not auto_parallel_mode:
                     cell._params[param_name] = _updata(param)
                     continue
@@ -1370,6 +1948,12 @@ class Cell(Cell_):
                     param_tuple = cell_dict[key]
                     new_param_tuple = []
                     for param in param_tuple:
+                        not_sliced = not param.sliced
+                        judgment = not_sliced
+                        if param.param_info.is_pipeline_shared_param:
+                            continue
+                        if is_graph_mode and is_parallel_mode and judgment:
+                            continue
                         if not auto_parallel_mode:
                             new_param_tuple.append(_updata(param))
                             continue
@@ -1677,7 +2261,7 @@ class Cell(Cell_):
             ...         return x
             >>> net = Net()
             >>> print(net.cells())
-            odict_values([Dense<input_channels=2, output_channels=2, has_bias=True>])
+            odict_values([Dense(input_channels=2, output_channels=2, has_bias=True)])
         """
         return self.name_cells().values()
@@ -1738,7 +2322,7 @@ class Cell(Cell_):
             ...         return x
             >>> net = Net()
             >>> print(net.name_cells())
-            OrderedDict([('dense', Dense<input_channels=2, output_channels=2, has_bias=True>)])
+            OrderedDict([('dense', Dense(input_channels=2, output_channels=2, has_bias=True))])
         """
         value_set = set()
         cells = OrderedDict()
@@ -1779,10 +2363,10 @@ class Cell(Cell_):
             ...     if isinstance(cell, nn.Dense):
             ...         cell.weight.set_data(initializer(One(), cell.weight.shape, cell.weight.dtype))
             >>> net.apply(func)
-            SequentialCell<
-              (0): Dense<input_channels=2, output_channels=2, has_bias=True>
-              (1): Dense<input_channels=2, output_channels=2, has_bias=True>
-              >
+            SequentialCell(
+              (0): Dense(input_channels=2, output_channels=2, has_bias=True)
+              (1): Dense(input_channels=2, output_channels=2, has_bias=True)
+            )
             >>> print(net[0].weight.asnumpy())
             [[1. 1.]
              [1. 1.]]
@@ -1914,8 +2498,8 @@ class Cell(Cell_):
             >>>
             >>> net = nn.Conv2d(120, 240, 4, has_bias=False, weight_init='normal')
             >>> net.to_float(mstype.float16)
-            Conv2d<input_channels=120, output_channels=240, kernel_size=(4, 4), stride=(1, 1), pad_mode=same,
-            padding=0, dilation=(1, 1), group=1, has_bias=False, weight_init=normal, bias_init=None, format=NCHW>
+            Conv2d(input_channels=120, output_channels=240, kernel_size=(4, 4), stride=(1, 1), pad_mode=same,
+            padding=0, dilation=(1, 1), group=1, has_bias=False, weight_init=normal, bias_init=None, format=NCHW)
         """
         if dst_type not in (mstype.float16, mstype.float32, mstype.bfloat16):
             raise ValueError("For 'to_float', the argument 'dst_type' must be mstype.float32, mstype.float16 or "
@@ -1955,9 +2539,8 @@ class Cell(Cell_):
     def set_grad(self, requires_grad=True):
         """
-        Sets the cell flag for gradient. In pynative mode, this parameter specifies whether the network requires
-        gradients. If ``true`` , the backward network needed to compute the gradients will be generated when the forward
-        network is executed.
+        Sets the cell flag for gradient.
         Args:
             requires_grad (bool): Specifies if the net need to grad, if it is
@@ -2121,8 +2704,7 @@ class Cell(Cell_):
         """
         if context._get_mode() == context.GRAPH_MODE:
             return HookHandle()
-        if not check_hook_fn("register_forward_pre_hook", hook_fn):
-            return HookHandle()
+        check_hook_fn(hook_fn)
         handle = HookHandle(self._forward_pre_hook)
         self._forward_pre_hook[handle.handle_id] = hook_fn
         return handle
@@ -2217,10 +2799,11 @@ class Cell(Cell_):
             (Tensor(shape=[1], dtype=Float32, value= [ 2.00000000e+00]), Tensor(shape=[1], dtype=Float32,
             value= [ 2.00000000e+00]))
         """
-        if context._get_mode() == context.GRAPH_MODE:
+        if self.has_bprop:
             return HookHandle()
-        if not check_hook_fn("register_forward_hook", hook_fn):
+        if context._get_mode() == context.GRAPH_MODE:
             return HookHandle()
+        check_hook_fn(hook_fn)
         handle = HookHandle(self._forward_hook)
         self._forward_hook[handle.handle_id] = hook_fn
         return handle
@@ -2310,8 +2893,7 @@ class Cell(Cell_):
         """
         if context._get_mode() == context.GRAPH_MODE:
             return HookHandle()
-        if not check_hook_fn("register_backward_pre_hook", hook_fn):
-            return HookHandle()
+        check_hook_fn(hook_fn)
         handle = HookHandle(self._backward_pre_hook)
         self._backward_pre_hook[handle.handle_id] = hook_fn
         if self._cell_backward_pre_hook is None:
@@ -2334,9 +2916,12 @@ class Cell(Cell_):
         Supported Platforms:
         ``Ascend`` ``GPU`` ``CPU``
         """
-        ret = self._cell_backward_pre_hook(outputs)
         if isinstance(outputs, tuple):
-            if not isinstance(ret, tuple):
+            ret = self._cell_backward_pre_hook(*outputs)
+        else:
+            ret = self._cell_backward_pre_hook(outputs)
+        if isinstance(outputs, tuple):
+            if len(outputs) == 1:
                 ret = (ret,)
             if len(ret) != len(outputs):
                 raise TypeError(
@@ -2344,6 +2929,527 @@ class Cell(Cell_):
                         len(ret), len(outputs)))
         return ret
+    def get_extra_state(self) -> Any:
+        """Return any extra state to include in the cell's state_dict.
+        This function is called from ``state_dict``.
+        Implement this and a corresponding ``set_extra_state`` for your cell
+        if you need to store extra state.
+        Note that extra state should be picklable to ensure working serialization
+        of the state_dict. Only provide backwards compatibility guarantees
+        for serializing tensors; other objects may break backwards compatibility if
+        their serialized pickled form changes.
+        Returns:
+            object, any extra state to store in the cell's state_dict.
+        """
+        raise RuntimeError(
+            "Reached a code path in Cell.get_extra_state() that should never be called."
+        )
+    def set_extra_state(self, state: Any) -> None:
+        """Set extra state contained in the loaded `state_dict`.
+        This function is called from `load_state_dict` to handle any extra state
+        found within the `state_dict`. Implement this function and a corresponding
+        `get_extra_state` for your cell if you need to store extra state within its
+        `state_dict`.
+        Args:
+            state (dict): Extra state from the `state_dict`.
+        """
+        raise RuntimeError(
+            "Reached a code path in Cell.set_extra_state() that should never be called."
+        )
+    @jit_forbidden_register
+    def register_state_dict_post_hook(self, hook):
+        r"""Register a post-hook for the :func:`mindspore.nn.Cell.state_dict` method.
+        It should have the following signature:
+        hook(cell, state_dict, prefix, local_metadata) -> None
+        The registered hooks can modify the ``state_dict`` inplace.
+        Args:
+            hook (Callable): The hook function after `state_dict` is called.
+        Returns:
+            A handle that can be used to remove the added hook by calling
+            `handle.remove()`.
+        """
+        from mindspore.utils.hooks import _RemovableHandle
+        handle = _RemovableHandle(self._state_dict_hooks)
+        self._state_dict_hooks[handle.id] = hook
+        return handle
+    @jit_forbidden_register
+    def register_state_dict_pre_hook(self, hook):
+        r"""Register a pre-hook for the :func:`mindspore.nn.Cell.state_dict` method.
+        It should have the following signature:
+        hook(cell, prefix, keep_vars) -> None
+        The registered hooks can be used to perform pre-processing before the `state_dict`
+        call is made.
+        Args:
+            hook (Callable): The hook function before `state_dict` is called.
+        Returns:
+            A handle that can be used to remove the added hook by calling
+            `handle.remove()`.
+        Examples:
+            >>> import mindspore
+            ...
+            ...
+            >>> class NetA(mindspore.nn.Cell):
+            ...     def __init__(self):
+            ...         super().__init__()
+            ...         self.register_buffer("buffer_a", mindspore.tensor([1, 2, 3]))
+            ...         self.param_a = mindspore.Parameter(mindspore.tensor([1, 2, 3]))
+            ...
+            ...     def construct(self, x):
+            ...         return x + self.buffer_a + self.param_a
+            ...
+            ...
+            >>> def _add_extra_param(cell, prefix, keep_vars):
+            ...     cell._params["extra_param"] = mindspore.Parameter(mindspore.tensor([4, 5, 6]))
+            ...
+            ...
+            >>> net = NetA()
+            >>> handle = net.register_state_dict_pre_hook(_add_extra_param)
+            >>> net_state_dict = net.state_dict()
+            >>> handle.remove()
+            >>> print("extra_param" in net_state_dict)
+            True
+        """
+        from mindspore.utils.hooks import _RemovableHandle
+        handle = _RemovableHandle(self._state_dict_pre_hooks)
+        self._state_dict_pre_hooks[handle.id] = hook
+        return handle
+    def _save_to_state_dict(self, destination, prefix, keep_vars):
+        r"""Save cell state to the `destination` dictionary.
+        The `destination` dictionary will contain the state
+        of the cell, but not its descendants. This is called on every
+        sub cell in :func:`mindspore.nn.Cell.state_dict`.
+        In rare cases, subclasses can achieve class-specific behavior by
+        overriding this method with custom logic.
+        Args:
+            destination (dict): a dict where state will be stored
+            prefix (str): the prefix for parameters and buffers used in this
+                cell
+        """
+        for name, param in self._params.items():
+            if param is not None:
+                destination[prefix + name] = param
+        for name, buf in self._buffers.items():
+            if buf is not None and name not in self._non_persistent_buffers_set:
+                destination[prefix + name] = buf
+        extra_state_key = prefix + _EXTRA_STATE_KEY_SUFFIX
+        if (
+                getattr(self.__class__, "get_extra_state", Cell.get_extra_state)
+                is not Cell.get_extra_state
+        ):
+            destination[extra_state_key] = self.get_extra_state()
+    # The user can pass an optional arbitrary mappable object to `state_dict`, in which case `state_dict` returns
+    # back that same object. But if they pass nothing, an `OrderedDict` is created and returned.
+    T_destination = TypeVar("T_destination", bound=Dict[str, Any])
+    @jit_forbidden_register
+    def state_dict(self, *args, destination=None, prefix="", keep_vars=False):
+        r"""Return a dictionary containing references to the whole state of the cell.
+        Both parameters and persistent buffers (e.g. running averages) are
+        included. Keys are corresponding parameter and buffer names.
+        Parameters and buffers set to ``None`` are not included.
+        .. note::
+            The returned object is a shallow copy. It contains references
+            to the cell's parameters and buffers.
+        .. warning::
+            - Currently ``state_dict()`` also accepts positional arguments for
+              ``destination``, ``prefix`` and ``keep_vars`` in order. However,
+              this is being deprecated and keyword arguments will be enforced in
+              future releases.
+            - Please avoid the use of argument ``destination`` as it is not
+              designed for end-users.
+        Args:
+            destination (dict, optional): If provided, the state of cell will
+                be updated into the dict and the same object is returned.
+                Otherwise, an ``OrderedDict`` will be created and returned.
+                Default: ``None``.
+            prefix (str, optional): A prefix added to parameter and buffer
+                names to compose the keys in state_dict. Default: ``''``.
+            keep_vars (bool, optional): Whether the state_dict returns a copy. Default: ``False`` , returns a reference.
+        Returns:
+            Dict, a dictionary containing a whole state of the cell.
+        Examples:
+            >>> import mindspore
+            >>> class Model(mindspore.nn.Cell):
+            ...     def __init__(self):
+            ...         super().__init__()
+            ...         self.register_buffer("buffer_a", mindspore.tensor([4, 5, 6]))
+            ...         self.param_a = mindspore.Parameter(mindspore.tensor([1, 2, 3]))
+            ...
+            ...     def construct(self, x):
+            ...         return x + self.buffer_a + self.param_a
+            ...
+            ...
+            >>> model = Model()
+            >>> print(model.state_dict())
+            OrderedDict([('param_a', Parameter (name=param_a, shape=(3,), dtype=Int64, requires_grad=True)), \
+            ('buffer_a', Tensor(shape=[3], dtype=Int64, value= [4, 5, 6]))])
+        """
+        # TODO: Remove `args` and the parsing logic when BC allows.
+        if args:
+            # DeprecationWarning is ignored by default
+            warnings.warn(
+                "Positional args are being deprecated, use kwargs instead. Refer to "
+                "https://www.mindspore.cn/docs/zh-CN/master/api_python/nn/mindspore.nn.Cell.html"
+                " for details.",
+                FutureWarning,
+                stacklevel=2,
+            )
+            if destination is None:
+                destination = args[0]
+            if len(args) > 1 and prefix == "":
+                prefix = args[1]
+            if len(args) > 2 and keep_vars is False:
+                keep_vars = args[2]
+        if destination is not None and not isinstance(destination, dict):
+            raise TypeError(f"The type of destination must be OrderedDict, but got {type(destination)}")
+        if not isinstance(prefix, str):
+            raise TypeError(f"The type of prefix must be string, but got {type(prefix)}")
+        if not isinstance(keep_vars, bool):
+            raise TypeError(f"The type of keep_vars must be bool, but got {type(keep_vars)}")
+        if destination is None:
+            destination = OrderedDict()
+            destination._metadata = OrderedDict()
+        local_metadata = {}
+        if hasattr(destination, "_metadata"):
+            destination._metadata[prefix[:-1]] = local_metadata
+        for hook in self._state_dict_pre_hooks.values():
+            hook(self, prefix, keep_vars)
+        self._save_to_state_dict(destination, prefix, keep_vars)
+        for name, cell in self._cells.items():
+            if cell is not None:
+                cell.state_dict(
+                    destination=destination,
+                    prefix=prefix + name + ".",
+                    keep_vars=keep_vars,
+                )
+        for hook in self._state_dict_hooks.values():
+            hook_result = hook(self, destination, prefix, local_metadata)
+            if hook_result is not None:
+                raise RuntimeError("state_dict post-hook must return None")
+        return destination
+    @jit_forbidden_register
+    def register_load_state_dict_pre_hook(self, hook):
+        r"""Register a pre-hook to be run before cell's :func:`mindspore.nn.Cell.load_state_dict` is called.
+        It should have the following signature:
+        hook(cell, state_dict, prefix, local_metadata, strict, missing_keys, unexpected_keys, error_msgs) -> None  # noqa: B950
+        Args:
+            hook (Callable): The hook function before `load_state_dict` is called.
+        Returns:
+            A handle that can be used to remove the added hook by calling
+            `handle.remove()`.
+        """
+        from mindspore.utils.hooks import _RemovableHandle
+        handle = _RemovableHandle(self._load_state_dict_pre_hooks)
+        self._load_state_dict_pre_hooks[handle.id] = hook
+        return handle
+    @jit_forbidden_register
+    def register_load_state_dict_post_hook(self, hook):
+        r"""Register a post-hook to be run after cell's :func:`mindspore.nn.Cell.load_state_dict` is called.
+        It should have the following signature:
+        hook(cell, incompatible_keys) -> None
+        The ``cell`` argument is the current cell that this hook is registered
+        on, and the ``incompatible_keys`` argument is a ``NamedTuple`` consisting
+        of attributes ``missing_keys`` and ``unexpected_keys``. ``missing_keys``
+        is a ``list`` of ``str`` containing the missing keys and
+        ``unexpected_keys`` is a ``list`` of ``str`` containing the unexpected keys.
+        The given incompatible_keys can be modified inplace if needed.
+        Note that the checks performed when calling :func:`load_state_dict` with
+        ``strict=True`` are affected by modifications the hook makes to
+        ``missing_keys`` or ``unexpected_keys``, as expected. Additions to either
+        set of keys will result in an error being thrown when ``strict=True``, and
+        clearing out both missing and unexpected keys will avoid an error.
+        Args:
+            hook (Callable): The hook function after `load_state_dict` is called.
+        Returns:
+            A handle that can be used to remove the added hook by calling
+            `handle.remove()`.
+        """
+        from mindspore.utils.hooks import _RemovableHandle
+        handle = _RemovableHandle(self._load_state_dict_post_hooks)
+        self._load_state_dict_post_hooks[handle.id] = hook
+        return handle
+    def _load_from_state_dict(
+            self,
+            state_dict,
+            prefix,
+            local_metadata,
+            strict,
+            missing_keys,
+            unexpected_keys,
+            error_msgs,
+    ):
+        r"""Copy parameters and buffers from :attr:`state_dict` into only this cell, but not its descendants.
+        This is called on every sub cell
+        in :func:`mindspore.nn.Cell.load_state_dict`. Metadata saved for this
+        cell in input :attr:`state_dict` is provided as :attr:`local_metadata`.
+        For state dicts without metadata, :attr:`local_metadata` is empty.
+        Subclasses can achieve class-specific backward compatible loading using
+        the version number at `local_metadata.get("version", None)`.
+        .. note::
+            :attr:`state_dict` is not the same object as the input
+            :attr:`state_dict` to :func:`mindspore.nn.Cell.load_state_dict`. So
+            it can be modified.
+        Args:
+            state_dict (dict): a dict containing parameters and
+                persistent buffers.
+            prefix (str): the prefix for parameters and buffers used in this
+                cell
+            local_metadata (dict): a dict containing the metadata for this cell.
+                See
+            strict (bool): whether to strictly enforce that the keys in
+                :attr:`state_dict` with :attr:`prefix` match the names of
+                parameters and buffers in this cell
+            missing_keys (list of str): if ``strict=True``, add missing keys to
+                this list
+            unexpected_keys (list of str): if ``strict=True``, add unexpected
+                keys to this list
+            error_msgs (list of str): error messages should be added to this
+                list, and will be reported together in
+                :func:`mindspore.nn.Cell.load_state_dict`
+        """
+        for hook in self._load_state_dict_pre_hooks.values():
+            hook(
+                self,
+                state_dict,
+                prefix,
+                local_metadata,
+                strict,
+                missing_keys,
+                unexpected_keys,
+                error_msgs,
+            )
+        persistent_buffers = {
+            k: v
+            for k, v in self._buffers.items()
+            if k not in self._non_persistent_buffers_set
+        }
+        local_name_params = itertools.chain(
+            self._params.items(), persistent_buffers.items()
+        )
+        local_state = {k: v for k, v in local_name_params if v is not None}
+        for name, param in local_state.items():
+            key = prefix + name
+            if key in state_dict:
+                input_param = state_dict[key]
+                if not isinstance(input_param, Tensor):
+                    error_msgs.append(
+                        f'While copying the parameter named "{key}", '
+                        "expected Tensor or Tensor-like object from checkpoint but "
+                        f"received {type(input_param)}"
+                    )
+                    continue
+                if input_param.shape != param.shape:
+                    # local shape should match the one in checkpoint
+                    error_msgs.append(
+                        f"size mismatch for {key}: copying a param with shape {input_param.shape} from checkpoint, "
+                        f"the shape in current model is {param.shape}."
+                    )
+                    continue
+                try:
+                    param.assign_value(Tensor(input_param.asnumpy(), dtype=param.dtype))
+                except Exception as ex:  # pylint: disable=W0703
+                    error_msgs.append(
+                        f'While copy the parameter named "{key}", '
+                        f"whose shape in the model are {param.shape} and "
+                        f"whose shape in the checkpoint are {input_param.shape}, "
+                        f"an exception occurred : {ex.args}."
+                    )
+            elif strict:
+                missing_keys.append(key)
+        extra_state_key = prefix + _EXTRA_STATE_KEY_SUFFIX
+        if getattr(self.__class__, "set_extra_state", Cell.set_extra_state) is not Cell.set_extra_state:
+            if extra_state_key in state_dict:
+                self.set_extra_state(state_dict[extra_state_key])
+            elif strict:
+                missing_keys.append(extra_state_key)
+        elif strict and (extra_state_key in state_dict):
+            unexpected_keys.append(extra_state_key)
+        if strict:
+            for key in state_dict.keys():
+                if key.startswith(prefix) and key != extra_state_key:
+                    input_name = key[len(prefix):].split(".", 1)
+                    # Must be cell if it have attributes
+                    if len(input_name) > 1:
+                        if input_name[0] not in self._cells:
+                            unexpected_keys.append(key)
+                    elif input_name[0] not in local_state:
+                        unexpected_keys.append(key)
+    @jit_forbidden_register
+    def load_state_dict(self, state_dict: Mapping[str, Any], strict: bool = True):
+        r"""Copy parameters and buffers from :attr:`state_dict` into this cell and its descendants.
+        If :attr:`strict` is ``True``, then
+        the keys of :attr:`state_dict` must exactly match the keys returned
+        by this cell's :func:`mindspore.nn.Cell.state_dict` function.
+        Args:
+            state_dict (dict): A dict containing parameters and
+                persistent buffers.
+            strict (bool, optional): Whether to strictly enforce that the keys
+                in input `state_dict` match the keys returned by this cell's
+                :func:`mindspore.nn.Cell.state_dict` function. Default ``True`` .
+        Returns:
+            A namedtuple with ``missing_keys`` and ``unexpected_keys`` fields,
+            - `missing_keys` is a list of str containing any keys that are expected
+              by this cell but missing from the provided ``state_dict``.
+            - `unexpected_keys` is a list of str containing the keys that are not
+              expected by this cell but present in the provided ``state_dict``.
+        Note:
+            If `strict` is ``True`` and a parameter or buffer is registered as ``None``, but its corresponding key
+            exists in :attr:`state_dict`, and :func:`mindspore.nn.Cell.load_state_dict` will raise a ``RuntimeError``.
+        Examples:
+            >>> import mindspore
+            >>> import os
+            >>> class Model(mindspore.nn.Cell):
+            ...     def __init__(self):
+            ...         super().__init__()
+            ...         self.register_buffer("buffer_a", mindspore.tensor([4, 5, 6]))
+            ...         self.param_a = mindspore.Parameter(mindspore.tensor([1, 2, 3]))
+            ...
+            ...     def construct(self, x):
+            ...         return x + self.buffer_a + self.param_a
+            ...
+            ...
+            >>> model = Model()
+            >>> print(model.state_dict())
+            >>> mindspore.save_checkpoint(model.state_dict(), './model_state_dict_ckpt')
+            >>> new_model = Model()
+            >>> new_model.load_state_dict(mindspore.load_checkpoint('./model_state_dict_ckpt'))
+            >>> print(new_model.state_dict())
+            >>> os.remove('./model_state_dict_ckpt')
+            OrderedDict([('param_a', Parameter (name=param_a, shape=(3,), dtype=Int64, requires_grad=True)), \
+            ('buffer_a', Tensor(shape=[3], dtype=Int64, value= [4, 5, 6]))])
+            OrderedDict([('param_a', Parameter (name=param_a, shape=(3,), dtype=Int64, requires_grad=True)), \
+            ('buffer_a', Tensor(shape=[3], dtype=Int64, value= [4, 5, 6]))])
+        """
+        if not isinstance(state_dict, Mapping):
+            raise TypeError(
+                f"Expected state_dict to be dict-like, got {type(state_dict)}."
+            )
+        missing_keys: List[str] = []
+        unexpected_keys: List[str] = []
+        error_msgs: List[str] = []
+        # copy state_dict so _load_from_state_dict can modify it
+        metadata = getattr(state_dict, "_metadata", None)
+        state_dict = OrderedDict(state_dict)
+        if metadata is not None:
+            # mypy isn't aware that "_metadata" exists in state_dict
+            state_dict._metadata = metadata  # type: ignore[attr-defined]
+        def load(cell, local_state_dict, prefix=""):
+            local_metadata = {} if metadata is None else metadata.get(prefix[:-1], {})
+            cell._load_from_state_dict(
+                local_state_dict, prefix, local_metadata, True, missing_keys, unexpected_keys, error_msgs,
+            )
+            for name, child in cell._cells.items():
+                if child is not None:
+                    child_prefix = prefix + name + "."
+                    child_state_dict = {k: v for k, v in local_state_dict.items() if k.startswith(child_prefix)}
+                    load(child, child_state_dict, child_prefix)  # noqa: F821
+            # Note that the hook can modify missing_keys and unexpected_keys.
+            incompatible_keys = _IncompatibleKeys(missing_keys, unexpected_keys)
+            for hook in cell._load_state_dict_post_hooks.values():
+                out = hook(cell, incompatible_keys)
+                if out is not None:
+                    raise RuntimeError(
+                        "Hooks registered with ``register_load_state_dict_post_hook`` are not"
+                        "expected to return new values, if incompatible_keys need to be modified,"
+                        "it should be done inplace."
+                    )
+        load(self, state_dict)
+        del load
+        if strict:
+            if unexpected_keys:
+                error_msgs.insert(
+                    0,
+                    "Unexpected key(s) in state_dict: {}. ".format(
+                        ", ".join(f'"{k}"' for k in unexpected_keys)
+                    ),
+                )
+            if missing_keys:
+                error_msgs.insert(
+                    0,
+                    "Missing key(s) in state_dict: {}. ".format(
+                        ", ".join(f'"{k}"' for k in missing_keys)
+                    ),
+                )
+        if error_msgs:
+            raise RuntimeError(
+                "Error(s) in loading state_dict for {}:\n\t{}".format(
+                    self.__class__.__name__, "\n\t".join(error_msgs)
+                )
+            )
+        return _IncompatibleKeys(missing_keys, unexpected_keys)
     def register_backward_hook(self, hook_fn):
         """
         Register the backward hook function.
@@ -2403,8 +3509,7 @@ class Cell(Cell_):
         """
         if context._get_mode() == context.GRAPH_MODE:
             return HookHandle()
-        if not check_hook_fn("register_backward_hook", hook_fn):
-            return HookHandle()
+        check_hook_fn(hook_fn)
         handle = HookHandle(self._backward_hook)
         self._backward_hook[handle.handle_id] = hook_fn
         if self._cell_backward_hook is None:
@@ -2452,9 +3557,14 @@ class Cell(Cell_):
                 outputs = self.construct(*outputs, **kwargs)
             else:
                 outputs = self.construct(outputs, **kwargs)
-        outputs = self._cell_backward_hook(outputs)
-        return outputs
+        if isinstance(outputs, tuple):
+            new_outputs = self._cell_backward_hook(*outputs)
+        else:
+            new_outputs = self._cell_backward_hook(outputs)
+        # if outputs is (X,) and new_outpus is X
+        if isinstance(outputs, tuple) and len(outputs) == 1:
+            new_outputs = (new_outputs,)
+        return new_outputs
     def set_param_ps(self, recurse=True, init_in_server=False):
         """
@@ -2543,8 +3653,9 @@ class Cell(Cell_):
         if not self._has_config_recompute:
             self._has_config_recompute = True
         else:
-            raise RuntimeError("The recompute interface can be configured only once."
-                               " When the parent cell is configured, the child cell should not be configured")
+            logger.info("The recompute interface can be configured only once."
+                        " When the parent cell is configured, the child cell should not be configured")
+            return
         self._set_recompute_scope(mode)
         if mode and not output_recompute:
             self.add_flags(output_no_recompute=True)
@@ -2584,18 +3695,13 @@ class Cell(Cell_):
         """
         if context.get_context("mode") == context.PYNATIVE_MODE:
             self._recompute_cell = recompute_registry.get()(self.construct)
-            self._add_recompute_flag()
-            return
         self._recompute()
         if 'mp_comm_recompute' in kwargs.keys():
             self._mp_comm_recompute(kwargs.get('mp_comm_recompute', False))
         if 'parallel_optimizer_comm_recompute' in kwargs.keys():
-            if (kwargs.get('parallel_optimizer_comm_recompute', False) and
-                    context.get_auto_parallel_context("pipeline_stages") > 1):
+            if kwargs.get('parallel_optimizer_comm_recompute', False):
                 logger.warning("Currently, the communication operator allgathers introduced by optimizer shard "
-                               "are not support recomputation in pipeline parallel.")
-            elif context.get_auto_parallel_context("pipeline_stages") == 1:
-                self._parallel_optimizer_comm_recompute(kwargs.get('parallel_optimizer_comm_recompute', False))
+                               "is replaced with zero3.")
         if 'recompute_slice_activation' in kwargs:
             self._recompute_slice_activation(kwargs.get('recompute_slice_activation', False))
@@ -2687,17 +3793,91 @@ class Cell(Cell_):
         if hasattr(network, "_amp_level"):
             self._amp_level = getattr(network, "_amp_level")
-    def _add_recompute_flag(self):
-        """
-        Set pynative cell recomputed.
+    def _register_parameters_hook(self, forward_hook=None, backward_hook=None, all=False):
         """
-        if not self._has_config_recompute:
-            self._has_config_recompute = True
+        Register the forward hook for parameters and register the backward hook for the corresponding gradient.
+        .. warning::
+            This is an experimental prototype that is subject to change and/or deletion.
+        Note:
+            - The `_register_parameters_hook(forward_hook, backward_hook)` only work in graph mode
+            - The `forward_hook` must be defined as the following code.
+              `parameters`: the tuple of the trainble parameters of the Cell, each element in the tuple shuould be
+               in the format of `(param_name, Parameter)`.
+            - The `forward_hook` should have the following signature:
+              forward_hook(parameters) -> None.
+            - The `backward_hook` must be defined as the following code.
+              `gradients`: the tuple of the gradients corresponding to the trainble parameters of the Cell, each
+               element in the tuple shuould be in the format of `(param_name, gradient)`.
+            - The `backward_hook` should have the following signature:
+              backward_hook(parameters) -> New gradients.
+        Args:
+            forward_hook (function, optional): Python function or ``None``, Forward hook function. Default: ``None``
+            backward_hook (function, optional): Python function or ``None``, Backward hook function. Default ``None``
+            all (bool, optional): bool, whether to set hooks for all sub cells recursively. Default: ``False``
+        Returns:
+            None
+        Raises:
+            RuntimeError: If the `forward_hook` or `backward_hook ` has unspoorted syntax under GRAPH MODE.
+            TypeError: If the `forward_hook` or `backward_hook` is not defined as required.
+        Supported Platforms:
+        ``Ascend`` ``GPU`` ``CPU``
+        Examples:
+            >>> import mindspore as ms
+            >>> from mindspore import Tensor, nn, ops, Parameter
+            >>>
+            >>> ms.set_context(mode=ms.GRAPH_MODE)
+            >>> def parameter_hook(parameters):
+            ...     print("--- enter parameter hook ---")
+            ...     for name, param in parameters:
+            ...         print (name, param)
+            ...     print("--- leave parameter hook ---")
+            ...
+            >>> def gradient_hook(gradients):
+            ...     print("--- enter gradient hook ---")
+            ...     outs = []
+            ...     for name, gradient in gradients:
+            ...         print(name, gradient)
+            ...         outs.append(gradient * 2) # double gradient
+            ...     print("--- leave gradient hook ---")
+            ...     return outs
+            ...
+            >>> class Net(nn.Cell):
+            ...     def __init__(self)
+            ...         super(Net, self).__init__()
+            ...         self.w = Parameter(Tensor(np.array([3.0], np.float32)), name='w')
+            ...     def construct(self, x):
+            ...         return self.w * x
+            ...
+            >>> grad = ops.GradOperation(get_by_list=True)
+            >>> net = Net()
+            >>> net._register_parameters_hook(forward_hook=parameter_hook, backward_hook=gradient_hook)
+            >>> x = Tensor(np.array([4.0]).astype(np.float32))
+            >>> output = grad(net, net.trainable_params())(x)
+            --- enter parameter hook ---
+            w
+            Tensor(shape=[1], dtype=Float32, value=[ 3.00000000e+00])
+            --- leave parameter hook ---
+            --- enter gradient hook ---
+            w
+            Tensor(shape=[1], dtype=Float32, value=[ 4.00000000e+00])
+            --- leave gradient hook ---
+            >>> print("doubled grad: ", output)
+            doubled grad: (Tensor(shape=[1], dtype=Float32, value=[ 8.00000000e+00]),)
+        """
+        if not all:
+            self._parameters_forward_hook = forward_hook
+            self._parameters_backward_hook = backward_hook
         else:
-            logger.info("The recompute interface can be configured only once."
-                        " If the parent cell is configured, the child cell should not be configured")
-        for cell in self.cells():
-            cell._add_recompute_flag()
+            for _, cell in self.cells_and_names():
+                cell._parameters_forward_hook = forward_hook
+                cell._parameters_backward_hook = backward_hook
 class GraphCell(Cell):
@@ -2713,12 +3893,10 @@ class GraphCell(Cell):
             The key is the parameter name whose type is str, and the value is a Tensor or Parameter.
             If the parameter exists in the graph according to the name, update it's value.
             If the parameter does not exist, ignore it. Default: ``None`` .
-        obf_random_seed (Union[int, None]): The random seed used for dynamic obfuscation. "dynamic obfuscation" is
-            used for model protection, which can refer to :func:`mindspore.obfuscate_model`. If the input `graph` is
-            a func_graph loaded from a mindir file obfuscated with `obf_random_seed` , then `obf_random_seed` should be
-            provided. `obf_random_seed` should be in (0, 9223372036854775807]. default: ``None`` .
+        obf_random_seed (Union[int, None]): The random seed used for dynamic obfuscation, which is not supported now.
     Raises:
+        NotImplementedError: Dynamic structure obfuscation is not supported now.
         TypeError: If the `graph` is not a FuncGraph.
         TypeError: If the `params_init` is not a dict.
         TypeError: If the key of the `params_init` is not a str.
@@ -2748,20 +3926,12 @@ class GraphCell(Cell):
     def __init__(self, graph, params_init=None, obf_random_seed=None):
         super(GraphCell, self).__init__(auto_prefix=True)
+        if obf_random_seed is not None:
+            raise NotImplementedError("Dynamic structure obfuscation is not supported now.")
         if not isinstance(graph, FuncGraph):
             raise TypeError(f"For 'GraphCell', the argument 'graph' must be a FuncGraph loaded from MindIR, "
                             f"but got type {type(graph)}.")
         self.graph = graph
-        self.obf_random_seed = obf_random_seed
-        if obf_random_seed is not None:
-            if not isinstance(obf_random_seed, int):
-                raise TypeError("'obf_random_seed' must be int, but got {}.".format(type(obf_random_seed)))
-            int_64_max = 9223372036854775807
-            if obf_random_seed <= 0 or obf_random_seed > int_64_max:
-                raise ValueError(
-                    "'obf_random_seed' must be larger than 0, and less or equal than int64 ({}),"
-                    "but got {}.".format(int_64_max, obf_random_seed))
-            self._branch_control_input = _generate_branch_control_input(self.obf_random_seed)
         params_init = {} if params_init is None else params_init
         if not isinstance(params_init, dict):
             raise TypeError(f"For 'GraphCell', the argument 'params_init' must be a dict, but got {type(params_init)}.")
@@ -2781,19 +3951,30 @@ class GraphCell(Cell):
     def __call__(self, *args, **kwargs):
         self.phase = "graph_load_from_mindir"
         self._add_attr("graph_load_from_mindir", self.graph)
-        if not self.obf_random_seed:
-            return self.compile_and_run(*args, **kwargs)
-        append_input = Tensor((numpy.ones((1,)) * self._branch_control_input).astype(numpy.int32))
-        return self.compile_and_run(*args, append_input, **kwargs)
+        return self.compile_and_run(*args, **kwargs)
-def _check_param_list_tuple(value):
+def _is_parameter_list_or_tuple(value):
     """
     Check the type of input in list or tuple is Parameter.
     :param value: list or tuple.
     :return: The types of all inputs are parameter.
     """
-    for item in value:
-        if not isinstance(item, Parameter):
-            return False
-    return True
+    if isinstance(value, (list, tuple)) and value:
+        for item in value:
+            if not isinstance(item, Parameter):
+                return False
+        return True
+    return False
+def _addindent(s_, num_spaces):
+    s = s_.split("\n")
+    # don't do anything for single-line stuff
+    if len(s) == 1:
+        return s_
+    first = s.pop(0)
+    s = [(num_spaces * " ") + line for line in s]
+    s = "\n".join(s)
+    s = first + "\n" + s
+    return s