PyPI - mindspore - Versions diffs - 2.6.0__cp311-cp311-win_amd64.whl → 2.7.0__cp311-cp311-win_amd64.whl - Mend

mindspore 2.6.0__cp311-cp311-win_amd64.whl → 2.7.0__cp311-cp311-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (455) hide show

mindspore/.commit_id +1 -1
mindspore/Microsoft.VisualStudio.Telemetry.dll +0 -0
mindspore/Newtonsoft.Json.dll +0 -0
mindspore/__init__.py +2 -2
mindspore/_c_dataengine.cp311-win_amd64.pyd +0 -0
mindspore/_c_expression.cp311-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp311-win_amd64.pyd +0 -0
mindspore/_checkparam.py +42 -11
mindspore/_extends/builtin_operations.py +3 -3
mindspore/{_deprecated → _extends/optimize}/__init__.py +9 -3
mindspore/_extends/optimize/cell_utils.py +96 -0
mindspore/_extends/parallel_compile/akg_compiler/custom.py +1109 -0
mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
mindspore/_extends/parse/__init__.py +3 -3
mindspore/_extends/parse/compile_config.py +44 -22
mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +1 -2
mindspore/_extends/parse/parser.py +64 -83
mindspore/_extends/parse/resources.py +39 -0
mindspore/_extends/parse/standard_method.py +47 -14
mindspore/_extends/parse/trope.py +8 -1
mindspore/_extends/pijit/__init__.py +1 -2
mindspore/_extends/pijit/pijit_func_white_list.py +2 -5
mindspore/amp.py +4 -22
mindspore/atlprov.dll +0 -0
mindspore/avcodec-59.dll +0 -0
mindspore/avdevice-59.dll +0 -0
mindspore/avfilter-8.dll +0 -0
mindspore/avformat-59.dll +0 -0
mindspore/avutil-57.dll +0 -0
mindspore/boost/adasum.py +1 -1
mindspore/boost/boost_cell_wrapper.py +4 -4
mindspore/c1.dll +0 -0
mindspore/c1xx.dll +0 -0
mindspore/c2.dll +0 -0
mindspore/common/__init__.py +43 -12
mindspore/common/_grad_function.py +2 -1
mindspore/common/_pijit_context.py +28 -7
mindspore/common/_stub_tensor.py +1 -209
mindspore/common/_tensor_cpp_method.py +1 -1
mindspore/common/_tensor_docs.py +177 -52
mindspore/common/_utils.py +9 -1
mindspore/common/api.py +338 -208
mindspore/common/dtype.py +108 -57
mindspore/common/dump.py +11 -16
mindspore/common/dynamic_shape/__init__.py +0 -0
mindspore/common/{auto_dynamic_shape.py → dynamic_shape/auto_dynamic_shape.py} +17 -23
mindspore/common/dynamic_shape/enable_dynamic.py +197 -0
mindspore/common/file_system.py +59 -9
mindspore/common/generator.py +2 -3
mindspore/common/hook_handle.py +33 -5
mindspore/common/jit_config.py +1 -1
mindspore/common/jit_trace.py +84 -105
mindspore/common/np_dtype.py +3 -3
mindspore/common/parameter.py +27 -29
mindspore/common/recompute.py +5 -7
mindspore/common/sparse_tensor.py +0 -3
mindspore/common/symbol.py +0 -1
mindspore/common/tensor.py +84 -133
mindspore/communication/_comm_helper.py +46 -4
mindspore/communication/management.py +79 -7
mindspore/context.py +47 -38
mindspore/dataset/__init__.py +1 -1
mindspore/dataset/audio/transforms.py +1 -1
mindspore/dataset/core/config.py +38 -4
mindspore/dataset/engine/datasets.py +350 -322
mindspore/dataset/engine/datasets_user_defined.py +69 -23
mindspore/dataset/engine/iterators.py +2 -2
mindspore/dataset/engine/obs/config_loader.py +2 -2
mindspore/dataset/engine/obs/obs_mindrecord_dataset.py +8 -0
mindspore/dataset/transforms/c_transforms.py +2 -2
mindspore/dataset/transforms/py_transforms.py +7 -3
mindspore/dataset/transforms/transforms.py +10 -6
mindspore/dataset/vision/__init__.py +1 -1
mindspore/dataset/vision/py_transforms.py +8 -8
mindspore/dataset/vision/transforms.py +17 -5
mindspore/dataset/vision/utils.py +632 -21
mindspore/dataset/vision/validators.py +1 -0
mindspore/device_context/ascend/device.py +1 -1
mindspore/device_context/ascend/op_tuning.py +35 -1
mindspore/device_context/gpu/__init__.py +2 -2
mindspore/device_context/gpu/device.py +1 -1
mindspore/device_context/gpu/op_precision.py +4 -2
mindspore/device_context/gpu/op_tuning.py +6 -3
mindspore/device_manager.py +16 -9
mindspore/dnnl.dll +0 -0
mindspore/dpcmi.dll +0 -0
mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +5 -4
mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
mindspore/experimental/optim/adadelta.py +13 -20
mindspore/experimental/optim/adagrad.py +15 -22
mindspore/experimental/optim/adam.py +17 -24
mindspore/experimental/optim/adamax.py +14 -22
mindspore/experimental/optim/adamw.py +28 -34
mindspore/experimental/optim/asgd.py +15 -25
mindspore/experimental/optim/lr_scheduler.py +27 -45
mindspore/experimental/optim/nadam.py +14 -24
mindspore/experimental/optim/optimizer.py +13 -23
mindspore/experimental/optim/radam.py +18 -24
mindspore/experimental/optim/rmsprop.py +14 -25
mindspore/experimental/optim/rprop.py +15 -26
mindspore/experimental/optim/sgd.py +9 -19
mindspore/hal/__init__.py +4 -4
mindspore/hal/contiguous_tensors_handle.py +2 -2
mindspore/hal/memory.py +1 -0
mindspore/include/api/cell.h +65 -5
mindspore/include/api/cfg.h +24 -7
mindspore/include/api/context.h +1 -0
mindspore/include/api/delegate.h +10 -2
mindspore/include/api/dual_abi_helper.h +100 -19
mindspore/include/api/graph.h +14 -1
mindspore/include/api/kernel.h +16 -3
mindspore/include/api/kernel_api.h +9 -1
mindspore/include/api/metrics/accuracy.h +9 -0
mindspore/include/api/model.h +8 -1
mindspore/include/api/model_group.h +4 -0
mindspore/include/api/model_parallel_runner.h +2 -0
mindspore/include/api/status.h +48 -10
mindspore/include/api/types.h +8 -3
mindspore/include/c_api/model_c.h +0 -58
mindspore/include/c_api/tensor_c.h +0 -26
mindspore/include/dataset/constants.h +9 -0
mindspore/include/dataset/vision_ascend.h +1 -1
mindspore/jpeg62.dll +0 -0
mindspore/mindrecord/tools/cifar10.py +61 -11
mindspore/mindrecord/tools/cifar10_to_mr.py +5 -0
mindspore/mindspore_backend_common.dll +0 -0
mindspore/mindspore_backend_manager.dll +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_cpu_res_manager.dll +0 -0
mindspore/mindspore_dump.dll +0 -0
mindspore/mindspore_frontend.dll +0 -0
mindspore/mindspore_glog.dll +0 -0
mindspore/mindspore_memory_pool.dll +0 -0
mindspore/mindspore_ms_backend.dll +0 -0
mindspore/mindspore_ops.dll +0 -0
mindspore/mindspore_ops_host.dll +0 -0
mindspore/mindspore_ops_kernel_common.dll +0 -0
mindspore/mindspore_profiler.dll +0 -0
mindspore/mindspore_pyboost.dll +0 -0
mindspore/mindspore_pynative.dll +0 -0
mindspore/mindspore_res_manager.dll +0 -0
mindspore/mindspore_runtime_pipeline.dll +0 -0
mindspore/mint/__init__.py +4 -44
mindspore/mint/distributed/__init__.py +5 -0
mindspore/mint/distributed/distributed.py +425 -19
mindspore/mint/nn/__init__.py +1 -1
mindspore/mint/nn/functional.py +53 -6
mindspore/mint/nn/layer/_functions.py +163 -294
mindspore/mint/nn/layer/activation.py +8 -6
mindspore/mint/nn/layer/conv.py +125 -101
mindspore/mint/nn/layer/normalization.py +11 -25
mindspore/mint/optim/adam.py +19 -18
mindspore/mint/optim/adamw.py +14 -8
mindspore/mint/optim/sgd.py +5 -5
mindspore/msobj140.dll +0 -0
mindspore/mspdb140.dll +0 -0
mindspore/mspdbcore.dll +0 -0
mindspore/mspdbst.dll +0 -0
mindspore/mspft140.dll +0 -0
mindspore/msvcdis140.dll +0 -0
mindspore/msvcp140_1.dll +0 -0
mindspore/msvcp140_2.dll +0 -0
mindspore/msvcp140_atomic_wait.dll +0 -0
mindspore/msvcp140_codecvt_ids.dll +0 -0
mindspore/nn/cell.py +488 -620
mindspore/nn/grad/cell_grad.py +11 -12
mindspore/nn/layer/activation.py +36 -36
mindspore/nn/layer/basic.py +74 -77
mindspore/nn/layer/channel_shuffle.py +4 -4
mindspore/nn/layer/combined.py +4 -2
mindspore/nn/layer/conv.py +86 -85
mindspore/nn/layer/dense.py +9 -7
mindspore/nn/layer/embedding.py +50 -52
mindspore/nn/layer/image.py +38 -40
mindspore/nn/layer/math.py +111 -112
mindspore/nn/layer/normalization.py +56 -44
mindspore/nn/layer/pooling.py +58 -63
mindspore/nn/layer/rnn_cells.py +33 -33
mindspore/nn/layer/rnns.py +56 -56
mindspore/nn/layer/thor_layer.py +74 -73
mindspore/nn/layer/transformer.py +11 -1
mindspore/nn/learning_rate_schedule.py +20 -20
mindspore/nn/loss/loss.py +79 -81
mindspore/nn/optim/adam.py +2 -4
mindspore/nn/optim/adasum.py +2 -2
mindspore/nn/optim/lamb.py +1 -3
mindspore/nn/optim/optimizer.py +1 -1
mindspore/nn/optim/tft_wrapper.py +2 -3
mindspore/nn/optim/thor.py +2 -2
mindspore/nn/probability/distribution/_utils/utils.py +2 -2
mindspore/nn/probability/distribution/exponential.py +2 -1
mindspore/nn/probability/distribution/poisson.py +2 -1
mindspore/nn/sparse/sparse.py +3 -3
mindspore/nn/wrap/cell_wrapper.py +73 -42
mindspore/nn/wrap/grad_reducer.py +37 -52
mindspore/nn/wrap/loss_scale.py +72 -74
mindspore/numpy/array_creations.py +7 -7
mindspore/numpy/fft.py +1 -1
mindspore/numpy/math_ops.py +1 -1
mindspore/numpy/utils_const.py +1 -1
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/opencv_imgproc452.dll +0 -0
mindspore/ops/_grad_experimental/grad_comm_ops.py +51 -13
mindspore/ops/_grad_experimental/grad_debug_ops.py +14 -0
mindspore/ops/_grad_experimental/grad_inner_ops.py +0 -9
mindspore/ops/_op_impl/cpu/__init__.py +1 -0
mindspore/{experimental/es/__init__.py → ops/_op_impl/cpu/joinedstr_op.py} +12 -6
mindspore/ops/_vmap/vmap_array_ops.py +6 -13
mindspore/ops/_vmap/vmap_nn_ops.py +8 -16
mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +29 -10
mindspore/ops/auto_generate/gen_extend_func.py +5 -55
mindspore/ops/auto_generate/gen_ops_def.py +753 -273
mindspore/ops/auto_generate/gen_ops_prim.py +1687 -958
mindspore/ops/auto_generate/pyboost_inner_prim.py +31 -1
mindspore/ops/composite/__init__.py +10 -0
mindspore/ops/composite/base.py +9 -5
mindspore/ops/composite/multitype_ops/__init__.py +12 -1
mindspore/ops/composite/multitype_ops/_compile_utils.py +132 -108
mindspore/ops/composite/multitype_ops/_constexpr_utils.py +1 -1
mindspore/ops/composite/multitype_ops/add_impl.py +70 -2
mindspore/ops/composite/multitype_ops/div_impl.py +49 -0
mindspore/ops/composite/multitype_ops/floordiv_impl.py +29 -0
mindspore/ops/composite/multitype_ops/getitem_impl.py +11 -0
mindspore/ops/composite/multitype_ops/mod_impl.py +5 -3
mindspore/ops/composite/multitype_ops/mul_impl.py +49 -0
mindspore/ops/composite/multitype_ops/setitem_impl.py +57 -0
mindspore/ops/composite/multitype_ops/sub_impl.py +34 -0
mindspore/ops/composite/multitype_ops/zeros_like_impl.py +14 -0
mindspore/ops/function/__init__.py +4 -1
mindspore/ops/function/_add_attr_func.py +11 -6
mindspore/ops/function/array_func.py +17 -100
mindspore/ops/function/debug_func.py +8 -5
mindspore/ops/function/grad/grad_func.py +5 -13
mindspore/ops/function/math_func.py +65 -399
mindspore/ops/function/nn_func.py +44 -61
mindspore/ops/function/other_func.py +4 -1
mindspore/ops/function/random_func.py +31 -4
mindspore/ops/functional.py +2 -3
mindspore/ops/functional_overload.py +486 -18
mindspore/ops/op_info_register.py +21 -0
mindspore/ops/operations/__init__.py +5 -2
mindspore/ops/operations/_custom_ops_utils.py +675 -8
mindspore/ops/operations/_inner_ops.py +14 -18
mindspore/ops/operations/_sequence_ops.py +1 -1
mindspore/ops/operations/array_ops.py +4 -50
mindspore/ops/operations/comm_ops.py +186 -41
mindspore/ops/operations/custom_ops.py +244 -175
mindspore/ops/operations/debug_ops.py +55 -4
mindspore/ops/operations/image_ops.py +13 -13
mindspore/ops/operations/manually_defined/ops_def.py +27 -28
mindspore/ops/operations/math_ops.py +8 -9
mindspore/ops/operations/nn_ops.py +6 -7
mindspore/ops/primitive.py +9 -20
mindspore/ops/tensor_method.py +52 -11
mindspore/ops_generate/api/cpp_create_prim_instance_helper_generator.py +1 -1
mindspore/ops_generate/api/functional_map_cpp_generator.py +10 -9
mindspore/ops_generate/api/functions_cc_generator.py +58 -10
mindspore/ops_generate/api/tensor_func_reg_cpp_generator.py +1 -1
mindspore/ops_generate/common/base_generator.py +14 -0
mindspore/ops_generate/common/gen_constants.py +7 -2
mindspore/ops_generate/common/gen_utils.py +0 -19
mindspore/ops_generate/common/op_proto.py +11 -4
mindspore/ops_generate/common/template.py +88 -11
mindspore/ops_generate/gen_ops.py +1 -1
mindspore/ops_generate/op_def/lite_ops_cpp_generator.py +4 -4
mindspore/ops_generate/op_def/ops_name_h_generator.py +0 -3
mindspore/ops_generate/op_def/ops_primitive_h_generator.py +0 -4
mindspore/ops_generate/op_def_py/op_prim_py_generator.py +5 -2
mindspore/ops_generate/pyboost/auto_grad_impl_cc_generator.py +49 -8
mindspore/ops_generate/pyboost/auto_grad_reg_cc_generator.py +2 -2
mindspore/ops_generate/pyboost/gen_pyboost_func.py +31 -16
mindspore/ops_generate/pyboost/op_template_parser.py +98 -72
mindspore/ops_generate/pyboost/pyboost_functions_cpp_generator.py +70 -273
mindspore/ops_generate/pyboost/pyboost_functions_h_generator.py +14 -6
mindspore/ops_generate/pyboost/pyboost_functions_impl_cpp_generator.py +316 -0
mindspore/ops_generate/pyboost/pyboost_functions_py_generator.py +1 -1
mindspore/ops_generate/pyboost/pyboost_grad_function_cpp_generator.py +5 -3
mindspore/ops_generate/pyboost/pyboost_inner_prim_generator.py +1 -1
mindspore/ops_generate/pyboost/pyboost_internal_functions_cpp_generator.py +76 -0
mindspore/ops_generate/pyboost/pyboost_internal_functions_h_generator.py +76 -0
mindspore/ops_generate/pyboost/pyboost_internal_kernel_info_adapter_generator.py +125 -0
mindspore/ops_generate/pyboost/pyboost_native_grad_functions_generator.py +4 -3
mindspore/ops_generate/pyboost/pyboost_op_cpp_code_generator.py +348 -61
mindspore/ops_generate/pyboost/pyboost_overload_functions_cpp_generator.py +1 -1
mindspore/ops_generate/pyboost/pyboost_utils.py +118 -9
mindspore/ops_generate/tensor_py_cc_generator.py +1 -24
mindspore/parallel/_auto_parallel_context.py +9 -17
mindspore/parallel/_cell_wrapper.py +106 -40
mindspore/parallel/_parallel_serialization.py +4 -3
mindspore/parallel/_ps_context.py +4 -6
mindspore/parallel/_tensor.py +167 -12
mindspore/parallel/_transformer/moe.py +1 -1
mindspore/parallel/_transformer/transformer.py +17 -12
mindspore/parallel/_utils.py +5 -11
mindspore/parallel/auto_parallel.py +33 -12
mindspore/parallel/checkpoint_convert.py +3 -3
mindspore/parallel/checkpoint_transform.py +5 -1
mindspore/parallel/cluster/process_entity/_api.py +88 -49
mindspore/parallel/cluster/process_entity/_utils.py +95 -7
mindspore/parallel/cluster/run.py +48 -7
mindspore/parallel/function/__init__.py +8 -1
mindspore/parallel/function/reshard_func.py +7 -6
mindspore/parallel/nn/__init__.py +15 -2
mindspore/parallel/nn/parallel_cell_wrapper.py +50 -14
mindspore/parallel/nn/parallel_grad_reducer.py +7 -14
mindspore/parallel/shard.py +9 -23
mindspore/parallel/transform_safetensors.py +468 -174
mindspore/pgodb140.dll +0 -0
mindspore/pgort140.dll +0 -0
mindspore/profiler/__init__.py +2 -1
mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +7 -7
mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +3 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +3 -0
mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +3 -3
mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +3 -3
mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +4 -4
mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +3 -3
mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +4 -1
mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +2 -1
mindspore/profiler/analysis/task_manager.py +1 -1
mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +5 -1
mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +2 -1
mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +10 -9
mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +43 -23
mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +3 -2
mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +9 -5
mindspore/profiler/analysis/viewer/ms_operator_details_viewer.py +132 -0
mindspore/profiler/common/constant.py +16 -0
mindspore/profiler/common/msprof_cmd_tool.py +2 -2
mindspore/profiler/common/path_manager.py +9 -0
mindspore/profiler/common/profiler_context.py +50 -29
mindspore/profiler/common/profiler_info.py +0 -16
mindspore/profiler/common/profiler_meta_data.py +1 -0
mindspore/profiler/common/profiler_op_analyse.py +239 -0
mindspore/profiler/common/profiler_output_path.py +23 -8
mindspore/profiler/common/profiler_parameters.py +128 -35
mindspore/profiler/dynamic_profile/__init__.py +0 -0
mindspore/profiler/dynamic_profile/dynamic_monitor_proxy.py +39 -0
mindspore/profiler/dynamic_profile/dynamic_profiler_config_context.py +666 -0
mindspore/profiler/dynamic_profile/dynamic_profiler_utils.py +62 -0
mindspore/profiler/dynamic_profiler.py +374 -338
mindspore/profiler/envprofiler.py +42 -12
mindspore/profiler/experimental_config.py +112 -7
mindspore/profiler/mstx.py +33 -12
mindspore/profiler/platform/__init__.py +2 -3
mindspore/profiler/platform/cpu_profiler.py +10 -4
mindspore/profiler/platform/npu_profiler.py +30 -20
mindspore/profiler/profiler.py +218 -154
mindspore/profiler/profiler_action_controller.py +65 -77
mindspore/profiler/profiler_interface.py +2 -2
mindspore/profiler/schedule.py +10 -4
mindspore/rewrite/common/config.py +1 -0
mindspore/rewrite/common/namer.py +1 -0
mindspore/rewrite/common/namespace.py +1 -0
mindspore/rewrite/node/node.py +31 -11
mindspore/rewrite/parsers/assign_parser.py +1 -1
mindspore/rewrite/symbol_tree/symbol_tree.py +2 -2
mindspore/run_check/_check_version.py +7 -10
mindspore/runtime/__init__.py +8 -6
mindspore/runtime/event.py +10 -4
mindspore/runtime/executor.py +87 -45
mindspore/runtime/memory.py +22 -30
mindspore/runtime/thread_bind_core.py +299 -165
mindspore/safeguard/rewrite_obfuscation.py +12 -13
mindspore/swresample-4.dll +0 -0
mindspore/swscale-6.dll +0 -0
mindspore/tbbmalloc.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/train/_utils.py +9 -5
mindspore/train/amp.py +43 -23
mindspore/train/callback/__init__.py +5 -5
mindspore/train/callback/_callback.py +2 -1
mindspore/train/callback/_checkpoint.py +4 -14
mindspore/train/callback/_flops_collector.py +11 -7
mindspore/train/callback/_landscape.py +0 -1
mindspore/train/callback/_train_fault_tolerance.py +72 -18
mindspore/train/data_sink.py +15 -6
mindspore/train/dataset_helper.py +14 -5
mindspore/train/model.py +49 -47
mindspore/train/serialization.py +168 -126
mindspore/train/summary/summary_record.py +13 -2
mindspore/train/train_thor/model_thor.py +2 -2
mindspore/turbojpeg.dll +0 -0
mindspore/utils/__init__.py +3 -2
mindspore/utils/dryrun.py +0 -6
mindspore/utils/runtime_execution_order_check.py +162 -78
mindspore/utils/sdc_detect.py +68 -0
mindspore/utils/utils.py +14 -17
mindspore/vcmeta.dll +0 -0
mindspore/vcruntime140.dll +0 -0
mindspore/vcruntime140_1.dll +0 -0
mindspore/version.py +1 -1
{mindspore-2.6.0.dist-info → mindspore-2.7.0.dist-info}/METADATA +5 -4
{mindspore-2.6.0.dist-info → mindspore-2.7.0.dist-info}/RECORD +400 -439
mindspore/_deprecated/jit.py +0 -198
mindspore/_extends/remote/kernel_build_server_ascend.py +0 -75
mindspore/communication/_hccl_management.py +0 -297
mindspore/experimental/es/embedding_service.py +0 -891
mindspore/experimental/es/embedding_service_layer.py +0 -581
mindspore/profiler/common/validator/__init__.py +0 -14
mindspore/profiler/common/validator/validate_path.py +0 -84
mindspore/profiler/parser/__init__.py +0 -14
mindspore/profiler/parser/aicpu_data_parser.py +0 -272
mindspore/profiler/parser/ascend_analysis/__init__.py +0 -14
mindspore/profiler/parser/ascend_analysis/constant.py +0 -71
mindspore/profiler/parser/ascend_analysis/file_manager.py +0 -180
mindspore/profiler/parser/ascend_analysis/function_event.py +0 -185
mindspore/profiler/parser/ascend_analysis/fwk_cann_parser.py +0 -136
mindspore/profiler/parser/ascend_analysis/fwk_file_parser.py +0 -131
mindspore/profiler/parser/ascend_analysis/msprof_timeline_parser.py +0 -104
mindspore/profiler/parser/ascend_analysis/path_manager.py +0 -313
mindspore/profiler/parser/ascend_analysis/profiler_info_parser.py +0 -123
mindspore/profiler/parser/ascend_analysis/tlv_decoder.py +0 -86
mindspore/profiler/parser/ascend_analysis/trace_event_manager.py +0 -75
mindspore/profiler/parser/ascend_cluster_generator.py +0 -116
mindspore/profiler/parser/ascend_communicate_generator.py +0 -314
mindspore/profiler/parser/ascend_flops_generator.py +0 -116
mindspore/profiler/parser/ascend_fpbp_generator.py +0 -82
mindspore/profiler/parser/ascend_hccl_generator.py +0 -271
mindspore/profiler/parser/ascend_integrate_generator.py +0 -42
mindspore/profiler/parser/ascend_memory_generator.py +0 -185
mindspore/profiler/parser/ascend_msprof_exporter.py +0 -282
mindspore/profiler/parser/ascend_msprof_generator.py +0 -187
mindspore/profiler/parser/ascend_op_generator.py +0 -334
mindspore/profiler/parser/ascend_steptrace_generator.py +0 -94
mindspore/profiler/parser/ascend_timeline_generator.py +0 -545
mindspore/profiler/parser/base_timeline_generator.py +0 -483
mindspore/profiler/parser/container.py +0 -229
mindspore/profiler/parser/cpu_gpu_timeline_generator.py +0 -697
mindspore/profiler/parser/flops_parser.py +0 -531
mindspore/profiler/parser/framework_enum.py +0 -111
mindspore/profiler/parser/framework_parser.py +0 -464
mindspore/profiler/parser/framework_struct.py +0 -61
mindspore/profiler/parser/gpu_analysis/__init__.py +0 -14
mindspore/profiler/parser/gpu_analysis/function_event.py +0 -44
mindspore/profiler/parser/gpu_analysis/fwk_file_parser.py +0 -89
mindspore/profiler/parser/gpu_analysis/profiler_info_parser.py +0 -72
mindspore/profiler/parser/hccl_parser.py +0 -573
mindspore/profiler/parser/hwts_log_parser.py +0 -122
mindspore/profiler/parser/integrator.py +0 -526
mindspore/profiler/parser/memory_usage_parser.py +0 -277
mindspore/profiler/parser/minddata_analyzer.py +0 -800
mindspore/profiler/parser/minddata_parser.py +0 -186
mindspore/profiler/parser/minddata_pipeline_parser.py +0 -299
mindspore/profiler/parser/op_intermediate_parser.py +0 -149
mindspore/profiler/parser/optime_parser.py +0 -250
mindspore/profiler/parser/profiler_info.py +0 -213
mindspore/profiler/parser/step_trace_parser.py +0 -666
mindspore/utils/hooks.py +0 -81
/mindspore/common/{_auto_dynamic.py → dynamic_shape/_auto_dynamic.py} +0 -0
{mindspore-2.6.0.dist-info → mindspore-2.7.0.dist-info}/WHEEL +0 -0
{mindspore-2.6.0.dist-info → mindspore-2.7.0.dist-info}/entry_points.txt +0 -0
{mindspore-2.6.0.dist-info → mindspore-2.7.0.dist-info}/top_level.txt +0 -0

mindspore/mint/nn/__init__.py CHANGED Viewed

@@ -1189,7 +1189,7 @@ class PixelShuffle(Cell):
         >>> pixel_shuffle = mint.nn.PixelShuffle(3)
         >>> input = mint.randn(1, 9, 4, 4)
         >>> output = pixel_shuffle(input)
-        >>> print(output.shape())
+        >>> print(output.shape)
             [1, 1, 12, 12]
     """

mindspore/mint/nn/functional.py CHANGED Viewed

@@ -67,7 +67,7 @@ from mindspore.ops.auto_generate import prelu
 # 20
 # 21
-from mindspore.ops.function.nn_func import conv3d_ext as conv3d
+from mindspore.ops.functional_overload import conv3d
 # 22
 # 23
@@ -118,7 +118,8 @@ from mindspore.ops.auto_generate import soft_margin_loss
 # 45
 # 46
-from mindspore.ops.functional import silu
+from mindspore.ops.auto_generate import silu as silu_func
+from mindspore.ops.auto_generate import inplace_silu
 # 47
 # 48
@@ -283,6 +284,52 @@ from mindspore.ops.functional import adaptive_avg_pool2d_ext as adaptive_avg_poo
 from mindspore.ops.function.nn_func import cross_entropy_ext as cross_entropy
 from mindspore.ops.function.nn_func import nll_loss_ext as nll_loss
+def silu(input, inplace=False):
+    r"""
+    Computes Sigmoid Linear Unit of input element-wise. The SiLU function is defined as:
+    .. math::
+        \text{SiLU}(x) = x * \sigma(x),
+    where :math:`x` is an element of the input, :math:`\sigma(x)` is Sigmoid function.
+    .. math::
+        \text{sigma}(x_i) = \frac{1}{1 + \exp(-x_i)},
+    SiLU Function Graph:
+    .. image:: ../images/SiLU.png
+        :align: center
+    Args:
+        input (Tensor): `input` is :math:`x` in the preceding formula. Input with the data type
+            float16 or float32.
+        inplace (bool, optional): If it is ``True``, enable the in place update function. Default value: ``False``.
+    Returns:
+        Tensor, with the same type and shape as the `input`.
+    Raises:
+        TypeError: If dtype of `input` is neither float16 nor float32.
+    Supported Platforms:
+        ``Ascend`` ``GPU`` ``CPU``
+    Examples:
+        >>> import mindspore
+        >>> from mindspore import Tensor, mint
+        >>> import numpy as np
+        >>> input = Tensor(np.array([-1, 2, -3, 2, -1]), mindspore.float16)
+        >>> output = mint.nn.functional.silu(input, inplace=False)
+        >>> print(output)
+        [-0.269  1.762  -0.1423  1.762  -0.269]
+    """
+    if inplace:
+        return inplace_silu(input)
+    return silu_func(input)
 def elu(input, alpha=1.0, inplace=False):
     r"""
@@ -511,7 +558,10 @@ def binary_cross_entropy(input, target, weight=None, reduction='mean'):
         \end{cases}
     .. warning::
-        - The value of `input` must range from `0` to `l`.
+        The value of `input` must range from `0` to `l`.
+    .. note::
+        Currently, when the platform is Ascend, all gradient calculations are performed on NPU.
     Args:
         input (Tensor): The predictive value whose data type must be float16 or float32.
@@ -955,9 +1005,6 @@ def threshold(input, threshold, value, inplace=False):  # pylint: disable=W0621
         \text{value}, &\text{ otherwise }
         \end{cases}
-    .. warning::
-        This is an experimental API that is subject to change or deletion.
     Args:
         input (Tensor): The input Tensor.
         threshold (Union[int, float]): The value of the threshold.

mindspore/mint/nn/layer/_functions.py CHANGED Viewed

@@ -1,323 +1,192 @@
+# Copyright 2025 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+"""functions for mint"""
 import mindspore
-from mindspore import Tensor
-from mindspore import context
-import mindspore.communication
-import mindspore.communication.comm_func
+from mindspore import ops, mint
+from mindspore import _checkparam as validator
 from mindspore.nn.cell import Cell
+from mindspore.communication.comm_func import all_gather_into_tensor
+from mindspore.communication.comm_func import all_reduce
+from mindspore.communication.management import get_rank, get_group_size, GlobalComm, _get_group
 from mindspore.ops.auto_generate.gen_ops_prim import BatchNormReduceGrad
 from mindspore.ops.auto_generate.gen_ops_prim import BatchNormElemtGrad
-from mindspore.communication import GlobalComm
-from mindspore.ops import ReduceOp
-from mindspore._c_expression import TensorPy as Tensor_
-from mindspore.communication._comm_helper import _get_size_helper, HCCL_WORLD_COMM_GROUP
-from mindspore.ops._primitive_cache import _get_cache_prim
-from mindspore.communication.comm_func import all_gather_into_tensor as all_gather_into_tensor_dy
-from mindspore.ops import operations as P
-from mindspore import ops, mint
-DEFAULT_WORLD_COMM_GROUP = HCCL_WORLD_COMM_GROUP
+from mindspore.ops.primitive import Primitive, prim_arg_register, PrimitiveWithInfer, prim_attr_register
+from mindspore.ops.operations.comm_ops import ReduceOp, check_collective_target_dtype
 batch_norm_reduce_grad = BatchNormReduceGrad()
 batch_norm_elemt_grad = BatchNormElemtGrad()
-shape = P.Shape()
-def _deal_comm_outputs(output, async_op):
-    if isinstance(output, tuple):
-        if not async_op:
-            output[1].wait()
-            return output[0]
+shape = ops.Shape()
+class AllGather(PrimitiveWithInfer):
+    @prim_arg_register
+    def __init__(self, group=GlobalComm.WORLD_COMM_GROUP):
+        super(AllGather, self).__init__(self.__class__.__name__)
+        self.group = _get_group(group)
+        validator.check_value_type('group', self.group, (str,), self.name)
+        self.rank = get_rank(self.group)
+        self.rank_size = get_group_size(self.group)
+        validator.check('rank', self.rank, 'rank_size', self.rank_size, validator.LT, self.name)
+        self.add_prim_attr('rank_size', self.rank_size)
+        self.add_prim_attr('group', self.group)
+        self.add_prim_attr('fusion', 0)
+        self.add_prim_attr('mean_flag', False)
+        self.add_prim_attr('no_eliminate', True)
+    def __call__(self, combined):
+        output, _ = all_gather_into_tensor(combined, group=self.group)
         return output
-    if not async_op:
+    def infer_shape(self, x_shape):
+        validator.check_positive_int(len(x_shape), "x shape", self.name)
+        if x_shape[0] > 0:
+            x_shape[0] = x_shape[0] * self.rank_size
+        return x_shape
+    def infer_dtype(self, x_dtype):
+        check_collective_target_dtype('x', x_dtype, self.name)
+        return x_dtype
+class AllReduce(Primitive):
+    @prim_attr_register
+    def __init__(self, op=ReduceOp.SUM, group=GlobalComm.WORLD_COMM_GROUP):
+        """Initialize AllReduce."""
+        super().__init__(name="AllReduce")
+        self.group = _get_group(group)
+        if not isinstance(op, type(ReduceOp.SUM)):
+            raise TypeError(f"For '{self.name}', the 'op' must be str, but got {type(op).__name__}.")
+        if not isinstance(self.group, str):
+            raise TypeError(f"For '{self.name}', the 'group' must be str, "
+                            f"but got {type(self.group).__name__}.")
+        self.op = op
+        self.add_prim_attr('group', self.group)
+        self.add_prim_attr('fusion', 0)
+        self.add_prim_attr('index', 0)
+        self.add_prim_attr('no_eliminate', True)
+    def __call__(self, combined):
+        output, _ = all_reduce(combined, group=self.group)
         return output
-    return output
-def get_group_size(group=GlobalComm.WORLD_COMM_GROUP):
-    if not isinstance(group, str):
-        raise TypeError("For 'get_group_size', the argument 'group' must be type of string, "
-                        "but got 'group' type : {}.".format(type(group)))
-    return _get_size_helper(group=_get_group(group))
-def _contiguous(tensor):
-    if not tensor.is_contiguous() or tensor.storage_offset() != 0:
-        tensor = tensor.contiguous()
-    return tensor
-def _get_group(group):
-    """Return the world communication group if the `group` is `DEFAULT_WORLD_COMM_GROUP`."""
-    if group == DEFAULT_WORLD_COMM_GROUP:
-        return GlobalComm.WORLD_COMM_GROUP
-    return group
-def all_gather_into_tensor(tensor, group=GlobalComm.WORLD_COMM_GROUP, async_op=False):
-    if not isinstance(tensor, (Tensor, Tensor_)):
-        raise TypeError(
-            "For all_gather_into_tensor, the input tensor must be tensor")
-    group = _get_group(group)
-    tensor = _contiguous(tensor)
-    all_gather_op = _get_cache_prim(P.AllGather)(group=group)
-    output = all_gather_op(tensor)
-    return _deal_comm_outputs(output, async_op)
-def all_reduce(tensor, op=ReduceOp.SUM, group=GlobalComm.WORLD_COMM_GROUP, async_op=False):
-    if not isinstance(tensor, (Tensor, Tensor_)):
-        raise TypeError("For all_reduce, the input tensor must be tensor")
-    if not isinstance(op, str):
-        raise TypeError("For all_reduce, the input op type must be str")
-    if op not in ('sum', 'prod', 'min', 'max'):
-        raise TypeError(
-            "For all_reduce, the input op value must be one of sum, prod, min, max")
-    group = _get_group(group)
-    tensor = _contiguous(tensor)
-    all_reduce_op = _get_cache_prim(P.AllReduce)(op=op, group=group)
-    output = all_reduce_op(tensor)
-    return _deal_comm_outputs(output, async_op)
-def bprop_pynative(input_x, weight, bias, running_mean, running_var, eps, momentum,
-                   process_group, world_size, output, doutput):
-    _, mean_param, invstd_param, count_all_param = output
-    dout, _, _, _ = doutput
-    # 不支持 KBK模式
-    if not dout.is_contiguous():
-        dout = dout.contiguous()
-    grad_input = grad_weight = grad_bias = None
-    inputG = True
-    weightG = True
-    biasG = True
-    # calculate local stats as well as grad_weight / grad_bias
-    sum_dy, sum_dy_xmu, grad_weight, grad_bias = batch_norm_reduce_grad(
-        dout,
-        input_x,
-        mean_param,
-        invstd_param,
-        weight,
-        inputG,
-        weightG,
-        biasG
-    )
-    if inputG:
-        # synchronizing stats used to calculate input gradient.
-        sum_dy_shape = shape(sum_dy)
-        num_channels = sum_dy_shape[0]
-        combined = mint.cat([sum_dy, sum_dy_xmu], dim=0)
-        new_combined, _ = mindspore.communication.comm_func.all_reduce(
-            combined, group=process_group)
-        sum_dy, sum_dy_xmu = mint.split(new_combined, num_channels)
-        # backward pass for gradient calculation
-        grad_input = batch_norm_elemt_grad(
-            dout,
-            input_x,
-            mean_param,
-            invstd_param,
-            weight,
-            sum_dy,
-            sum_dy_xmu,
-            count_all_param
-        )
-    # synchronizing of grad_weight / grad_bias is not needed as distributed
-    # training would handle all reduce.
-    if weight is None or not weightG:
-        grad_weight = None
-    if weight is None or not biasG:
-        grad_bias = None
-    return grad_input, grad_weight, grad_bias, None, None, None, None, None, None
+class SyncBatchNormInner(Cell):
+    def __init__(self, self_num_features, self_world_size):
+        super(SyncBatchNormInner, self).__init__()
+        self.num_features = self_num_features
+        self.world_size = self_world_size
+    def construct(self, input, weight, bias, running_mean, running_var, eps, momentum, process_group, world_size):
+        if self.world_size != world_size:
+            raise ValueError('World Size Error')
+        input = input.contiguous()
+        if weight is not None:
+            weight = weight.contiguous()
+        input_shape = shape(input)
+        input_numel = ops.numel(input)
+        size = int(input_numel // input_shape[1])
+        if size == 1 and world_size < 2:
+            raise ValueError(
+                'Expected more than 1 value per channel when training, got input size {}'.format(size))
+        # calculate mean/invstd for input.
+        mean, invstd = mint.batch_norm_stats(input, eps)
+        count = mint.full((1,), input_numel // input_shape[1], dtype=mean.dtype)
+        num_channels = input_shape[1]
+        if self.num_features != num_channels:
+            raise ValueError('Features Error')
+        # C, C, 1 -> (2C + 1)
+        combined = mint.cat([mean, invstd, count], dim=0)
+        # Use allgather instead of allreduce because count could be different across
+        # ranks, simple all reduce op can not give correct results.
+        # batch_norm_gather_stats_with_counts calculates global mean & invstd based on
+        # all gathered mean, invstd and count.
+        # world_size * (2C + 1)
+        all_gather_op = AllGather(process_group)
+        combined = all_gather_op(combined)
+        combined = ops.reshape(combined, [world_size, -1])
+        # world_size * (2C + 1) -> world_size * C, world_size * C, world_size * 1
+        mean_val_all, invstd_val_all, count_val_all = mint.split(
+            combined, num_channels, dim=1)
+        # calculate global mean & invstd
+        mean, invstd = mint.batch_norm_gather_stats_with_counts(input, mean_val_all, invstd_val_all, running_mean,
+                                                                running_var, momentum, eps, count_val_all.view(-1))
+        # apply element-wise normalization
+        out = mint.batch_norm_elemt(input, weight, bias, mean, invstd, eps)
+        return (out, mean, invstd, count_val_all.view(-1))
-def bprop_kbk(input_x, weight, bias, running_mean, running_var, eps, momentum,
+    def bprop(self, input_x, weight, bias, running_mean, running_var, eps, momentum,
               process_group, world_size, output, doutput):
-    _, mean_param, invstd_param, count_all_param = output
-    dout, _, _, _ = doutput
+        _, mean_param, invstd_param, count_all_param = output
+        dout, _, _, _ = doutput
-    dout = dout.contiguous()
-    grad_input = grad_weight = grad_bias = None
-    inputG = True
-    weightG = True
-    biasG = True
-    # calculate local stats as well as grad_weight / grad_bias
-    sum_dy, sum_dy_xmu, grad_weight, grad_bias = batch_norm_reduce_grad(
-        dout,
-        input_x,
-        mean_param,
-        invstd_param,
-        weight,
-        inputG,
-        weightG,
-        biasG
-    )
-    if inputG:
-        # synchronizing stats used to calculate input gradient.
-        sum_dy_shape = shape(sum_dy)
-        num_channels = sum_dy_shape[0]
-        combined = mint.cat([sum_dy, sum_dy_xmu], dim=0)
+        # 不支持 KBK模式
+        dout = dout.contiguous()
-        new_combined = all_reduce(combined, group=process_group)
+        grad_input = grad_weight = grad_bias = None
-        sum_dy, sum_dy_xmu = mint.split(new_combined, num_channels)
+        inputG = True
+        weightG = True
+        biasG = True
-        # backward pass for gradient calculation
-        grad_input = batch_norm_elemt_grad(
+        # calculate local stats as well as grad_weight / grad_bias
+        sum_dy, sum_dy_xmu, grad_weight, grad_bias = batch_norm_reduce_grad(
             dout,
             input_x,
             mean_param,
             invstd_param,
             weight,
-            sum_dy,
-            sum_dy_xmu,
-            count_all_param
+            inputG,
+            weightG,
+            biasG
         )
-    # synchronizing of grad_weight / grad_bias is not needed as distributed
-    # training would handle all reduce.
-    if weight is None or not weightG:
-        grad_weight = None
-    if weight is None or not biasG:
-        grad_bias = None
-    return grad_input, grad_weight, grad_bias, None, None, None, None, None, None
-def construct_pynative(input, weight, bias, running_mean, running_var, eps, momentum, process_group,
-                       world_size, self_num_features, self_world_size):
-    if self_world_size != world_size:
-        raise ValueError('World Size Error')
-    if not input.is_contiguous():
-        input = input.contiguous()
-    if weight is not None:
-        weight = weight.contiguous()
-    input_shape = shape(input)
-    input_numel = ops.numel(input)
-    size = int(input_numel // input_shape[1])
-    if size == 1 and world_size < 2:
-        raise ValueError(
-            'Expected more than 1 value per channel when training, got input size {}'.format(size))
-    # calculate mean/invstd for input.
-    mean, invstd = mint.batch_norm_stats(input, eps)
-    count = mint.full((1,), input_numel //
-                      input_shape[1], dtype=mean.dtype)
-    num_channels = input_shape[1]
-    if self_num_features != num_channels:
-        raise ValueError('Features Error')
-    # C, C, 1 -> (2C + 1)
-    combined = mint.cat([mean, invstd, count], dim=0)
-    # Use allgather instead of allreduce because count could be different across
-    # ranks, simple all reduce op can not give correct results.
-    # batch_norm_gather_stats_with_counts calculates global mean & invstd based on
-    # all gathered mean, invstd and count.
-    # world_size * (2C + 1)
-    combined, _ = all_gather_into_tensor_dy(combined, process_group)
-    combined = ops.reshape(combined, [world_size, -1])
-    # world_size * (2C + 1) -> world_size * C, world_size * C, world_size * 1
-    mean_val_all, invstd_val_all, count_val_all = mint.split(
-        combined, num_channels, dim=1)
-    # calculate global mean & invstd
-    mean, invstd = mint.batch_norm_gather_stats_with_counts(input, mean_val_all, invstd_val_all, running_mean,
-                                                            running_var, momentum, eps, count_val_all.view(-1))
-    # apply element-wise normalization
-    out = mint.batch_norm_elemt(input, weight, bias, mean, invstd, eps)
-    return (out, mean, invstd, count_val_all.view(-1))
-def construct_kbk(input, weight, bias, running_mean, running_var, eps, momentum, process_group,
-                  world_size, self_num_features, self_world_size):
-    if self_world_size != world_size:
-        raise ValueError('World Size Error')
-    input = input.contiguous()
-    if weight is not None:
-        weight = weight.contiguous()
-    input_shape = shape(input)
-    input_numel = ops.numel(input)
-    size = int(input_numel // input_shape[1])
-    if size == 1 and world_size < 2:
-        raise ValueError(
-            'Expected more than 1 value per channel when training, got input size {}'.format(size))
-    # calculate mean/invstd for input.
-    mean, invstd = mint.batch_norm_stats(input, eps)
-    count = mint.full((1,), input_numel //
-                      input_shape[1], dtype=mean.dtype)
-    num_channels = input_shape[1]
-    if self_num_features != num_channels:
-        raise ValueError('Features Error')
-    # C, C, 1 -> (2C + 1)
-    combined = mint.cat([mean, invstd, count], dim=0)
-    # Use allgather instead of allreduce because count could be different across
-    # ranks, simple all reduce op can not give correct results.
-    # batch_norm_gather_stats_with_counts calculates global mean & invstd based on
-    # all gathered mean, invstd and count.
-    # world_size * (2C + 1)
-    combined = all_gather_into_tensor(combined, process_group)
-    combined = ops.reshape(combined, [world_size, -1])
-    # world_size * (2C + 1) -> world_size * C, world_size * C, world_size * 1
-    mean_all, invstd_all, count_all = mint.split(
-        combined, num_channels, dim=1)
-    # calculate global mean & invstd
-    mean, invstd = mint.batch_norm_gather_stats_with_counts(
-        input,
-        mean_all,
-        invstd_all,
-        running_mean,
-        running_var,
-        momentum,
-        eps,
-        count_all.view(-1)
-    )
-    # apply element-wise normalization
-    out = mint.batch_norm_elemt(input, weight, bias, mean, invstd, eps)
-    return (out, mean, invstd, count_all.view(-1))
-class SyncBatchNormInner(Cell):
-    def __init__(self, self_num_features, self_world_size):
-        super(SyncBatchNormInner, self).__init__()
-        self.num_features = self_num_features
-        self.world_size = self_world_size
-        self.mode = context.get_context("mode")
-        if self.mode == 1:
-            self.fn_bprop = bprop_pynative
-            self.fn_construct = construct_pynative
-        else:
-            self.fn_bprop = bprop_kbk
-            self.fn_construct = construct_kbk
-    def construct(self, input, weight, bias, running_mean, running_var, eps, momentum, process_group, world_size):
-        return self.fn_construct(input, weight, bias, running_mean, running_var, eps, momentum, process_group,
-                                 world_size, self.num_features, self.world_size)
-    def bprop(self, input_x, weight, bias, running_mean, running_var, eps, momentum,
-              process_group, world_size, output, doutput):
-        return self.fn_bprop(input_x, weight, bias, running_mean, running_var, eps, momentum,
-                             process_group, world_size, output, doutput)
+        if inputG:
+            # synchronizing stats used to calculate input gradient.
+            sum_dy_shape = shape(sum_dy)
+            num_channels = sum_dy_shape[0]
+            combined = mint.cat([sum_dy, sum_dy_xmu], dim=0)
+            all_reduce_op = AllReduce(group=process_group)
+            new_combined = all_reduce_op(combined)
+            sum_dy, sum_dy_xmu = mint.split(new_combined, num_channels)
+            # backward pass for gradient calculation
+            grad_input = batch_norm_elemt_grad(
+                dout,
+                input_x,
+                mean_param,
+                invstd_param,
+                weight,
+                sum_dy,
+                sum_dy_xmu,
+                count_all_param
+            )
+        # synchronizing of grad_weight / grad_bias is not needed as distributed
+        # training would handle all reduce.
+        if weight is None or not weightG:
+            grad_weight = None
+        if weight is None or not biasG:
+            grad_bias = None
+        return grad_input, grad_weight, grad_bias, None, None, None, None, None, None
 class _SyncBatchNorm(Cell):

mindspore/mint/nn/layer/activation.py CHANGED Viewed

@@ -45,6 +45,10 @@ class SiLU(Cell):
     .. warning::
         This is an experimental API that is subject to change or deletion.
+    Args:
+        inplace (bool, optional): If it is ``True``, enable the in-place update function.
+            Default value: ``False``.
     Inputs:
         - **input** (Tensor) - `input` is :math:`x` in the preceding formula.
           Input with the data type float16 or float32. Tensor of any dimension.
@@ -63,18 +67,19 @@ class SiLU(Cell):
         >>> from mindspore import Tensor, mint
         >>> import numpy as np
         >>> input = Tensor(np.array([-1, 2, -3, 2, -1]), mindspore.float16)
-        >>> silu = mint.nn.SiLU()
+        >>> silu = mint.nn.SiLU(inplace=False)
         >>> output = silu(input)
         >>> print(output)
         [-0.269  1.762  -0.1423  1.762  -0.269]
     """
-    def __init__(self):
+    def __init__(self, inplace=False):
         """Initialize SiLU."""
         super(SiLU, self).__init__()
+        self.inplace = inplace
     def construct(self, x):
-        return mint.nn.functional.silu(x)
+        return mint.nn.functional.silu(x, self.inplace)
 class Sigmoid(Cell):
@@ -355,9 +360,6 @@ class Threshold(Cell):
         \text{value}, &\text{ otherwise }
         \end{cases}
-    .. warning::
-        This is an experimental API that is subject to change or deletion.
     Args:
         threshold (Union[int, float]): The value of the threshold.
         value (Union[int, float]): The value to replace with when element is less than threshold.