PyPI - mindspore - Versions diffs - 2.4.1__cp310-cp310-win_amd64.whl → 2.5.0__cp310-cp310-win_amd64.whl - Mend

mindspore 2.4.1__cp310-cp310-win_amd64.whl → 2.5.0__cp310-cp310-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (372) hide show

mindspore/.commit_id +1 -1
mindspore/__init__.py +8 -3
mindspore/_c_dataengine.cp310-win_amd64.pyd +0 -0
mindspore/_c_expression.cp310-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp310-win_amd64.pyd +0 -0
mindspore/_checkparam.py +0 -5
mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
mindspore/_extends/parse/compile_config.py +64 -0
mindspore/_extends/parse/deprecated/__init__.py +0 -0
mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
mindspore/_extends/parse/parser.py +23 -5
mindspore/_extends/parse/standard_method.py +123 -27
mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
mindspore/amp.py +7 -1
mindspore/avcodec-59.dll +0 -0
mindspore/avdevice-59.dll +0 -0
mindspore/avfilter-8.dll +0 -0
mindspore/avformat-59.dll +0 -0
mindspore/avutil-57.dll +0 -0
mindspore/boost/boost_cell_wrapper.py +136 -41
mindspore/common/__init__.py +3 -1
mindspore/common/_register_for_tensor.py +0 -1
mindspore/common/_stub_tensor.py +25 -4
mindspore/common/_tensor_cpp_method.py +17 -0
mindspore/common/_tensor_docs.py +6132 -0
mindspore/common/api.py +99 -25
mindspore/common/dtype.py +34 -34
mindspore/common/dump.py +2 -1
mindspore/common/file_system.py +8 -1
mindspore/common/generator.py +2 -0
mindspore/common/hook_handle.py +3 -1
mindspore/common/initializer.py +3 -4
mindspore/common/lazy_inline.py +8 -2
mindspore/common/mindir_util.py +10 -2
mindspore/common/parameter.py +30 -27
mindspore/common/tensor.py +713 -1337
mindspore/communication/__init__.py +1 -1
mindspore/communication/_comm_helper.py +10 -0
mindspore/communication/comm_func.py +215 -173
mindspore/communication/management.py +23 -20
mindspore/context.py +292 -193
mindspore/dataset/__init__.py +23 -19
mindspore/dataset/callback/ds_callback.py +2 -1
mindspore/dataset/core/config.py +84 -3
mindspore/dataset/engine/cache_admin.py +3 -3
mindspore/dataset/engine/cache_client.py +5 -4
mindspore/dataset/engine/datasets.py +192 -149
mindspore/dataset/engine/datasets_audio.py +14 -0
mindspore/dataset/engine/datasets_standard_format.py +28 -11
mindspore/dataset/engine/datasets_text.py +38 -1
mindspore/dataset/engine/datasets_user_defined.py +125 -65
mindspore/dataset/engine/datasets_vision.py +81 -8
mindspore/dataset/engine/iterators.py +281 -63
mindspore/dataset/engine/obs/util.py +8 -0
mindspore/dataset/engine/queue.py +40 -0
mindspore/dataset/engine/samplers.py +26 -2
mindspore/dataset/engine/serializer_deserializer.py +1 -1
mindspore/dataset/engine/validators.py +43 -11
mindspore/dataset/transforms/py_transforms_util.py +17 -0
mindspore/dataset/transforms/transforms.py +29 -12
mindspore/dataset/vision/validators.py +1 -2
mindspore/device_context/__init__.py +21 -0
mindspore/device_context/ascend/__init__.py +25 -0
mindspore/device_context/ascend/device.py +72 -0
mindspore/device_context/ascend/op_debug.py +94 -0
mindspore/device_context/ascend/op_precision.py +193 -0
mindspore/device_context/ascend/op_tuning.py +127 -0
mindspore/device_context/cpu/__init__.py +25 -0
mindspore/device_context/cpu/device.py +62 -0
mindspore/device_context/cpu/op_tuning.py +43 -0
mindspore/device_context/gpu/__init__.py +21 -0
mindspore/device_context/gpu/device.py +70 -0
mindspore/device_context/gpu/op_precision.py +67 -0
mindspore/device_context/gpu/op_tuning.py +175 -0
mindspore/device_manager.py +134 -0
mindspore/dnnl.dll +0 -0
mindspore/experimental/llm_boost/__init__.py +3 -2
mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
mindspore/experimental/llm_boost/atb/boost_base.py +239 -64
mindspore/experimental/llm_boost/atb/llama_boost.py +52 -30
mindspore/experimental/llm_boost/atb/qwen_boost.py +47 -24
mindspore/experimental/llm_boost/register.py +1 -0
mindspore/experimental/optim/adadelta.py +26 -22
mindspore/experimental/optim/adam.py +3 -0
mindspore/experimental/optim/lr_scheduler.py +33 -24
mindspore/experimental/optim/radam.py +33 -30
mindspore/hal/device.py +28 -0
mindspore/hal/event.py +17 -0
mindspore/hal/memory.py +94 -3
mindspore/hal/stream.py +91 -6
mindspore/include/api/context.h +1 -2
mindspore/include/dataset/constants.h +2 -2
mindspore/jpeg62.dll +0 -0
mindspore/log.py +12 -0
mindspore/mindrecord/__init__.py +1 -1
mindspore/mindrecord/config.py +17 -316
mindspore/mindrecord/filereader.py +1 -9
mindspore/mindrecord/filewriter.py +5 -15
mindspore/mindrecord/mindpage.py +1 -9
mindspore/mindspore_backend.dll +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_glog.dll +0 -0
mindspore/mindspore_ops.dll +0 -0
mindspore/mint/__init__.py +824 -218
mindspore/mint/distributed/__init__.py +66 -4
mindspore/mint/distributed/distributed.py +2594 -44
mindspore/mint/linalg/__init__.py +6 -0
mindspore/mint/nn/__init__.py +473 -14
mindspore/mint/nn/functional.py +486 -11
mindspore/mint/nn/layer/__init__.py +17 -4
mindspore/mint/nn/layer/_functions.py +330 -0
mindspore/mint/nn/layer/activation.py +169 -1
mindspore/mint/nn/layer/basic.py +123 -0
mindspore/mint/nn/layer/conv.py +727 -0
mindspore/mint/nn/layer/normalization.py +215 -19
mindspore/mint/nn/layer/padding.py +797 -0
mindspore/mint/nn/layer/pooling.py +170 -0
mindspore/mint/optim/__init__.py +2 -1
mindspore/mint/optim/adam.py +223 -0
mindspore/mint/optim/adamw.py +26 -19
mindspore/mint/special/__init__.py +2 -1
mindspore/multiprocessing/__init__.py +5 -0
mindspore/nn/__init__.py +2 -0
mindspore/nn/cell.py +142 -21
mindspore/nn/dynamic_lr.py +2 -1
mindspore/nn/layer/activation.py +6 -6
mindspore/nn/layer/basic.py +35 -25
mindspore/nn/layer/channel_shuffle.py +3 -3
mindspore/nn/layer/conv.py +3 -0
mindspore/nn/layer/embedding.py +3 -3
mindspore/nn/layer/normalization.py +8 -7
mindspore/nn/layer/padding.py +4 -3
mindspore/nn/layer/pooling.py +55 -23
mindspore/nn/layer/rnn_cells.py +1 -1
mindspore/nn/layer/rnns.py +2 -1
mindspore/nn/layer/timedistributed.py +5 -5
mindspore/nn/layer/transformer.py +48 -26
mindspore/nn/learning_rate_schedule.py +5 -3
mindspore/nn/loss/loss.py +31 -36
mindspore/nn/optim/ada_grad.py +1 -0
mindspore/nn/optim/adadelta.py +2 -2
mindspore/nn/optim/adam.py +1 -1
mindspore/nn/optim/lars.py +1 -4
mindspore/nn/optim/optimizer.py +1 -1
mindspore/nn/optim/rprop.py +2 -2
mindspore/nn/optim/thor.py +2 -1
mindspore/nn/utils/__init__.py +22 -0
mindspore/nn/utils/init.py +73 -0
mindspore/nn/wrap/cell_wrapper.py +4 -6
mindspore/nn/wrap/loss_scale.py +3 -4
mindspore/numpy/array_creations.py +60 -62
mindspore/numpy/array_ops.py +148 -143
mindspore/numpy/logic_ops.py +41 -42
mindspore/numpy/math_ops.py +361 -359
mindspore/numpy/utils.py +16 -16
mindspore/numpy/utils_const.py +4 -4
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/opencv_imgproc452.dll +0 -0
mindspore/ops/__init__.py +2 -1
mindspore/ops/_grad_experimental/grad_comm_ops.py +107 -8
mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
mindspore/ops/_op_impl/cpu/__init__.py +1 -0
mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
mindspore/ops/_vmap/vmap_array_ops.py +20 -19
mindspore/ops/_vmap/vmap_base.py +0 -2
mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
mindspore/ops/_vmap/vmap_math_ops.py +11 -9
mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
mindspore/ops/auto_generate/gen_extend_func.py +554 -60
mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
mindspore/ops/auto_generate/gen_ops_prim.py +8027 -3411
mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
mindspore/ops/composite/base.py +1 -1
mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
mindspore/ops/function/__init__.py +12 -0
mindspore/ops/function/array_func.py +561 -159
mindspore/ops/function/clip_func.py +64 -0
mindspore/ops/function/debug_func.py +28 -20
mindspore/ops/function/image_func.py +1 -1
mindspore/ops/function/linalg_func.py +5 -4
mindspore/ops/function/math_func.py +1664 -294
mindspore/ops/function/nn_func.py +988 -317
mindspore/ops/function/parameter_func.py +3 -56
mindspore/ops/function/random_func.py +243 -33
mindspore/ops/function/sparse_unary_func.py +1 -1
mindspore/ops/functional.py +18 -5
mindspore/ops/functional_overload.py +897 -0
mindspore/ops/operations/__init__.py +3 -2
mindspore/ops/operations/_embedding_cache_ops.py +4 -4
mindspore/ops/operations/_grad_ops.py +2 -34
mindspore/ops/operations/_infer_ops.py +2 -1
mindspore/ops/operations/_inner_ops.py +38 -8
mindspore/ops/operations/array_ops.py +45 -303
mindspore/ops/operations/comm_ops.py +23 -17
mindspore/ops/operations/custom_ops.py +7 -49
mindspore/ops/operations/debug_ops.py +42 -47
mindspore/ops/operations/inner_ops.py +6 -4
mindspore/ops/operations/linalg_ops.py +3 -2
mindspore/ops/operations/manually_defined/ops_def.py +185 -104
mindspore/ops/operations/math_ops.py +11 -216
mindspore/ops/operations/nn_ops.py +153 -310
mindspore/ops/primitive.py +23 -21
mindspore/ops/tensor_method.py +1669 -0
mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
mindspore/ops_generate/arg_handler.py +0 -61
mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
mindspore/ops_generate/base_generator.py +11 -0
mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
mindspore/ops_generate/functional_overload_py_generator.py +110 -0
mindspore/ops_generate/functions_cc_generator.py +233 -0
mindspore/ops_generate/gen_aclnn_implement.py +110 -114
mindspore/ops_generate/gen_constants.py +157 -3
mindspore/ops_generate/gen_ops.py +245 -990
mindspore/ops_generate/gen_pyboost_func.py +97 -998
mindspore/ops_generate/gen_utils.py +119 -33
mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
mindspore/ops_generate/op_api_proto.py +206 -0
mindspore/ops_generate/op_def_py_generator.py +131 -0
mindspore/ops_generate/op_prim_py_generator.py +480 -0
mindspore/ops_generate/op_proto.py +373 -108
mindspore/ops_generate/op_template_parser.py +436 -0
mindspore/ops_generate/ops_def_cc_generator.py +288 -0
mindspore/ops_generate/ops_def_h_generator.py +74 -0
mindspore/ops_generate/ops_name_h_generator.py +68 -0
mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
mindspore/ops_generate/pyboost_utils.py +92 -33
mindspore/ops_generate/template.py +294 -44
mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
mindspore/parallel/__init__.py +3 -3
mindspore/parallel/_auto_parallel_context.py +44 -34
mindspore/parallel/_cell_wrapper.py +22 -3
mindspore/parallel/_parallel_serialization.py +13 -2
mindspore/parallel/_utils.py +4 -2
mindspore/parallel/algo_parameter_config.py +1 -1
mindspore/parallel/checkpoint_transform.py +44 -0
mindspore/parallel/cluster/process_entity/_api.py +131 -37
mindspore/parallel/cluster/process_entity/_utils.py +41 -6
mindspore/parallel/cluster/run.py +20 -3
mindspore/parallel/parameter_broadcast.py +1 -1
mindspore/parallel/shard.py +3 -0
mindspore/parallel/transform_safetensors.py +119 -253
mindspore/profiler/__init__.py +17 -4
mindspore/profiler/analysis/__init__.py +0 -0
mindspore/profiler/analysis/parser/__init__.py +0 -0
mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
mindspore/profiler/analysis/parser/base_parser.py +158 -0
mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
mindspore/profiler/analysis/task_manager.py +131 -0
mindspore/profiler/analysis/time_converter.py +84 -0
mindspore/profiler/analysis/viewer/__init__.py +0 -0
mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
mindspore/profiler/analysis/work_flow.py +73 -0
mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
mindspore/profiler/common/command_executor.py +90 -0
mindspore/profiler/common/constant.py +174 -3
mindspore/profiler/common/file_manager.py +208 -0
mindspore/profiler/common/log.py +130 -0
mindspore/profiler/common/msprof_cmd_tool.py +202 -0
mindspore/profiler/common/path_manager.py +371 -0
mindspore/profiler/common/process_bar.py +168 -0
mindspore/profiler/common/process_pool.py +9 -3
mindspore/profiler/common/profiler_context.py +476 -0
mindspore/profiler/common/profiler_info.py +304 -0
mindspore/profiler/common/profiler_output_path.py +284 -0
mindspore/profiler/common/profiler_parameters.py +210 -0
mindspore/profiler/common/profiler_path_manager.py +120 -0
mindspore/profiler/common/record_function.py +76 -0
mindspore/profiler/common/tlv_decoder.py +76 -0
mindspore/profiler/common/util.py +75 -2
mindspore/profiler/dynamic_profiler.py +270 -37
mindspore/profiler/envprofiler.py +138 -0
mindspore/profiler/mstx.py +199 -0
mindspore/profiler/platform/__init__.py +21 -0
mindspore/profiler/platform/base_profiler.py +40 -0
mindspore/profiler/platform/cpu_profiler.py +124 -0
mindspore/profiler/platform/gpu_profiler.py +74 -0
mindspore/profiler/platform/npu_profiler.py +309 -0
mindspore/profiler/profiler.py +580 -93
mindspore/profiler/profiler_action_controller.py +187 -0
mindspore/profiler/profiler_interface.py +114 -0
mindspore/profiler/schedule.py +208 -0
mindspore/rewrite/api/symbol_tree.py +1 -2
mindspore/run_check/_check_version.py +18 -13
mindspore/runtime/__init__.py +37 -0
mindspore/runtime/device.py +27 -0
mindspore/runtime/event.py +209 -0
mindspore/runtime/executor.py +148 -0
mindspore/runtime/memory.py +392 -0
mindspore/runtime/stream.py +460 -0
mindspore/runtime/thread_bind_core.py +401 -0
mindspore/swresample-4.dll +0 -0
mindspore/swscale-6.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/train/__init__.py +2 -2
mindspore/train/_utils.py +53 -18
mindspore/train/amp.py +8 -4
mindspore/train/callback/_checkpoint.py +32 -18
mindspore/train/callback/_early_stop.py +1 -1
mindspore/train/callback/_flops_collector.py +105 -69
mindspore/train/callback/_history.py +1 -1
mindspore/train/callback/_summary_collector.py +44 -6
mindspore/train/callback/_tft_register.py +37 -15
mindspore/train/dataset_helper.py +11 -11
mindspore/train/metrics/precision.py +4 -5
mindspore/train/mind_ir_pb2.py +167 -46
mindspore/train/model.py +13 -14
mindspore/train/serialization.py +461 -72
mindspore/train/summary/summary_record.py +1 -2
mindspore/train/train_thor/model_thor.py +1 -1
mindspore/turbojpeg.dll +0 -0
mindspore/utils/__init__.py +4 -2
mindspore/utils/dryrun.py +138 -0
mindspore/utils/runtime_execution_order_check.py +550 -0
mindspore/version.py +1 -1
{mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/METADATA +3 -4
{mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/RECORD +368 -242
{mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
mindspore/common/_tensor_overload.py +0 -139
mindspore/mindspore_np_dtype.dll +0 -0
mindspore/profiler/envprofiling.py +0 -254
mindspore/profiler/profiling.py +0 -1926
{mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
{mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0

mindspore/ops/operations/comm_ops.py CHANGED Viewed

@@ -18,6 +18,7 @@
 from __future__ import absolute_import
 from __future__ import division
+import os
 from mindspore.common import Tensor
 from mindspore import _checkparam as validator
 from mindspore.communication.management import get_rank, get_group_size, GlobalComm, _get_group, _host_distribute
@@ -54,7 +55,7 @@ class ReduceOp:
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with multiple devices.
@@ -100,7 +101,9 @@ def check_collective_target_dtype(data_name, data_dtype, prim_name):
 def check_hcom_group_valid(group, prim_name=None):
     """Check if hcom group is valid."""
     msg_prefix = f"For '{prim_name}', the" if prim_name else "The"
-    if not _host_distribute() and context.get_context("mode") == context.PYNATIVE_MODE and \
+    sim_level = os.getenv("MS_SIMULATION_LEVEL")
+    no_sim = (sim_level is None or sim_level.strip() == '')
+    if no_sim and (not _host_distribute()) and context.get_context("mode") == context.PYNATIVE_MODE and \
             group != GlobalComm.WORLD_COMM_GROUP:
         raise RuntimeError(f"{msg_prefix} 'group' only support 'hccl_world_group' in pynative mode, but got "
                            f"'group': {group}. Please start by using mpi-run.")
@@ -141,7 +144,7 @@ class AllReduce(Primitive):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -231,7 +234,7 @@ class Reduce(PrimitiveWithInfer):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method without any third-party
             or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 4 devices.
@@ -315,7 +318,7 @@ class AllGather(PrimitiveWithInfer):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -538,7 +541,7 @@ class ReduceScatter(Primitive):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -676,7 +679,7 @@ class Broadcast(PrimitiveWithInfer):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -906,7 +909,7 @@ class AlltoAll(PrimitiveWithInfer):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 8 devices.
@@ -988,6 +991,9 @@ class NeighborExchangeV2(Primitive):
         in the same subnet, please check the `details \
         <https://www.mindspore.cn/docs/en/master/api_python/samples/ops/communicate_ops.html#notes>`_.
+        Users need to ensure that the length of the received data `recv_lens` is consistent with that of
+        the sent data `send_lens`.
     Args:
         send_rank_ids (list(int)): Ranks which the data is sent to. 8 rank_ids represents 8 directions, if one
                                    direction is not send to , set it -1.
@@ -1025,7 +1031,7 @@ class NeighborExchangeV2(Primitive):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -1142,7 +1148,7 @@ class CollectiveScatter(Primitive):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -1227,7 +1233,7 @@ class CollectiveGather(Primitive):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 4 devices.
@@ -1303,7 +1309,7 @@ class Barrier(PrimitiveWithInfer):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -1377,7 +1383,7 @@ class Send(PrimitiveWithInfer):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -1393,7 +1399,7 @@ class Send(PrimitiveWithInfer):
         >>>     def __init__(self):
         >>>         super(SendNet, self).__init__()
         >>>         self.depend = ops.Depend()
-        >>>         self.send = ops.Send(st_tag=0, dest_rank=8, group="hccl_world_group")
+        >>>         self.send = ops.Send(sr_tag=0, dest_rank=8, group="hccl_world_group")
         >>>
         >>>     def construct(self, x):
         >>>         out = self.depend(x, self.send(x))
@@ -1461,7 +1467,7 @@ class Receive(PrimitiveWithInfer):
             For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -1839,7 +1845,7 @@ class BatchISendIRecv(PrimitiveWithInfer):
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.
@@ -1952,7 +1958,7 @@ class AlltoAllV(PrimitiveWithInfer):
             without any third-party or configuration file dependencies.
             Please see the `msrun start up
-            <https://www.mindspore.cn/docs/zh-CN/master/model_train/parallel/msrun_launcher.html>`_
+            <https://www.mindspore.cn/docs/en/master/model_train/parallel/msrun_launcher.html>`_
             for more details.
             This example should be run with 2 devices.

mindspore/ops/operations/custom_ops.py CHANGED Viewed

@@ -223,8 +223,6 @@ class Custom(ops.PrimitiveWithInfer):
     .. note::
         The supported platforms are determined by the input `func_type`. The supported platforms are as follows:
-        - "hybrid": supports ["GPU", "CPU"].
-        - "akg": supports ["GPU", "CPU"].
         - "aot": supports ["GPU", "CPU", "Ascend"].
         - "pyfunc": supports ["CPU"].
         - "julia": supports ["CPU"].
@@ -233,11 +231,7 @@ class Custom(ops.PrimitiveWithInfer):
         func (Union[function, str]):
             - function: If func is of function type, then func should be a Python function which describes the
-              computation logic of a user defined operator. The function can be one of the following:
-              1. A AKG operator implementation function, which can use ir builder/tvm compute/hybrid grammar.
-              2. A pure python function
-              3. An kernel decorated function written by the Hybrid DSL.
+              computation logic of a user defined operator.
             - str: If func is of str type, then str should be a path of file along with a function name.
               This could be used when func_type is "aot" or "julia".
@@ -354,7 +348,7 @@ class Custom(ops.PrimitiveWithInfer):
         func_type (str): The implementation type of `func`, should be one of
-            [ ``"hybrid"`` , ``"akg"`` , ``"aot"`` , ``"pyfunc"`` , ``"julia"`` ].
+            [ ``"aot"`` , ``"pyfunc"`` , ``"julia"`` ].
         bprop (function): The back propagation function of `func`. Default: ``None`` .
         reg_info (Union[str, dict, list, tuple]): Represents the registration information(reg info) of `func` with
@@ -398,50 +392,14 @@ class Custom(ops.PrimitiveWithInfer):
         >>> input_x = Tensor(np.ones([16, 16]).astype(np.float32))
         >>> input_y = Tensor(np.ones([16, 16]).astype(np.float32))
         >>>
-        >>> # Example, func_type = "hybrid"
-        >>> # This is the default func_type in Custom,
-        >>> # and both out_shape and out_dtype can be None(default value).
-        >>> # In this case, the input func must be a function written in the Hybrid DSL
-        >>> # and decorated by @kernel.
-        >>> @kernel
-        ... def add_script(a, b):
-        ...     c = output_tensor(a.shape, a.dtype)
-        ...     for i0 in range(a.shape[0]):
-        ...         for i1 in range(a.shape[1]):
-        ...             c[i0, i1] = a[i0, i1] + b[i0, i1]
-        ...     return c
-        >>>
-        >>> test_op_hybrid = ops.Custom(add_script)
-        >>> output = test_op_hybrid(input_x, input_y)
-        >>> # the result will be a 16 * 16 tensor with all elements 2
-        >>> print(output.shape)
-        (16, 16)
-        >>> # Example, func_type = "aot"
-        >>> def test_aot(x, y, out_shapes, out_types):
-        ...     program = ops.Custom("./reorganize.so:CustomReorganize", out_shapes, out_types, "aot")
-        ...     out = program(x, y)
-        ...     return out
-        >>>
         >>> # Example, func_type = "pyfunc"
-        >>> def func_multi_output(x1, x2):
-        ...     return (x1 + x2), (x1 - x2)
+        >>> def func_pyfunc(x1, x2):
+        ...     return x1 + x2
         >>>
-        >>> test_pyfunc = ops.Custom(func_multi_output, lambda x, _: (x, x), lambda x, _: (x, x), "pyfunc")
+        >>> test_pyfunc = ops.Custom(func_pyfunc, lambda x, _: x, lambda x, _: x, "pyfunc")
         >>> output = test_pyfunc(input_x, input_y)
-        >>>
-        >>> # Example, func_type = "julia"
-        >>> # julia code:
-        >>> # add.jl
-        >>> # module Add
-        >>> # function add(x, y, z)
-        >>> #   z .= x + y
-        >>> #   return z
-        >>> # end
-        >>> # end
-        >>> def test_julia(x, y, out_shapes, out_types):
-        ...     program = ops.Custom("./add.jl:Add:add", out_shapes, out_types, "julia")
-        ...     out = program(x, y)
-        ...     return out
+        >>> print(output.shape)
+        (16, 16)
     """
     registered_func = {}

mindspore/ops/operations/debug_ops.py CHANGED Viewed

@@ -13,23 +13,24 @@
 # limitations under the License.
 # ============================================================================
 """debug_ops"""
-import os
 import stat
+from pathlib import Path
 import numpy as np
 from mindspore import log as logger
 from mindspore._c_expression import security, HookType
 from mindspore._c_expression import Tensor as Tensor_
+from mindspore._c_expression import _tensordump_process_file
 from mindspore import _checkparam as validator
 from mindspore.common import dtype as mstype
 from mindspore.common.parameter import Parameter
 from mindspore.common.tensor import Tensor
 from mindspore.ops.primitive import prim_attr_register, Primitive, PrimitiveWithInfer
 from mindspore._checkparam import check_hook_fn
+from mindspore.ops import operations as P
 SUMMARY_TENSOR_CACHE = []
-TENSORDUMP_ID = 0
 def _cache_summary_data(op_name, define_name, tensor):
@@ -64,8 +65,8 @@ class ScalarSummary(Primitive):
     which specify the directory of the summary file. The summary file can
     be loaded and shown by MindInsight, see `MindInsight documents <https://www.mindspore.cn/
     mindinsight/docs/en/master/index.html>`_ for details.
-    In Ascend platform with graph mode, can set environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
-    to solve operator execution failure when calling this operator intensively.
+    In Ascend platform with graph mode, the environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
+    can be set to solve operator execution failure when calling this operator intensively.
     Inputs:
         - **name** (str) - The name of the input variable, it must not be an empty string.
@@ -124,8 +125,8 @@ class ImageSummary(Primitive):
     SummaryRecord or SummaryCollector, which specify the directory of the summary file. The summary file can
     be loaded and shown by MindInsight, see `MindInsight documents <https://www.mindspore.cn/
     mindinsight/docs/en/master/index.html>`_ for details.
-    In Ascend platform with graph mode, can set environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
-    to solve operator execution failure when calling this operator intensively.
+    In Ascend platform with graph mode, the environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
+    can be set to solve operator execution failure when calling this operator intensively.
     Inputs:
         - **name** (str) - The name of the input variable, it must not be an empty string.
@@ -177,8 +178,8 @@ class TensorSummary(Primitive):
     or SummaryCollector, which specify the directory of the summary file. The summary file can
     be loaded and shown by MindInsight, see `MindInsight documents <https://www.mindspore.cn/
     mindinsight/docs/en/master/index.html>`_ for details.
-    In Ascend platform with graph mode, can set environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
-    to solve operator execution failure when calling this operator intensively.
+    In Ascend platform with graph mode, the environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
+    can be set to solve operator execution failure when calling this operator intensively.
     Inputs:
         - **name** (str) - The name of the input variable.
@@ -235,15 +236,15 @@ class TensorDump(Primitive):
     Save the Tensor as an npy file in numpy format.
     .. warning::
-        - If a large amount of data is stored within a short period, it may lead to memory overflow on the device side.
-          Consider slicing the data to reduce the data scale.
-        - Since data saving is processed asynchronously, when the amount of data is too large or the main process exits
-          too quickly, data loss may occur. You need to actively control the destruction time of the main process,
-          such as using sleep.
+        - The parameter input_output will no longer support the value 'all'.
+    .. note::
+        In Ascend platform with graph mode, the environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
+        can be set to solve operator execution failure when outputting big tensor or outputting tensor intensively.
     Args:
         input_output (str, optional): Used to control Tensordump behavior.
-            Available value is one of ['in', 'out', 'all']. Default value is ``out``.
+            Available value is one of ['in', 'out']. Default value is ``out``.
             In case of OpA --> RedistributionOps --> OpB,
             The dump data of OpA's output is not equal to OpB's input (Due to the redistribution operators).
@@ -253,21 +254,19 @@ class TensorDump(Primitive):
             Different requirements of saving dump data can be achieved by configuring parameter input_output:
             - If the input_output is 'out', the dump data contains only OpA's output slice.
-            - If the input_output is 'all', the dump data contains both OpA's output slice and OpB's input slice.
             - If the input_output is 'in', the dump data contains only OpB's input slice.
-            For input_output is 'all' or 'in', the input slice npy file format is:
-            id_fileName_cNodeID_dumpMode_rankID.npy.
+            For input_output is 'in', the input slice npy file format is:
+            fileName_dumpMode_dtype_id.npy.
-            For input_output is 'out' or 'all' the output slice npy file format is:
-            id_fileName.npy.
+            For input_output is 'out', the output slice npy file format is:
+            fileName_dtype_id.npy.
-            - id: An auto increment ID.
             - fileName: Value of the parameter file
               (if parameter file_name is a user-specified path, the value of fileName is the last level of the path).
-            - cNodeID: The node ID of the Tensordump node in the step_parallel_end.ir file.
             - dumpMode: Value of the parameter input_output.
-            - rankID: Logical device id.
+            - dtype: The original data type. Data of type bfloat16 stored in the .npy file will be converted to float32.
+            - id: An auto increment ID.
     Inputs:
         - **file** (str) - The path of the file to be saved.
@@ -285,7 +284,8 @@ class TensorDump(Primitive):
         >>> import mindspore as ms
         >>> import time
         >>> from mindspore import nn, Tensor, ops
-        >>> ms.set_context(mode=ms.GRAPH_MODE, device_target="Ascend")
+        >>> ms.set_context(mode=ms.GRAPH_MODE)
+        >>> ms.set_device(device_target="Ascend")
         >>> class Net(nn.Cell):
         ...     def __init__(self):
         ...         super(Net, self).__init__()
@@ -305,7 +305,7 @@ class TensorDump(Primitive):
         >>> net = Net()
         >>> out = net(input_x)
         >>> time.sleep(0.5)
-        >>> add = np.load('0_add.npy')
+        >>> add = np.load('add_float32_0.npy')
         >>> print(add)
         [[2. 3. 4. 5.]
          [6. 7. 8. 9.]]
@@ -318,25 +318,26 @@ class TensorDump(Primitive):
         self.add_prim_attr("side_effect_io", True)
         self.add_prim_attr("channel_name", "ms_tensor_dump")
+    def _save_file(self, file, data):
+        file = Path(file)
+        if file.exists():
+            file.chmod(stat.S_IWUSR)
+        np.save(file, data)
+        file.chmod(stat.S_IRUSR)
     def __call__(self, file, input_x):
         validator.check_value_type('file', file, [str], self.__class__.__name__)
         if not file:
             raise ValueError("For 'TensorDump', the input argument[file] cannot be an empty string.")
         validator.check_value_type('input_x', input_x, [Tensor], self.__class__.__name__)
-        global TENSORDUMP_ID
-        npy_suffix = ".npy"
-        directory, filename = os.path.split(file)
-        if directory and not os.path.exists(directory):
-            os.makedirs(directory, mode=0o700, exist_ok=True)
-        new_filename = f"{TENSORDUMP_ID}_{filename}"
-        new_file = os.path.join(directory, new_filename)
-        if not new_file.endswith(npy_suffix):
-            new_file += npy_suffix
-        if os.path.exists(new_file):
-            os.chmod(new_file, stat.S_IWUSR)
-        np.save(new_file, input_x.asnumpy())
-        os.chmod(new_file, stat.S_IRUSR)
-        TENSORDUMP_ID += 1
+        dtype = input_x.dtype
+        file = _tensordump_process_file(file, str(dtype))
+        if not file:
+            return
+        if dtype == mstype.bfloat16:
+            input_x = P.Cast()(input_x, mstype.float32)
+        self._save_file(file, input_x.asnumpy())
 class HistogramSummary(Primitive):
@@ -345,8 +346,8 @@ class HistogramSummary(Primitive):
     It must be used with SummaryRecord or SummaryCollector, which specify the directory of the summary file.
     The summary file can be loaded and shown by MindInsight, see `MindInsight documents <https://www.mindspore.cn/
     mindinsight/docs/en/master/index.html>`_ for details.
-    In Ascend platform with graph mode, can set environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
-    to solve operator execution failure when calling this operator intensively.
+    In Ascend platform with graph mode, the environment variables `MS_DUMP_SLICE_SIZE` and `MS_DUMP_WAIT_TIME`
+    can be set to solve operator execution failure when calling this operator intensively.
     Inputs:
         - **name** (str) - The name of the input variable.
@@ -398,7 +399,7 @@ class HistogramSummary(Primitive):
         _cache_summary_data(self.name, args[0], args[1])
-class InsertGradientOf(PrimitiveWithInfer):
+class InsertGradientOf(Primitive):
     """
     Attaches callback to the graph node that will be invoked on the node's gradient.
@@ -464,12 +465,6 @@ class InsertGradientOf(PrimitiveWithInfer):
         self.add_prim_attr('side_effect_backprop', True)
         self.f = f
-    def infer_shape(self, x_shape):
-        return x_shape
-    def infer_dtype(self, x_type):
-        return x_type
 class HookBackward(PrimitiveWithInfer):
     """

mindspore/ops/operations/inner_ops.py CHANGED Viewed

@@ -302,8 +302,8 @@ class FusedWeightScaleApplyMomentum(PrimitiveWithInfer):
           Default: ``0.0`` .
         - **loss_scale** (Tensor) - The loss scale value, must be a scalar tensor with float data type.
           Default: ``1.0`` .
-        - **variable** (Parameter) - Weights to be updated. data type must be float.
-        - **accumulation** (Parameter) - Accumulated gradient value by moment weight.
+        - **variable** (Union[Parameter, Tensor]) - Weights to be updated. data type must be float.
+        - **accumulation** (Union[Parameter, Tensor]) - Accumulated gradient value by moment weight.
           Has the same data type with `variable`.
         - **learning_rate** (Union[Number, Tensor]) - The learning rate value, must be a float number or
           a scalar tensor with float data type.
@@ -425,7 +425,8 @@ class FusedCastAdamWeightDecay(PrimitiveWithInfer):
         ...     def construct(self, lr, beta1, beta2, epsilon, decay, grad, norm):
         ...         out = self.opt(self.var, self.m, self.v, lr, beta1, beta2, epsilon, decay, grad, norm)
         ...         return out
-        >>> ms.set_context(mode=ms.GRAPH_MODE, device_target="CPU")
+        >>> ms.set_context(mode=ms.GRAPH_MODE)
+        >>> ms.set_device(device_target="CPU")
         >>> net = Net()
         >>> gradient = Tensor(np.ones([2, 2]), mstype.float16)
         >>> output = net(0.001, 0.9, 0.999, 1e-8, 0.0, gradient, 1.0)
@@ -560,7 +561,8 @@ class FusedAdaFactor(PrimitiveWithInfer):
         ...         out = self.opt(epsilon, clip_threshold, beta1, beta2, weight_decay, lr, grad, self.param,
         ...                        self.exp_avg, self.exp_avg_sq_row, self.exp_avg_sq_col, self.exp_avg_sq)
         ...         return out
-        >>> ms.set_context(mode=ms.GRAPH_MODE, device_target="CPU")
+        >>> ms.set_context(mode=ms.GRAPH_MODE)
+        >>> ms.set_device(device_target="CPU")
         >>> net = Net()
         >>> gradient = Tensor(np.ones(param_shape), mstype.float32)
         >>> output = net((1e-30, 1e-3), 1.0, 0.9, 0.8, 1e-2, 0.03, gradient)

mindspore/ops/operations/linalg_ops.py CHANGED Viewed

@@ -51,9 +51,10 @@ class Svd(Primitive):
     Examples:
         >>> import numpy as np
-        >>> from mindspore import Tensor, set_context
+        >>> import mindspore as ms
+        >>> from mindspore import Tensor
         >>> from mindspore import ops
-        >>> set_context(device_target="CPU")
+        >>> ms.set_device(device_target="CPU")
         >>> svd = ops.Svd(full_matrices=True, compute_uv=True)
         >>> a = Tensor(np.array([[1, 2], [-4, -5], [2, 1]]).astype(np.float32))
         >>> s, u, v = svd(a)