PyPI - mindspore - Versions diffs - 2.7.0rc1__cp310-cp310-win_amd64.whl → 2.7.1__cp310-cp310-win_amd64.whl - Mend

mindspore 2.7.0rc1__cp310-cp310-win_amd64.whl → 2.7.1__cp310-cp310-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (370) hide show

mindspore/.commit_id +1 -1
mindspore/__init__.py +5 -2
mindspore/_c_dataengine.cp310-win_amd64.pyd +0 -0
mindspore/_c_expression.cp310-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp310-win_amd64.pyd +0 -0
mindspore/_checkparam.py +2 -2
mindspore/_extends/builtin_operations.py +3 -3
mindspore/_extends/parallel_compile/akg_compiler/custom.py +1109 -0
mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
mindspore/_extends/parse/__init__.py +3 -3
mindspore/_extends/parse/compile_config.py +24 -1
mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +6 -3
mindspore/_extends/parse/parser.py +28 -22
mindspore/_extends/parse/resources.py +1 -1
mindspore/_extends/parse/standard_method.py +23 -2
mindspore/_extends/parse/trope.py +2 -1
mindspore/_extends/pijit/pijit_func_white_list.py +9 -27
mindspore/amp.py +0 -18
mindspore/avcodec-59.dll +0 -0
mindspore/avdevice-59.dll +0 -0
mindspore/avfilter-8.dll +0 -0
mindspore/avformat-59.dll +0 -0
mindspore/avutil-57.dll +0 -0
mindspore/boost/base.py +29 -2
mindspore/common/__init__.py +18 -12
mindspore/common/_decorator.py +3 -2
mindspore/common/_grad_function.py +3 -1
mindspore/common/_tensor_cpp_method.py +1 -1
mindspore/common/_tensor_docs.py +371 -96
mindspore/common/_utils.py +7 -43
mindspore/common/api.py +434 -135
mindspore/common/dtype.py +98 -57
mindspore/common/dump.py +7 -108
mindspore/common/dynamic_shape/__init__.py +0 -0
mindspore/common/{auto_dynamic_shape.py → dynamic_shape/auto_dynamic_shape.py} +15 -23
mindspore/common/dynamic_shape/enable_dynamic.py +197 -0
mindspore/common/file_system.py +59 -9
mindspore/common/hook_handle.py +82 -3
mindspore/common/jit_config.py +5 -1
mindspore/common/jit_trace.py +27 -12
mindspore/common/lazy_inline.py +5 -3
mindspore/common/np_dtype.py +3 -3
mindspore/common/parameter.py +17 -127
mindspore/common/recompute.py +4 -13
mindspore/common/tensor.py +50 -217
mindspore/communication/_comm_helper.py +11 -1
mindspore/communication/comm_func.py +138 -4
mindspore/communication/management.py +85 -1
mindspore/config/op_info.config +0 -15
mindspore/context.py +20 -106
mindspore/dataset/__init__.py +1 -1
mindspore/dataset/audio/transforms.py +1 -1
mindspore/dataset/core/config.py +35 -1
mindspore/dataset/engine/datasets.py +338 -319
mindspore/dataset/engine/datasets_user_defined.py +38 -22
mindspore/dataset/engine/datasets_vision.py +1 -1
mindspore/dataset/engine/validators.py +1 -15
mindspore/dataset/transforms/c_transforms.py +2 -2
mindspore/dataset/transforms/transforms.py +3 -3
mindspore/dataset/vision/__init__.py +1 -1
mindspore/dataset/vision/py_transforms.py +8 -8
mindspore/dataset/vision/transforms.py +17 -5
mindspore/dataset/vision/utils.py +632 -21
mindspore/device_context/ascend/op_tuning.py +35 -1
mindspore/dnnl.dll +0 -0
mindspore/{profiler/common/validator → graph}/__init__.py +9 -1
mindspore/graph/custom_pass.py +55 -0
mindspore/include/api/cell.h +28 -4
mindspore/include/api/cfg.h +24 -7
mindspore/include/api/context.h +1 -0
mindspore/include/api/delegate.h +0 -2
mindspore/include/api/dual_abi_helper.h +100 -19
mindspore/include/api/graph.h +14 -1
mindspore/include/api/kernel.h +16 -3
mindspore/include/api/kernel_api.h +9 -1
mindspore/include/api/metrics/accuracy.h +9 -0
mindspore/include/api/model.h +5 -1
mindspore/include/api/model_group.h +4 -0
mindspore/include/api/model_parallel_runner.h +2 -0
mindspore/include/api/status.h +48 -10
mindspore/include/api/types.h +6 -1
mindspore/include/dataset/constants.h +9 -0
mindspore/include/dataset/execute.h +2 -2
mindspore/jpeg62.dll +0 -0
mindspore/mindrecord/__init__.py +3 -3
mindspore/mindrecord/common/exceptions.py +1 -0
mindspore/mindrecord/config.py +1 -1
mindspore/{parallel/mpi → mindrecord/core}/__init__.py +4 -1
mindspore/mindrecord/{shardheader.py → core/shardheader.py} +2 -1
mindspore/mindrecord/{shardindexgenerator.py → core/shardindexgenerator.py} +1 -1
mindspore/mindrecord/{shardreader.py → core/shardreader.py} +2 -1
mindspore/mindrecord/{shardsegment.py → core/shardsegment.py} +2 -2
mindspore/mindrecord/{shardutils.py → core/shardutils.py} +1 -1
mindspore/mindrecord/{shardwriter.py → core/shardwriter.py} +1 -1
mindspore/mindrecord/filereader.py +4 -4
mindspore/mindrecord/filewriter.py +5 -5
mindspore/mindrecord/mindpage.py +2 -2
mindspore/mindrecord/tools/cifar10.py +4 -3
mindspore/mindrecord/tools/cifar100.py +1 -1
mindspore/mindrecord/tools/cifar100_to_mr.py +1 -1
mindspore/mindrecord/tools/cifar10_to_mr.py +6 -6
mindspore/mindrecord/tools/csv_to_mr.py +1 -1
mindspore/mindrecord/tools/imagenet_to_mr.py +1 -1
mindspore/mindrecord/tools/mnist_to_mr.py +1 -1
mindspore/mindrecord/tools/tfrecord_to_mr.py +1 -1
mindspore/mindspore_backend_common.dll +0 -0
mindspore/mindspore_backend_manager.dll +0 -0
mindspore/mindspore_cluster.dll +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_cpu.dll +0 -0
mindspore/mindspore_dump.dll +0 -0
mindspore/mindspore_frontend.dll +0 -0
mindspore/mindspore_glog.dll +0 -0
mindspore/mindspore_hardware_abstract.dll +0 -0
mindspore/mindspore_memory_pool.dll +0 -0
mindspore/mindspore_ms_backend.dll +0 -0
mindspore/mindspore_ops.dll +0 -0
mindspore/{mindspore_ops_host.dll → mindspore_ops_cpu.dll} +0 -0
mindspore/mindspore_profiler.dll +0 -0
mindspore/mindspore_pyboost.dll +0 -0
mindspore/mindspore_pynative.dll +0 -0
mindspore/mindspore_runtime_pipeline.dll +0 -0
mindspore/mindspore_runtime_utils.dll +0 -0
mindspore/mindspore_tools.dll +0 -0
mindspore/mint/__init__.py +15 -10
mindspore/mint/distributed/__init__.py +4 -0
mindspore/mint/distributed/distributed.py +392 -69
mindspore/mint/nn/__init__.py +2 -16
mindspore/mint/nn/functional.py +4 -110
mindspore/mint/nn/layer/__init__.py +0 -2
mindspore/mint/nn/layer/_functions.py +1 -2
mindspore/mint/nn/layer/activation.py +0 -6
mindspore/mint/nn/layer/basic.py +0 -47
mindspore/mint/nn/layer/conv.py +10 -10
mindspore/mint/nn/layer/normalization.py +11 -16
mindspore/mint/nn/layer/pooling.py +0 -4
mindspore/nn/__init__.py +1 -3
mindspore/nn/cell.py +231 -239
mindspore/nn/layer/activation.py +4 -2
mindspore/nn/layer/basic.py +56 -14
mindspore/nn/layer/container.py +16 -0
mindspore/nn/layer/embedding.py +4 -169
mindspore/nn/layer/image.py +1 -1
mindspore/nn/layer/normalization.py +2 -1
mindspore/nn/layer/thor_layer.py +4 -85
mindspore/nn/optim/ada_grad.py +0 -1
mindspore/nn/optim/adafactor.py +0 -1
mindspore/nn/optim/adam.py +32 -127
mindspore/nn/optim/adamax.py +0 -1
mindspore/nn/optim/asgd.py +0 -1
mindspore/nn/optim/ftrl.py +8 -102
mindspore/nn/optim/lamb.py +1 -4
mindspore/nn/optim/lars.py +0 -3
mindspore/nn/optim/lazyadam.py +25 -218
mindspore/nn/optim/momentum.py +5 -43
mindspore/nn/optim/optimizer.py +6 -55
mindspore/nn/optim/proximal_ada_grad.py +0 -1
mindspore/nn/optim/rmsprop.py +0 -1
mindspore/nn/optim/rprop.py +0 -1
mindspore/nn/optim/sgd.py +0 -1
mindspore/nn/optim/tft_wrapper.py +2 -4
mindspore/nn/optim/thor.py +0 -2
mindspore/nn/probability/bijector/bijector.py +7 -8
mindspore/nn/probability/bijector/gumbel_cdf.py +2 -2
mindspore/nn/probability/bijector/power_transform.py +20 -21
mindspore/nn/probability/bijector/scalar_affine.py +5 -5
mindspore/nn/probability/bijector/softplus.py +13 -14
mindspore/nn/probability/distribution/_utils/utils.py +2 -2
mindspore/nn/wrap/cell_wrapper.py +39 -5
mindspore/nn/wrap/grad_reducer.py +4 -89
mindspore/numpy/array_creations.py +4 -4
mindspore/numpy/fft.py +9 -9
mindspore/numpy/utils_const.py +1 -1
mindspore/{nn/reinforcement → onnx}/__init__.py +5 -8
mindspore/onnx/onnx_export.py +137 -0
mindspore/opencv_core4110.dll +0 -0
mindspore/opencv_imgcodecs4110.dll +0 -0
mindspore/{opencv_imgproc452.dll → opencv_imgproc4110.dll} +0 -0
mindspore/ops/__init__.py +2 -0
mindspore/ops/_grad_experimental/grad_comm_ops.py +38 -2
mindspore/ops/_grad_experimental/grad_inner_ops.py +0 -9
mindspore/ops/_op_impl/aicpu/__init__.py +0 -10
mindspore/ops/_op_impl/cpu/__init__.py +1 -5
mindspore/ops/_op_impl/cpu/{buffer_append.py → joinedstr_op.py} +8 -8
mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +28 -24
mindspore/ops/auto_generate/gen_extend_func.py +6 -11
mindspore/ops/auto_generate/gen_ops_def.py +385 -154
mindspore/ops/auto_generate/gen_ops_prim.py +5676 -5167
mindspore/ops/communication.py +97 -0
mindspore/ops/composite/__init__.py +5 -2
mindspore/ops/composite/base.py +16 -2
mindspore/ops/composite/multitype_ops/__init__.py +3 -1
mindspore/ops/composite/multitype_ops/_compile_utils.py +150 -8
mindspore/ops/composite/multitype_ops/_constexpr_utils.py +1 -1
mindspore/ops/composite/multitype_ops/add_impl.py +7 -0
mindspore/ops/composite/multitype_ops/mod_impl.py +27 -0
mindspore/ops/function/__init__.py +2 -0
mindspore/ops/function/array_func.py +24 -18
mindspore/ops/function/comm_func.py +3883 -0
mindspore/ops/function/debug_func.py +7 -6
mindspore/ops/function/grad/grad_func.py +4 -12
mindspore/ops/function/math_func.py +89 -86
mindspore/ops/function/nn_func.py +92 -313
mindspore/ops/function/random_func.py +9 -18
mindspore/ops/functional.py +4 -1
mindspore/ops/functional_overload.py +377 -30
mindspore/ops/operations/__init__.py +2 -5
mindspore/ops/operations/_custom_ops_utils.py +7 -9
mindspore/ops/operations/_inner_ops.py +12 -50
mindspore/ops/operations/_rl_inner_ops.py +0 -933
mindspore/ops/operations/array_ops.py +5 -50
mindspore/ops/operations/comm_ops.py +95 -17
mindspore/ops/operations/custom_ops.py +237 -22
mindspore/ops/operations/debug_ops.py +33 -35
mindspore/ops/operations/manually_defined/ops_def.py +39 -318
mindspore/ops/operations/math_ops.py +5 -5
mindspore/ops/operations/nn_ops.py +3 -3
mindspore/ops/operations/sparse_ops.py +0 -83
mindspore/ops/primitive.py +4 -27
mindspore/ops/tensor_method.py +88 -10
mindspore/ops_generate/aclnn/aclnn_kernel_register_auto_cc_generator.py +5 -5
mindspore/ops_generate/aclnn/gen_aclnn_implement.py +8 -8
mindspore/ops_generate/api/functions_cc_generator.py +53 -4
mindspore/ops_generate/api/tensor_func_reg_cpp_generator.py +25 -11
mindspore/ops_generate/common/gen_constants.py +11 -10
mindspore/ops_generate/common/op_proto.py +18 -1
mindspore/ops_generate/common/template.py +102 -245
mindspore/ops_generate/common/template_utils.py +212 -0
mindspore/ops_generate/gen_custom_ops.py +69 -0
mindspore/ops_generate/op_def/ops_def_cc_generator.py +78 -7
mindspore/ops_generate/op_def_py/base_op_prim_py_generator.py +360 -0
mindspore/ops_generate/op_def_py/custom_op_prim_py_generator.py +140 -0
mindspore/ops_generate/op_def_py/op_def_py_generator.py +54 -7
mindspore/ops_generate/op_def_py/op_prim_py_generator.py +5 -312
mindspore/ops_generate/pyboost/auto_grad_impl_cc_generator.py +74 -17
mindspore/ops_generate/pyboost/auto_grad_reg_cc_generator.py +22 -5
mindspore/ops_generate/pyboost/gen_pyboost_func.py +0 -16
mindspore/ops_generate/pyboost/op_template_parser.py +3 -2
mindspore/ops_generate/pyboost/pyboost_functions_cpp_generator.py +21 -5
mindspore/ops_generate/pyboost/pyboost_functions_h_generator.py +2 -2
mindspore/ops_generate/pyboost/pyboost_functions_impl_cpp_generator.py +30 -10
mindspore/ops_generate/pyboost/pyboost_grad_function_cpp_generator.py +10 -3
mindspore/ops_generate/pyboost/pyboost_internal_kernel_info_adapter_generator.py +1 -1
mindspore/ops_generate/pyboost/pyboost_native_grad_functions_generator.py +19 -9
mindspore/ops_generate/pyboost/pyboost_op_cpp_code_generator.py +71 -28
mindspore/ops_generate/pyboost/pyboost_overload_functions_cpp_generator.py +10 -9
mindspore/ops_generate/pyboost/pyboost_utils.py +27 -16
mindspore/ops_generate/resources/yaml_loader.py +13 -0
mindspore/ops_generate/tensor_py_cc_generator.py +2 -2
mindspore/parallel/_auto_parallel_context.py +5 -15
mindspore/parallel/_cell_wrapper.py +1 -1
mindspore/parallel/_parallel_serialization.py +4 -6
mindspore/parallel/_ps_context.py +2 -2
mindspore/parallel/_utils.py +34 -17
mindspore/parallel/auto_parallel.py +23 -9
mindspore/parallel/checkpoint_transform.py +20 -2
mindspore/parallel/cluster/process_entity/_api.py +28 -33
mindspore/parallel/cluster/process_entity/_utils.py +9 -5
mindspore/parallel/cluster/run.py +5 -3
mindspore/{experimental/llm_boost/ascend_native → parallel/distributed}/__init__.py +21 -22
mindspore/parallel/distributed/distributed_data_parallel.py +393 -0
mindspore/parallel/distributed/flatten_grad_buffer.py +295 -0
mindspore/parallel/function/reshard_func.py +6 -5
mindspore/parallel/nn/parallel_cell_wrapper.py +40 -3
mindspore/parallel/nn/parallel_grad_reducer.py +0 -8
mindspore/parallel/shard.py +7 -21
mindspore/parallel/strategy.py +336 -0
mindspore/parallel/transform_safetensors.py +127 -20
mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +13 -9
mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +1 -1
mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +1 -1
mindspore/profiler/common/constant.py +5 -0
mindspore/profiler/common/file_manager.py +9 -0
mindspore/profiler/common/msprof_cmd_tool.py +40 -4
mindspore/profiler/common/path_manager.py +65 -24
mindspore/profiler/common/profiler_context.py +27 -14
mindspore/profiler/common/profiler_info.py +3 -3
mindspore/profiler/common/profiler_meta_data.py +1 -0
mindspore/profiler/common/profiler_op_analyse.py +10 -6
mindspore/profiler/common/profiler_path_manager.py +13 -0
mindspore/profiler/common/util.py +30 -3
mindspore/profiler/dynamic_profiler.py +91 -46
mindspore/profiler/envprofiler.py +30 -5
mindspore/profiler/experimental_config.py +18 -2
mindspore/profiler/platform/cpu_profiler.py +10 -4
mindspore/profiler/platform/npu_profiler.py +34 -7
mindspore/profiler/profiler.py +193 -145
mindspore/profiler/profiler_action_controller.py +1 -1
mindspore/profiler/profiler_interface.py +2 -2
mindspore/rewrite/symbol_tree/symbol_tree.py +1 -1
mindspore/run_check/_check_version.py +108 -24
mindspore/runtime/__init__.py +9 -6
mindspore/runtime/executor.py +35 -0
mindspore/runtime/memory.py +113 -0
mindspore/runtime/thread_bind_core.py +1 -1
mindspore/swresample-4.dll +0 -0
mindspore/swscale-6.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/{experimental/llm_boost → tools}/__init__.py +5 -5
mindspore/tools/data_dump.py +130 -0
mindspore/tools/sdc_detect.py +91 -0
mindspore/tools/stress_detect.py +63 -0
mindspore/train/__init__.py +6 -6
mindspore/train/_utils.py +8 -21
mindspore/train/amp.py +6 -7
mindspore/train/callback/_callback.py +2 -1
mindspore/train/callback/_checkpoint.py +1 -17
mindspore/train/callback/_flops_collector.py +10 -6
mindspore/train/callback/_train_fault_tolerance.py +72 -25
mindspore/train/data_sink.py +5 -9
mindspore/train/dataset_helper.py +5 -5
mindspore/train/model.py +41 -230
mindspore/train/serialization.py +160 -401
mindspore/train/train_thor/model_thor.py +2 -2
mindspore/turbojpeg.dll +0 -0
mindspore/utils/__init__.py +6 -3
mindspore/utils/dlpack.py +92 -0
mindspore/utils/dryrun.py +1 -1
mindspore/utils/runtime_execution_order_check.py +10 -0
mindspore/utils/sdc_detect.py +14 -12
mindspore/utils/stress_detect.py +43 -0
mindspore/utils/utils.py +152 -16
mindspore/version.py +1 -1
{mindspore-2.7.0rc1.dist-info → mindspore-2.7.1.dist-info}/METADATA +3 -2
{mindspore-2.7.0rc1.dist-info → mindspore-2.7.1.dist-info}/RECORD +330 -344
mindspore/_extends/remote/kernel_build_server_ascend.py +0 -75
mindspore/communication/_hccl_management.py +0 -297
mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +0 -207
mindspore/experimental/llm_boost/ascend_native/llm_boost.py +0 -52
mindspore/experimental/llm_boost/atb/__init__.py +0 -23
mindspore/experimental/llm_boost/atb/boost_base.py +0 -385
mindspore/experimental/llm_boost/atb/llama_boost.py +0 -137
mindspore/experimental/llm_boost/atb/qwen_boost.py +0 -124
mindspore/experimental/llm_boost/register.py +0 -130
mindspore/experimental/llm_boost/utils.py +0 -31
mindspore/include/OWNERS +0 -7
mindspore/mindspore_cpu_res_manager.dll +0 -0
mindspore/mindspore_ops_kernel_common.dll +0 -0
mindspore/mindspore_res_manager.dll +0 -0
mindspore/nn/optim/_dist_optimizer_registry.py +0 -111
mindspore/nn/reinforcement/_batch_read_write.py +0 -142
mindspore/nn/reinforcement/_tensors_queue.py +0 -152
mindspore/nn/reinforcement/tensor_array.py +0 -145
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/ops/_op_impl/aicpu/priority_replay_buffer.py +0 -113
mindspore/ops/_op_impl/aicpu/reservoir_replay_buffer.py +0 -96
mindspore/ops/_op_impl/aicpu/sparse_cross.py +0 -42
mindspore/ops/_op_impl/cpu/buffer_get.py +0 -28
mindspore/ops/_op_impl/cpu/buffer_sample.py +0 -28
mindspore/ops/_op_impl/cpu/priority_replay_buffer.py +0 -42
mindspore/ops/operations/_tensor_array.py +0 -359
mindspore/ops/operations/rl_ops.py +0 -288
mindspore/parallel/_offload_context.py +0 -275
mindspore/parallel/_recovery_context.py +0 -115
mindspore/parallel/_transformer/__init__.py +0 -35
mindspore/parallel/_transformer/layers.py +0 -765
mindspore/parallel/_transformer/loss.py +0 -251
mindspore/parallel/_transformer/moe.py +0 -693
mindspore/parallel/_transformer/op_parallel_config.py +0 -222
mindspore/parallel/_transformer/transformer.py +0 -3124
mindspore/parallel/mpi/_mpi_config.py +0 -116
mindspore/profiler/common/validator/validate_path.py +0 -84
mindspore/train/memory_profiling_pb2.py +0 -298
mindspore/utils/hooks.py +0 -81
/mindspore/common/{_auto_dynamic.py → dynamic_shape/_auto_dynamic.py} +0 -0
{mindspore-2.7.0rc1.dist-info → mindspore-2.7.1.dist-info}/WHEEL +0 -0
{mindspore-2.7.0rc1.dist-info → mindspore-2.7.1.dist-info}/entry_points.txt +0 -0
{mindspore-2.7.0rc1.dist-info → mindspore-2.7.1.dist-info}/top_level.txt +0 -0

mindspore/ops/operations/array_ops.py CHANGED Viewed

@@ -42,7 +42,7 @@ from ..auto_generate import (
     NonZero, ResizeNearestNeighbor, Identity, Split, CumSum, CumProd,
     MaskedSelect, Cummax, Cummin, Argmin, Concat, UnsortedSegmentSum, UniqueConsecutive,
     ScalarToTensor, Triu, BroadcastTo, StridedSlice, Select, TopkExt,
-    SearchSorted, Meshgrid, Squeeze, Slice, TransposeExtView)
+    SearchSorted, Meshgrid, Squeeze, Slice, TransposeExtView, MaskedScatter)
 from .manually_defined import Rank, Shape, Tile, Cast, Ones, Zeros, TypeAs
 from ..auto_generate import ArgMaxWithValue, ArgMinWithValue
 from ..auto_generate import TensorScatterElements as TensorScatterElementsExt
@@ -1048,11 +1048,11 @@ class Fill(PrimitiveWithCheck):
         self.init_prim_io_names(inputs=['type', 'shape', 'value'], outputs=['y'])
     def __call__(self, dtype, dims, x):
-        if dtype not in mstype.all_types and dtype not in [mstype.uint16, mstype.uint32, mstype.uint64]:
+        if dtype not in mstype.all_types:
             raise TypeError(
                 f"For \'{self.name}\', the supported data type is ['bool', 'int8', 'int16', 'int32', 'int64', 'uint8', "
                 "'uint16', 'uint32', 'uint64','float16', 'float32', 'float64'], but got an invalid dtype!.")
-        x_nptype = mstype.dtype_to_nptype(dtype)
+        x_nptype = mstype._dtype_to_nptype(dtype)  # pylint:disable=protected-access
         if not isinstance(dims, Tensor) and not isinstance(dims, tuple):
             raise TypeError(f"For \'{self.name}\', input[1] must be tensor.")
         if not isinstance(x, Tensor) and not isinstance(x, float) and not isinstance(x, int):
@@ -1065,7 +1065,7 @@ class Fill(PrimitiveWithCheck):
         return Tensor(ret, dtype=dtype)
     def infer_value(self, dtype, dims, x):
-        x_nptype = mstype.dtype_to_nptype(dtype)
+        x_nptype = mstype._dtype_to_nptype(dtype)  # pylint:disable=protected-access
         if dims is not None and None not in dims and x is not None:
             if isinstance(dims, Tensor):
                 dims = dims.asnumpy()
@@ -1157,6 +1157,7 @@ class FillV2(PrimitiveWithCheck):
             init_func = Zero()
             init_func.__enable_zero_dim__ = True
             out = Tensor(shape=dims, dtype=x.dtype, init=init_func)
+            out.init_data()
             return out
         return Tensor(np.full(dims, x.asnumpy()))
@@ -3974,52 +3975,6 @@ class RangeV2(Primitive):
         validator.check_positive_int(maxlen, "maxlen", self.name)
-class MaskedScatter(Primitive):
-    """
-    Updates the value in the input with value in `updates` according to the `mask`.
-    .. warning::
-        This is an experimental API that is subject to change or deletion.
-    Inputs:
-        - **x** (Tensor): The input Tensor to be updated.
-        - **mask** (Tensor[bool]): The mask Tensor indicating which elements should be modified or replaced.
-          The shapes of `mask` and `x` must be the same or broadcastable.
-        - **updates** (Tensor): The values to scatter into the target tensor `x`. It has the same data type as `x`. The
-          number of elements must be greater than or equal to the number of True's in `mask`.
-    Outputs:
-        Tensor, with the same type and shape as `x`.
-    Raises:
-        TypeError: If `x`, `mask` or `updates` is not a Tensor.
-        TypeError: If data type of `x` is not be supported.
-        TypeError: If dtype of `mask` is not bool.
-        TypeError: If the dim of `x` less than the dim of `mask`.
-        ValueError: If `mask` can not be broadcastable to `x`.
-        ValueError: If the number of elements in `updates` is less than number of True's in `mask`.
-    Supported Platforms:
-        ``Ascend`` ``CPU``
-    Examples:
-        >>> import mindspore
-        >>> import numpy as np
-        >>> from mindspore import Tensor, ops
-        >>> input_x = Tensor(np.array([1., 2., 3., 4.]), mindspore.float32)
-        >>> mask = Tensor(np.array([True, True, False, True]), mindspore.bool_)
-        >>> updates = Tensor(np.array([5., 6., 7.]), mindspore.float32)
-        >>> output = ops.MaskedScatter()(input_x, mask, updates)
-        >>> print(output)
-        [5. 6. 3. 7.]
-    """
-    @prim_attr_register
-    def __init__(self):
-        """Initialize MaskedScatter"""
-        self.init_prim_io_names(inputs=['x', 'mask', 'updates'], outputs=['y'])
 class _TensorScatterOp(PrimitiveWithInfer):
     """
     Defines TensorScatter Base Operators

mindspore/ops/operations/comm_ops.py CHANGED Viewed

@@ -18,10 +18,9 @@
 from __future__ import absolute_import
 from __future__ import division
-import os
 from mindspore.common import Tensor
 from mindspore import _checkparam as validator
-from mindspore.communication.management import get_rank, get_group_size, GlobalComm, _get_group, _host_distribute
+from mindspore.communication.management import get_rank, get_group_size, GlobalComm, _get_group
 from mindspore.common import dtype as mstype
 from mindspore.ops.primitive import PrimitiveWithInfer, PrimitiveWithCheck, Primitive, prim_attr_register
 from mindspore.common.api import context
@@ -98,17 +97,6 @@ def check_collective_target_dtype(data_name, data_dtype, prim_name):
     validator.check_tensor_dtype_valid(data_name, data_dtype, valid_dtype, prim_name)
-def check_hcom_group_valid(group, prim_name=None):
-    """Check if hcom group is valid."""
-    msg_prefix = f"For '{prim_name}', the" if prim_name else "The"
-    sim_level = os.getenv("MS_SIMULATION_LEVEL")
-    no_sim = (sim_level is None or sim_level.strip() == '')
-    if no_sim and (not _host_distribute()) and context.get_context("mode") == context.PYNATIVE_MODE and \
-            group != GlobalComm.WORLD_COMM_GROUP:
-        raise RuntimeError(f"{msg_prefix} 'group' only support 'hccl_world_group' in pynative mode, but got "
-                           f"'group': {group}. Please start by using mpi-run.")
 class AllReduce(Primitive):
     """
     Reduces tensors across all devices in such a way that all devices will get the same final result,
@@ -187,7 +175,6 @@ class AllReduce(Primitive):
         if not isinstance(self.group, str):
             raise TypeError(f"For '{self.name}', the 'group' must be str, "
                             f"but got {type(self.group).__name__}.")
-        check_hcom_group_valid(self.group, prim_name=self.name)
         self.op = op
         self.add_prim_attr('group', self.group)
         self.add_prim_attr('fusion', 0)
@@ -720,7 +707,6 @@ class Broadcast(PrimitiveWithInfer):
         """Initialize Broadcast."""
         validator.check_value_type('root_rank', root_rank, (int,), self.name)
         validator.check_value_type('group', _get_group(group), (str,), self.name)
-        check_hcom_group_valid(group, prim_name=self.name)
         self.add_prim_attr('group', _get_group(group))
         self.add_prim_attr('no_eliminate', True)
@@ -1954,7 +1940,7 @@ class BatchISendIRecv(PrimitiveWithInfer):
 class AlltoAllV(PrimitiveWithInfer):
-    """
+    r"""
     AllToAllV which support uneven scatter and gather compared with AllToAll.
     Note:
@@ -2015,7 +2001,7 @@ class AlltoAllV(PrimitiveWithInfer):
         ...    send_tensor = Tensor([0, 1, 2.])
         ...    send_numel_list = [1, 2]
         ...    recv_numel_list = [1, 2]
-        >>> elif rank == 1:
+        ... elif rank == 1:
         ...    send_tensor = Tensor([3, 4, 5.])
         ...    send_numel_list = [2, 1]
         ...    recv_numel_list = [2, 1]
@@ -2027,6 +2013,10 @@ class AlltoAllV(PrimitiveWithInfer):
         rank 1:
         [1. 2. 5]
+    Tutorial Examples:
+        - `Distributed Set Communication Primitives - AlltoAllV
+          <https://www.mindspore.cn/docs/en/master/api_python/samples/ops/communicate_ops.html#alltoallv>`_
     """
     @prim_attr_register
@@ -2038,6 +2028,94 @@ class AlltoAllV(PrimitiveWithInfer):
         self.add_prim_attr('block_size', self.block_size)
+class AlltoAllVC(PrimitiveWithInfer):
+    r"""
+    AllToAllVC passes in the sending and receiving parameters of all ranks through the input parameter
+    `send_count_matrix`. Compared to AllToAllV, AllToAllVC does not require the aggregation of all rank
+    sending and receiving parameters, thus offering superior performance.
+    Note:
+        Only one-dimensional input is supported; the input data must be flattened into a one-dimensional
+        array before using this interface.
+    Args:
+        group (str, optional): The communication group to work on. Default: ``GlobalComm.WORLD_COMM_GROUP``, which
+            means ``"hccl_world_group"`` in Ascend.
+        block_size (int, optional): The basic units for splitting and gathering numel by `send_count_matrix`.
+            Default: ``1``.
+        transpose (bool, optional): Indicates whether the `send_count_matrix` needs to undergo a transpose
+            operation, this parameter is used in reverse calculation scenarios. Default: ``False``.
+    Inputs:
+        - **input_x** (Tensor) - flatten tensor to scatter. The shape of tensor is :math:`(x_1)`.
+        - **send_count_matrix** (Union[list[int], Tensor]) - The sending and receiving parameters of
+          all ranks, :math:`\text{send_count_matrix}[i*\text{rank_size}+j]` represents the amount of data sent by
+          rank i to rank j, and the basic unit is the number of bytes of Tensor's dtype. Among them, `rank_size`
+          indicates the size of the communication group.
+    Outputs:
+        Tensor. Flattened and concatenated tensor gather from remote ranks.
+        If gather result is empty, it will return a Tensor with shape `()`, and value has no actual meaning.
+    Supported Platforms:
+        ``Ascend``
+    Examples:
+        .. note::
+            Before running the following examples, you need to configure the communication environment variables.
+            For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
+            without any third-party or configuration file dependencies.
+            Please see the `msrun start up
+            <https://www.mindspore.cn/tutorials/en/master/parallel/msrun_launcher.html>`_
+            for more details.
+            This example should be run with 2 devices.
+        >>> from mindspore.ops import AlltoAllVC
+        >>> import mindspore.nn as nn
+        >>> from mindspore.communication import init, get_rank
+        >>> from mindspore import Tensor
+        >>>
+        >>> init()
+        >>> rank = get_rank()
+        >>> class Net(nn.Cell):
+        ...     def __init__(self):
+        ...         super(Net, self).__init__()
+        ...         self.all_to_all_v_c = AlltoAllVC()
+        ...
+        ...     def construct(self, x, send_count_matrix):
+        ...         return self.all_to_all_v_c(x, send_count_matrix)
+        >>> send_count_matrix = Tensor([[0, 3], [3, 0]])
+        >>> send_tensor = Tensor([0, 1, 2.]) * rank
+        >>> net = Net()
+        >>> output = net(send_tensor, send_count_matrix)
+        >>> print(output)
+        rank 0:
+        [0. 1. 2]
+        rank 1:
+        [0. 0. 0]
+    Tutorial Examples:
+        - `Distributed Set Communication Primitives - AlltoAllVC
+          <https://www.mindspore.cn/docs/en/master/api_python/samples/ops/communicate_ops.html#alltoallvc>`_
+    """
+    @prim_attr_register
+    def __init__(self, group=GlobalComm.WORLD_COMM_GROUP, block_size=1, transpose=False):
+        self.group = GlobalComm.WORLD_COMM_GROUP if group is None else _get_group(group)
+        self.rank_size = get_group_size(self.group)
+        self.add_prim_attr('rank_size', self.rank_size)
+        self.add_prim_attr('group', self.group)
+        self.rank_id = get_rank(_get_group(self.group))
+        self.add_prim_attr('rank_id', self.rank_id)
+        validator.check_value_type("block_size", block_size, [int], self.name)
+        self.add_prim_attr('block_size', self.block_size)
+        self.add_prim_attr('transpose', self.transpose)
 class AllGatherV(PrimitiveWithInfer):
     """
     Gathers uneven tensors from the specified communication group and returns the tensor which is all gathered.

mindspore/ops/operations/custom_ops.py CHANGED Viewed

@@ -18,6 +18,7 @@ from __future__ import absolute_import
 import json
 import os
 import re
+import sys
 import ast
 import hashlib
 import stat
@@ -26,6 +27,7 @@ import inspect
 import importlib
 import platform
 import subprocess
+import shutil
 import numpy as np
 import mindspore as ms
 from mindspore._c_expression import Oplib, typing
@@ -37,6 +39,7 @@ from mindspore.ops import DataType
 from mindspore import log as logger
 from mindspore import ops
 from mindspore.communication.management import get_rank, GlobalComm
+from mindspore import _checkparam as validator
 from ._ms_kernel import determine_variable_usage
 from ._custom_grad import autodiff_bprop
 from ._pyfunc_registry import add_pyfunc
@@ -1075,17 +1078,18 @@ class Custom(ops.PrimitiveWithInfer):
                 if isinstance(arg_dtype, mstype.TensorType):
                     arg_dtype = arg_dtype.element_type()
                 fake_arg = np.zeros(arg["shape"]).astype(
-                    mstype.dtype_to_nptype(arg_dtype))
+                    mstype._dtype_to_nptype(arg_dtype))  # pylint:disable=protected-access
                 fake_input.append(fake_arg)
         fake_output = self.func(*fake_input)
         if hasattr(fake_output, 'shape'):
             infer_shape = fake_output.shape
-            infer_dtype = mstype.TensorType(mstype.pytype_to_dtype(fake_output.dtype))
+            # pylint:disable=protected-access
+            infer_dtype = mstype.TensorType(mstype._pytype_to_dtype(fake_output.dtype))
         else:
             infer_shape = (1,)
-            infer_dtype = mstype.pytype_to_dtype(fake_output.dtype)
+            infer_dtype = mstype._pytype_to_dtype(fake_output.dtype)  # pylint:disable=protected-access
         infer_value = Tensor(fake_output) if enable_infer_value else None
@@ -1184,6 +1188,54 @@ class Custom(ops.PrimitiveWithInfer):
         return ops.primitive._run_op(self, self.name, args)
+class _MultiSoProxy:
+    """
+    A thin wrapper that transparently multiplexes attribute access between a
+    pure-Python fallback module and an optional compiled shared-object (SO)
+    module, honoring MindSpore’s current execution mode (GRAPH vs. PYNATIVE).
+    """
+    def __init__(self, func_module, so_module):
+        """
+        Args:
+            func_module (module or None): Python module to serve as the fallback implementation source.
+                May be ``None`` if no Python fallback is available.
+            so_module (module): Compiled shared-object module that provides
+                optimized kernels accessible only in ``PYNATIVE_MODE``.
+        """
+        self.func_module = func_module
+        self.so_module = so_module
+    def __getattr__(self, name: str):
+        """
+        Intercepts every attribute lookup and resolves it against the wrapped
+        modules according to the documented precedence rules.
+        Args:
+            name (str): Name of the custom operation being requested.
+        Returns:
+            Any: The requested callable or attribute from either ``func_module`` or ``so_module``.
+        Raises:
+            AttributeError: If the attribute is not found in any applicable module or
+            is incompatible with the current execution mode.
+        """
+        if self.func_module is not None and hasattr(self.func_module, name):
+            return getattr(self.func_module, name)
+        if context.get_context("mode") == ms.PYNATIVE_MODE:
+            if hasattr(self.so_module, name):
+                return getattr(self.so_module, name)
+            raise AttributeError(
+                f"Custom op '{name}' is neither in func_module nor in so_module."
+            )
+        raise AttributeError(
+            f"Custom op '{name}' does not support GRAPH mode. "
+            f"Please register it for GRAPH mode or switch to PYNATIVE mode."
+        )
 class CustomOpBuilder:
     r"""
     CustomOpBuilder is used to initialize and configure custom operators for MindSpore.
@@ -1199,10 +1251,11 @@ class CustomOpBuilder:
     Args:
         name (str): The unique name of the custom operator module, used to identify the operator.
-        sources (Union[str, list[str]]): The source file(s) of the custom operator. It can be a single file path or
-                                    a list of file paths.
+        sources (Union[list[str], tuple[str], str]): The source file(s) of the custom operator. It can be a single
+            file path or a list of file paths.
         backend (str, optional): The target backend for the operator, such as "CPU" or "Ascend". Default: ``None``.
-        include_paths (list[str], optional): Additionally included paths needed during compilation. Default: ``None``.
+        include_paths (Union[list[str], tuple[str], str], optional): Additionally included paths needed during
+            compilation. Default: ``None``.
         cflags (str, optional): Extra C++ compiler flags to be used during compilation. Default: ``None``.
         ldflags (str, optional): Extra linker flags to be used during linking. Default: ``None``.
         kwargs (dict, optional): Additional keyword arguments for future extensions or specific custom requirements.
@@ -1216,6 +1269,17 @@ class CustomOpBuilder:
             - enable_atb (bool, optional): Whether to call ATB (Ascend Transformer Boost) operator. If set to ``True``,
               the `backend` must be ``Ascend`` or left empty. Default: ``False``.
+            - enable_asdsip (bool, optional): Whether to call ASDSIP (Ascend SiP Boost) operator. If set to ``True``,
+              the `backend` must be ``Ascend`` or left empty. Default: ``False``.
+            - op_def (Union[list[str], tuple[str], str], optional): Path(s) to the operator definition
+              file(s) (YAML format). When using custom operators in graph mode, this parameter is mandatory.
+              It can be a single file path string or a list of file path strings. Default: ``None``.
+            - op_doc (Union[list[str], tuple[str], str], optional): Path(s) to the operator documentation
+              file(s) (YAML format). This parameter is optional and used to provide additional documentation
+              for the operator. It can be a single file path string or a list of file path strings. Default: ``None``.
     .. note::
         - If the `backend` argument is provided, additional default flags will be automatically added to
           the compilation and linking steps to support the operator's target backend. The default options
@@ -1238,20 +1302,20 @@ class CustomOpBuilder:
     _loaded_ops = {}
     def __init__(self, name, sources, backend=None, include_paths=None, cflags=None, ldflags=None, **kwargs):
-        self.name = name
-        self.source = sources
-        self.backend = backend
-        self.include_paths = include_paths
-        self.cflags = cflags
-        self.ldflags = ldflags
-        self.build_dir = kwargs.get("build_dir")
-        self.enable_atb = kwargs.get("enable_atb", False)
+        self._check_and_get_args(name, sources, backend, include_paths, cflags, ldflags, **kwargs)
         self._ms_path = os.path.dirname(os.path.abspath(ms.__file__))
+        self.auto_generate = self.name + "_auto_generate"
         if self.enable_atb:
             if backend is not None and backend != "Ascend":
                 raise ValueError("For 'CustomOpBuilder', when 'enable_atb' is set to True, the 'backend' must be "
                                  f"'Ascend' (or left implicit), but got '{backend}'")
             self.backend = "Ascend"
+        if self.enable_asdsip:
+            if backend is not None and backend != "Ascend":
+                raise ValueError("For 'CustomOpBuilder', when 'enable_asdsip' is set to True, the 'backend' must be "
+                                 f"'Ascend' (or left implicit), but got '{backend}'")
+            self.backend = "Ascend"
         if self.backend == "Ascend":
             ascend_opp_path = os.getenv("ASCEND_OPP_PATH")
             if not ascend_opp_path:
@@ -1263,6 +1327,115 @@ class CustomOpBuilder:
                 if not self.atb_home_path:
                     raise ValueError("Environment variable 'ATB_HOME_PATH' must be set when 'enable_atb' is True.")
+    def _check_and_get_args(self, name, sources, backend=None, include_paths=None,
+                            cflags=None, ldflags=None, **kwargs):
+        """
+        Validate and normalize all arguments to meet custom-op build requirements.
+        """
+        def _check_str_or_list_str(key, val):
+            if val is None:
+                return val
+            if isinstance(val, str):
+                val = [val]
+            val = validator.check_value_type(key, val, [list, tuple])
+            val = list(val)
+            validator.check_element_type_of_iterable(key, val, [str])
+            return val
+        self.name = validator.check_value_type("name", name, [str])
+        self.source = _check_str_or_list_str("sources", sources)
+        self.backend = validator.check_value_type("backend", backend, [str, type(None)])
+        if self.backend is not None and self.backend not in {"CPU", "Ascend"}:
+            raise ValueError(
+                f"For 'backend', only 'CPU' or 'Ascend' are allowed, but got '{self.backend}'.")
+        self.include_paths = _check_str_or_list_str("include_paths", include_paths)
+        self.cflags = validator.check_value_type("cflags", cflags, [str, type(None)])
+        self.ldflags = validator.check_value_type("ldflags", ldflags, [str, type(None)])
+        self.build_dir = validator.check_value_type("build_dir",
+                                                    kwargs.get("build_dir"),
+                                                    [str, type(None)])
+        self.debug_mode = validator.check_bool(kwargs.get("debug_mode", False), "debug_mode")
+        self.enable_asdsip = validator.check_bool(kwargs.get("enable_asdsip", False), "enable_asdsip")
+        self.yaml = _check_str_or_list_str("op_def", kwargs.get("op_def"))
+        self.doc = _check_str_or_list_str("op_doc", kwargs.get("op_doc"))
+        self.enable_atb = validator.check_bool(kwargs.get("enable_atb", False))
+    def _generate_custom_op_def(self, module: str, input_path: str, doc_path: str, output_path: str) -> None:
+        """Call gen_custom_ops.py to generate custom operator definition"""
+        file_path = os.path.join(self._ms_path, "ops_generate/gen_custom_ops.py")
+        cmd = [
+            sys.executable,
+            file_path,
+            "-i", input_path,
+            "-o", output_path,
+            "-m", module,
+            "-d", doc_path
+        ]
+        try:
+            subprocess.run(
+                cmd,
+                check=True,
+                text=True,
+                capture_output=True
+            )
+        except subprocess.CalledProcessError as exc:
+            raise RuntimeError(
+                f"gen_custom_op.py failed with exit code {exc.returncode}.\n"
+                f"stdout: {exc.stdout}\n"
+                f"stderr: {exc.stderr}"
+            ) from None
+    def _get_op_def(self):
+        """
+        Generate C++ operator-definition source files from one or more YAML specification files.
+        """
+        if self.yaml is None:
+            return []
+        if self.doc is None:
+            logger.info("Missing required 'doc': no YAML document was provided.")
+        build_path = self._get_build_directory()
+        yaml_path = os.path.join(build_path, "yaml")
+        op_def_path = os.path.join(build_path, self.auto_generate)
+        if os.path.exists(op_def_path):
+            shutil.rmtree(op_def_path)
+        os.makedirs(op_def_path, exist_ok=True)
+        def copy_files(yaml_files, dest_path):
+            if os.path.exists(dest_path):
+                shutil.rmtree(dest_path)
+            os.makedirs(dest_path, exist_ok=True)
+            for file_path in yaml_files:
+                if not os.path.isfile(file_path):
+                    raise FileNotFoundError(f"File not found: {file_path}")
+                filename = os.path.basename(file_path)
+                file_ext = os.path.splitext(filename)[1].lower()
+                if file_ext not in ('.yaml', '.yml'):
+                    raise ValueError(f"Invalid file extension: {file_ext} for {filename}")
+                _dest_path = os.path.join(dest_path, filename)
+                shutil.copy2(file_path, _dest_path)
+        yaml_files = [self.yaml] if isinstance(self.yaml, str) else self.yaml
+        copy_files(yaml_files, yaml_path)
+        doc_path = ""
+        if self.doc is not None:
+            doc_path = os.path.join(build_path, "doc")
+            doc_files = [self.doc] if isinstance(self.doc, str) else self.doc
+            copy_files(doc_files, doc_path)
+        self._generate_custom_op_def(self.name, yaml_path, doc_path, op_def_path)
+        return [os.path.join(op_def_path, "gen_custom_ops_def.cc")]
     def get_sources(self):
         """
         Get the source files for the custom operator.
@@ -1270,7 +1443,8 @@ class CustomOpBuilder:
         Returns:
             str or list[str], The source file(s) for the operator.
         """
-        return self.source
+        self.source = [self.source] if isinstance(self.source, str) else self.source
+        return self.source + self._get_op_def()
     def get_include_paths(self):
         """
@@ -1297,6 +1471,7 @@ class CustomOpBuilder:
         """include paths for inner module interface."""
         ms_inner_path = os.path.join(self._ms_path, "include", "mindspore")
         include_list = []
+        include_list.append(os.path.join(ms_inner_path, "include"))
         include_list.append(os.path.join(ms_inner_path, "core", "include"))
         include_list.append(os.path.join(ms_inner_path, "core", "mindrt", "include"))
         include_list.append(os.path.join(ms_inner_path, "core", "mindrt"))
@@ -1316,10 +1491,16 @@ class CustomOpBuilder:
         """
         flags = [f'-DMS_EXTENSION_NAME={self.name}', '-D_GLIBCXX_USE_CXX11_ABI=0', '-DENABLE_FAST_HASH_TABLE=1']
         flags += ['-std=c++17', '-fstack-protector-all', '-fPIC', '-pie']
+        if self.debug_mode:
+            flags.append('-g')
+        else:
+            flags.append('-O2')
         if self.backend == "Ascend":
             flags.append('-DCUSTOM_ASCEND_OP')
             if self.enable_atb:
                 flags.append('-DCUSTOM_ENABLE_ATB')
+            if self.enable_asdsip:
+                flags.append('-DCUSTOM_ENABLE_ASDSIP')
         if self.cflags is not None:
             flags.append(self.cflags)
         return flags
@@ -1332,24 +1513,31 @@ class CustomOpBuilder:
             list[str], A list of linker flags.
         """
         flags = ['-shared']
-        flags += ['-Wl,-z,relro,-z,now,-z,noexecstack', '-Wl,--disable-new-dtags,--rpath', '-s']
+        flags += ['-Wl,-z,relro,-z,now,-z,noexecstack', '-Wl,--disable-new-dtags,--rpath']
+        if not self.debug_mode:
+            flags.append('-s')  # strip
         flags += [
             f"-L{os.path.abspath(os.path.join(self._ms_path, 'lib'))}",
             '-lmindspore_core',
             '-lmindspore_ms_backend',
             '-lmindspore_pynative',
-            '-lmindspore_extension'
+            '-lmindspore_pyboost'
         ]
         if self.backend == "Ascend":
-            flags.append(f"-L{os.path.abspath(os.path.join(self._ms_path, 'lib', 'plugin'))}")
             flags.append(f"-L{os.path.abspath(os.path.join(self.ascend_cann_path, 'lib64'))}")
             flags.append('-lascendcl')
+            plugin_path = os.path.abspath(os.path.join(self._ms_path, 'lib', 'plugin'))
+            flags.append(f"-L{plugin_path}")
+            flags.append(f"-L{os.path.join(plugin_path, 'ascend')}")
             flags.append('-l:libmindspore_ascend.so.2')
+            flags.append('-lmindspore_extension_ascend_aclnn')
             if self.enable_atb:
-                flags.append(f"-L{os.path.abspath(os.path.join(self._ms_path, 'lib', 'plugin', 'ascend'))}")
                 flags.append('-lmindspore_extension_ascend_atb')
                 flags.append(f"-L{os.path.abspath(os.path.join(self.atb_home_path, 'lib'))}")
                 flags.append('-latb')
+            if self.enable_asdsip:
+                flags.append(f"-L{os.path.abspath(os.path.join(self._ms_path, 'lib', 'plugin', 'ascend'))}")
+                flags.append('-lmindspore_extension_ascend_asdsip')
         if self.ldflags is not None:
             flags.append(self.ldflags)
         return flags
@@ -1380,15 +1568,42 @@ class CustomOpBuilder:
         """
         if self.name in CustomOpBuilder._loaded_ops:
             return CustomOpBuilder._loaded_ops[self.name]
         module_path = self.build()
-        mod = self._import_module(module_path)
+        so_module = CustomOpBuilder._import_module(module_path)
+        func_module = None
+        if self.yaml is not None:
+            module_path = os.path.join(self.build_dir, self.auto_generate, "gen_ops_def.py")
+            sys.path.append(os.path.join(self.build_dir, self.auto_generate))
+            sys.path.append(os.path.join(self.build_dir))
+            func_module = self._import_module(module_path, True)
+        mod = _MultiSoProxy(func_module, so_module)
         CustomOpBuilder._loaded_ops[self.name] = mod
         return mod
-    def _import_module(self, module_path):
+    @staticmethod
+    def _import_module(module_path, is_yaml_build=False):
         """Import module from library."""
-        spec = importlib.util.spec_from_file_location(self.name, module_path)
+        module_path = os.path.abspath(module_path)
+        module_dir = os.path.dirname(module_path)
+        module_name = os.path.splitext(os.path.basename(module_path))[0]
+        if is_yaml_build:
+            package_name = os.path.basename(module_dir)
+            if module_dir not in sys.path:
+                sys.path.append(module_dir)
+            if package_name not in sys.modules:
+                pkg_spec = importlib.machinery.ModuleSpec(package_name, None, is_package=True)
+                pkg = importlib.util.module_from_spec(pkg_spec)
+                pkg.__path__ = [module_dir]
+                sys.modules[package_name] = pkg
+            module_name = f"{package_name}.{module_name}"
+        spec = importlib.util.spec_from_file_location(module_name, module_path)
         module = importlib.util.module_from_spec(spec)
+        sys.modules[module_name] = module
         spec.loader.exec_module(module)
         return module