PyPI - mindspore - Versions diffs - 2.3.0__cp39-cp39-win_amd64.whl → 2.4.1__cp39-cp39-win_amd64.whl - Mend

mindspore 2.3.0__cp39-cp39-win_amd64.whl → 2.4.1__cp39-cp39-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (287) hide show

mindspore/.commit_id +1 -1
mindspore/__init__.py +3 -1
mindspore/_c_dataengine.cp39-win_amd64.pyd +0 -0
mindspore/_c_expression.cp39-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp39-win_amd64.pyd +0 -0
mindspore/_checkparam.py +50 -9
mindspore/_extends/parse/compile_config.py +41 -0
mindspore/_extends/parse/parser.py +9 -7
mindspore/_extends/parse/standard_method.py +52 -14
mindspore/_extends/pijit/pijit_func_white_list.py +350 -24
mindspore/amp.py +24 -10
mindspore/avcodec-59.dll +0 -0
mindspore/avdevice-59.dll +0 -0
mindspore/avfilter-8.dll +0 -0
mindspore/avformat-59.dll +0 -0
mindspore/avutil-57.dll +0 -0
mindspore/common/__init__.py +6 -4
mindspore/common/_pijit_context.py +190 -0
mindspore/common/_register_for_tensor.py +2 -1
mindspore/common/_tensor_overload.py +139 -0
mindspore/common/api.py +102 -87
mindspore/common/dump.py +5 -6
mindspore/common/generator.py +1 -7
mindspore/common/hook_handle.py +14 -26
mindspore/common/initializer.py +51 -15
mindspore/common/mindir_util.py +2 -2
mindspore/common/parameter.py +62 -15
mindspore/common/recompute.py +39 -9
mindspore/common/sparse_tensor.py +7 -3
mindspore/common/tensor.py +183 -37
mindspore/communication/__init__.py +1 -1
mindspore/communication/_comm_helper.py +38 -3
mindspore/communication/comm_func.py +315 -60
mindspore/communication/management.py +14 -14
mindspore/context.py +132 -22
mindspore/dataset/__init__.py +1 -1
mindspore/dataset/audio/__init__.py +1 -1
mindspore/dataset/core/config.py +7 -0
mindspore/dataset/core/validator_helpers.py +7 -0
mindspore/dataset/engine/cache_client.py +1 -1
mindspore/dataset/engine/datasets.py +72 -44
mindspore/dataset/engine/datasets_audio.py +7 -7
mindspore/dataset/engine/datasets_standard_format.py +53 -3
mindspore/dataset/engine/datasets_text.py +20 -20
mindspore/dataset/engine/datasets_user_defined.py +174 -104
mindspore/dataset/engine/datasets_vision.py +33 -33
mindspore/dataset/engine/iterators.py +29 -0
mindspore/dataset/engine/obs/util.py +7 -0
mindspore/dataset/engine/queue.py +114 -60
mindspore/dataset/engine/serializer_deserializer.py +2 -2
mindspore/dataset/engine/validators.py +34 -14
mindspore/dataset/text/__init__.py +1 -4
mindspore/dataset/transforms/__init__.py +0 -3
mindspore/dataset/utils/line_reader.py +2 -0
mindspore/dataset/vision/__init__.py +1 -4
mindspore/dataset/vision/utils.py +1 -1
mindspore/dataset/vision/validators.py +2 -1
mindspore/dnnl.dll +0 -0
mindspore/{nn/extend → experimental/es}/__init__.py +4 -11
mindspore/experimental/es/embedding_service.py +883 -0
mindspore/{nn/layer → experimental/es}/embedding_service_layer.py +218 -30
mindspore/experimental/llm_boost/__init__.py +21 -0
mindspore/{nn/extend/layer → experimental/llm_boost/atb}/__init__.py +4 -8
mindspore/experimental/llm_boost/atb/boost_base.py +211 -0
mindspore/experimental/llm_boost/atb/llama_boost.py +115 -0
mindspore/experimental/llm_boost/atb/qwen_boost.py +101 -0
mindspore/experimental/llm_boost/register.py +129 -0
mindspore/experimental/llm_boost/utils.py +31 -0
mindspore/experimental/optim/adamw.py +85 -0
mindspore/experimental/optim/optimizer.py +3 -0
mindspore/hal/__init__.py +3 -3
mindspore/hal/contiguous_tensors_handle.py +175 -0
mindspore/hal/stream.py +18 -0
mindspore/include/api/model_group.h +13 -1
mindspore/include/api/types.h +10 -10
mindspore/include/dataset/config.h +2 -2
mindspore/include/dataset/constants.h +2 -2
mindspore/include/dataset/execute.h +2 -2
mindspore/include/dataset/vision.h +4 -0
mindspore/jpeg62.dll +0 -0
mindspore/log.py +1 -1
mindspore/mindrecord/filewriter.py +68 -51
mindspore/mindspore_backend.dll +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_glog.dll +0 -0
mindspore/mindspore_np_dtype.dll +0 -0
mindspore/mindspore_ops.dll +0 -0
mindspore/mint/__init__.py +983 -46
mindspore/mint/distributed/__init__.py +31 -0
mindspore/mint/distributed/distributed.py +254 -0
mindspore/mint/nn/__init__.py +268 -23
mindspore/mint/nn/functional.py +125 -19
mindspore/mint/nn/layer/__init__.py +39 -0
mindspore/mint/nn/layer/activation.py +133 -0
mindspore/mint/nn/layer/normalization.py +477 -0
mindspore/mint/nn/layer/pooling.py +110 -0
mindspore/mint/optim/adamw.py +26 -13
mindspore/mint/special/__init__.py +63 -0
mindspore/multiprocessing/__init__.py +2 -1
mindspore/nn/__init__.py +0 -1
mindspore/nn/cell.py +276 -96
mindspore/nn/layer/activation.py +211 -44
mindspore/nn/layer/basic.py +137 -10
mindspore/nn/layer/embedding.py +137 -2
mindspore/nn/layer/normalization.py +101 -5
mindspore/nn/layer/padding.py +34 -48
mindspore/nn/layer/pooling.py +161 -7
mindspore/nn/layer/transformer.py +3 -3
mindspore/nn/loss/__init__.py +2 -2
mindspore/nn/loss/loss.py +84 -6
mindspore/nn/optim/__init__.py +2 -1
mindspore/nn/optim/adadelta.py +1 -1
mindspore/nn/optim/adam.py +1 -1
mindspore/nn/optim/lamb.py +1 -1
mindspore/nn/optim/tft_wrapper.py +124 -0
mindspore/nn/wrap/cell_wrapper.py +12 -23
mindspore/nn/wrap/grad_reducer.py +5 -5
mindspore/nn/wrap/loss_scale.py +17 -3
mindspore/numpy/__init__.py +1 -1
mindspore/numpy/array_creations.py +65 -68
mindspore/numpy/array_ops.py +64 -60
mindspore/numpy/fft.py +610 -75
mindspore/numpy/logic_ops.py +11 -10
mindspore/numpy/math_ops.py +85 -84
mindspore/numpy/utils_const.py +4 -4
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/opencv_imgproc452.dll +0 -0
mindspore/ops/__init__.py +6 -4
mindspore/ops/_grad_experimental/grad_array_ops.py +0 -11
mindspore/ops/_grad_experimental/grad_comm_ops.py +67 -4
mindspore/ops/_grad_experimental/grad_math_ops.py +0 -22
mindspore/ops/_vmap/vmap_array_ops.py +2 -4
mindspore/ops/_vmap/vmap_math_ops.py +17 -1
mindspore/ops/_vmap/vmap_nn_ops.py +43 -2
mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +91 -7
mindspore/ops/auto_generate/gen_arg_dtype_cast.py +2 -0
mindspore/ops/auto_generate/gen_extend_func.py +767 -13
mindspore/ops/auto_generate/gen_ops_def.py +2452 -364
mindspore/ops/auto_generate/gen_ops_prim.py +5442 -1756
mindspore/ops/auto_generate/pyboost_inner_prim.py +176 -56
mindspore/ops/composite/base.py +85 -48
mindspore/ops/composite/multitype_ops/_compile_utils.py +1 -0
mindspore/ops/composite/multitype_ops/not_in_impl.py +2 -2
mindspore/ops/function/__init__.py +22 -0
mindspore/ops/function/array_func.py +492 -153
mindspore/ops/function/debug_func.py +113 -1
mindspore/ops/function/fft_func.py +15 -2
mindspore/ops/function/grad/grad_func.py +3 -2
mindspore/ops/function/math_func.py +564 -207
mindspore/ops/function/nn_func.py +817 -383
mindspore/ops/function/other_func.py +3 -2
mindspore/ops/function/random_func.py +402 -12
mindspore/ops/function/reshard_func.py +13 -11
mindspore/ops/function/sparse_unary_func.py +1 -1
mindspore/ops/function/vmap_func.py +3 -2
mindspore/ops/functional.py +24 -14
mindspore/ops/op_info_register.py +3 -3
mindspore/ops/operations/__init__.py +7 -2
mindspore/ops/operations/_grad_ops.py +2 -76
mindspore/ops/operations/_infer_ops.py +1 -1
mindspore/ops/operations/_inner_ops.py +71 -94
mindspore/ops/operations/array_ops.py +14 -146
mindspore/ops/operations/comm_ops.py +63 -53
mindspore/ops/operations/custom_ops.py +83 -19
mindspore/ops/operations/debug_ops.py +42 -10
mindspore/ops/operations/manually_defined/_inner.py +12 -0
mindspore/ops/operations/manually_defined/ops_def.py +273 -20
mindspore/ops/operations/math_ops.py +12 -223
mindspore/ops/operations/nn_ops.py +20 -114
mindspore/ops/operations/other_ops.py +7 -4
mindspore/ops/operations/random_ops.py +46 -1
mindspore/ops/primitive.py +18 -6
mindspore/ops_generate/arg_dtype_cast.py +2 -0
mindspore/ops_generate/gen_aclnn_implement.py +11 -11
mindspore/ops_generate/gen_constants.py +36 -0
mindspore/ops_generate/gen_ops.py +67 -52
mindspore/ops_generate/gen_ops_inner_prim.py +1 -1
mindspore/ops_generate/gen_pyboost_func.py +131 -47
mindspore/ops_generate/op_proto.py +10 -3
mindspore/ops_generate/pyboost_utils.py +14 -1
mindspore/ops_generate/template.py +43 -21
mindspore/parallel/__init__.py +3 -1
mindspore/parallel/_auto_parallel_context.py +31 -9
mindspore/parallel/_cell_wrapper.py +85 -0
mindspore/parallel/_parallel_serialization.py +47 -19
mindspore/parallel/_tensor.py +127 -13
mindspore/parallel/_utils.py +53 -22
mindspore/parallel/algo_parameter_config.py +5 -5
mindspore/parallel/checkpoint_transform.py +46 -39
mindspore/parallel/cluster/process_entity/__init__.py +1 -1
mindspore/parallel/cluster/process_entity/_api.py +31 -23
mindspore/parallel/cluster/process_entity/_utils.py +2 -27
mindspore/parallel/parameter_broadcast.py +3 -4
mindspore/parallel/shard.py +162 -31
mindspore/parallel/transform_safetensors.py +1146 -0
mindspore/profiler/__init__.py +2 -1
mindspore/profiler/common/constant.py +29 -0
mindspore/profiler/common/registry.py +47 -0
mindspore/profiler/common/util.py +28 -0
mindspore/profiler/dynamic_profiler.py +694 -0
mindspore/profiler/envprofiling.py +17 -19
mindspore/profiler/parser/ascend_analysis/constant.py +18 -0
mindspore/profiler/parser/ascend_analysis/file_manager.py +25 -4
mindspore/profiler/parser/ascend_analysis/function_event.py +43 -19
mindspore/profiler/parser/ascend_analysis/fwk_cann_parser.py +31 -26
mindspore/profiler/parser/ascend_analysis/fwk_file_parser.py +56 -10
mindspore/profiler/parser/ascend_analysis/msprof_timeline_parser.py +55 -8
mindspore/profiler/parser/ascend_analysis/path_manager.py +313 -0
mindspore/profiler/parser/ascend_analysis/profiler_info_parser.py +27 -20
mindspore/profiler/parser/ascend_analysis/trace_event_manager.py +9 -2
mindspore/profiler/parser/ascend_msprof_exporter.py +5 -4
mindspore/profiler/parser/ascend_timeline_generator.py +27 -25
mindspore/profiler/parser/base_timeline_generator.py +19 -25
mindspore/profiler/parser/cpu_gpu_timeline_generator.py +25 -12
mindspore/profiler/parser/framework_parser.py +1 -391
mindspore/profiler/parser/gpu_analysis/__init__.py +14 -0
mindspore/profiler/parser/gpu_analysis/function_event.py +44 -0
mindspore/profiler/parser/gpu_analysis/fwk_file_parser.py +89 -0
mindspore/profiler/parser/gpu_analysis/profiler_info_parser.py +72 -0
mindspore/profiler/parser/memory_usage_parser.py +0 -154
mindspore/profiler/parser/profiler_info.py +78 -6
mindspore/profiler/profiler.py +153 -0
mindspore/profiler/profiling.py +285 -413
mindspore/rewrite/__init__.py +1 -2
mindspore/rewrite/common/namespace.py +4 -4
mindspore/rewrite/symbol_tree/symbol_tree.py +3 -3
mindspore/run_check/_check_version.py +39 -104
mindspore/safeguard/rewrite_obfuscation.py +591 -247
mindspore/swresample-4.dll +0 -0
mindspore/swscale-6.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/train/__init__.py +4 -3
mindspore/train/_utils.py +105 -19
mindspore/train/amp.py +171 -53
mindspore/train/callback/__init__.py +2 -2
mindspore/train/callback/_callback.py +4 -4
mindspore/train/callback/_checkpoint.py +97 -31
mindspore/train/callback/_cluster_monitor.py +1 -1
mindspore/train/callback/_flops_collector.py +1 -0
mindspore/train/callback/_loss_monitor.py +3 -3
mindspore/train/callback/_on_request_exit.py +145 -31
mindspore/train/callback/_summary_collector.py +5 -5
mindspore/train/callback/_tft_register.py +375 -0
mindspore/train/dataset_helper.py +15 -3
mindspore/train/metrics/metric.py +3 -3
mindspore/train/metrics/roc.py +4 -4
mindspore/train/mind_ir_pb2.py +44 -39
mindspore/train/model.py +154 -58
mindspore/train/serialization.py +342 -128
mindspore/turbojpeg.dll +0 -0
mindspore/utils/__init__.py +21 -0
mindspore/utils/utils.py +60 -0
mindspore/version.py +1 -1
{mindspore-2.3.0.dist-info → mindspore-2.4.1.dist-info}/METADATA +13 -7
{mindspore-2.3.0.dist-info → mindspore-2.4.1.dist-info}/RECORD +260 -254
{mindspore-2.3.0.dist-info → mindspore-2.4.1.dist-info}/WHEEL +1 -1
mindspore/include/c_api/ms/abstract.h +0 -67
mindspore/include/c_api/ms/attribute.h +0 -197
mindspore/include/c_api/ms/base/handle_types.h +0 -43
mindspore/include/c_api/ms/base/macros.h +0 -32
mindspore/include/c_api/ms/base/status.h +0 -33
mindspore/include/c_api/ms/base/types.h +0 -283
mindspore/include/c_api/ms/context.h +0 -102
mindspore/include/c_api/ms/graph.h +0 -160
mindspore/include/c_api/ms/node.h +0 -606
mindspore/include/c_api/ms/tensor.h +0 -161
mindspore/include/c_api/ms/value.h +0 -84
mindspore/mindspore_shared_lib.dll +0 -0
mindspore/nn/extend/basic.py +0 -140
mindspore/nn/extend/embedding.py +0 -143
mindspore/nn/extend/layer/normalization.py +0 -109
mindspore/nn/extend/pooling.py +0 -117
mindspore/nn/layer/embedding_service.py +0 -531
mindspore/ops/_op_impl/aicpu/strided_slice_v2.py +0 -93
mindspore/ops/_op_impl/aicpu/strided_slice_v2_grad.py +0 -66
mindspore/ops/extend/__init__.py +0 -53
mindspore/ops/extend/array_func.py +0 -218
mindspore/ops/extend/math_func.py +0 -76
mindspore/ops/extend/nn_func.py +0 -308
mindspore/ops/silent_check.py +0 -162
mindspore/profiler/parser/msadvisor_analyzer.py +0 -82
mindspore/profiler/parser/msadvisor_parser.py +0 -240
mindspore/train/callback/_mindio_ttp.py +0 -443
{mindspore-2.3.0.dist-info → mindspore-2.4.1.dist-info}/entry_points.txt +0 -0
{mindspore-2.3.0.dist-info → mindspore-2.4.1.dist-info}/top_level.txt +0 -0

mindspore/ops/function/vmap_func.py CHANGED Viewed

@@ -27,8 +27,9 @@ def vmap(fn, in_axes=0, out_axes=0):
     Vmap is pioneered by Jax and it removes the restriction of batch dimension on the operator, and provides a
     more convenient and unified operator expression. Moreover, it allows users to composite with other functional
     modules such as :func:`mindspore.grad`, to improve the development efficiency, please refer to the
-    `Automatic Vectorization (Vmap) <https://www.mindspore.cn/tutorials/experts/en/master/vmap/vmap.html>`_ tutorial
-    for more detail. In addition, the vectorizing map does not execute loops outside the function, but sinks loops
+    `Automatic Vectorization (Vmap) <https://www.mindspore.cn/docs/en/master/model_train/train_process/optimize/vmap.html>`_
+    tutorial for more detail.
+    In addition, the vectorizing map does not execute loops outside the function, but sinks loops
     into the primitive operations of the function for better performance. When combined with `Graph Kernel Fusion`,
     operational efficiency would be further improved.

mindspore/ops/functional.py CHANGED Viewed

@@ -1,6 +1,6 @@
 # This is the Python adaptation and derivative work of Myia (https://github.com/mila-iqia/myia/).
 #
-# Copyright 2021-2022 Huawei Technologies Co., Ltd
+# Copyright 2021-2024 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -19,7 +19,7 @@
 from mindspore.common._register_for_tensor import tensor_operator_registry
 from mindspore.ops import _constants
 from mindspore.ops.function import *
-from mindspore.ops.function.array_func import narrow, flatten
+from mindspore.ops.function.array_func import chunk_ext, zero_
 from mindspore.ops.function.math_func import all, argmax_ext
 from mindspore.ops.function.random_func import uniform_ext
 from mindspore.ops import operations as P
@@ -34,14 +34,15 @@ from mindspore.ops.operations.math_ops import Roll
 from mindspore.ops.composite.math_ops import mm
 from mindspore.ops.function.math_func import dot
 from mindspore.ops import auto_generate
+from mindspore.ops.auto_generate import cast
 from mindspore.ops_generate.gen_ops_inner_prim import DtypeToEnum
-from mindspore.ops.operations.manually_defined.ops_def import scalar_div, scalar_mod, scalar_add, scalar_mul,\
-    scalar_sub, scalar_gt, scalar_ge, scalar_le, scalar_lt, scalar_eq, scalar_floordiv, scalar_log, scalar_pow,\
+from mindspore.ops.operations.manually_defined.ops_def import scalar_div, scalar_mod, scalar_add, scalar_mul, \
+    scalar_sub, scalar_gt, scalar_ge, scalar_le, scalar_lt, scalar_eq, scalar_floordiv, scalar_log, scalar_pow, \
     scalar_uadd, scalar_usub, flash_attention_score
 typeof = Primitive('typeof')
 hastype = Primitive('hastype')
-cast = P.Cast()
+_cast = P.Cast()
 dtype = P.DType()
 isconstant = _inner_ops.IsConstant()
 isconstant.set_const_prim(True)
@@ -116,7 +117,8 @@ reduced_shape = Primitive("reduced_shape")
 # shape_mul:input must be shape multiply elements in tuple(shape)
 shape_mul = _sequence_ops.shape_mul()
-setattr(tensor_operator_registry, 'tuple_to_tensor', _sequence_ops.TupleToTensor)
+setattr(tensor_operator_registry, 'tuple_to_tensor',
+        _sequence_ops.TupleToTensor)
 setattr(tensor_operator_registry, 'add', add)
 setattr(tensor_operator_registry, 'softmax', softmax)
 setattr(tensor_operator_registry, 'addr', addr)
@@ -136,6 +138,7 @@ setattr(tensor_operator_registry, 'rsqrt', rsqrt)
 setattr(tensor_operator_registry, 'bincount', bincount)
 setattr(tensor_operator_registry, 'slogdet', slogdet)
 setattr(tensor_operator_registry, 'trace', trace)
+setattr(tensor_operator_registry, 'tracev2', auto_generate.trace_v2_op)
 setattr(tensor_operator_registry, 'tril', tril)
 setattr(tensor_operator_registry, 'chunk', chunk)
 setattr(tensor_operator_registry, 'count_nonzero', count_nonzero)
@@ -210,7 +213,8 @@ setattr(tensor_operator_registry, 'dot', dot)
 setattr(tensor_operator_registry, 'outer', outer)
 setattr(tensor_operator_registry, 'log1p', log1p)
 setattr(tensor_operator_registry, 'logdet', logdet)
-setattr(tensor_operator_registry, 'log_matrix_determinant', log_matrix_determinant)
+setattr(tensor_operator_registry,
+        'log_matrix_determinant', log_matrix_determinant)
 setattr(tensor_operator_registry, 'matrix_determinant', matrix_determinant)
 setattr(tensor_operator_registry, 'ceil', ceil)
 setattr(tensor_operator_registry, 'fillv2', P.FillV2)
@@ -223,6 +227,7 @@ setattr(tensor_operator_registry, 'vsplit', vsplit)
 setattr(tensor_operator_registry, 'hsplit', hsplit)
 setattr(tensor_operator_registry, 'dsplit', dsplit)
 setattr(tensor_operator_registry, 'zeros_like', zeros_like)
+setattr(tensor_operator_registry, 'zero_', zero_)
 setattr(tensor_operator_registry, 'scalar_to_tensor', scalar_to_tensor)
 setattr(tensor_operator_registry, 'stop_gradient', stop_gradient)
 setattr(tensor_operator_registry, 'masked_fill', masked_fill)
@@ -264,6 +269,7 @@ setattr(tensor_operator_registry, 'tanh', tanh)
 setattr(tensor_operator_registry, 'exp', exp)
 setattr(tensor_operator_registry, 'addbmm', addbmm)
 setattr(tensor_operator_registry, 'addmm', addmm)
+setattr(tensor_operator_registry, 'addmm_', auto_generate.inplace_addmm_op)
 setattr(tensor_operator_registry, 'addmv', addmv)
 setattr(tensor_operator_registry, 'adjoint', adjoint)
 setattr(tensor_operator_registry, 'asinh', asinh)
@@ -314,7 +320,7 @@ setattr(tensor_operator_registry, 'unsqueeze', unsqueeze)
 setattr(tensor_operator_registry, 'expand_dims', expand_dims)
 setattr(tensor_operator_registry, 'contiguous', auto_generate.contiguous)
 # support GE backend for no compare operators
-setattr(tensor_operator_registry, 'cast', cast)
+setattr(tensor_operator_registry, 'cast', _cast)
 setattr(tensor_operator_registry, 'shape_mul', shape_mul)
 setattr(tensor_operator_registry, 'concatenate', concat)
 setattr(tensor_operator_registry, 'fill', fill)
@@ -392,12 +398,13 @@ setattr(tensor_operator_registry, 'argwhere', argwhere)
 setattr(tensor_operator_registry, 'coo_add', coo_add)
 setattr(tensor_operator_registry, 'topk', topk)
 setattr(tensor_operator_registry, 'isfinite', isfinite)
-setattr(tensor_operator_registry, 'to', cast)
-setattr(tensor_operator_registry, 'bool', cast)
-setattr(tensor_operator_registry, 'float', cast)
-setattr(tensor_operator_registry, 'half', cast)
-setattr(tensor_operator_registry, 'int', cast)
-setattr(tensor_operator_registry, 'long', cast)
+setattr(tensor_operator_registry, 'to', _cast)
+setattr(tensor_operator_registry, 'bool', _cast)
+setattr(tensor_operator_registry, 'float', _cast)
+setattr(tensor_operator_registry, 'half', _cast)
+setattr(tensor_operator_registry, 'int', _cast)
+setattr(tensor_operator_registry, 'long', _cast)
+setattr(tensor_operator_registry, 'byte', _cast)
 setattr(tensor_operator_registry, 'cholesky', cholesky)
 setattr(tensor_operator_registry, 'cholesky_inverse', cholesky_inverse)
 setattr(tensor_operator_registry, 'cholesky_solve', cholesky_solve)
@@ -440,6 +447,9 @@ setattr(tensor_operator_registry, 'imag', imag)
 setattr(tensor_operator_registry, 'repeat_interleave', repeat_interleave)
 setattr(tensor_operator_registry, 'rad2deg', rad2deg)
 setattr(tensor_operator_registry, 'deg2rad', deg2rad)
+setattr(tensor_operator_registry, 'copy_', auto_generate.copy_ext)
+setattr(tensor_operator_registry, 'add_', auto_generate.inplace_add_ext)
+setattr(tensor_operator_registry, 'adds_', auto_generate.inplace_adds_ext)
 setattr(tensor_operator_registry, 'copysign', copysign)
 setattr(tensor_operator_registry, 'roll', Roll)
 setattr(tensor_operator_registry, 'rot90', rot90)

mindspore/ops/op_info_register.py CHANGED Viewed

@@ -82,7 +82,7 @@ class _CustomInstaller:
         for dir_name in dir_names:
             if not os.path.isdir(dir_name):
                 try:
-                    os.makedirs(dir_name, exist_ok=True)
+                    os.makedirs(dir_name, mode=0o700, exist_ok=True)
                 except OSError as err:
                     if err.errno == 17:  # File exists
                         pass
@@ -121,7 +121,7 @@ class _CustomInstaller:
     def _find_ai_cpu_so_path(self, so_file):
         """find the absolute path of so"""
-        current_path = os.path.dirname(os.path.abspath(__file__))
+        current_path = os.path.dirname(os.path.realpath(__file__))
         search_paths = [current_path + "/../lib", current_path + "/../lib/plugin/ascend"]
         for path in search_paths:
             so_path = os.path.join(path, so_file)
@@ -235,7 +235,7 @@ class _CustomInstaller:
             # generate and copy reg info file
             op_info = self._gen_ai_core_reg_info(imply_path, self.func.__name__)
             self._copy_file(imply_path, self.ai_core_impl_dir)
-            for arc_name in ["ascend910", "ascend910b", "ascend910c", "ascend310p"]:
+            for arc_name in ["ascend910", "ascend910b", "ascend910_93", "ascend310p"]:
                 arc_dir = os.path.join(self.ai_core_config_dir, arc_name)
                 _CustomInstaller._create_dir(arc_dir)
                 self._save_op_info(arc_dir, "aic-{}-ops-info.json".format(arc_name), op_info)

mindspore/ops/operations/__init__.py CHANGED Viewed

@@ -55,7 +55,7 @@ from .comm_ops import (AllGather, AllReduce, Reduce, NeighborExchange, NeighborE
                        _MirrorOperator, _MirrorMiniStepOperator, _MiniStepAllGather, ReduceOp, _VirtualDataset,
                        _VirtualOutput, _VirtualDiv, _GetTensorSlice, _VirtualAdd, _VirtualAssignAdd, _VirtualAccuGrad,
                        _HostAllGather, _HostReduceScatter, _MirrorMicroStepOperator, _MicroStepAllGather,
-                       _VirtualPipelineEnd, AlltoAllV, ReduceScatter)
+                       _VirtualPipelineEnd, AlltoAllV, ReduceScatter, _VirtualAssignKvCache)
 from .control_ops import GeSwitch, Merge
 from .custom_ops import (Custom)
 from .debug_ops import (ImageSummary, InsertGradientOf, HookBackward, ScalarSummary,
@@ -96,7 +96,7 @@ from .nn_ops import (LSTM, SGD, Adam, AdamWeightDecay, FusedSparseAdam, FusedSpa
                      InstanceNorm,
                      GeLU, FastGeLU, Elu, CeLU,
                      GetNext, L2Normalize, LayerNorm, L2Loss, CTCLoss, CTCLossV2, CTCLossV2Grad, CTCGreedyDecoder,
-                     LogSoftmax, MaxPool3D, AvgPool3D,
+                     LogSoftmax, LogSoftmaxExt, MaxPool3D, AvgPool3D,
                      MaxPool, DataFormatDimMap,
                      AvgPool, Conv2DBackpropInput, ComputeAccidentalHits,
                      MaxPoolWithArgmaxV2, OneHot, Pad, MirrorPad, Mish, PReLU, ReLU, ReLU6,
@@ -136,6 +136,7 @@ from ..deprecated import (identity, DropoutDoMask, MaxPoolWithArgmax, DropoutGen
                           TensorAdd, InplaceUpdate, ScatterNonAliasingAdd,
                           BatchToSpaceND, Unpack, GatherV2, DynamicShape, ScalarToArray, Pack)
 from .manually_defined._inner import ScalarCast
+from .manually_defined import WhileLoop, Scan, ForiLoop
 from .reshard_ops import (Reshard)
 __all__ = [
@@ -203,6 +204,7 @@ __all__ = [
     'Softmax',
     'Softsign',
     'LogSoftmax',
+    'LogSoftmaxExt',
     'SoftmaxCrossEntropyWithLogits',
     'BCEWithLogitsLoss',
     'ROIAlign',
@@ -337,6 +339,9 @@ __all__ = [
     'TupleToArray',
     'GeSwitch',
     'Merge',
+    'WhileLoop',
+    'Scan',
+    'ForiLoop',
     'CheckValid',
     'BartlettWindow',
     'BlackmanWindow',

mindspore/ops/operations/_grad_ops.py CHANGED Viewed

@@ -35,8 +35,8 @@ from ..auto_generate import (AbsGrad, ACosGrad, LogitGrad, AcoshGrad, AsinGrad,
                              SigmoidGrad, HSwishGrad, NLLLossGrad, AtanGrad, GridSampler3DGrad, GridSampler2DGrad,
                              ResizeBicubicGrad, HSigmoidGrad, CholeskyGrad, ResizeNearestNeighborGrad, LayerNormGrad,
                              HShrinkGrad, LayerNormGradGrad, SiLUGrad, MaximumGrad, MaximumGradGrad, RmsNormGrad,
-                             FlashAttentionScoreGrad, UpsampleTrilinear3DGrad, UpsampleNearest3DGrad,
-                             BinaryCrossEntropyGrad)
+                             FlashAttentionScoreGrad, UpsampleTrilinear3DGrad, UpsampleNearest3DGrad, MaskedSelectGrad,
+                             BinaryCrossEntropyGrad, SoftShrinkGrad, SeluGrad)
 class SparseFillEmptyRowsGrad(Primitive):
@@ -1658,35 +1658,6 @@ class SoftMarginLossGrad(Primitive):
         self.reduction = validator.check_string(reduction, ['none', 'sum', 'mean'], 'reduction', self.name)
-class StridedSliceV2Grad(Primitive):
-    """
-    Performs grad of StridedSliceV2 operation.
-    Inputs:
-        - **shapex** (Tensor) - StridedSliceV2 shape of input
-        - **begin** (tuple[int]) - A tuple which represents the location where to start. Only
-          constant value is allowed.
-        - **end** (tuple[int]) - A tuple or which represents the maximum location where to end.
-          Only constant value is allowed.
-        - **strides** (tuple[int]) - A tuple which represents the stride is continuously added
-          before reaching the maximum location. Only constant value is allowed.
-        - **dy** (Tensor) - The output of StridedSliceV2
-    Outputs:
-        Tensor, the shape same as the input of StridedSliceV2
-    """
-    @prim_attr_register
-    def __init__(self,
-                 begin_mask=0,
-                 end_mask=0,
-                 ellipsis_mask=0,
-                 new_axis_mask=0,
-                 shrink_axis_mask=0):
-        """Initialize StridedSliceV2Grad"""
-        self.init_prim_io_names(inputs=['shapex', 'begin', 'end', 'strides', 'dy'], outputs=['output'])
 class StridedSliceGrad(Primitive):
     """
     Performs grad of StridedSlice operation.
@@ -1991,51 +1962,6 @@ class MvlgammaGrad(Primitive):
         self.p = validator.check_value_type('p', p, [int], self.name)
-class MaskedSelectGrad(PrimitiveWithInfer):
-    """Computes gradient for MaskedSelect."""
-    @prim_attr_register
-    def __init__(self):
-        pass
-    def infer_shape(self, x, mask, grad):
-        return x
-    def infer_dtype(self, x, mask, grad):
-        return x
-class SoftShrinkGrad(Primitive):
-    r"""
-          Gradients for SoftShrink operation.
-          Args:
-              lambd – The \lambdaλ (must be no less than zero) value for the Softshrink formulation. Default: 0.5.
-          Inputs:
-              - **input_grad** (Tensor) - The input gradient.
-              - **input_x** (Tensor) - The input of SoftShrink with data type of float16 or float32.
-                Any number of additional dimensions.
-          Outputs:
-              output - Tensor, has the same shape and data type as input_x.
-          Raises:
-              TypeError: If lambd is not a float.
-              TypeError: If dtype of input_x is neither float16 nor float32.
-              ValueError: If lambd is less than to 0.
-          Supported Platforms:
-              ``Ascend``
-      """
-    @prim_attr_register
-    def __init__(self, lambd=0.5):
-        self.init_prim_io_names(inputs=['input_grad', 'input_x'], outputs=['output'])
-        validator.check_value_type("lambd", lambd, [float], self.name)
-        validator.check_number("lambd", lambd, 0, validator.GE, self.name)
 class CdistGrad(Primitive):
     """Computes gradient for Cdist."""

mindspore/ops/operations/_infer_ops.py CHANGED Viewed

@@ -16,4 +16,4 @@
 """Operator of infer net"""
 # pylint: disable=unused-import
 from ..auto_generate import (QuantV2, DynamicQuantExt, QuantBatchMatmul, WeightQuantBatchMatmul, KVCacheScatterUpdate,
-                             FusedInferAttentionScore, GroupedMatmul, MoeFinalizeRouting)
+                             FusedInferAttentionScore, GroupedMatmul, MoeFinalizeRouting, QuantLinearSparse)

mindspore/ops/operations/_inner_ops.py CHANGED Viewed

@@ -17,6 +17,7 @@
 from types import FunctionType, MethodType
 from collections.abc import Iterable
 import os
+import weakref
 import numpy as np
 from mindspore.common import Tensor
@@ -29,7 +30,7 @@ from mindspore.ops.operations.math_ops import _infer_shape_reduce
 from mindspore.ops.primitive import PrimitiveWithCheck, PrimitiveWithInfer, prim_attr_register, Primitive, \
     _run_op, _check_contains_variable
 from mindspore._c_expression import Tensor as Tensor_
-from mindspore._c_expression import typing
+from mindspore._c_expression import typing, HookType
 from mindspore import _checkparam as validator
 from mindspore.common import dtype as mstype
 from mindspore.common.parameter import Parameter
@@ -1535,7 +1536,7 @@ class CellBackwardHook(PrimitiveWithInfer):
         ...     print(grad)
         ...
         >>> hook = inner.CellBackwardHook()
-        >>> hook_fn_key = hook.register_backward_hook(hook_fn)
+        >>> hook_fn_key = hook.register_backward_hook()
         >>> def hook_test(x, y):
         ...     z = x * y
         ...     z = hook(z)
@@ -1556,16 +1557,19 @@ class CellBackwardHook(PrimitiveWithInfer):
         (Tensor(shape=[], dtype=Float32, value= 4), Tensor(shape=[], dtype=Float32, value= 4))
     """
-    def __init__(self, cell_id=""):
+    def __init__(self, cell_id="", cell=None, hook_dict=None):
         """Initialize CellBackwardHook"""
         super(CellBackwardHook, self).__init__(self.__class__.__name__)
         self.cell_id = cell_id
+        self.cell = cell
+        self.hook_dict = weakref.ref(hook_dict)
         self.add_prim_attr("cell_id", cell_id)
-        self.init_attrs["cell_id"] = cell_id
+        self.grad_output = None
-    def __call__(self, args):
-        if not isinstance(args, tuple):
-            args = (args,)
+    def __call__(self, *args):
+        # If args is empty, just return.
+        if not args:
+            return args
         return _run_op(self, self.name, args)
     def infer_shape(self, *inputs_shape):
@@ -1578,51 +1582,76 @@ class CellBackwardHook(PrimitiveWithInfer):
             return inputs_type[0]
         return inputs_type
-    def register_backward_hook(self, hook_fn):
-        r"""
-        This function is used to register backward hook function. Note that this function is only supported in pynative
-        mode.
-        Note:
-            The 'hook_fn' must be defined as the following code.
-            `cell_id` is the information of registered cell. `grad_input` is the gradient passed to the cell.
-            `grad_output` is the gradient computed and passed to the next cell or primitive, which may be modified by
-            returning a new output gradient.
-            The 'hook_fn' should have the following signature:
-            hook_fn(cell_id, grad_input, grad_output) -> New output gradient or none.
-            The 'hook_fn' is executed in the python environment.
+    def register_backward_hook(self):
+        """
+        Register the backward hook function.
         Args:
-            hook_fn (Function): Python function. Backward hook function.
+            None
         Returns:
-            - **key** (int) - The key of 'hook_fn'.
+            None
-        Raises:
-            TypeError: If the `hook_fn` is not a function of python.
+        Supported Platforms:
+        ``Ascend`` ``GPU`` ``CPU``
         """
-        if not isinstance(hook_fn, (FunctionType, MethodType)):
-            raise TypeError(f"When using 'register_backward_hook(hook_fn)', the type of 'hook_fn' must be python "
-                            f"function, but got {type(hook_fn)}.")
-        key = self.add_backward_hook_fn(hook_fn)
-        return key
-    def remove_backward_hook(self, key):
-        r"""
-        This function is used to remove backward hook function. Note that this operation is only supported in pynative
-        mode.
-        Note:
-            The 'key' is the object returned by 'register_backward_hook' function of the same CellBackwardHook
-            operator.
+        def hook_backward_grad(grad):
+            if self.grad_output is None:
+                self.grad_output = grad
+                # Indicates the first time of call backward hook, and need to wait for the second time call
+                return self.cell_id
+            backward_hook_grad_input = grad
+            if self.hook_dict():
+                backward_hooks = self.hook_dict().values()
+                for hook in backward_hooks:
+                    res = hook(self.cell, backward_hook_grad_input, self.grad_output)
+                    if res is None:
+                        continue
+                    if not isinstance(res, tuple):
+                        res = (res,)
+                    if len(res) != len(grad):
+                        raise TypeError(
+                            "The backward hook return value size is {} not equal to expect grad input size {}".format(
+                                len(res), len(grad)))
+                    backward_hook_grad_input = res
+            self.grad_output = None
+            return backward_hook_grad_input
+        self.set_hook_fn(hook_backward_grad, HookType.BackwardHook)
+    def register_backward_pre_hook(self):
+        """
+        Register the backward pre hook function.
         Args:
-            key (int): The key corresponding to the 'hook_fn'.
+            None
         Returns:
-            None.
+            None
+        Supported Platforms:
+        ``Ascend`` ``GPU`` ``CPU``
         """
-        self.remove_backward_hook_fn(key)
+        def hook_backward_pre_grad(grad):
+            backward_pre_hook_grad = grad
+            if self.hook_dict():
+                backward_pre_hooks = self.hook_dict().values()
+                for hook in backward_pre_hooks:
+                    res = hook(self.cell, backward_pre_hook_grad)
+                    if res is None:
+                        continue
+                    if not isinstance(res, tuple):
+                        res = (res,)
+                    if len(res) != len(grad):
+                        raise TypeError(
+                            "The backward pre hook return value size is {} not equal to expect output size {}".format(
+                                len(res), len(grad)))
+                    backward_pre_hook_grad = res
+            return backward_pre_hook_grad
+        self.set_hook_fn(hook_backward_pre_grad, HookType.BackwardPreHook)
 class Format(PrimitiveWithInfer):
@@ -2478,60 +2507,6 @@ class FFN(Primitive):
         validator.check_value_type("inner_precise", inner_precise, [int], cls_name)
-class _MirrorSilentCheck(PrimitiveWithInfer):
-    """
-    The operator _MirrorSilentCheck implements accuracy-sensitive detection on the tensor input in backpropagator.
-    Call _MirrorSilentCheck in method __call__ of derived class to implement accuracy-sensitive detection.
-    Inputs:
-        - **input** (Tensor) : The tensor used for detection.
-          Its data type must be mindspore.float16, mindspore.float32 or mindspore.bfloat16.
-        - **pre_val** (Parameter(Tensor)) : Support parameter in accuracy-sensitive detection.
-          Please only generated by method generate_params() of ASDBase.
-        - **min_val** (Parameter(Tensor)) : Support parameter in accuracy-sensitive detection.
-          Please only generated by method generate_params() of ASDBase.
-        - **max_val** (Parameter(Tensor)) : Support parameter in accuracy-sensitive detection.
-          Please only generated by method generate_params() of ASDBase.
-        - **cnt** (Parameter(Tensor)) : Support parameter in accuracy-sensitive detection.
-          Please only generated by method generate_params() of ASDBase.
-          After each invocation of _MirrorSilentCheck, increment the value of cnt by one.
-    Outputs:
-        - **output** (Tensor) - Same shape, type and value as `input`.
-    """
-    @prim_attr_register
-    def __init__(self, min_steps=8):
-        upper_thresh, sigma_thresh = self.get_thresh()
-        self.min_steps = min_steps
-        self.thresh_l1 = upper_thresh[0]
-        self.coeff_l1 = sigma_thresh[0]
-        self.thresh_l2 = upper_thresh[1]
-        self.coeff_l2 = sigma_thresh[1]
-        self.add_prim_attr('side_effect_mem', True)
-    def parse_thresh(self, env_var_name, default_value, min_value):
-        env_var = os.environ.get(env_var_name, default=default_value)
-        thresh = [value.strip() for value in env_var.split(",")]
-        if len(thresh) != 2 or not all(value.isdigit() for value in thresh):
-            thresh = default_value.split(",")
-        thresh = [float(max(int(value), min_value)) for value in thresh]
-        if thresh[0] <= thresh[1]:
-            thresh = [float(value) for value in default_value.split(",")]
-        return thresh
-    def get_thresh(self):
-        upper_thresh = self.parse_thresh("NPU_ASD_UPPER_THRESH", "1000000,10000", 3)
-        sigma_thresh = self.parse_thresh("NPU_ASD_SIGMA_THRESH", "100000,5000", 3)
-        return upper_thresh, sigma_thresh
-    def infer_shape(self, x_shape, pre_shape, min_shape, max_shape, n_step, loss_scale_shape):
-        return x_shape
-    def infer_dtype(self, x_dtype, pre_dtype, min_dtype, max_dtype, n_dtype, loss_scale_dtype):
-        return x_dtype
 class _VirtualConverterEnd(PrimitiveWithInfer):
     """
     Auto parallel virtual operator.
@@ -2560,6 +2535,8 @@ class _VirtualConverterBegin(PrimitiveWithInfer):
         self.output_nums = output_nums
     def infer_shape(self, arg):
+        if self.output_nums == 0:
+            return ValueError("output_nums can\'t be zero.")
         new_arg = (arg[0] / self.output_nums,) + tuple(arg[1:])
         return (new_arg,) * self.output_nums