PyPI - mindspore - Versions diffs - 2.3.0__cp39-cp39-win_amd64.whl → 2.4.0__cp39-cp39-win_amd64.whl - Mend

mindspore 2.3.0__cp39-cp39-win_amd64.whl → 2.4.0__cp39-cp39-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (285) hide show

mindspore/.commit_id +1 -1
mindspore/__init__.py +3 -1
mindspore/_c_dataengine.cp39-win_amd64.pyd +0 -0
mindspore/_c_expression.cp39-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp39-win_amd64.pyd +0 -0
mindspore/_checkparam.py +50 -9
mindspore/_extends/parse/compile_config.py +41 -0
mindspore/_extends/parse/parser.py +9 -7
mindspore/_extends/parse/standard_method.py +52 -14
mindspore/_extends/pijit/pijit_func_white_list.py +350 -24
mindspore/amp.py +24 -10
mindspore/avcodec-59.dll +0 -0
mindspore/avdevice-59.dll +0 -0
mindspore/avfilter-8.dll +0 -0
mindspore/avformat-59.dll +0 -0
mindspore/avutil-57.dll +0 -0
mindspore/common/__init__.py +6 -4
mindspore/common/_pijit_context.py +190 -0
mindspore/common/_register_for_tensor.py +2 -1
mindspore/common/_tensor_overload.py +139 -0
mindspore/common/api.py +102 -87
mindspore/common/dump.py +5 -6
mindspore/common/generator.py +1 -7
mindspore/common/hook_handle.py +14 -26
mindspore/common/mindir_util.py +2 -2
mindspore/common/parameter.py +46 -13
mindspore/common/recompute.py +39 -9
mindspore/common/sparse_tensor.py +7 -3
mindspore/common/tensor.py +209 -29
mindspore/communication/__init__.py +1 -1
mindspore/communication/_comm_helper.py +38 -3
mindspore/communication/comm_func.py +310 -55
mindspore/communication/management.py +14 -14
mindspore/context.py +123 -22
mindspore/dataset/__init__.py +1 -1
mindspore/dataset/audio/__init__.py +1 -1
mindspore/dataset/core/config.py +7 -0
mindspore/dataset/core/validator_helpers.py +7 -0
mindspore/dataset/engine/cache_client.py +1 -1
mindspore/dataset/engine/datasets.py +72 -44
mindspore/dataset/engine/datasets_audio.py +7 -7
mindspore/dataset/engine/datasets_standard_format.py +53 -3
mindspore/dataset/engine/datasets_text.py +20 -20
mindspore/dataset/engine/datasets_user_defined.py +174 -104
mindspore/dataset/engine/datasets_vision.py +33 -33
mindspore/dataset/engine/iterators.py +29 -0
mindspore/dataset/engine/obs/util.py +7 -0
mindspore/dataset/engine/queue.py +114 -60
mindspore/dataset/engine/serializer_deserializer.py +2 -2
mindspore/dataset/engine/validators.py +34 -14
mindspore/dataset/text/__init__.py +1 -4
mindspore/dataset/transforms/__init__.py +0 -3
mindspore/dataset/utils/line_reader.py +2 -0
mindspore/dataset/vision/__init__.py +1 -4
mindspore/dataset/vision/utils.py +1 -1
mindspore/dataset/vision/validators.py +2 -1
mindspore/dnnl.dll +0 -0
mindspore/{nn/extend → experimental/es}/__init__.py +4 -11
mindspore/experimental/es/embedding_service.py +883 -0
mindspore/{nn/layer → experimental/es}/embedding_service_layer.py +218 -30
mindspore/experimental/llm_boost/__init__.py +21 -0
mindspore/{nn/extend/layer → experimental/llm_boost/atb}/__init__.py +4 -8
mindspore/experimental/llm_boost/atb/boost_base.py +211 -0
mindspore/experimental/llm_boost/atb/llama_boost.py +115 -0
mindspore/experimental/llm_boost/atb/qwen_boost.py +101 -0
mindspore/experimental/llm_boost/register.py +129 -0
mindspore/experimental/llm_boost/utils.py +31 -0
mindspore/experimental/optim/adamw.py +85 -0
mindspore/experimental/optim/optimizer.py +3 -0
mindspore/hal/__init__.py +3 -3
mindspore/hal/contiguous_tensors_handle.py +175 -0
mindspore/hal/stream.py +18 -0
mindspore/include/api/model_group.h +13 -1
mindspore/include/api/types.h +10 -10
mindspore/include/dataset/config.h +2 -2
mindspore/include/dataset/constants.h +2 -2
mindspore/include/dataset/execute.h +2 -2
mindspore/include/dataset/vision.h +4 -0
mindspore/jpeg62.dll +0 -0
mindspore/log.py +1 -1
mindspore/mindrecord/filewriter.py +68 -51
mindspore/mindspore_backend.dll +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_glog.dll +0 -0
mindspore/mindspore_np_dtype.dll +0 -0
mindspore/mindspore_ops.dll +0 -0
mindspore/mint/__init__.py +495 -46
mindspore/mint/distributed/__init__.py +31 -0
mindspore/mint/distributed/distributed.py +254 -0
mindspore/mint/nn/__init__.py +266 -21
mindspore/mint/nn/functional.py +125 -19
mindspore/mint/nn/layer/__init__.py +39 -0
mindspore/mint/nn/layer/activation.py +133 -0
mindspore/mint/nn/layer/normalization.py +477 -0
mindspore/mint/nn/layer/pooling.py +110 -0
mindspore/mint/optim/adamw.py +28 -7
mindspore/mint/special/__init__.py +63 -0
mindspore/multiprocessing/__init__.py +2 -1
mindspore/nn/__init__.py +0 -1
mindspore/nn/cell.py +275 -93
mindspore/nn/layer/activation.py +211 -44
mindspore/nn/layer/basic.py +113 -3
mindspore/nn/layer/embedding.py +120 -2
mindspore/nn/layer/normalization.py +101 -5
mindspore/nn/layer/padding.py +34 -48
mindspore/nn/layer/pooling.py +161 -7
mindspore/nn/layer/transformer.py +3 -3
mindspore/nn/loss/__init__.py +2 -2
mindspore/nn/loss/loss.py +84 -6
mindspore/nn/optim/__init__.py +2 -1
mindspore/nn/optim/adadelta.py +1 -1
mindspore/nn/optim/adam.py +1 -1
mindspore/nn/optim/lamb.py +1 -1
mindspore/nn/optim/tft_wrapper.py +127 -0
mindspore/nn/wrap/cell_wrapper.py +12 -23
mindspore/nn/wrap/grad_reducer.py +5 -5
mindspore/nn/wrap/loss_scale.py +17 -3
mindspore/numpy/__init__.py +1 -1
mindspore/numpy/array_creations.py +65 -68
mindspore/numpy/array_ops.py +64 -60
mindspore/numpy/fft.py +610 -75
mindspore/numpy/logic_ops.py +11 -10
mindspore/numpy/math_ops.py +85 -84
mindspore/numpy/utils_const.py +4 -4
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/opencv_imgproc452.dll +0 -0
mindspore/ops/__init__.py +6 -4
mindspore/ops/_grad_experimental/grad_comm_ops.py +47 -3
mindspore/ops/_grad_experimental/grad_math_ops.py +0 -22
mindspore/ops/_vmap/vmap_array_ops.py +2 -4
mindspore/ops/_vmap/vmap_math_ops.py +17 -1
mindspore/ops/_vmap/vmap_nn_ops.py +43 -2
mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +85 -7
mindspore/ops/auto_generate/gen_arg_dtype_cast.py +2 -0
mindspore/ops/auto_generate/gen_extend_func.py +734 -13
mindspore/ops/auto_generate/gen_ops_def.py +2420 -381
mindspore/ops/auto_generate/gen_ops_prim.py +5196 -1659
mindspore/ops/auto_generate/pyboost_inner_prim.py +176 -56
mindspore/ops/composite/base.py +85 -48
mindspore/ops/composite/multitype_ops/_compile_utils.py +1 -0
mindspore/ops/composite/multitype_ops/not_in_impl.py +2 -2
mindspore/ops/function/__init__.py +22 -0
mindspore/ops/function/array_func.py +490 -153
mindspore/ops/function/debug_func.py +113 -1
mindspore/ops/function/fft_func.py +15 -2
mindspore/ops/function/grad/grad_func.py +3 -2
mindspore/ops/function/math_func.py +558 -207
mindspore/ops/function/nn_func.py +817 -383
mindspore/ops/function/other_func.py +3 -2
mindspore/ops/function/random_func.py +184 -8
mindspore/ops/function/reshard_func.py +13 -11
mindspore/ops/function/sparse_unary_func.py +1 -1
mindspore/ops/function/vmap_func.py +3 -2
mindspore/ops/functional.py +24 -14
mindspore/ops/op_info_register.py +3 -3
mindspore/ops/operations/__init__.py +6 -1
mindspore/ops/operations/_grad_ops.py +2 -76
mindspore/ops/operations/_infer_ops.py +1 -1
mindspore/ops/operations/_inner_ops.py +71 -94
mindspore/ops/operations/array_ops.py +12 -146
mindspore/ops/operations/comm_ops.py +42 -53
mindspore/ops/operations/custom_ops.py +83 -19
mindspore/ops/operations/debug_ops.py +42 -10
mindspore/ops/operations/manually_defined/_inner.py +12 -0
mindspore/ops/operations/manually_defined/ops_def.py +265 -10
mindspore/ops/operations/math_ops.py +12 -223
mindspore/ops/operations/nn_ops.py +20 -114
mindspore/ops/operations/other_ops.py +7 -4
mindspore/ops/operations/random_ops.py +46 -1
mindspore/ops/primitive.py +18 -6
mindspore/ops_generate/arg_dtype_cast.py +2 -0
mindspore/ops_generate/gen_aclnn_implement.py +11 -11
mindspore/ops_generate/gen_constants.py +36 -0
mindspore/ops_generate/gen_ops.py +67 -52
mindspore/ops_generate/gen_ops_inner_prim.py +1 -1
mindspore/ops_generate/gen_pyboost_func.py +131 -47
mindspore/ops_generate/op_proto.py +10 -3
mindspore/ops_generate/pyboost_utils.py +14 -1
mindspore/ops_generate/template.py +43 -21
mindspore/parallel/__init__.py +3 -1
mindspore/parallel/_auto_parallel_context.py +28 -8
mindspore/parallel/_cell_wrapper.py +83 -0
mindspore/parallel/_parallel_serialization.py +47 -19
mindspore/parallel/_tensor.py +81 -11
mindspore/parallel/_utils.py +13 -1
mindspore/parallel/algo_parameter_config.py +5 -5
mindspore/parallel/checkpoint_transform.py +46 -39
mindspore/parallel/cluster/process_entity/__init__.py +1 -1
mindspore/parallel/cluster/process_entity/_api.py +31 -23
mindspore/parallel/cluster/process_entity/_utils.py +2 -27
mindspore/parallel/parameter_broadcast.py +3 -4
mindspore/parallel/shard.py +162 -31
mindspore/parallel/transform_safetensors.py +993 -0
mindspore/profiler/__init__.py +2 -1
mindspore/profiler/common/constant.py +29 -0
mindspore/profiler/common/registry.py +47 -0
mindspore/profiler/common/util.py +28 -0
mindspore/profiler/dynamic_profiler.py +694 -0
mindspore/profiler/envprofiling.py +17 -19
mindspore/profiler/parser/ascend_analysis/constant.py +18 -0
mindspore/profiler/parser/ascend_analysis/file_manager.py +25 -4
mindspore/profiler/parser/ascend_analysis/function_event.py +43 -19
mindspore/profiler/parser/ascend_analysis/fwk_cann_parser.py +31 -26
mindspore/profiler/parser/ascend_analysis/fwk_file_parser.py +56 -10
mindspore/profiler/parser/ascend_analysis/msprof_timeline_parser.py +55 -8
mindspore/profiler/parser/ascend_analysis/path_manager.py +313 -0
mindspore/profiler/parser/ascend_analysis/profiler_info_parser.py +27 -20
mindspore/profiler/parser/ascend_analysis/trace_event_manager.py +9 -2
mindspore/profiler/parser/ascend_msprof_exporter.py +5 -4
mindspore/profiler/parser/ascend_timeline_generator.py +27 -25
mindspore/profiler/parser/base_timeline_generator.py +19 -25
mindspore/profiler/parser/cpu_gpu_timeline_generator.py +25 -12
mindspore/profiler/parser/framework_parser.py +1 -391
mindspore/profiler/parser/gpu_analysis/__init__.py +14 -0
mindspore/profiler/parser/gpu_analysis/function_event.py +44 -0
mindspore/profiler/parser/gpu_analysis/fwk_file_parser.py +89 -0
mindspore/profiler/parser/gpu_analysis/profiler_info_parser.py +72 -0
mindspore/profiler/parser/memory_usage_parser.py +0 -154
mindspore/profiler/parser/profiler_info.py +78 -6
mindspore/profiler/profiler.py +153 -0
mindspore/profiler/profiling.py +280 -412
mindspore/rewrite/__init__.py +1 -2
mindspore/rewrite/common/namespace.py +4 -4
mindspore/rewrite/symbol_tree/symbol_tree.py +3 -3
mindspore/run_check/_check_version.py +36 -103
mindspore/safeguard/rewrite_obfuscation.py +591 -247
mindspore/swresample-4.dll +0 -0
mindspore/swscale-6.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/train/__init__.py +4 -3
mindspore/train/_utils.py +28 -2
mindspore/train/amp.py +171 -53
mindspore/train/callback/__init__.py +2 -2
mindspore/train/callback/_callback.py +4 -4
mindspore/train/callback/_checkpoint.py +85 -22
mindspore/train/callback/_cluster_monitor.py +1 -1
mindspore/train/callback/_flops_collector.py +1 -0
mindspore/train/callback/_loss_monitor.py +3 -3
mindspore/train/callback/_on_request_exit.py +134 -31
mindspore/train/callback/_summary_collector.py +5 -5
mindspore/train/callback/_tft_register.py +352 -0
mindspore/train/dataset_helper.py +7 -3
mindspore/train/metrics/metric.py +3 -3
mindspore/train/metrics/roc.py +4 -4
mindspore/train/mind_ir_pb2.py +44 -39
mindspore/train/model.py +134 -58
mindspore/train/serialization.py +336 -112
mindspore/turbojpeg.dll +0 -0
mindspore/utils/__init__.py +21 -0
mindspore/utils/utils.py +60 -0
mindspore/version.py +1 -1
{mindspore-2.3.0.dist-info → mindspore-2.4.0.dist-info}/METADATA +6 -2
{mindspore-2.3.0.dist-info → mindspore-2.4.0.dist-info}/RECORD +258 -252
mindspore/include/c_api/ms/abstract.h +0 -67
mindspore/include/c_api/ms/attribute.h +0 -197
mindspore/include/c_api/ms/base/handle_types.h +0 -43
mindspore/include/c_api/ms/base/macros.h +0 -32
mindspore/include/c_api/ms/base/status.h +0 -33
mindspore/include/c_api/ms/base/types.h +0 -283
mindspore/include/c_api/ms/context.h +0 -102
mindspore/include/c_api/ms/graph.h +0 -160
mindspore/include/c_api/ms/node.h +0 -606
mindspore/include/c_api/ms/tensor.h +0 -161
mindspore/include/c_api/ms/value.h +0 -84
mindspore/mindspore_shared_lib.dll +0 -0
mindspore/nn/extend/basic.py +0 -140
mindspore/nn/extend/embedding.py +0 -143
mindspore/nn/extend/layer/normalization.py +0 -109
mindspore/nn/extend/pooling.py +0 -117
mindspore/nn/layer/embedding_service.py +0 -531
mindspore/ops/_op_impl/aicpu/strided_slice_v2.py +0 -93
mindspore/ops/_op_impl/aicpu/strided_slice_v2_grad.py +0 -66
mindspore/ops/extend/__init__.py +0 -53
mindspore/ops/extend/array_func.py +0 -218
mindspore/ops/extend/math_func.py +0 -76
mindspore/ops/extend/nn_func.py +0 -308
mindspore/ops/silent_check.py +0 -162
mindspore/profiler/parser/msadvisor_analyzer.py +0 -82
mindspore/profiler/parser/msadvisor_parser.py +0 -240
mindspore/train/callback/_mindio_ttp.py +0 -443
{mindspore-2.3.0.dist-info → mindspore-2.4.0.dist-info}/WHEEL +0 -0
{mindspore-2.3.0.dist-info → mindspore-2.4.0.dist-info}/entry_points.txt +0 -0
{mindspore-2.3.0.dist-info → mindspore-2.4.0.dist-info}/top_level.txt +0 -0

mindspore/ops/auto_generate/pyboost_inner_prim.py CHANGED Viewed

@@ -26,6 +26,8 @@ from mindspore._c_expression import BroadcastToPrim_
 from mindspore._c_expression import ConcatPrim_
 from mindspore._c_expression import ConvolutionGradPrim_
 from mindspore._c_expression import ConvolutionPrim_
+from mindspore._c_expression import CrossPrim_
+from mindspore._c_expression import CummaxPrim_
 from mindspore._c_expression import EluExtPrim_
 from mindspore._c_expression import FFNExtPrim_
 from mindspore._c_expression import FlashAttentionScoreGradPrim_
@@ -34,20 +36,30 @@ from mindspore._c_expression import GridSampler2DGradPrim_
 from mindspore._c_expression import GridSampler2DPrim_
 from mindspore._c_expression import GridSampler3DGradPrim_
 from mindspore._c_expression import GridSampler3DPrim_
+from mindspore._c_expression import HShrinkGradPrim_
+from mindspore._c_expression import HShrinkPrim_
+from mindspore._c_expression import IncreFlashAttentionPrim_
 from mindspore._c_expression import IsClosePrim_
+from mindspore._c_expression import LogSoftmaxGradPrim_
+from mindspore._c_expression import LogSoftmaxPrim_
 from mindspore._c_expression import MatMulPrim_
 from mindspore._c_expression import MaxPoolGradWithIndicesPrim_
 from mindspore._c_expression import MaxPoolGradWithMaskPrim_
 from mindspore._c_expression import MaxPoolWithIndicesPrim_
 from mindspore._c_expression import MaxPoolWithMaskPrim_
+from mindspore._c_expression import NanToNumPrim_
 from mindspore._c_expression import OneHotExtPrim_
 from mindspore._c_expression import ReduceAllPrim_
 from mindspore._c_expression import ReduceAnyPrim_
 from mindspore._c_expression import ReverseV2Prim_
 from mindspore._c_expression import RmsNormPrim_
+from mindspore._c_expression import RollPrim_
 from mindspore._c_expression import SearchSortedPrim_
 from mindspore._c_expression import SoftmaxPrim_
+from mindspore._c_expression import SoftShrinkGradPrim_
+from mindspore._c_expression import SoftShrinkPrim_
 from mindspore._c_expression import StackExtPrim_
+from mindspore._c_expression import TrilExtPrim_
 from mindspore._c_expression import TriuPrim_
 from mindspore._c_expression import UpsampleTrilinear3DGradPrim_
 from mindspore._c_expression import UpsampleTrilinear3DPrim_
@@ -94,8 +106,8 @@ batch_norm_grad_ext_impl = _PyboostBatchNormGradExtPrim()
 class _PyboostBinaryCrossEntropyGradPrim(BinaryCrossEntropyGradPrim_):
     def __call__(self, input, target, grad_output, weight, reduction):
-        converted_reduction = str_to_enum(reduction)
-        return _convert_stub(super().__call__(input, target, grad_output, weight, reduction))
+        converted_reduction = str_to_enum('binary_cross_entropy_grad', 'reduction', reduction)
+        return _convert_stub(super().__call__(input, target, grad_output, weight, converted_reduction))
 binary_cross_entropy_grad_impl = _PyboostBinaryCrossEntropyGradPrim()
@@ -103,8 +115,8 @@ binary_cross_entropy_grad_impl = _PyboostBinaryCrossEntropyGradPrim()
 class _PyboostBinaryCrossEntropyPrim(BinaryCrossEntropyPrim_):
     def __call__(self, input, target, weight, reduction):
-        converted_reduction = str_to_enum(reduction)
-        return _convert_stub(super().__call__(input, target, weight, reduction))
+        converted_reduction = str_to_enum('binary_cross_entropy', 'reduction', reduction)
+        return _convert_stub(super().__call__(input, target, weight, converted_reduction))
 binary_cross_entropy_impl = _PyboostBinaryCrossEntropyPrim()
@@ -112,8 +124,8 @@ binary_cross_entropy_impl = _PyboostBinaryCrossEntropyPrim()
 class _PyboostBCEWithLogitsLossPrim(BCEWithLogitsLossPrim_):
     def __call__(self, input, target, weight, posWeight, reduction):
-        converted_reduction = str_to_enum(reduction)
-        return _convert_stub(super().__call__(input, target, weight, posWeight, reduction))
+        converted_reduction = str_to_enum('binary_cross_entropy_with_logits', 'reduction', reduction)
+        return _convert_stub(super().__call__(input, target, weight, posWeight, converted_reduction))
 binary_cross_entropy_with_logits_impl = _PyboostBCEWithLogitsLossPrim()
@@ -139,11 +151,11 @@ concat_impl = _PyboostConcatPrim()
 class _PyboostConvolutionGradPrim(ConvolutionGradPrim_):
     def __call__(self, dout, input, weight, bias, stride, padding, dilation, transposed, output_padding, groups, output_mask):
-        converted_stride = to_strides(stride)
-        converted_padding = to_2d_paddings(padding)
-        converted_dilation = to_dilations(dilation)
-        converted_output_padding = to_output_padding(output_padding)
-        return _convert_stub(super().__call__(dout, input, weight, bias, stride, padding, dilation, transposed, output_padding, groups, output_mask))
+        converted_stride = to_strides('convolution_grad', 'stride', stride)
+        converted_padding = to_2d_paddings('convolution_grad', 'padding', padding)
+        converted_dilation = to_dilations('convolution_grad', 'dilation', dilation)
+        converted_output_padding = to_output_padding('convolution_grad', 'output_padding', output_padding)
+        return _convert_stub(super().__call__(dout, input, weight, bias, converted_stride, converted_padding, converted_dilation, transposed, converted_output_padding, groups, output_mask))
 convolution_grad_impl = _PyboostConvolutionGradPrim()
@@ -151,16 +163,34 @@ convolution_grad_impl = _PyboostConvolutionGradPrim()
 class _PyboostConvolutionPrim(ConvolutionPrim_):
     def __call__(self, input, weight, bias, stride, padding, dilation, transposed, output_padding, groups):
-        converted_stride = to_strides(stride)
-        converted_padding = to_2d_paddings(padding)
-        converted_dilation = to_dilations(dilation)
-        converted_output_padding = to_output_padding(output_padding)
-        return _convert_stub(super().__call__(input, weight, bias, stride, padding, dilation, transposed, output_padding, groups))
+        converted_stride = to_strides('convolution', 'stride', stride)
+        converted_padding = to_2d_paddings('convolution', 'padding', padding)
+        converted_dilation = to_dilations('convolution', 'dilation', dilation)
+        converted_output_padding = to_output_padding('convolution', 'output_padding', output_padding)
+        return _convert_stub(super().__call__(input, weight, bias, converted_stride, converted_padding, converted_dilation, transposed, converted_output_padding, groups))
 convolution_impl = _PyboostConvolutionPrim()
+class _PyboostCrossPrim(CrossPrim_):
+    def __call__(self, input, other, dim):
+        return _convert_stub(super().__call__(input, other, dim))
+cross_impl = _PyboostCrossPrim()
+class _PyboostCummaxPrim(CummaxPrim_):
+    def __call__(self, input, axis):
+        return _convert_stub(super().__call__(input, axis))
+cummax_impl = _PyboostCummaxPrim()
 class _PyboostEluExtPrim(EluExtPrim_):
     def __call__(self, input, alpha):
@@ -172,8 +202,8 @@ elu_ext_impl = _PyboostEluExtPrim()
 class _PyboostFFNExtPrim(FFNExtPrim_):
     def __call__(self, x, weight1, weight2, expertTokens, bias1, bias2, scale, offset, deqScale1, deqScale2, antiquant_scale1, antiquant_scale2, antiquant_offset1, antiquant_offset2, activation, inner_precise):
-        converted_activation = str_to_enum(activation)
-        return _convert_stub(super().__call__(x, weight1, weight2, expertTokens, bias1, bias2, scale, offset, deqScale1, deqScale2, antiquant_scale1, antiquant_scale2, antiquant_offset1, antiquant_offset2, activation, inner_precise))
+        converted_activation = str_to_enum('ffn_ext', 'activation', activation)
+        return _convert_stub(super().__call__(x, weight1, weight2, expertTokens, bias1, bias2, scale, offset, deqScale1, deqScale2, antiquant_scale1, antiquant_scale2, antiquant_offset1, antiquant_offset2, converted_activation, inner_precise))
 ffn_ext_impl = _PyboostFFNExtPrim()
@@ -181,8 +211,8 @@ ffn_ext_impl = _PyboostFFNExtPrim()
 class _PyboostFlashAttentionScoreGradPrim(FlashAttentionScoreGradPrim_):
     def __call__(self, query, key, value, dy, pse_shift, drop_mask, padding_mask, atten_mask, softmax_max, softmax_sum, softmax_in, attention_in, prefix, actual_seq_qlen, actual_seq_kvlen, head_num, keep_prob, scale_value, pre_tokens, next_tokens, inner_precise, input_layout, sparse_mode):
-        converted_input_layout = str_to_enum(input_layout)
-        return _convert_stub(super().__call__(query, key, value, dy, pse_shift, drop_mask, padding_mask, atten_mask, softmax_max, softmax_sum, softmax_in, attention_in, prefix, actual_seq_qlen, actual_seq_kvlen, head_num, keep_prob, scale_value, pre_tokens, next_tokens, inner_precise, input_layout, sparse_mode))
+        converted_input_layout = str_to_enum('flash_attention_score_grad', 'input_layout', input_layout)
+        return _convert_stub(super().__call__(query, key, value, dy, pse_shift, drop_mask, padding_mask, atten_mask, softmax_max, softmax_sum, softmax_in, attention_in, prefix, actual_seq_qlen, actual_seq_kvlen, head_num, keep_prob, scale_value, pre_tokens, next_tokens, inner_precise, converted_input_layout, sparse_mode))
 flash_attention_score_grad_impl = _PyboostFlashAttentionScoreGradPrim()
@@ -190,8 +220,8 @@ flash_attention_score_grad_impl = _PyboostFlashAttentionScoreGradPrim()
 class _PyboostFlashAttentionScorePrim(FlashAttentionScorePrim_):
     def __call__(self, query, key, value, real_shift, drop_mask, padding_mask, attn_mask, prefix, actual_seq_qlen, actual_seq_kvlen, head_num, keep_prob, scale_value, pre_tokens, next_tokens, inner_precise, input_layout, sparse_mode):
-        converted_input_layout = str_to_enum(input_layout)
-        return _convert_stub(super().__call__(query, key, value, real_shift, drop_mask, padding_mask, attn_mask, prefix, actual_seq_qlen, actual_seq_kvlen, head_num, keep_prob, scale_value, pre_tokens, next_tokens, inner_precise, input_layout, sparse_mode))
+        converted_input_layout = str_to_enum('flash_attention_score', 'input_layout', input_layout)
+        return _convert_stub(super().__call__(query, key, value, real_shift, drop_mask, padding_mask, attn_mask, prefix, actual_seq_qlen, actual_seq_kvlen, head_num, keep_prob, scale_value, pre_tokens, next_tokens, inner_precise, converted_input_layout, sparse_mode))
 flash_attention_score_impl = _PyboostFlashAttentionScorePrim()
@@ -199,9 +229,9 @@ flash_attention_score_impl = _PyboostFlashAttentionScorePrim()
 class _PyboostGridSampler2DGradPrim(GridSampler2DGradPrim_):
     def __call__(self, grad, input_x, grid, interpolation_mode, padding_mode, align_corners):
-        converted_interpolation_mode = str_to_enum(interpolation_mode)
-        converted_padding_mode = str_to_enum(padding_mode)
-        return _convert_stub(super().__call__(grad, input_x, grid, interpolation_mode, padding_mode, align_corners))
+        converted_interpolation_mode = str_to_enum('grid_sampler_2d_grad', 'interpolation_mode', interpolation_mode)
+        converted_padding_mode = str_to_enum('grid_sampler_2d_grad', 'padding_mode', padding_mode)
+        return _convert_stub(super().__call__(grad, input_x, grid, converted_interpolation_mode, converted_padding_mode, align_corners))
 grid_sampler_2d_grad_impl = _PyboostGridSampler2DGradPrim()
@@ -209,9 +239,9 @@ grid_sampler_2d_grad_impl = _PyboostGridSampler2DGradPrim()
 class _PyboostGridSampler2DPrim(GridSampler2DPrim_):
     def __call__(self, input_x, grid, interpolation_mode, padding_mode, align_corners):
-        converted_interpolation_mode = str_to_enum(interpolation_mode)
-        converted_padding_mode = str_to_enum(padding_mode)
-        return _convert_stub(super().__call__(input_x, grid, interpolation_mode, padding_mode, align_corners))
+        converted_interpolation_mode = str_to_enum('grid_sampler_2d', 'interpolation_mode', interpolation_mode)
+        converted_padding_mode = str_to_enum('grid_sampler_2d', 'padding_mode', padding_mode)
+        return _convert_stub(super().__call__(input_x, grid, converted_interpolation_mode, converted_padding_mode, align_corners))
 grid_sampler_2d_impl = _PyboostGridSampler2DPrim()
@@ -219,9 +249,9 @@ grid_sampler_2d_impl = _PyboostGridSampler2DPrim()
 class _PyboostGridSampler3DGradPrim(GridSampler3DGradPrim_):
     def __call__(self, grad, input_x, grid, interpolation_mode, padding_mode, align_corners):
-        converted_interpolation_mode = str_to_enum(interpolation_mode)
-        converted_padding_mode = str_to_enum(padding_mode)
-        return _convert_stub(super().__call__(grad, input_x, grid, interpolation_mode, padding_mode, align_corners))
+        converted_interpolation_mode = str_to_enum('grid_sampler_3d_grad', 'interpolation_mode', interpolation_mode)
+        converted_padding_mode = str_to_enum('grid_sampler_3d_grad', 'padding_mode', padding_mode)
+        return _convert_stub(super().__call__(grad, input_x, grid, converted_interpolation_mode, converted_padding_mode, align_corners))
 grid_sampler_3d_grad_impl = _PyboostGridSampler3DGradPrim()
@@ -229,14 +259,41 @@ grid_sampler_3d_grad_impl = _PyboostGridSampler3DGradPrim()
 class _PyboostGridSampler3DPrim(GridSampler3DPrim_):
     def __call__(self, input_x, grid, interpolation_mode, padding_mode, align_corners):
-        converted_interpolation_mode = str_to_enum(interpolation_mode)
-        converted_padding_mode = str_to_enum(padding_mode)
-        return _convert_stub(super().__call__(input_x, grid, interpolation_mode, padding_mode, align_corners))
+        converted_interpolation_mode = str_to_enum('grid_sampler_3d', 'interpolation_mode', interpolation_mode)
+        converted_padding_mode = str_to_enum('grid_sampler_3d', 'padding_mode', padding_mode)
+        return _convert_stub(super().__call__(input_x, grid, converted_interpolation_mode, converted_padding_mode, align_corners))
 grid_sampler_3d_impl = _PyboostGridSampler3DPrim()
+class _PyboostHShrinkGradPrim(HShrinkGradPrim_):
+    def __call__(self, gradients, features, lambd):
+        return _convert_stub(super().__call__(gradients, features, lambd))
+hshrink_grad_impl = _PyboostHShrinkGradPrim()
+class _PyboostHShrinkPrim(HShrinkPrim_):
+    def __call__(self, input, lambd):
+        return _convert_stub(super().__call__(input, lambd))
+hshrink_impl = _PyboostHShrinkPrim()
+class _PyboostIncreFlashAttentionPrim(IncreFlashAttentionPrim_):
+    def __call__(self, query, key, value, attn_mask, actual_seq_lengths, pse_shift, dequant_scale1, quant_scale1, dequant_scale2, quant_scale2, quant_offset2, antiquant_scale, antiquant_offset, block_table, kv_padding_size, num_heads, input_layout, scale_value, num_key_value_heads, block_size, inner_precise):
+        converted_input_layout = str_to_enum('incre_flash_attention', 'input_layout', input_layout)
+        return _convert_stub(super().__call__(query, key, value, attn_mask, actual_seq_lengths, pse_shift, dequant_scale1, quant_scale1, dequant_scale2, quant_scale2, quant_offset2, antiquant_scale, antiquant_offset, block_table, kv_padding_size, num_heads, converted_input_layout, scale_value, num_key_value_heads, block_size, inner_precise))
+incre_flash_attention_impl = _PyboostIncreFlashAttentionPrim()
 class _PyboostIsClosePrim(IsClosePrim_):
     def __call__(self, input, other, rtol, atol, equal_nan):
@@ -246,6 +303,24 @@ class _PyboostIsClosePrim(IsClosePrim_):
 isclose_impl = _PyboostIsClosePrim()
+class _PyboostLogSoftmaxGradPrim(LogSoftmaxGradPrim_):
+    def __call__(self, logits, grad, axis):
+        return _convert_stub(super().__call__(logits, grad, axis))
+log_softmax_grad_impl = _PyboostLogSoftmaxGradPrim()
+class _PyboostLogSoftmaxPrim(LogSoftmaxPrim_):
+    def __call__(self, logits, axis):
+        return _convert_stub(super().__call__(logits, axis))
+log_softmax_impl = _PyboostLogSoftmaxPrim()
 class _PyboostMatMulPrim(MatMulPrim_):
     def __call__(self, input, mat2, transpose_a, transpose_b):
@@ -257,11 +332,11 @@ matmul_impl = _PyboostMatMulPrim()
 class _PyboostMaxPoolGradWithIndicesPrim(MaxPoolGradWithIndicesPrim_):
     def __call__(self, x, grad, argmax, kernel_size, strides, pads, dilation, ceil_mode, argmax_type):
-        converted_kernel_size = to_kernel_size(kernel_size)
-        converted_strides = to_strides(strides)
-        converted_pads = to_output_padding(pads)
-        converted_dilation = to_dilations(dilation)
-        return _convert_stub(super().__call__(x, grad, argmax, kernel_size, strides, pads, dilation, ceil_mode, argmax_type))
+        converted_kernel_size = to_kernel_size('max_pool_grad_with_indices', 'kernel_size', kernel_size)
+        converted_strides = to_strides('max_pool_grad_with_indices', 'strides', strides)
+        converted_pads = to_output_padding('max_pool_grad_with_indices', 'pads', pads)
+        converted_dilation = to_dilations('max_pool_grad_with_indices', 'dilation', dilation)
+        return _convert_stub(super().__call__(x, grad, argmax, converted_kernel_size, converted_strides, converted_pads, converted_dilation, ceil_mode, argmax_type))
 max_pool_grad_with_indices_impl = _PyboostMaxPoolGradWithIndicesPrim()
@@ -269,11 +344,11 @@ max_pool_grad_with_indices_impl = _PyboostMaxPoolGradWithIndicesPrim()
 class _PyboostMaxPoolGradWithMaskPrim(MaxPoolGradWithMaskPrim_):
     def __call__(self, x, grad, mask, kernel_size, strides, pads, dilation, ceil_mode, argmax_type):
-        converted_kernel_size = to_kernel_size(kernel_size)
-        converted_strides = to_strides(strides)
-        converted_pads = to_output_padding(pads)
-        converted_dilation = to_dilations(dilation)
-        return _convert_stub(super().__call__(x, grad, mask, kernel_size, strides, pads, dilation, ceil_mode, argmax_type))
+        converted_kernel_size = to_kernel_size('max_pool_grad_with_mask', 'kernel_size', kernel_size)
+        converted_strides = to_strides('max_pool_grad_with_mask', 'strides', strides)
+        converted_pads = to_output_padding('max_pool_grad_with_mask', 'pads', pads)
+        converted_dilation = to_dilations('max_pool_grad_with_mask', 'dilation', dilation)
+        return _convert_stub(super().__call__(x, grad, mask, converted_kernel_size, converted_strides, converted_pads, converted_dilation, ceil_mode, argmax_type))
 max_pool_grad_with_mask_impl = _PyboostMaxPoolGradWithMaskPrim()
@@ -281,11 +356,11 @@ max_pool_grad_with_mask_impl = _PyboostMaxPoolGradWithMaskPrim()
 class _PyboostMaxPoolWithIndicesPrim(MaxPoolWithIndicesPrim_):
     def __call__(self, x, kernel_size, strides, pads, dilation, ceil_mode, argmax_type):
-        converted_kernel_size = to_kernel_size(kernel_size)
-        converted_strides = to_strides(strides)
-        converted_pads = to_output_padding(pads)
-        converted_dilation = to_dilations(dilation)
-        return _convert_stub(super().__call__(x, kernel_size, strides, pads, dilation, ceil_mode, argmax_type))
+        converted_kernel_size = to_kernel_size('max_pool_with_indices', 'kernel_size', kernel_size)
+        converted_strides = to_strides('max_pool_with_indices', 'strides', strides)
+        converted_pads = to_output_padding('max_pool_with_indices', 'pads', pads)
+        converted_dilation = to_dilations('max_pool_with_indices', 'dilation', dilation)
+        return _convert_stub(super().__call__(x, converted_kernel_size, converted_strides, converted_pads, converted_dilation, ceil_mode, argmax_type))
 max_pool_with_indices_impl = _PyboostMaxPoolWithIndicesPrim()
@@ -293,16 +368,25 @@ max_pool_with_indices_impl = _PyboostMaxPoolWithIndicesPrim()
 class _PyboostMaxPoolWithMaskPrim(MaxPoolWithMaskPrim_):
     def __call__(self, x, kernel_size, strides, pads, dilation, ceil_mode, argmax_type):
-        converted_kernel_size = to_kernel_size(kernel_size)
-        converted_strides = to_strides(strides)
-        converted_pads = to_output_padding(pads)
-        converted_dilation = to_dilations(dilation)
-        return _convert_stub(super().__call__(x, kernel_size, strides, pads, dilation, ceil_mode, argmax_type))
+        converted_kernel_size = to_kernel_size('max_pool_with_mask', 'kernel_size', kernel_size)
+        converted_strides = to_strides('max_pool_with_mask', 'strides', strides)
+        converted_pads = to_output_padding('max_pool_with_mask', 'pads', pads)
+        converted_dilation = to_dilations('max_pool_with_mask', 'dilation', dilation)
+        return _convert_stub(super().__call__(x, converted_kernel_size, converted_strides, converted_pads, converted_dilation, ceil_mode, argmax_type))
 max_pool_with_mask_impl = _PyboostMaxPoolWithMaskPrim()
+class _PyboostNanToNumPrim(NanToNumPrim_):
+    def __call__(self, input, nan, posinf, neginf):
+        return _convert_stub(super().__call__(input, nan, posinf, neginf))
+nan_to_num_impl = _PyboostNanToNumPrim()
 class _PyboostOneHotExtPrim(OneHotExtPrim_):
     def __call__(self, tensor, num_classes, on_value, off_value, axis):
@@ -348,6 +432,15 @@ class _PyboostRmsNormPrim(RmsNormPrim_):
 rms_norm_impl = _PyboostRmsNormPrim()
+class _PyboostRollPrim(RollPrim_):
+    def __call__(self, input, shift, axis):
+        return _convert_stub(super().__call__(input, shift, axis))
+roll_impl = _PyboostRollPrim()
 class _PyboostSearchSortedPrim(SearchSortedPrim_):
     def __call__(self, sorted_sequence, values, sorter, dtype, right):
@@ -366,6 +459,24 @@ class _PyboostSoftmaxPrim(SoftmaxPrim_):
 softmax_impl = _PyboostSoftmaxPrim()
+class _PyboostSoftShrinkGradPrim(SoftShrinkGradPrim_):
+    def __call__(self, input_grad, input_x, lambd):
+        return _convert_stub(super().__call__(input_grad, input_x, lambd))
+softshrink_grad_impl = _PyboostSoftShrinkGradPrim()
+class _PyboostSoftShrinkPrim(SoftShrinkPrim_):
+    def __call__(self, input, lambd):
+        return _convert_stub(super().__call__(input, lambd))
+softshrink_impl = _PyboostSoftShrinkPrim()
 class _PyboostStackExtPrim(StackExtPrim_):
     def __call__(self, tensors, dim):
@@ -375,6 +486,15 @@ class _PyboostStackExtPrim(StackExtPrim_):
 stack_ext_impl = _PyboostStackExtPrim()
+class _PyboostTrilExtPrim(TrilExtPrim_):
+    def __call__(self, input, diagonal):
+        return _convert_stub(super().__call__(input, diagonal))
+tril_ext_impl = _PyboostTrilExtPrim()
 class _PyboostTriuPrim(TriuPrim_):
     def __call__(self, input, diagonal):
@@ -412,9 +532,9 @@ grouped_matmul_impl = _PyboostGroupedMatmulPrim()
 class _PyboostQuantBatchMatmulPrim(QuantBatchMatmulPrim_):
-    def __call__(self, x1, x2, scale, offset, bias, transpose_x1, transpose_x2, dtype):
+    def __call__(self, x1, x2, scale, offset, bias, pertokenScaleOptional, transpose_x1, transpose_x2, dtype):
-        return _convert_stub(super().__call__(x1, x2, scale, offset, bias, transpose_x1, transpose_x2, dtype))
+        return _convert_stub(super().__call__(x1, x2, scale, offset, bias, pertokenScaleOptional, transpose_x1, transpose_x2, dtype))
 quant_batch_matmul_impl = _PyboostQuantBatchMatmulPrim()

mindspore/ops/composite/base.py CHANGED Viewed

@@ -30,7 +30,7 @@ from mindspore._c_expression import GradOperation_, HyperMap_, Map_, MultitypeFu
     SequenceSliceGetItem_, ListSliceSetItem_, VmapOperation_, TaylorOperation_, ListPop_, \
     ListClear_, ListReverse_, ListExtend_, DictClear_, DictHasKey_, DictUpdate_, DictFromKeys_, \
     ZerosLike_, TensorIndexGetitem_, TensorIndexSetitem_, ListAdd_, DictSetItem_, \
-    HandleBoolTensor_, PreSetitemByTuple_, StarredGetItem_,\
+    HandleBoolTensor_, PreSetitemByTuple_, StarredGetItem_, \
     StarredUnpack_, StarredUnpackMerge_, IterConverter_, HasNext_, Next_, MSContext
 from mindspore.common import dtype as mstype
 from mindspore.common.api import jit, _pynative_executor, _wrap_func
@@ -346,9 +346,11 @@ class GradOperation(GradOperation_):
         self.grad_position = (0,)
     def __call__(self, fn, weights=None):
-        weights_id = _get_grad_weights_id(weights)
-        if self.grad_fn is not None and self.fn == fn and self.weights_id == weights_id:
-            return self.grad_fn
+        weights_id = ''
+        if context.get_context("mode") == context.GRAPH_MODE:
+            weights_id = _get_grad_weights_id(weights)
+            if self.grad_fn is not None and self.fn == fn and self.weights_id == weights_id:
+                return self.grad_fn
         grad_ = GradOperation(self.get_all, self.get_by_list, self.sens_param)
         # If calling Grad in GRAPH_MODE or calling Grad in functions decorated with 'jit', do grad in GRAPH_MODE
         # If calling Grad in pure PYNATIVE_MODE do grad in PYNATIVE_MODE
@@ -374,8 +376,8 @@ class GradOperation(GradOperation_):
             @_wrap_func
             def after_grad(*args, **kwargs):
-                self._pynative_forward_run(fn, grad_, weights, args, kwargs)
-                out = _pynative_executor.grad(fn, grad_, weights, self.grad_position, *args, **kwargs)
+                run_args = self._pynative_forward_run(fn, grad_, weights, *args, **kwargs)
+                out = _pynative_executor.grad(fn, grad_, weights, self.grad_position, *run_args)
                 out = _grads_divided_by_device_num_if_recomputation(out)
                 return out
         else:
@@ -396,26 +398,39 @@ class GradOperation(GradOperation_):
         self.weights_id = weights_id
         return self.grad_fn
-    def _pynative_forward_run(self, fn, grad, weights, args, kwargs):
-        """ Pynative forward run to build grad graph. """
-        new_kwargs = kwargs
+    def _pynative_forward_run(self, fn, grad, weights, *args, **kwargs):
+        """ PyNative forward run to build grad graph. """
+        sens = None
         if self.sens_param:
-            if 'sens' not in kwargs.keys():
-                args = args[:-1]
+            if 'sens' in kwargs.keys():
+                sens = kwargs.pop('sens')
             else:
-                new_kwargs = kwargs.copy()
-                new_kwargs.pop('sens')
+                # default use args last elem as sens
+                sens = args[-1]
+                args = args[:-1]
+        run_args = args
+        if kwargs:
+            run_args = args + tuple(kwargs.values())
+        # check run exclude sens
         if isinstance(fn, (FunctionType, MethodType)):
-            if not _pynative_executor.check_run(grad, fn, weights, None, *args, **new_kwargs):
+            if not _pynative_executor.check_run(grad, fn, weights, None, *run_args):
                 _pynative_executor.set_grad_flag(True)
-                _pynative_executor.new_graph(fn, *args, **new_kwargs)
-                output = fn(*args, **new_kwargs)
-                _pynative_executor.end_graph(fn, output, *args, **new_kwargs)
+                _pynative_executor.new_graph(fn, *args, **kwargs)
+                output = fn(*args, **kwargs)
+                _pynative_executor.end_graph(fn, output, *args, **kwargs)
         else:
-            # Check if fn have run already
-            if not _pynative_executor.check_run(grad, fn, weights, None, *args, **new_kwargs):
-                _pynative_executor.set_grad_flag(True)
-                fn(*args, **new_kwargs)
+            # Check if fn has run already
+            if not _pynative_executor.check_run(grad, fn, weights, None, *run_args):
+                requires_grad = fn.requires_grad
+                fn.requires_grad = True
+                fn(*args, **kwargs)
+                fn.requires_grad = requires_grad
+        # If it has sens, keep sens as the last element
+        if sens is not None:
+            run_args += (sens,) if sens is not isinstance(run_args, tuple) else sens
+        return run_args
 class _TaylorOperation(TaylorOperation_):
@@ -552,13 +567,15 @@ class _Grad(GradOperation_):
         self.weights_id = None
     def __call__(self, fn, weights=None, grad_position=0):
-        weights_id = _get_grad_weights_id(weights)
-        if self.grad_fn is not None and self.fn == fn and self.grad_position == grad_position and \
-                self.weights_id == weights_id:
-            return self.grad_fn
+        weights_id = ''
+        if context.get_context("mode") == context.GRAPH_MODE:
+            weights_id = _get_grad_weights_id(weights)
+            if self.grad_fn is not None and self.fn == fn and self.grad_position == grad_position and \
+                    self.weights_id == weights_id:
+                return self.grad_fn
-        def aux_fn(*args):
-            outputs = fn(*args)
+        def aux_fn(*args, **kwargs):
+            outputs = fn(*args, **kwargs)
             if not isinstance(outputs, tuple) or len(outputs) < 2:
                 raise ValueError("When has_aux is True, origin fn requires more than one outputs.")
             res = (outputs[0],)
@@ -597,8 +614,8 @@ class _Grad(GradOperation_):
             @_wrap_func
             def after_grad(*args, **kwargs):
-                res = self._pynative_forward_run(fn, grad_, weights, args, kwargs)
-                out = _pynative_executor.grad(fn, grad_, weights, grad_position, *args, **kwargs)
+                run_args, res = self._pynative_forward_run(fn, grad_, weights, *args, **kwargs)
+                out = _pynative_executor.grad(fn, grad_, weights, grad_position, *run_args)
                 out = _grads_divided_by_device_num_if_recomputation(out)
                 if self.return_ids and out:
                     out = _combine_with_ids(grad_position, weights, out)
@@ -633,32 +650,49 @@ class _Grad(GradOperation_):
         self.weights_id = weights_id
         return self.grad_fn
-    def _pynative_forward_run(self, fn, grad, weights, args, kwargs):
-        """ Pynative forward runs to build grad graph. """
-        new_kwargs = kwargs
-        outputs = ()
+    def _pynative_forward_run(self, fn, grad, weights, *args, **kwargs):
+        """ PyNative forward runs to build grad graph. """
+        sens = None
         if self.sens_param:
             if 'sens' in kwargs.keys():
-                new_kwargs = kwargs.copy()
-                new_kwargs.pop('sens')
+                sens = kwargs.pop('sens')
             else:
+                # default use args last elem as sens
+                sens = args[-1]
                 args = args[:-1]
+        run_args = args
+        if kwargs:
+            run_args = args + tuple(kwargs.values())
+        # check run exclude sens
+        outputs = ()
+        run_forward = False
         if isinstance(fn, (FunctionType, MethodType)):
-            if not _pynative_executor.check_run(grad, fn, weights, self.grad_position, *args, **new_kwargs):
+            if not _pynative_executor.check_run(grad, fn, weights, self.grad_position, *run_args):
                 _pynative_executor.set_grad_flag(True)
-                _pynative_executor.new_graph(fn, *args, **new_kwargs)
-                outputs = fn(*args, **new_kwargs)
-                _pynative_executor.end_graph(fn, outputs, *args, **new_kwargs)
-                return outputs
+                _pynative_executor.new_graph(fn, *args, **kwargs)
+                outputs = fn(*args, **kwargs)
+                _pynative_executor.end_graph(fn, outputs, *args, **kwargs)
+                run_forward = True
         else:
             # Check if fn has run already.
-            if not _pynative_executor.check_run(grad, fn, weights, self.grad_position, *args, **new_kwargs):
-                _pynative_executor.set_grad_flag(True)
-                outputs = fn(*args, **new_kwargs)
-                return outputs
+            if not _pynative_executor.check_run(grad, fn, weights, self.grad_position, *run_args):
+                requires_grad = fn.requires_grad
+                fn.requires_grad = True
+                outputs = fn(*args, **kwargs)
+                fn.requires_grad = requires_grad
+                run_forward = True
+        # If it has sens, keep sens as the last element
+        if sens is not None:
+            run_args += (sens,) if sens is not isinstance(run_args, tuple) else sens
+        # Normal run grad
+        if run_forward:
+            return run_args, outputs
         if (self.get_value or self.has_aux) and not outputs:
-            outputs = fn(*args, **new_kwargs)
-        return outputs
+            outputs = fn(*args, **kwargs)
+        return run_args, outputs
 class _Vmap(VmapOperation_):
@@ -806,10 +840,12 @@ class MultitypeFuncGraph(MultitypeFuncGraph_):
 class HyperMap(HyperMap_):
     """
-    Hypermap will apply the set operation to input sequences.
+    HyperMap will apply the set operation to input sequences.
     Apply the operations to every element of the sequence or nested sequence. Different
-    from `mindspore.ops.Map`, the `HyperMap` supports to apply on nested structure.
+    from `mindspore.ops.Map`, the `HyperMap` supports to apply on nested structure. The
+    `HyperMap` also supports dynamic sequences as input, but it does not extend this
+    support to nested dynamic sequences.
     Args:
         ops (Union[MultitypeFuncGraph, None], optional): `ops` is the operation to apply. If `ops` is `None`,
@@ -959,6 +995,7 @@ class _ListAppend(ListAppend_):
     Args:
         name (str): The name of the metafuncgraph object.
     """
     # `__init__` method removed entirely
     def __call__(self, *args):
         pass

mindspore/ops/composite/multitype_ops/_compile_utils.py CHANGED Viewed

@@ -483,6 +483,7 @@ def format_index_tensor(index, arg):
             index[format_idx] = F.select(index_tensor < 0, index_tensor + format_dim, index_tensor)
         return index
     index = Tensor(index)
+    format_dims = Tensor(format_dims)
     return F.select(index < 0, index + format_dims, index)

mindspore/ops/composite/multitype_ops/not_in_impl.py CHANGED Viewed

@@ -41,7 +41,7 @@ def _number_not_in_tuple(x, y):
     Returns:
        bool, if x not in y return true, x in y return false.
    """
-    if F.is_sequence_shape_unknown(y) or not F.isconstant(x):
+    if F.is_sequence_value_unknown(y) or not F.isconstant(x):
         return not InSequence()(x, y)
     return not const_utils.scalar_in_sequence(x, y)
@@ -58,7 +58,7 @@ def _number_not_in_list(x, y):
     Returns:
        bool, if x not in y return true, x in y return false.
    """
-    if F.is_sequence_shape_unknown(y) or not F.isconstant(x):
+    if F.is_sequence_value_unknown(y) or not F.isconstant(x):
         return not InSequence()(x, y)
     return not const_utils.scalar_in_sequence(x, y)