PyPI - mindspore - Versions diffs - 2.7.0__cp310-cp310-win_amd64.whl → 2.7.1__cp310-cp310-win_amd64.whl - Mend

mindspore 2.7.0__cp310-cp310-win_amd64.whl → 2.7.1__cp310-cp310-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (290) hide show

mindspore/.commit_id +1 -1
mindspore/__init__.py +4 -1
mindspore/_c_dataengine.cp310-win_amd64.pyd +0 -0
mindspore/_c_expression.cp310-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp310-win_amd64.pyd +0 -0
mindspore/_extends/parse/compile_config.py +24 -1
mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +6 -2
mindspore/_extends/parse/resources.py +1 -1
mindspore/_extends/parse/standard_method.py +8 -1
mindspore/_extends/parse/trope.py +2 -1
mindspore/_extends/pijit/pijit_func_white_list.py +7 -22
mindspore/avcodec-59.dll +0 -0
mindspore/avdevice-59.dll +0 -0
mindspore/avfilter-8.dll +0 -0
mindspore/avformat-59.dll +0 -0
mindspore/avutil-57.dll +0 -0
mindspore/boost/base.py +29 -2
mindspore/common/_decorator.py +3 -2
mindspore/common/_grad_function.py +3 -1
mindspore/common/_tensor_cpp_method.py +1 -1
mindspore/common/_tensor_docs.py +275 -64
mindspore/common/_utils.py +0 -44
mindspore/common/api.py +285 -35
mindspore/common/dump.py +7 -108
mindspore/common/dynamic_shape/auto_dynamic_shape.py +1 -3
mindspore/common/hook_handle.py +60 -0
mindspore/common/jit_config.py +5 -1
mindspore/common/jit_trace.py +27 -12
mindspore/common/lazy_inline.py +5 -3
mindspore/common/parameter.py +13 -107
mindspore/common/recompute.py +4 -11
mindspore/common/tensor.py +16 -169
mindspore/communication/_comm_helper.py +11 -1
mindspore/communication/comm_func.py +138 -4
mindspore/communication/management.py +85 -1
mindspore/config/op_info.config +0 -15
mindspore/context.py +5 -85
mindspore/dataset/engine/datasets.py +8 -4
mindspore/dataset/engine/datasets_vision.py +1 -1
mindspore/dataset/engine/validators.py +1 -15
mindspore/dnnl.dll +0 -0
mindspore/{experimental/llm_boost/ascend_native → graph}/__init__.py +7 -7
mindspore/graph/custom_pass.py +55 -0
mindspore/include/dataset/execute.h +2 -2
mindspore/jpeg62.dll +0 -0
mindspore/mindrecord/__init__.py +3 -3
mindspore/mindrecord/common/exceptions.py +1 -0
mindspore/mindrecord/config.py +1 -1
mindspore/{parallel/mpi → mindrecord/core}/__init__.py +4 -1
mindspore/mindrecord/{shardheader.py → core/shardheader.py} +2 -1
mindspore/mindrecord/{shardindexgenerator.py → core/shardindexgenerator.py} +1 -1
mindspore/mindrecord/{shardreader.py → core/shardreader.py} +2 -1
mindspore/mindrecord/{shardsegment.py → core/shardsegment.py} +2 -2
mindspore/mindrecord/{shardutils.py → core/shardutils.py} +1 -1
mindspore/mindrecord/{shardwriter.py → core/shardwriter.py} +1 -1
mindspore/mindrecord/filereader.py +4 -4
mindspore/mindrecord/filewriter.py +5 -5
mindspore/mindrecord/mindpage.py +2 -2
mindspore/mindrecord/tools/cifar10.py +1 -1
mindspore/mindrecord/tools/cifar100.py +1 -1
mindspore/mindrecord/tools/cifar100_to_mr.py +1 -1
mindspore/mindrecord/tools/cifar10_to_mr.py +1 -1
mindspore/mindrecord/tools/csv_to_mr.py +1 -1
mindspore/mindrecord/tools/imagenet_to_mr.py +1 -1
mindspore/mindrecord/tools/mnist_to_mr.py +1 -1
mindspore/mindrecord/tools/tfrecord_to_mr.py +1 -1
mindspore/mindspore_backend_common.dll +0 -0
mindspore/mindspore_backend_manager.dll +0 -0
mindspore/mindspore_cluster.dll +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_cpu.dll +0 -0
mindspore/mindspore_dump.dll +0 -0
mindspore/mindspore_frontend.dll +0 -0
mindspore/mindspore_glog.dll +0 -0
mindspore/mindspore_hardware_abstract.dll +0 -0
mindspore/mindspore_memory_pool.dll +0 -0
mindspore/mindspore_ms_backend.dll +0 -0
mindspore/mindspore_ops.dll +0 -0
mindspore/{mindspore_ops_host.dll → mindspore_ops_cpu.dll} +0 -0
mindspore/mindspore_profiler.dll +0 -0
mindspore/mindspore_pyboost.dll +0 -0
mindspore/mindspore_pynative.dll +0 -0
mindspore/mindspore_runtime_pipeline.dll +0 -0
mindspore/mindspore_runtime_utils.dll +0 -0
mindspore/mindspore_tools.dll +0 -0
mindspore/mint/__init__.py +15 -10
mindspore/mint/distributed/distributed.py +182 -62
mindspore/mint/nn/__init__.py +2 -16
mindspore/mint/nn/functional.py +4 -110
mindspore/mint/nn/layer/__init__.py +0 -2
mindspore/mint/nn/layer/activation.py +0 -6
mindspore/mint/nn/layer/basic.py +0 -47
mindspore/mint/nn/layer/conv.py +4 -4
mindspore/mint/nn/layer/normalization.py +8 -13
mindspore/mint/nn/layer/pooling.py +0 -4
mindspore/nn/__init__.py +1 -3
mindspore/nn/cell.py +16 -66
mindspore/nn/layer/basic.py +49 -1
mindspore/nn/layer/container.py +16 -0
mindspore/nn/layer/embedding.py +4 -169
mindspore/nn/layer/normalization.py +2 -1
mindspore/nn/layer/thor_layer.py +4 -85
mindspore/nn/optim/ada_grad.py +0 -1
mindspore/nn/optim/adafactor.py +0 -1
mindspore/nn/optim/adam.py +31 -124
mindspore/nn/optim/adamax.py +0 -1
mindspore/nn/optim/asgd.py +0 -1
mindspore/nn/optim/ftrl.py +8 -102
mindspore/nn/optim/lamb.py +0 -1
mindspore/nn/optim/lars.py +0 -3
mindspore/nn/optim/lazyadam.py +25 -218
mindspore/nn/optim/momentum.py +5 -43
mindspore/nn/optim/optimizer.py +6 -55
mindspore/nn/optim/proximal_ada_grad.py +0 -1
mindspore/nn/optim/rmsprop.py +0 -1
mindspore/nn/optim/rprop.py +0 -1
mindspore/nn/optim/sgd.py +0 -1
mindspore/nn/optim/tft_wrapper.py +0 -1
mindspore/nn/optim/thor.py +0 -2
mindspore/nn/probability/bijector/bijector.py +7 -8
mindspore/nn/probability/bijector/gumbel_cdf.py +2 -2
mindspore/nn/probability/bijector/power_transform.py +20 -21
mindspore/nn/probability/bijector/scalar_affine.py +5 -5
mindspore/nn/probability/bijector/softplus.py +13 -14
mindspore/nn/wrap/grad_reducer.py +4 -74
mindspore/numpy/array_creations.py +2 -2
mindspore/numpy/fft.py +9 -9
mindspore/{nn/reinforcement → onnx}/__init__.py +5 -8
mindspore/onnx/onnx_export.py +137 -0
mindspore/opencv_core4110.dll +0 -0
mindspore/opencv_imgcodecs4110.dll +0 -0
mindspore/{opencv_imgproc452.dll → opencv_imgproc4110.dll} +0 -0
mindspore/ops/__init__.py +2 -0
mindspore/ops/_grad_experimental/grad_comm_ops.py +38 -2
mindspore/ops/_op_impl/aicpu/__init__.py +0 -10
mindspore/ops/_op_impl/cpu/__init__.py +0 -5
mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +16 -22
mindspore/ops/auto_generate/gen_extend_func.py +2 -7
mindspore/ops/auto_generate/gen_ops_def.py +98 -141
mindspore/ops/auto_generate/gen_ops_prim.py +12708 -12686
mindspore/ops/communication.py +97 -0
mindspore/ops/composite/__init__.py +5 -2
mindspore/ops/composite/base.py +15 -1
mindspore/ops/composite/multitype_ops/__init__.py +3 -1
mindspore/ops/composite/multitype_ops/_compile_utils.py +150 -8
mindspore/ops/composite/multitype_ops/add_impl.py +7 -0
mindspore/ops/composite/multitype_ops/mod_impl.py +27 -0
mindspore/ops/function/__init__.py +1 -0
mindspore/ops/function/array_func.py +14 -12
mindspore/ops/function/comm_func.py +3883 -0
mindspore/ops/function/debug_func.py +3 -4
mindspore/ops/function/math_func.py +45 -54
mindspore/ops/function/nn_func.py +75 -294
mindspore/ops/function/random_func.py +9 -18
mindspore/ops/functional.py +2 -0
mindspore/ops/functional_overload.py +354 -18
mindspore/ops/operations/__init__.py +2 -5
mindspore/ops/operations/_custom_ops_utils.py +7 -9
mindspore/ops/operations/_inner_ops.py +1 -38
mindspore/ops/operations/_rl_inner_ops.py +0 -933
mindspore/ops/operations/array_ops.py +1 -0
mindspore/ops/operations/comm_ops.py +94 -2
mindspore/ops/operations/custom_ops.py +228 -19
mindspore/ops/operations/debug_ops.py +27 -29
mindspore/ops/operations/manually_defined/ops_def.py +27 -306
mindspore/ops/operations/nn_ops.py +2 -2
mindspore/ops/operations/sparse_ops.py +0 -83
mindspore/ops/primitive.py +1 -17
mindspore/ops/tensor_method.py +72 -3
mindspore/ops_generate/aclnn/aclnn_kernel_register_auto_cc_generator.py +5 -5
mindspore/ops_generate/aclnn/gen_aclnn_implement.py +8 -8
mindspore/ops_generate/api/functions_cc_generator.py +53 -4
mindspore/ops_generate/api/tensor_func_reg_cpp_generator.py +25 -11
mindspore/ops_generate/common/gen_constants.py +11 -10
mindspore/ops_generate/common/op_proto.py +18 -1
mindspore/ops_generate/common/template.py +102 -245
mindspore/ops_generate/common/template_utils.py +212 -0
mindspore/ops_generate/gen_custom_ops.py +69 -0
mindspore/ops_generate/op_def/ops_def_cc_generator.py +78 -7
mindspore/ops_generate/op_def_py/base_op_prim_py_generator.py +360 -0
mindspore/ops_generate/op_def_py/custom_op_prim_py_generator.py +140 -0
mindspore/ops_generate/op_def_py/op_def_py_generator.py +54 -7
mindspore/ops_generate/op_def_py/op_prim_py_generator.py +5 -312
mindspore/ops_generate/pyboost/auto_grad_impl_cc_generator.py +74 -17
mindspore/ops_generate/pyboost/auto_grad_reg_cc_generator.py +22 -5
mindspore/ops_generate/pyboost/op_template_parser.py +3 -2
mindspore/ops_generate/pyboost/pyboost_functions_cpp_generator.py +21 -5
mindspore/ops_generate/pyboost/pyboost_functions_h_generator.py +2 -2
mindspore/ops_generate/pyboost/pyboost_functions_impl_cpp_generator.py +30 -10
mindspore/ops_generate/pyboost/pyboost_grad_function_cpp_generator.py +10 -3
mindspore/ops_generate/pyboost/pyboost_internal_kernel_info_adapter_generator.py +1 -1
mindspore/ops_generate/pyboost/pyboost_native_grad_functions_generator.py +19 -9
mindspore/ops_generate/pyboost/pyboost_op_cpp_code_generator.py +71 -28
mindspore/ops_generate/pyboost/pyboost_overload_functions_cpp_generator.py +10 -9
mindspore/ops_generate/pyboost/pyboost_utils.py +27 -16
mindspore/ops_generate/resources/yaml_loader.py +13 -0
mindspore/ops_generate/tensor_py_cc_generator.py +2 -2
mindspore/parallel/_cell_wrapper.py +1 -1
mindspore/parallel/_parallel_serialization.py +1 -4
mindspore/parallel/_utils.py +29 -6
mindspore/parallel/checkpoint_transform.py +18 -2
mindspore/parallel/cluster/process_entity/_api.py +24 -32
mindspore/parallel/cluster/process_entity/_utils.py +9 -5
mindspore/{experimental/llm_boost/atb → parallel/distributed}/__init__.py +21 -23
mindspore/parallel/distributed/distributed_data_parallel.py +393 -0
mindspore/parallel/distributed/flatten_grad_buffer.py +295 -0
mindspore/parallel/strategy.py +336 -0
mindspore/parallel/transform_safetensors.py +117 -16
mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +3 -0
mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +1 -1
mindspore/profiler/common/constant.py +5 -0
mindspore/profiler/common/file_manager.py +9 -0
mindspore/profiler/common/msprof_cmd_tool.py +38 -2
mindspore/profiler/common/path_manager.py +56 -24
mindspore/profiler/common/profiler_context.py +2 -12
mindspore/profiler/common/profiler_info.py +3 -3
mindspore/profiler/common/profiler_path_manager.py +13 -0
mindspore/profiler/common/util.py +30 -3
mindspore/profiler/experimental_config.py +2 -1
mindspore/profiler/platform/npu_profiler.py +33 -6
mindspore/run_check/_check_version.py +108 -24
mindspore/runtime/__init__.py +3 -2
mindspore/runtime/executor.py +11 -3
mindspore/runtime/memory.py +112 -0
mindspore/swresample-4.dll +0 -0
mindspore/swscale-6.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/{experimental/llm_boost → tools}/__init__.py +5 -5
mindspore/tools/data_dump.py +130 -0
mindspore/tools/sdc_detect.py +91 -0
mindspore/tools/stress_detect.py +63 -0
mindspore/train/__init__.py +6 -6
mindspore/train/_utils.py +5 -18
mindspore/train/amp.py +6 -4
mindspore/train/callback/_checkpoint.py +0 -9
mindspore/train/callback/_train_fault_tolerance.py +69 -18
mindspore/train/data_sink.py +1 -5
mindspore/train/model.py +38 -211
mindspore/train/serialization.py +126 -387
mindspore/turbojpeg.dll +0 -0
mindspore/utils/__init__.py +6 -3
mindspore/utils/dlpack.py +92 -0
mindspore/utils/dryrun.py +1 -1
mindspore/utils/runtime_execution_order_check.py +10 -0
mindspore/utils/sdc_detect.py +14 -12
mindspore/utils/stress_detect.py +43 -0
mindspore/utils/utils.py +144 -8
mindspore/version.py +1 -1
{mindspore-2.7.0.dist-info → mindspore-2.7.1.dist-info}/METADATA +3 -2
{mindspore-2.7.0.dist-info → mindspore-2.7.1.dist-info}/RECORD +254 -267
mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +0 -210
mindspore/experimental/llm_boost/ascend_native/llm_boost.py +0 -52
mindspore/experimental/llm_boost/atb/boost_base.py +0 -385
mindspore/experimental/llm_boost/atb/llama_boost.py +0 -137
mindspore/experimental/llm_boost/atb/qwen_boost.py +0 -124
mindspore/experimental/llm_boost/register.py +0 -130
mindspore/experimental/llm_boost/utils.py +0 -31
mindspore/include/OWNERS +0 -7
mindspore/mindspore_cpu_res_manager.dll +0 -0
mindspore/mindspore_ops_kernel_common.dll +0 -0
mindspore/mindspore_res_manager.dll +0 -0
mindspore/nn/optim/_dist_optimizer_registry.py +0 -111
mindspore/nn/reinforcement/_batch_read_write.py +0 -142
mindspore/nn/reinforcement/_tensors_queue.py +0 -152
mindspore/nn/reinforcement/tensor_array.py +0 -145
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/ops/_op_impl/aicpu/priority_replay_buffer.py +0 -113
mindspore/ops/_op_impl/aicpu/reservoir_replay_buffer.py +0 -96
mindspore/ops/_op_impl/aicpu/sparse_cross.py +0 -42
mindspore/ops/_op_impl/cpu/buffer_append.py +0 -28
mindspore/ops/_op_impl/cpu/buffer_get.py +0 -28
mindspore/ops/_op_impl/cpu/buffer_sample.py +0 -28
mindspore/ops/_op_impl/cpu/priority_replay_buffer.py +0 -42
mindspore/ops/operations/_tensor_array.py +0 -359
mindspore/ops/operations/rl_ops.py +0 -288
mindspore/parallel/_offload_context.py +0 -275
mindspore/parallel/_recovery_context.py +0 -115
mindspore/parallel/_transformer/__init__.py +0 -35
mindspore/parallel/_transformer/layers.py +0 -765
mindspore/parallel/_transformer/loss.py +0 -251
mindspore/parallel/_transformer/moe.py +0 -693
mindspore/parallel/_transformer/op_parallel_config.py +0 -222
mindspore/parallel/_transformer/transformer.py +0 -3124
mindspore/parallel/mpi/_mpi_config.py +0 -116
mindspore/train/memory_profiling_pb2.py +0 -298
{mindspore-2.7.0.dist-info → mindspore-2.7.1.dist-info}/WHEEL +0 -0
{mindspore-2.7.0.dist-info → mindspore-2.7.1.dist-info}/entry_points.txt +0 -0
{mindspore-2.7.0.dist-info → mindspore-2.7.1.dist-info}/top_level.txt +0 -0

mindspore/mint/nn/functional.py CHANGED Viewed

@@ -15,10 +15,7 @@
 """mint nn functional."""
 from __future__ import absolute_import
 import mindspore.ops as ops
-import mindspore.mint as mint
-from mindspore import log as logger
 from mindspore import _checkparam as validator
-from mindspore.ops.primitive import constexpr
 from mindspore.ops.function.nn_func import max_pool2d_ext as max_pool2d
 from mindspore.ops.functional import (
     conv_transpose2d,
@@ -55,8 +52,9 @@ from mindspore.ops.function.nn_func import relu_
 # 14
 from mindspore.ops.function.nn_func import dropout_ext as dropout
+from mindspore.ops.function.nn_func import dropout2d_ext as dropout2d
 # 15
-from mindspore.ops.function.nn_func import conv1d_ext as conv1d
+from mindspore.ops.functional_overload import conv1d
 from mindspore.ops.function.nn_func import conv2d_ext as conv2d
 # 16
 from mindspore.ops.function.nn_func import log_softmax_ext as log_softmax
@@ -126,6 +124,7 @@ from mindspore.ops.auto_generate import inplace_silu
 # 49
 from mindspore.ops.functional import sigmoid
+from mindspore.ops.functional import inplace_sigmoid as sigmoid_
 # 50
 # 51
@@ -502,9 +501,6 @@ def relu6(input, inplace=False):
     .. image:: ../images/ReLU6.png
         :align: center
-    .. warning::
-        This is an experimental optimizer API that is subject to change.
     Args:
         input (Tensor): input Tensor. Dtype is in int8, int16, int32, int64, uint8, float16, float32, bfloat16.
         inplace (bool, optional): Whether to apply erasing inplace. Default: ``False``.
@@ -770,9 +766,6 @@ def smooth_l1_loss(input, target, reduction='mean', beta=1.0):
     Here :math:`\text{beta}` controls the point where the loss function changes from quadratic to linear.
     :math:`\text{beta} \geq 0` , its default value is ``1.0`` . :math:`N` is the batch size.
-    .. warning::
-        This is an experimental optimizer API that is subject to change.
     Note:
         - Arg `input` and `target` comply with the implicit type conversion rules to make the data types consistent.
           If they have different data types, the lower precision data type will be converted to relatively the
@@ -837,104 +830,6 @@ def smooth_l1_loss(input, target, reduction='mean', beta=1.0):
     return ops.function.smooth_l1_loss(input, target, beta, reduction)
-@constexpr
-def log_warning(msg):
-    """Adds warning to logger."""
-    logger.warning(msg)
-def dropout2d(input, p=0.5, training=True):
-    r"""
-    During training, randomly zeroes some channels of the input tensor with probability `p`
-    from a Bernoulli distribution (For a 4-dimensional tensor with a shape of :math:`(N, C, H, W)`,
-    the channel feature map refers to a 2-dimensional feature map with the shape of :math:`(H, W)`).
-    For example, the :math:`j\_th` channel of the :math:`i\_th` sample in the batched input is a to-be-processed
-    `2D` tensor input[i,j].
-    Each channel will be zeroed out independently on every forward call which based on Bernoulli distribution
-    probability `p`.
-    The parper `Dropout: A Simple Way to Prevent Neural Networks from Overfitting
-    <http://www.cs.toronto.edu/~rsalakhu/papers/srivastava14a.pdf>`_ mentioned this technology, and it is proved that
-    it can effectively reduce over fitting and prevent neuronal coadaptation.
-    For more details, refer to `Improving neural networks by preventing co-adaptation of feature detectors
-    <https://arxiv.org/pdf/1207.0580.pdf>`_ .
-    `dropout2d` can improve the independence between channel feature maps.
-    .. warning::
-        This is an experimental API that is subject to change or deletion.
-    Args:
-        input (Tensor): A `4D` tensor with shape :math:`(N, C, H, W)`, where `N` is the batch size, `C` is the number
-            of channels, `H` is the feature height, and `W` is the feature width.
-        p (float, optional): The dropping probability of a channel, between 0 and 1, e.g. `p` = 0.8,
-            which means dropping out 80% of channels. Default: ``0.5`` .
-        training(bool, optional): If `training` is True, applying dropout, otherwise, not applying. Default: ``True`` .
-    Returns:
-        Tensor, output, with the same shape and data type as `input`.
-    Raises:
-        TypeError: If `input` is not a Tensor.
-        TypeError: If the data type of `p` is not float.
-        ValueError: If `p` is out of the range `[0.0, 1.0]`.
-    Supported Platforms:
-        ``Ascend``
-    Examples:
-        >>> import mindspore
-        >>> import numpy as np
-        >>> from mindspore import Tensor, mint
-        >>> input = Tensor(np.ones([2, 1, 2, 3]), mindspore.float32)
-        >>> output = mint.nn.functional.dropout2d(input, 0.5)
-        >>> print(output.shape)
-        (2, 1, 2, 3)
-    """
-    def dropout2d_impl_(input, p, training):
-        if p == 0 or not training or input.numel() == 0:
-            return input
-        if p == 1:
-            return mint.mul(input, mint.zeros((), dtype=input.dtype))
-        if input.ndim < 2:
-            raise ValueError(f'For dropout2d, input size after unsqueeze must be greater or equal to 2')
-        if ops.is_sequence_shape_unknown(input.shape):
-            input_tensor_shape = ops.TensorShape()(input)
-            nosie_tensor_shape = mint.ones_like(input_tensor_shape)
-            nosie_tensor_shape[0] = input_tensor_shape[0]
-            nosie_tensor_shape[1] = input_tensor_shape[1]
-            nosie_shape = ops.TensorToTuple()(nosie_tensor_shape)
-        else:
-            nosie_shape = input.shape[:2] + tuple(1 for _ in range(len(input.shape) - 2))
-        nosie = mint.full(nosie_shape, 1 - p, dtype=input.dtype)
-        nosie = mint.bernoulli(nosie)
-        nosie = mint.div(nosie, 1 - p)
-        return mint.mul(input, nosie)
-    validator.check_float_range(p, 0.0, 1.0, validator.INC_BOTH, "p", "dropout2d")
-    validator.check_bool(training, "training", "dropout2d")
-    if input.ndim not in (3, 4):
-        log_warning(f"dropout2d receviced a {input.ndim}-D input which is not recommended. Please use dropout instead.")
-    is_batched = input.ndim == 4
-    if not is_batched:
-        input_shape = input.shape
-        if ops.is_sequence_shape_unknown(input.shape):
-            input_shape = ops.TensorToTuple()(ops.TensorShape()(input))
-        input = input.reshape((1, *input_shape))
-        result = dropout2d_impl_(input, p, training)
-        result = result.reshape(input_shape)
-    else:
-        result = dropout2d_impl_(input, p, training)
-    return result
 def normalize(input, p=2.0, dim=1, eps=1e-12):
     r"""
     Perform normalization of inputs over specified dimension
@@ -1060,7 +955,6 @@ def adaptive_avg_pool3d(input, output_size):
     .. warning::
         For Ascend, it is only supported on Atlas A2 Training Series Products.
-        This is an experimental optimizer API that is subject to change or deletion.
     Args:
         input (Tensor): The input of adaptive_avg_pool3d, which is a 4D or 5D Tensor.
@@ -1265,6 +1159,7 @@ __all__ = [
     # 49
     'sigmoid',
+    'sigmoid_',
     # 50
     # 51
@@ -1402,7 +1297,6 @@ __all__ = [
     'adaptive_avg_pool2d',
     # 350
-    'conv1d',
     # 393
     'dropout2d',

mindspore/mint/nn/layer/__init__.py CHANGED Viewed

@@ -31,7 +31,6 @@ from mindspore.mint.nn.layer.normalization import SyncBatchNorm
 from mindspore.mint.nn.layer.activation import LogSigmoid
 from mindspore.mint.nn.layer.activation import SiLU
 from mindspore.mint.nn.layer.activation import Threshold
-from mindspore.mint.nn.layer.basic import Dropout2d
 from mindspore.mint.nn.layer.pooling import AdaptiveMaxPool1d
 from mindspore.mint.nn.layer.pooling import AdaptiveAvgPool1d
 from mindspore.mint.nn.layer.pooling import AdaptiveAvgPool2d
@@ -46,7 +45,6 @@ __all__ = [
     'LayerNorm',
     'LogSigmoid',
     'SiLU',
-    'Dropout2d',
     'AdaptiveMaxPool1d',
     'AdaptiveAvgPool1d',
     'AdaptiveAvgPool2d',

mindspore/mint/nn/layer/activation.py CHANGED Viewed

@@ -147,9 +147,6 @@ class LogSigmoid(Cell):
     .. image:: ../images/LogSigmoid.png
         :align: center
-    .. warning::
-        This is an experimental API that is subject to change or deletion.
     Inputs:
         - **input** (Tensor) - The input of LogSigmoid with data type of bfloat16, float16 or float32.
           The shape is :math:`(*)` where :math:`*` means, any number of additional dimensions.
@@ -313,9 +310,6 @@ class Tanh(Cell):
     .. image:: ../images/Tanh.png
         :align: center
-    .. warning::
-        This is an experimental API that is subject to change or deletion.
     Inputs:
         - **input** (Tensor) - Tensor of any dimension, input with data type of float16 or float32.

mindspore/mint/nn/layer/basic.py CHANGED Viewed

@@ -18,52 +18,6 @@ from __future__ import division
 from mindspore import mint
 from mindspore.nn.cell import Cell
-from mindspore import _checkparam as validator
-class Dropout2d(Cell):
-    r"""
-    During training, randomly zeroes some channels of the input tensor with probability `p`
-    from a Bernoulli distribution (For a 4-dimensional tensor with a shape of :math:`NCHW`,
-    the channel feature map refers to a 2-dimensional feature map with the shape of :math:`HW`).
-    For example, the :math:`j\_th` channel of the :math:`i\_th` sample in the batched input is a to-be-processed
-    `2D` tensor input[i,j].
-    Each channel will be zeroed out independently on every forward call with probability `p` using samples
-    from a Bernoulli distribution.
-    `Dropout2d` can improve the independence between channel feature maps.
-    .. warning::
-        This is an experimental API that is subject to change or deletion.
-    Refer to :func:`mindspore.mint.nn.functional.dropout2d` for more details.
-    Supported Platforms:
-        ``Ascend``
-    Examples:
-        >>> import mindspore
-        >>> from mindspore import Tensor, mint
-        >>> import numpy as np
-        >>> dropout = mint.nn.Dropout2d(p=0.5)
-        >>> x = Tensor(np.ones([2, 1, 2, 3]), mindspore.float32)
-        >>> output = dropout(x)
-        >>> print(output.shape)
-        (2, 1, 2, 3)
-    """
-    def __init__(self, p=0.5):
-        """Initialize Dropout2d."""
-        super(Dropout2d, self).__init__()
-        validator.check_float_range(p, 0.0, 1.0, validator.INC_BOTH, "p", self.cls_name)
-        self.p = p
-    def construct(self, x):
-        if not self.training or self.p == 0:
-            return x
-        return mint.nn.functional.dropout2d(x, self.p)
 class Flatten(Cell):
@@ -118,6 +72,5 @@ class Flatten(Cell):
 __all__ = [
-    'Dropout2d',
     'Flatten',
 ]

mindspore/mint/nn/layer/conv.py CHANGED Viewed

@@ -222,10 +222,10 @@ class Conv1d(_Conv):
         dtype (:class:`mindspore.dtype`, optional): Dtype of Parameters. Default: ``None``, using ``mstype.float32``.
     Variables:
-        - **weight** (Tensor) - The weight of the convolution layer, with shape :math:
-          `(C_{out}, C_{in} / \text{groups}, \text{kernel_size[0]})`.
-        - **bias** (Tensor) - The bias of the convolution layer, with shape :math:
-          `(C_{out})`. If bias is False, this will be None.
+        - **weight** (Tensor) - The weight of the convolution layer, with shape
+          :math:`(C_{out}, C_{in} / \text{groups}, \text{kernel_size[0]})`.
+        - **bias** (Tensor) - The bias of the convolution layer, with shape
+          :math:`(C_{out})`. If bias is False, this will be None.
     Inputs:
         - **input** (Tensor) - Tensor of shape :math:`(N, C_{in}, L_{in})` \

mindspore/mint/nn/layer/normalization.py CHANGED Viewed

@@ -37,7 +37,6 @@ class _NormBase(Cell):
                  dtype=None
                  ) -> None:
         super(_NormBase, self).__init__()
-        self.set_train()
         self.shape = ops.Shape()
         self.num_features = num_features
         self.eps = eps
@@ -110,7 +109,6 @@ class _BatchNorm(_NormBase):
             dtype=None) -> None:
         super(_BatchNorm, self).__init__(num_features, eps, momentum, affine, track_running_stats,
                                          dtype)
-        self.training = True
     def _check_input_dim(self, input):
@@ -170,7 +168,6 @@ class BatchNorm1d(_BatchNorm):
     .. warning::
         This API does not support Dynamic Rank.
-        This is an experimental API that is subject to change or deletion.
     Args:
         num_features (int): `C` from an expected input of shape :math:`(N, C, L)`.
@@ -209,8 +206,8 @@ class BatchNorm1d(_BatchNorm):
         >>> net = mint.nn.BatchNorm1d(4)
         >>> output = net(input_x)
         >>> print(output)
-        [[ 0.99950075 0.9980011 -0.9980068 -0.9997783]
-         [-0.9995012 -0.99799967 0.9980068  0.9997778]]
+        [[0.6999965  0.4999975  0.4999975  0.59999704]
+         [0.4999975  0.399998   0.59999704 0.89999545]]
     """
     def _check_input_dim(self, input):
@@ -239,7 +236,6 @@ class BatchNorm2d(_BatchNorm):
     .. warning::
         - This API does not support Dynamic Rank.
-        - This is an experimental API that is subject to change or deletion.
     Args:
         num_features (int): `C` from an expected input of shape :math:`(N, C, H, W)`.
@@ -277,10 +273,10 @@ class BatchNorm2d(_BatchNorm):
         >>> net = mint.nn.BatchNorm2d(2)
         >>> output = net(input_x)
         >>> print(output)
-        [[[[-0.99950075]]
-          [[0.9980087]]]
-          [[[0.999501]]
-          [[-0.9980097]]]]
+        [[[[0.29999852]]
+          [[0.399998  ]]]
+         [[[0.4999975 ]]
+          [[0.29999852]]]]
     """
     def _check_input_dim(self, input):
@@ -309,7 +305,6 @@ class BatchNorm3d(_BatchNorm):
     .. warning::
         This API does not support Dynamic Rank.
-        This is an experimental API that is subject to change or deletion.
     Args:
         num_features (int): `C` from an expected input of shape :math:`(N, C, D, H, W)`.
@@ -347,8 +342,8 @@ class BatchNorm3d(_BatchNorm):
         >>> net = mint.nn.BatchNorm3d(2)
         >>> output = net(input_x)
         >>> print(output)
-        [[[[[-0.9999688 0.99996865]]]
-          [[[-0.9999833 06.9999831]]]]]
+        [[[[[0.0999995  0.89999545]]]
+          [[[1.1999941  2.2999885 ]]]]]
     """
     def _check_input_dim(self, input):

mindspore/mint/nn/layer/pooling.py CHANGED Viewed

@@ -73,9 +73,6 @@ class AdaptiveAvgPool2d(_AdaptiveAvgPoolNd):
     The output is of size :math:`H x W` , for any input size.
     The number of output features is equal to the number of input planes.
-    .. warning::
-        This is an experimental API that is subject to change or deletion.
     Args:
         output_size (Union(int, tuple[int])): the target output size of the image of the form :math:`H x W` .
             Can be a tuple :math:`(H, W)` or a single :math:`H` for square image :math:`H x H` .
@@ -129,7 +126,6 @@ class AdaptiveAvgPool3d(Cell):
     .. warning::
         For Ascend, it is only supported on Atlas A2 Training Series Products.
-        This is an experimental optimizer API that is subject to change or deletion.
     Args:
         output_size (Union[int, tuple]): The target output size. `output_size` can be a tuple :math:`(D, H, W)`,

mindspore/nn/__init__.py CHANGED Viewed

@@ -21,7 +21,7 @@ from __future__ import absolute_import
 __all__ = ["Cell", "GraphCell", "PipelineGradReducer", "PipelineCell", "MicroBatchInterleaved"]
-from mindspore.nn import layer, loss, optim, wrap, grad, metrics, probability, sparse, dynamic_lr, reinforcement
+from mindspore.nn import layer, loss, optim, wrap, grad, metrics, probability, sparse, dynamic_lr
 from mindspore.parallel.nn.parallel_grad_reducer import PipelineGradReducer
 from mindspore.parallel.nn.parallel_cell_wrapper import PipelineCell, MicroBatchInterleaved
 from mindspore.nn.learning_rate_schedule import *
@@ -34,7 +34,6 @@ from mindspore.nn.metrics import *
 from mindspore.nn.wrap import *
 from mindspore.nn.grad import Jvp, Vjp
 from mindspore.nn.sparse import *
-from mindspore.nn.reinforcement import *
 from mindspore.nn.utils import *
 __all__.extend(layer.__all__)
@@ -46,7 +45,6 @@ __all__.extend(grad.__all__)
 __all__.extend(sparse.__all__)
 __all__.extend(learning_rate_schedule.__all__)
 __all__.extend(dynamic_lr.__all__)
-__all__.extend(reinforcement.__all__)
 __all__.extend(utils.__all__)
 __all__.sort()

mindspore/nn/cell.py CHANGED Viewed

@@ -192,6 +192,7 @@ class Cell(Cell_):
         super().__setattr__("_auto_prefix", auto_prefix)
         super().__setattr__("_scope", None)
         super().__setattr__("_phase", 'train')
+        super().__setattr__("_compile_phase", None)
         super().__setattr__("_parameter_layout_dict", None)
         super().__setattr__("_parallel_parameter_name_list", None)
         super().__setattr__("_parallel_parameter_merge_net_dict", None)
@@ -493,6 +494,19 @@ class Cell(Cell_):
             raise TypeError(f"For 'Cell', the property 'phase' must be string type, but got type {type(value)}.")
         self._phase = value
+    @property
+    def compile_phase(self):
+        return self._compile_phase
+    @compile_phase.setter
+    def compile_phase(self, value):
+        if not isinstance(value, str):
+            raise TypeError(f"For 'Cell', 'compile_phase' must be string type, but got type {type(value)}.")
+        self._compile_phase = value
+        for cell in self._cells.values():
+            if cell is not None:
+                cell.compile_phase = value
     @property
     def parameter_layout_dict(self):
         """
@@ -1705,6 +1719,7 @@ class Cell(Cell_):
         _init_auto_parallel_context(self)
         compile_args = self._get_compile_args(args)
         self._has_mutable_args_list = _get_mutable_flags(compile_args)
+        _cell_graph_executor.set_real_args(args, kwargs)
         _cell_graph_executor.compile(self, *compile_args, phase=self.phase,
                                      jit_config_dict=self._jit_config_dict, **kwargs)
         _clear_auto_parallel_context(self)
@@ -2587,23 +2602,6 @@ class Cell(Cell_):
         else:
             self._jit_config_dict = jit_config.jit_config_dict
-    def flatten_weights(self, fusion_size=0):
-        """
-        Reset data for weight parameters so that they are using contiguous memory chunks grouped by data type.
-        Note:
-            By default, parameters with same data type will using a single contiguous memory chunk. but for
-            some models with huge number of parameters, splitting a large memory chunk into several smaller
-            memory chunks has the potential for performance gains, if this is the case, we can use 'fusion_size'
-            to limit the maximum memory chunk size.
-        Args:
-            fusion_size (int): Maximum memory chunk size in bytes, ``0`` for unlimited. Default: ``0`` .
-        """
-        if fusion_size < 0:
-            raise ValueError(f"Negative 'fusion_size' {fusion_size} is invalid.")
-        Tensor._flatten_tensors(self.trainable_params(), fusion_size)  # pylint: disable=W0212
     @jit_forbidden_register
     def register_forward_pre_hook(self, hook_fn, with_kwargs=False):
         """
@@ -3507,24 +3505,6 @@ class Cell(Cell_):
         _update_hook_version()
         return handle
-    def set_param_ps(self, recurse=True, init_in_server=False):
-        """
-        Set whether the trainable parameters are updated by parameter server and whether the
-        trainable parameters are initialized on server.
-        Note:
-            It only works when a running task is in the parameter server mode.
-            It is only supported in graph mode.
-        Args:
-            recurse (bool): Whether sets the trainable parameters of subcells. Default: ``True`` .
-            init_in_server (bool): Whether trainable parameters updated by parameter server are
-                initialized on server. Default: ``False`` .
-        """
-        params = self.trainable_params(recurse)
-        for param in params:
-            param.set_param_ps(init_in_server)
     def set_comm_fusion(self, fusion_type, recurse=True):
         """
         Set `comm_fusion` for all the parameters in this cell. Please refer to the description of
@@ -3628,8 +3608,7 @@ class Cell(Cell_):
                 introduced by optimizer shard are recomputed in auto parallel or semi auto parallel mode.
                 Default: ``False`` .
         """
-        if context._get_mode() == context.PYNATIVE_MODE:
-            self._recompute_cell = recompute_registry.get()(self.construct)
+        self._recompute_cell = recompute_registry.get()(self.construct)
         self._recompute()
         if 'mp_comm_recompute' in kwargs.keys():
             self._mp_comm_recompute(kwargs.get('mp_comm_recompute', False))
@@ -3646,35 +3625,6 @@ class Cell(Cell_):
                                  "the key kwargs must be 'mp_comm_recompute', "
                                  "'parallel_optimizer_comm_recompute', 'recompute_slice_activation'" % key)
-    def place(self, role, rank_id):
-        """
-        Set the label for all operators in this cell.
-        This label tells MindSpore compiler on which process this cell should be launched.
-        And each process's identical label consists of input `role` and `rank_id`.
-        So by setting different cells with different labels, which will be launched on different processes,
-        users can launch a distributed training or predicting job.
-        Note:
-            - This method is effective only after
-              `mindspore.communication.init()` is called for dynamic cluster building.
-        Args:
-            role (str): The role of the process on which this cell will be launched.
-                        Only 'MS_WORKER' is supported for now.
-            rank_id (int): The rank id of the process on which this cell will be launched.
-                           The rank is unique in processes with the same role.
-        Examples:
-            >>> from mindspore import context
-            >>> import mindspore.nn as nn
-            >>> context.set_context(mode=context.GRAPH_MODE)
-            >>> fc = nn.Dense(2, 3)
-            >>> fc.place('MS_WORKER', 0)
-        """
-        all_ops = self._get_prims_recursively()
-        for op in all_ops:
-            op.place(role, rank_id)
     def _get_attr_from_cell(self, network):
         if not isinstance(network, Cell):
             return

mindspore/nn/layer/basic.py CHANGED Viewed

@@ -38,7 +38,7 @@ from mindspore.common.generator import default_generator
 __all__ = ['Dropout', 'Flatten', 'Dense', 'Linear', 'ClipByNorm', 'Norm', 'OneHot', 'Pad', 'Unfold', 'Tril', 'Triu',
            'MatrixDiag', 'MatrixDiagPart', 'MatrixSetDiag', 'L1Regularizer', 'Dropout1d',
-           'Dropout2d', 'Dropout3d', 'Upsample', 'Roll', 'Identity', 'Unflatten', 'DropoutExt']
+           'Dropout2d', 'Dropout3d', 'Upsample', 'Roll', 'Identity', 'Unflatten', 'DropoutExt', 'Dropout2dExt']
 class L1Regularizer(Cell):
@@ -382,6 +382,54 @@ class Dropout2d(Cell):
         return f"p={self.keep_prob}"
+class Dropout2dExt(Cell):
+    r"""
+    During training, randomly zeroes some channels of the input tensor with probability `p`
+    from a Bernoulli distribution (For a 4-dimensional tensor with a shape of :math:`NCHW`,
+    the channel feature map refers to a 2-dimensional feature map with the shape of :math:`HW`).
+    For example, the :math:`j\_th` channel of the :math:`i\_th` sample in the batched input is a to-be-processed
+    `2D` tensor input[i,j].
+    Each channel will be zeroed out independently on every forward call with probability `p` using samples
+    from a Bernoulli distribution.
+    `Dropout2d` can improve the independence between channel feature maps.
+    .. warning::
+        This is an experimental API that is subject to change or deletion.
+    Refer to :func:`mindspore.mint.nn.functional.dropout2d` for more details.
+    Supported Platforms:
+        ``Ascend``
+    Examples:
+        >>> import mindspore
+        >>> from mindspore import Tensor, mint
+        >>> import numpy as np
+        >>> dropout = mint.nn.Dropout2d(p=0.5)
+        >>> x = Tensor(np.ones([2, 1, 2, 3]), mindspore.float32)
+        >>> output = dropout(x)
+        >>> print(output.shape)
+        (2, 1, 2, 3)
+    """
+    def __init__(self, p=0.5, inplace=False):
+        """Initialize Dropout2d."""
+        super(Dropout2dExt, self).__init__()
+        self.p = p
+        self.inplace = inplace
+        self.generator_step = Tensor(12, mstype.int64)
+    def construct(self, input):
+        if not self.training or self.p == 0:
+            return input
+        seed, offset = default_generator._step(self.generator_step)  # pylint: disable=protected-access
+        return ops.auto_generate.dropout2d_ext_op(input, self.p, self.training, self.inplace, seed, offset)
 class Dropout3d(Cell):
     r"""
     During training, randomly zeroes some channels of the input tensor

mindspore/nn/layer/container.py CHANGED Viewed

@@ -247,6 +247,14 @@ class SequentialCell(Cell):
         self._cells = temp_dict
         self.cell_list = list(self._cells.values())
+    def __setattr__(self, name, value):
+        from mindspore.common.recompute import _RecomputeCell
+        if isinstance(value, _RecomputeCell):
+            # RecomputeCell should not be executed
+            object.__setattr__(self, name, value)
+        else:
+            super().__setattr__(name, value)
     def __bool__(self):
         return len(self._cells) != 0
@@ -594,6 +602,14 @@ class CellDict(_CellDictBase, Cell):
     def __delitem__(self, key):
         del self._cells[key]
+    def __setattr__(self, name, value):
+        from mindspore.common.recompute import _RecomputeCell
+        if isinstance(value, _RecomputeCell):
+            # RecomputeCell should not be executed
+            object.__setattr__(self, name, value)
+        else:
+            super().__setattr__(name, value)
     def __len__(self):
         return len(self._cells)